109c6f1ddSLingrui98/*************************************************************************************** 209c6f1ddSLingrui98* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 309c6f1ddSLingrui98* Copyright (c) 2020-2021 Peng Cheng Laboratory 409c6f1ddSLingrui98* 509c6f1ddSLingrui98* XiangShan is licensed under Mulan PSL v2. 609c6f1ddSLingrui98* You can use this software according to the terms and conditions of the Mulan PSL v2. 709c6f1ddSLingrui98* You may obtain a copy of Mulan PSL v2 at: 809c6f1ddSLingrui98* http://license.coscl.org.cn/MulanPSL2 909c6f1ddSLingrui98* 1009c6f1ddSLingrui98* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 1109c6f1ddSLingrui98* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 1209c6f1ddSLingrui98* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 1309c6f1ddSLingrui98* 1409c6f1ddSLingrui98* See the Mulan PSL v2 for more details. 1509c6f1ddSLingrui98***************************************************************************************/ 1609c6f1ddSLingrui98 1709c6f1ddSLingrui98package xiangshan.frontend 1809c6f1ddSLingrui98 198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters 2009c6f1ddSLingrui98import chisel3._ 2109c6f1ddSLingrui98import chisel3.util._ 221ca0e4f3SYinan Xuimport utils._ 233c02ee8fSwakafaimport utility._ 2409c6f1ddSLingrui98import xiangshan._ 25e30430c2SJayimport xiangshan.frontend.icache._ 261ca0e4f3SYinan Xuimport xiangshan.backend.CtrlToFtqIO 272e1be6e1SSteve Gouimport xiangshan.backend.decode.ImmUnion 283c02ee8fSwakafaimport utility.ChiselDB 2951532d8bSGuokai Chen 3051532d8bSGuokai Chenclass FtqDebugBundle extends Bundle { 3151532d8bSGuokai Chen val pc = UInt(39.W) 3251532d8bSGuokai Chen val target = UInt(39.W) 3351532d8bSGuokai Chen val isBr = Bool() 3451532d8bSGuokai Chen val isJmp = Bool() 3551532d8bSGuokai Chen val isCall = Bool() 3651532d8bSGuokai Chen val isRet = Bool() 3751532d8bSGuokai Chen val misPred = Bool() 3851532d8bSGuokai Chen val isTaken = Bool() 3951532d8bSGuokai Chen val predStage = UInt(2.W) 4051532d8bSGuokai Chen} 4109c6f1ddSLingrui98 423b739f49SXuan Huclass FtqPtr(entries: Int) extends CircularQueuePtr[FtqPtr]( 433b739f49SXuan Hu entries 4409c6f1ddSLingrui98){ 453b739f49SXuan Hu def this()(implicit p: Parameters) = this(p(XSCoreParamsKey).FtqSize) 4609c6f1ddSLingrui98} 4709c6f1ddSLingrui98 4809c6f1ddSLingrui98object FtqPtr { 4909c6f1ddSLingrui98 def apply(f: Bool, v: UInt)(implicit p: Parameters): FtqPtr = { 5009c6f1ddSLingrui98 val ptr = Wire(new FtqPtr) 5109c6f1ddSLingrui98 ptr.flag := f 5209c6f1ddSLingrui98 ptr.value := v 5309c6f1ddSLingrui98 ptr 5409c6f1ddSLingrui98 } 5509c6f1ddSLingrui98 def inverse(ptr: FtqPtr)(implicit p: Parameters): FtqPtr = { 5609c6f1ddSLingrui98 apply(!ptr.flag, ptr.value) 5709c6f1ddSLingrui98 } 5809c6f1ddSLingrui98} 5909c6f1ddSLingrui98 6009c6f1ddSLingrui98class FtqNRSRAM[T <: Data](gen: T, numRead: Int)(implicit p: Parameters) extends XSModule { 6109c6f1ddSLingrui98 6209c6f1ddSLingrui98 val io = IO(new Bundle() { 6309c6f1ddSLingrui98 val raddr = Input(Vec(numRead, UInt(log2Up(FtqSize).W))) 6409c6f1ddSLingrui98 val ren = Input(Vec(numRead, Bool())) 6509c6f1ddSLingrui98 val rdata = Output(Vec(numRead, gen)) 6609c6f1ddSLingrui98 val waddr = Input(UInt(log2Up(FtqSize).W)) 6709c6f1ddSLingrui98 val wen = Input(Bool()) 6809c6f1ddSLingrui98 val wdata = Input(gen) 6909c6f1ddSLingrui98 }) 7009c6f1ddSLingrui98 7109c6f1ddSLingrui98 for(i <- 0 until numRead){ 7209c6f1ddSLingrui98 val sram = Module(new SRAMTemplate(gen, FtqSize)) 7309c6f1ddSLingrui98 sram.io.r.req.valid := io.ren(i) 7409c6f1ddSLingrui98 sram.io.r.req.bits.setIdx := io.raddr(i) 7509c6f1ddSLingrui98 io.rdata(i) := sram.io.r.resp.data(0) 7609c6f1ddSLingrui98 sram.io.w.req.valid := io.wen 7709c6f1ddSLingrui98 sram.io.w.req.bits.setIdx := io.waddr 7809c6f1ddSLingrui98 sram.io.w.req.bits.data := VecInit(io.wdata) 7909c6f1ddSLingrui98 } 8009c6f1ddSLingrui98 8109c6f1ddSLingrui98} 8209c6f1ddSLingrui98 8309c6f1ddSLingrui98class Ftq_RF_Components(implicit p: Parameters) extends XSBundle with BPUUtils { 8409c6f1ddSLingrui98 val startAddr = UInt(VAddrBits.W) 85b37e4b45SLingrui98 val nextLineAddr = UInt(VAddrBits.W) 8609c6f1ddSLingrui98 val isNextMask = Vec(PredictWidth, Bool()) 87b37e4b45SLingrui98 val fallThruError = Bool() 88b37e4b45SLingrui98 // val carry = Bool() 8909c6f1ddSLingrui98 def getPc(offset: UInt) = { 9085215037SLingrui98 def getHigher(pc: UInt) = pc(VAddrBits-1, log2Ceil(PredictWidth)+instOffsetBits+1) 9185215037SLingrui98 def getOffset(pc: UInt) = pc(log2Ceil(PredictWidth)+instOffsetBits, instOffsetBits) 92b37e4b45SLingrui98 Cat(getHigher(Mux(isNextMask(offset) && startAddr(log2Ceil(PredictWidth)+instOffsetBits), nextLineAddr, startAddr)), 9309c6f1ddSLingrui98 getOffset(startAddr)+offset, 0.U(instOffsetBits.W)) 9409c6f1ddSLingrui98 } 9509c6f1ddSLingrui98 def fromBranchPrediction(resp: BranchPredictionBundle) = { 96a229ab6cSLingrui98 def carryPos(addr: UInt) = addr(instOffsetBits+log2Ceil(PredictWidth)+1) 97adc0b8dfSGuokai Chen this.startAddr := resp.pc(3) 98adc0b8dfSGuokai Chen this.nextLineAddr := resp.pc(3) + (FetchWidth * 4 * 2).U // may be broken on other configs 9909c6f1ddSLingrui98 this.isNextMask := VecInit((0 until PredictWidth).map(i => 100935edac4STang Haojin (resp.pc(3)(log2Ceil(PredictWidth), 1) +& i.U)(log2Ceil(PredictWidth)).asBool 10109c6f1ddSLingrui98 )) 102adc0b8dfSGuokai Chen this.fallThruError := resp.fallThruError(3) 10309c6f1ddSLingrui98 this 10409c6f1ddSLingrui98 } 10509c6f1ddSLingrui98 override def toPrintable: Printable = { 106b37e4b45SLingrui98 p"startAddr:${Hexadecimal(startAddr)}" 10709c6f1ddSLingrui98 } 10809c6f1ddSLingrui98} 10909c6f1ddSLingrui98 11009c6f1ddSLingrui98class Ftq_pd_Entry(implicit p: Parameters) extends XSBundle { 11109c6f1ddSLingrui98 val brMask = Vec(PredictWidth, Bool()) 11209c6f1ddSLingrui98 val jmpInfo = ValidUndirectioned(Vec(3, Bool())) 11309c6f1ddSLingrui98 val jmpOffset = UInt(log2Ceil(PredictWidth).W) 11409c6f1ddSLingrui98 val jalTarget = UInt(VAddrBits.W) 11509c6f1ddSLingrui98 val rvcMask = Vec(PredictWidth, Bool()) 11609c6f1ddSLingrui98 def hasJal = jmpInfo.valid && !jmpInfo.bits(0) 11709c6f1ddSLingrui98 def hasJalr = jmpInfo.valid && jmpInfo.bits(0) 11809c6f1ddSLingrui98 def hasCall = jmpInfo.valid && jmpInfo.bits(1) 11909c6f1ddSLingrui98 def hasRet = jmpInfo.valid && jmpInfo.bits(2) 12009c6f1ddSLingrui98 12109c6f1ddSLingrui98 def fromPdWb(pdWb: PredecodeWritebackBundle) = { 12209c6f1ddSLingrui98 val pds = pdWb.pd 12309c6f1ddSLingrui98 this.brMask := VecInit(pds.map(pd => pd.isBr && pd.valid)) 12409c6f1ddSLingrui98 this.jmpInfo.valid := VecInit(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid)).asUInt.orR 12509c6f1ddSLingrui98 this.jmpInfo.bits := ParallelPriorityMux(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid), 12609c6f1ddSLingrui98 pds.map(pd => VecInit(pd.isJalr, pd.isCall, pd.isRet))) 12709c6f1ddSLingrui98 this.jmpOffset := ParallelPriorityEncoder(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid)) 12809c6f1ddSLingrui98 this.rvcMask := VecInit(pds.map(pd => pd.isRVC)) 12909c6f1ddSLingrui98 this.jalTarget := pdWb.jalTarget 13009c6f1ddSLingrui98 } 13109c6f1ddSLingrui98 13209c6f1ddSLingrui98 def toPd(offset: UInt) = { 13309c6f1ddSLingrui98 require(offset.getWidth == log2Ceil(PredictWidth)) 13409c6f1ddSLingrui98 val pd = Wire(new PreDecodeInfo) 13509c6f1ddSLingrui98 pd.valid := true.B 13609c6f1ddSLingrui98 pd.isRVC := rvcMask(offset) 13709c6f1ddSLingrui98 val isBr = brMask(offset) 13809c6f1ddSLingrui98 val isJalr = offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(0) 13909c6f1ddSLingrui98 pd.brType := Cat(offset === jmpOffset && jmpInfo.valid, isJalr || isBr) 14009c6f1ddSLingrui98 pd.isCall := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(1) 14109c6f1ddSLingrui98 pd.isRet := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(2) 14209c6f1ddSLingrui98 pd 14309c6f1ddSLingrui98 } 14409c6f1ddSLingrui98} 14509c6f1ddSLingrui98 146f9c51548Sssszwicclass PrefetchPtrDB(implicit p: Parameters) extends Bundle { 147f9c51548Sssszwic val fromFtqPtr = UInt(log2Up(p(XSCoreParamsKey).FtqSize).W) 148f9c51548Sssszwic val fromIfuPtr = UInt(log2Up(p(XSCoreParamsKey).FtqSize).W) 149f9c51548Sssszwic} 15009c6f1ddSLingrui98 1513711cf36S小造xu_zhclass Ftq_Redirect_SRAMEntry(implicit p: Parameters) extends SpeculativeInfo { 152abdc3a32Sxu_zh val sc_disagree = if (!env.FPGAPlatform) Some(Vec(numBr, Bool())) else None 1533711cf36S小造xu_zh} 15409c6f1ddSLingrui98 15509c6f1ddSLingrui98class Ftq_1R_SRAMEntry(implicit p: Parameters) extends XSBundle with HasBPUConst { 15609c6f1ddSLingrui98 val meta = UInt(MaxMetaLength.W) 157deb3a97eSGao-Zeyu val ftb_entry = new FTBEntry 15809c6f1ddSLingrui98} 15909c6f1ddSLingrui98 16009c6f1ddSLingrui98class Ftq_Pred_Info(implicit p: Parameters) extends XSBundle { 16109c6f1ddSLingrui98 val target = UInt(VAddrBits.W) 16209c6f1ddSLingrui98 val cfiIndex = ValidUndirectioned(UInt(log2Ceil(PredictWidth).W)) 16309c6f1ddSLingrui98} 16409c6f1ddSLingrui98 16509c6f1ddSLingrui98 16609c6f1ddSLingrui98class FtqRead[T <: Data](private val gen: T)(implicit p: Parameters) extends XSBundle { 16754c6d89dSxiaofeibao-xjtu val valid = Output(Bool()) 16809c6f1ddSLingrui98 val ptr = Output(new FtqPtr) 16909c6f1ddSLingrui98 val offset = Output(UInt(log2Ceil(PredictWidth).W)) 17009c6f1ddSLingrui98 val data = Input(gen) 17154c6d89dSxiaofeibao-xjtu def apply(valid: Bool, ptr: FtqPtr, offset: UInt) = { 17254c6d89dSxiaofeibao-xjtu this.valid := valid 17309c6f1ddSLingrui98 this.ptr := ptr 17409c6f1ddSLingrui98 this.offset := offset 17509c6f1ddSLingrui98 this.data 17609c6f1ddSLingrui98 } 17709c6f1ddSLingrui98} 17809c6f1ddSLingrui98 17909c6f1ddSLingrui98 18009c6f1ddSLingrui98class FtqToBpuIO(implicit p: Parameters) extends XSBundle { 18109c6f1ddSLingrui98 val redirect = Valid(new BranchPredictionRedirect) 18209c6f1ddSLingrui98 val update = Valid(new BranchPredictionUpdate) 18309c6f1ddSLingrui98 val enq_ptr = Output(new FtqPtr) 184fd3aa057SYuandongliang val redirctFromIFU = Output(Bool()) 18509c6f1ddSLingrui98} 18609c6f1ddSLingrui98 1872c9f4a9fSxu_zhclass BpuFlushInfo(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper { 18809c6f1ddSLingrui98 // when ifu pipeline is not stalled, 18909c6f1ddSLingrui98 // a packet from bpu s3 can reach f1 at most 19009c6f1ddSLingrui98 val s2 = Valid(new FtqPtr) 191cb4f77ceSLingrui98 val s3 = Valid(new FtqPtr) 19209c6f1ddSLingrui98 def shouldFlushBy(src: Valid[FtqPtr], idx_to_flush: FtqPtr) = { 19309c6f1ddSLingrui98 src.valid && !isAfter(src.bits, idx_to_flush) 19409c6f1ddSLingrui98 } 19509c6f1ddSLingrui98 def shouldFlushByStage2(idx: FtqPtr) = shouldFlushBy(s2, idx) 196cb4f77ceSLingrui98 def shouldFlushByStage3(idx: FtqPtr) = shouldFlushBy(s3, idx) 19709c6f1ddSLingrui98} 1982c9f4a9fSxu_zh 1992c9f4a9fSxu_zhclass FtqToIfuIO(implicit p: Parameters) extends XSBundle { 2002c9f4a9fSxu_zh val req = Decoupled(new FetchRequestBundle) 2012c9f4a9fSxu_zh val redirect = Valid(new BranchPredictionRedirect) 2022c9f4a9fSxu_zh val topdown_redirect = Valid(new BranchPredictionRedirect) 2032c9f4a9fSxu_zh val flushFromBpu = new BpuFlushInfo 20409c6f1ddSLingrui98} 20509c6f1ddSLingrui98 2062c9f4a9fSxu_zhclass FtqToICacheIO(implicit p: Parameters) extends XSBundle { 207c5c5edaeSJenius //NOTE: req.bits must be prepare in T cycle 208c5c5edaeSJenius // while req.valid is set true in T + 1 cycle 209c5c5edaeSJenius val req = Decoupled(new FtqToICacheRequestBundle) 210c5c5edaeSJenius} 211c5c5edaeSJenius 2122c9f4a9fSxu_zhclass FtqToPrefetchIO(implicit p: Parameters) extends XSBundle { 213b92f8445Sssszwic val req = Decoupled(new FtqICacheInfo) 2142c9f4a9fSxu_zh val flushFromBpu = new BpuFlushInfo 215b92f8445Sssszwic} 216b92f8445Sssszwic 21709c6f1ddSLingrui98trait HasBackendRedirectInfo extends HasXSParameter { 21809c6f1ddSLingrui98 def isLoadReplay(r: Valid[Redirect]) = r.bits.flushItself() 21909c6f1ddSLingrui98} 22009c6f1ddSLingrui98 22109c6f1ddSLingrui98class FtqToCtrlIO(implicit p: Parameters) extends XSBundle with HasBackendRedirectInfo { 222b56f947eSYinan Xu // write to backend pc mem 223b56f947eSYinan Xu val pc_mem_wen = Output(Bool()) 224f533cba7SHuSipeng val pc_mem_waddr = Output(UInt(log2Ceil(FtqSize).W)) 225b56f947eSYinan Xu val pc_mem_wdata = Output(new Ftq_RF_Components) 226873dc383SLingrui98 // newest target 2276022c595SsinceforYy val newest_entry_en = Output(Bool()) 228873dc383SLingrui98 val newest_entry_target = Output(UInt(VAddrBits.W)) 229873dc383SLingrui98 val newest_entry_ptr = Output(new FtqPtr) 23009c6f1ddSLingrui98} 23109c6f1ddSLingrui98 23209c6f1ddSLingrui98class FTBEntryGen(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo with HasBPUParameter { 23309c6f1ddSLingrui98 val io = IO(new Bundle { 23409c6f1ddSLingrui98 val start_addr = Input(UInt(VAddrBits.W)) 23509c6f1ddSLingrui98 val old_entry = Input(new FTBEntry) 23609c6f1ddSLingrui98 val pd = Input(new Ftq_pd_Entry) 23709c6f1ddSLingrui98 val cfiIndex = Flipped(Valid(UInt(log2Ceil(PredictWidth).W))) 23809c6f1ddSLingrui98 val target = Input(UInt(VAddrBits.W)) 23909c6f1ddSLingrui98 val hit = Input(Bool()) 24009c6f1ddSLingrui98 val mispredict_vec = Input(Vec(PredictWidth, Bool())) 24109c6f1ddSLingrui98 24209c6f1ddSLingrui98 val new_entry = Output(new FTBEntry) 24309c6f1ddSLingrui98 val new_br_insert_pos = Output(Vec(numBr, Bool())) 24409c6f1ddSLingrui98 val taken_mask = Output(Vec(numBr, Bool())) 245803124a6SLingrui98 val jmp_taken = Output(Bool()) 24609c6f1ddSLingrui98 val mispred_mask = Output(Vec(numBr+1, Bool())) 24709c6f1ddSLingrui98 24809c6f1ddSLingrui98 // for perf counters 24909c6f1ddSLingrui98 val is_init_entry = Output(Bool()) 25009c6f1ddSLingrui98 val is_old_entry = Output(Bool()) 25109c6f1ddSLingrui98 val is_new_br = Output(Bool()) 25209c6f1ddSLingrui98 val is_jalr_target_modified = Output(Bool()) 25309c6f1ddSLingrui98 val is_always_taken_modified = Output(Bool()) 25409c6f1ddSLingrui98 val is_br_full = Output(Bool()) 25509c6f1ddSLingrui98 }) 25609c6f1ddSLingrui98 25709c6f1ddSLingrui98 // no mispredictions detected at predecode 25809c6f1ddSLingrui98 val hit = io.hit 25909c6f1ddSLingrui98 val pd = io.pd 26009c6f1ddSLingrui98 26109c6f1ddSLingrui98 val init_entry = WireInit(0.U.asTypeOf(new FTBEntry)) 26209c6f1ddSLingrui98 26309c6f1ddSLingrui98 26409c6f1ddSLingrui98 val cfi_is_br = pd.brMask(io.cfiIndex.bits) && io.cfiIndex.valid 26509c6f1ddSLingrui98 val entry_has_jmp = pd.jmpInfo.valid 26609c6f1ddSLingrui98 val new_jmp_is_jal = entry_has_jmp && !pd.jmpInfo.bits(0) && io.cfiIndex.valid 26709c6f1ddSLingrui98 val new_jmp_is_jalr = entry_has_jmp && pd.jmpInfo.bits(0) && io.cfiIndex.valid 26809c6f1ddSLingrui98 val new_jmp_is_call = entry_has_jmp && pd.jmpInfo.bits(1) && io.cfiIndex.valid 26909c6f1ddSLingrui98 val new_jmp_is_ret = entry_has_jmp && pd.jmpInfo.bits(2) && io.cfiIndex.valid 27009c6f1ddSLingrui98 val last_jmp_rvi = entry_has_jmp && pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask.last 271a60a2901SLingrui98 // val last_br_rvi = cfi_is_br && io.cfiIndex.bits === (PredictWidth-1).U && !pd.rvcMask.last 27209c6f1ddSLingrui98 27309c6f1ddSLingrui98 val cfi_is_jal = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jal 27409c6f1ddSLingrui98 val cfi_is_jalr = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jalr 27509c6f1ddSLingrui98 276a60a2901SLingrui98 def carryPos = log2Ceil(PredictWidth)+instOffsetBits 27709c6f1ddSLingrui98 def getLower(pc: UInt) = pc(carryPos-1, instOffsetBits) 27809c6f1ddSLingrui98 // if not hit, establish a new entry 27909c6f1ddSLingrui98 init_entry.valid := true.B 28009c6f1ddSLingrui98 // tag is left for ftb to assign 281eeb5ff92SLingrui98 282eeb5ff92SLingrui98 // case br 283eeb5ff92SLingrui98 val init_br_slot = init_entry.getSlotForBr(0) 284eeb5ff92SLingrui98 when (cfi_is_br) { 285eeb5ff92SLingrui98 init_br_slot.valid := true.B 286eeb5ff92SLingrui98 init_br_slot.offset := io.cfiIndex.bits 287b37e4b45SLingrui98 init_br_slot.setLowerStatByTarget(io.start_addr, io.target, numBr == 1) 288eeb5ff92SLingrui98 init_entry.always_taken(0) := true.B // set to always taken on init 289eeb5ff92SLingrui98 } 290eeb5ff92SLingrui98 291eeb5ff92SLingrui98 // case jmp 292eeb5ff92SLingrui98 when (entry_has_jmp) { 293eeb5ff92SLingrui98 init_entry.tailSlot.offset := pd.jmpOffset 294eeb5ff92SLingrui98 init_entry.tailSlot.valid := new_jmp_is_jal || new_jmp_is_jalr 295eeb5ff92SLingrui98 init_entry.tailSlot.setLowerStatByTarget(io.start_addr, Mux(cfi_is_jalr, io.target, pd.jalTarget), isShare=false) 296eeb5ff92SLingrui98 } 297eeb5ff92SLingrui98 29809c6f1ddSLingrui98 val jmpPft = getLower(io.start_addr) +& pd.jmpOffset +& Mux(pd.rvcMask(pd.jmpOffset), 1.U, 2.U) 299a60a2901SLingrui98 init_entry.pftAddr := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft, getLower(io.start_addr)) 300a60a2901SLingrui98 init_entry.carry := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft(carryPos-instOffsetBits), true.B) 30109c6f1ddSLingrui98 init_entry.isJalr := new_jmp_is_jalr 30209c6f1ddSLingrui98 init_entry.isCall := new_jmp_is_call 30309c6f1ddSLingrui98 init_entry.isRet := new_jmp_is_ret 304f4ebc4b2SLingrui98 // that means fall thru points to the middle of an inst 305ae409b75SSteve Gou init_entry.last_may_be_rvi_call := pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask(pd.jmpOffset) 30609c6f1ddSLingrui98 30709c6f1ddSLingrui98 // if hit, check whether a new cfi(only br is possible) is detected 30809c6f1ddSLingrui98 val oe = io.old_entry 309eeb5ff92SLingrui98 val br_recorded_vec = oe.getBrRecordedVec(io.cfiIndex.bits) 31009c6f1ddSLingrui98 val br_recorded = br_recorded_vec.asUInt.orR 31109c6f1ddSLingrui98 val is_new_br = cfi_is_br && !br_recorded 31209c6f1ddSLingrui98 val new_br_offset = io.cfiIndex.bits 31309c6f1ddSLingrui98 // vec(i) means new br will be inserted BEFORE old br(i) 314eeb5ff92SLingrui98 val allBrSlotsVec = oe.allSlotsForBr 31509c6f1ddSLingrui98 val new_br_insert_onehot = VecInit((0 until numBr).map{ 31609c6f1ddSLingrui98 i => i match { 317eeb5ff92SLingrui98 case 0 => 318eeb5ff92SLingrui98 !allBrSlotsVec(0).valid || new_br_offset < allBrSlotsVec(0).offset 319eeb5ff92SLingrui98 case idx => 320eeb5ff92SLingrui98 allBrSlotsVec(idx-1).valid && new_br_offset > allBrSlotsVec(idx-1).offset && 321eeb5ff92SLingrui98 (!allBrSlotsVec(idx).valid || new_br_offset < allBrSlotsVec(idx).offset) 32209c6f1ddSLingrui98 } 32309c6f1ddSLingrui98 }) 32409c6f1ddSLingrui98 32509c6f1ddSLingrui98 val old_entry_modified = WireInit(io.old_entry) 32609c6f1ddSLingrui98 for (i <- 0 until numBr) { 327eeb5ff92SLingrui98 val slot = old_entry_modified.allSlotsForBr(i) 328eeb5ff92SLingrui98 when (new_br_insert_onehot(i)) { 329eeb5ff92SLingrui98 slot.valid := true.B 330eeb5ff92SLingrui98 slot.offset := new_br_offset 331b37e4b45SLingrui98 slot.setLowerStatByTarget(io.start_addr, io.target, i == numBr-1) 332eeb5ff92SLingrui98 old_entry_modified.always_taken(i) := true.B 333eeb5ff92SLingrui98 }.elsewhen (new_br_offset > oe.allSlotsForBr(i).offset) { 334eeb5ff92SLingrui98 old_entry_modified.always_taken(i) := false.B 335eeb5ff92SLingrui98 // all other fields remain unchanged 336eeb5ff92SLingrui98 }.otherwise { 337eeb5ff92SLingrui98 // case i == 0, remain unchanged 338eeb5ff92SLingrui98 if (i != 0) { 339b37e4b45SLingrui98 val noNeedToMoveFromFormerSlot = (i == numBr-1).B && !oe.brSlots.last.valid 340eeb5ff92SLingrui98 when (!noNeedToMoveFromFormerSlot) { 341eeb5ff92SLingrui98 slot.fromAnotherSlot(oe.allSlotsForBr(i-1)) 342eeb5ff92SLingrui98 old_entry_modified.always_taken(i) := oe.always_taken(i) 34309c6f1ddSLingrui98 } 344eeb5ff92SLingrui98 } 345eeb5ff92SLingrui98 } 346eeb5ff92SLingrui98 } 34709c6f1ddSLingrui98 348eeb5ff92SLingrui98 // two circumstances: 349eeb5ff92SLingrui98 // 1. oe: | br | j |, new br should be in front of j, thus addr of j should be new pft 350eeb5ff92SLingrui98 // 2. oe: | br | br |, new br could be anywhere between, thus new pft is the addr of either 351eeb5ff92SLingrui98 // the previous last br or the new br 352eeb5ff92SLingrui98 val may_have_to_replace = oe.noEmptySlotForNewBr 353eeb5ff92SLingrui98 val pft_need_to_change = is_new_br && may_have_to_replace 35409c6f1ddSLingrui98 // it should either be the given last br or the new br 35509c6f1ddSLingrui98 when (pft_need_to_change) { 356eeb5ff92SLingrui98 val new_pft_offset = 357710a8720SLingrui98 Mux(!new_br_insert_onehot.asUInt.orR, 358710a8720SLingrui98 new_br_offset, oe.allSlotsForBr.last.offset) 359eeb5ff92SLingrui98 360710a8720SLingrui98 // set jmp to invalid 36109c6f1ddSLingrui98 old_entry_modified.pftAddr := getLower(io.start_addr) + new_pft_offset 36209c6f1ddSLingrui98 old_entry_modified.carry := (getLower(io.start_addr) +& new_pft_offset).head(1).asBool 363f4ebc4b2SLingrui98 old_entry_modified.last_may_be_rvi_call := false.B 36409c6f1ddSLingrui98 old_entry_modified.isCall := false.B 36509c6f1ddSLingrui98 old_entry_modified.isRet := false.B 366eeb5ff92SLingrui98 old_entry_modified.isJalr := false.B 36709c6f1ddSLingrui98 } 36809c6f1ddSLingrui98 36909c6f1ddSLingrui98 val old_entry_jmp_target_modified = WireInit(oe) 370710a8720SLingrui98 val old_target = oe.tailSlot.getTarget(io.start_addr) // may be wrong because we store only 20 lowest bits 371b37e4b45SLingrui98 val old_tail_is_jmp = !oe.tailSlot.sharing 372eeb5ff92SLingrui98 val jalr_target_modified = cfi_is_jalr && (old_target =/= io.target) && old_tail_is_jmp // TODO: pass full jalr target 3733bcae573SLingrui98 when (jalr_target_modified) { 37409c6f1ddSLingrui98 old_entry_jmp_target_modified.setByJmpTarget(io.start_addr, io.target) 37509c6f1ddSLingrui98 old_entry_jmp_target_modified.always_taken := 0.U.asTypeOf(Vec(numBr, Bool())) 37609c6f1ddSLingrui98 } 37709c6f1ddSLingrui98 37809c6f1ddSLingrui98 val old_entry_always_taken = WireInit(oe) 37909c6f1ddSLingrui98 val always_taken_modified_vec = Wire(Vec(numBr, Bool())) // whether modified or not 38009c6f1ddSLingrui98 for (i <- 0 until numBr) { 38109c6f1ddSLingrui98 old_entry_always_taken.always_taken(i) := 38209c6f1ddSLingrui98 oe.always_taken(i) && io.cfiIndex.valid && oe.brValids(i) && io.cfiIndex.bits === oe.brOffset(i) 383710a8720SLingrui98 always_taken_modified_vec(i) := oe.always_taken(i) && !old_entry_always_taken.always_taken(i) 38409c6f1ddSLingrui98 } 38509c6f1ddSLingrui98 val always_taken_modified = always_taken_modified_vec.reduce(_||_) 38609c6f1ddSLingrui98 38709c6f1ddSLingrui98 38809c6f1ddSLingrui98 38909c6f1ddSLingrui98 val derived_from_old_entry = 39009c6f1ddSLingrui98 Mux(is_new_br, old_entry_modified, 3913bcae573SLingrui98 Mux(jalr_target_modified, old_entry_jmp_target_modified, old_entry_always_taken)) 39209c6f1ddSLingrui98 39309c6f1ddSLingrui98 39409c6f1ddSLingrui98 io.new_entry := Mux(!hit, init_entry, derived_from_old_entry) 39509c6f1ddSLingrui98 39609c6f1ddSLingrui98 io.new_br_insert_pos := new_br_insert_onehot 39709c6f1ddSLingrui98 io.taken_mask := VecInit((io.new_entry.brOffset zip io.new_entry.brValids).map{ 39809c6f1ddSLingrui98 case (off, v) => io.cfiIndex.bits === off && io.cfiIndex.valid && v 39909c6f1ddSLingrui98 }) 400803124a6SLingrui98 io.jmp_taken := io.new_entry.jmpValid && io.new_entry.tailSlot.offset === io.cfiIndex.bits 40109c6f1ddSLingrui98 for (i <- 0 until numBr) { 40209c6f1ddSLingrui98 io.mispred_mask(i) := io.new_entry.brValids(i) && io.mispredict_vec(io.new_entry.brOffset(i)) 40309c6f1ddSLingrui98 } 40409c6f1ddSLingrui98 io.mispred_mask.last := io.new_entry.jmpValid && io.mispredict_vec(pd.jmpOffset) 40509c6f1ddSLingrui98 40609c6f1ddSLingrui98 // for perf counters 40709c6f1ddSLingrui98 io.is_init_entry := !hit 4083bcae573SLingrui98 io.is_old_entry := hit && !is_new_br && !jalr_target_modified && !always_taken_modified 40909c6f1ddSLingrui98 io.is_new_br := hit && is_new_br 4103bcae573SLingrui98 io.is_jalr_target_modified := hit && jalr_target_modified 41109c6f1ddSLingrui98 io.is_always_taken_modified := hit && always_taken_modified 412eeb5ff92SLingrui98 io.is_br_full := hit && is_new_br && may_have_to_replace 41309c6f1ddSLingrui98} 41409c6f1ddSLingrui98 415c5c5edaeSJeniusclass FtqPcMemWrapper(numOtherReads: Int)(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo { 416c5c5edaeSJenius val io = IO(new Bundle { 417c5c5edaeSJenius val ifuPtr_w = Input(new FtqPtr) 418c5c5edaeSJenius val ifuPtrPlus1_w = Input(new FtqPtr) 4196bf9b30dSLingrui98 val ifuPtrPlus2_w = Input(new FtqPtr) 420b92f8445Sssszwic val pfPtr_w = Input(new FtqPtr) 421b92f8445Sssszwic val pfPtrPlus1_w = Input(new FtqPtr) 422c5c5edaeSJenius val commPtr_w = Input(new FtqPtr) 4236bf9b30dSLingrui98 val commPtrPlus1_w = Input(new FtqPtr) 424c5c5edaeSJenius val ifuPtr_rdata = Output(new Ftq_RF_Components) 425c5c5edaeSJenius val ifuPtrPlus1_rdata = Output(new Ftq_RF_Components) 4266bf9b30dSLingrui98 val ifuPtrPlus2_rdata = Output(new Ftq_RF_Components) 427b92f8445Sssszwic val pfPtr_rdata = Output(new Ftq_RF_Components) 428b92f8445Sssszwic val pfPtrPlus1_rdata = Output(new Ftq_RF_Components) 429c5c5edaeSJenius val commPtr_rdata = Output(new Ftq_RF_Components) 4306bf9b30dSLingrui98 val commPtrPlus1_rdata = Output(new Ftq_RF_Components) 431c5c5edaeSJenius 432c5c5edaeSJenius val wen = Input(Bool()) 433c5c5edaeSJenius val waddr = Input(UInt(log2Ceil(FtqSize).W)) 434c5c5edaeSJenius val wdata = Input(new Ftq_RF_Components) 435c5c5edaeSJenius }) 436c5c5edaeSJenius 4376bf9b30dSLingrui98 val num_pc_read = numOtherReads + 5 438c5c5edaeSJenius val mem = Module(new SyncDataModuleTemplate(new Ftq_RF_Components, FtqSize, 43928f2cf58SLingrui98 num_pc_read, 1, "FtqPC")) 440c5c5edaeSJenius mem.io.wen(0) := io.wen 441c5c5edaeSJenius mem.io.waddr(0) := io.waddr 442c5c5edaeSJenius mem.io.wdata(0) := io.wdata 443c5c5edaeSJenius 4446bf9b30dSLingrui98 // read one cycle ahead for ftq local reads 445b92f8445Sssszwic val raddr_vec = VecInit(Seq(io.ifuPtr_w.value, io.ifuPtrPlus1_w.value, io.ifuPtrPlus2_w.value, 446b92f8445Sssszwic io.pfPtr_w.value, io.pfPtrPlus1_w.value, 447b92f8445Sssszwic io.commPtrPlus1_w.value, io.commPtr_w.value)) 448c5c5edaeSJenius 449c5c5edaeSJenius mem.io.raddr := raddr_vec 450c5c5edaeSJenius 451b92f8445Sssszwic io.ifuPtr_rdata := mem.io.rdata.dropRight(6).last 452b92f8445Sssszwic io.ifuPtrPlus1_rdata := mem.io.rdata.dropRight(5).last 453b92f8445Sssszwic io.ifuPtrPlus2_rdata := mem.io.rdata.dropRight(4).last 454b92f8445Sssszwic io.pfPtr_rdata := mem.io.rdata.dropRight(3).last 455b92f8445Sssszwic io.pfPtrPlus1_rdata := mem.io.rdata.dropRight(2).last 4566bf9b30dSLingrui98 io.commPtrPlus1_rdata := mem.io.rdata.dropRight(1).last 457c5c5edaeSJenius io.commPtr_rdata := mem.io.rdata.last 458c5c5edaeSJenius} 459c5c5edaeSJenius 46009c6f1ddSLingrui98class Ftq(implicit p: Parameters) extends XSModule with HasCircularQueuePtrHelper 461e30430c2SJay with HasBackendRedirectInfo with BPUUtils with HasBPUConst with HasPerfEvents 462e30430c2SJay with HasICacheParameters{ 46309c6f1ddSLingrui98 val io = IO(new Bundle { 46409c6f1ddSLingrui98 val fromBpu = Flipped(new BpuToFtqIO) 46509c6f1ddSLingrui98 val fromIfu = Flipped(new IfuToFtqIO) 46609c6f1ddSLingrui98 val fromBackend = Flipped(new CtrlToFtqIO) 46709c6f1ddSLingrui98 46809c6f1ddSLingrui98 val toBpu = new FtqToBpuIO 46909c6f1ddSLingrui98 val toIfu = new FtqToIfuIO 470c5c5edaeSJenius val toICache = new FtqToICacheIO 47109c6f1ddSLingrui98 val toBackend = new FtqToCtrlIO 472b92f8445Sssszwic val toPrefetch = new FtqToPrefetchIO 473b92f8445Sssszwic val icacheFlush = Output(Bool()) 4747052722fSJay 47509c6f1ddSLingrui98 val bpuInfo = new Bundle { 47609c6f1ddSLingrui98 val bpRight = Output(UInt(XLEN.W)) 47709c6f1ddSLingrui98 val bpWrong = Output(UInt(XLEN.W)) 47809c6f1ddSLingrui98 } 4791d1e6d4dSJenius 4801d1e6d4dSJenius val mmioCommitRead = Flipped(new mmioCommitRead) 481d2b20d1aSTang Haojin 482d2b20d1aSTang Haojin // for perf 483d2b20d1aSTang Haojin val ControlBTBMissBubble = Output(Bool()) 484d2b20d1aSTang Haojin val TAGEMissBubble = Output(Bool()) 485d2b20d1aSTang Haojin val SCMissBubble = Output(Bool()) 486d2b20d1aSTang Haojin val ITTAGEMissBubble = Output(Bool()) 487d2b20d1aSTang Haojin val RASMissBubble = Output(Bool()) 48809c6f1ddSLingrui98 }) 48909c6f1ddSLingrui98 io.bpuInfo := DontCare 49009c6f1ddSLingrui98 491d2b20d1aSTang Haojin val topdown_stage = RegInit(0.U.asTypeOf(new FrontendTopDownBundle)) 492d2b20d1aSTang Haojin // only driven by clock, not valid-ready 493d2b20d1aSTang Haojin topdown_stage := io.fromBpu.resp.bits.topdown_info 494d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info := topdown_stage 495d2b20d1aSTang Haojin 496d2b20d1aSTang Haojin val ifuRedirected = RegInit(VecInit(Seq.fill(FtqSize)(false.B))) 497d2b20d1aSTang Haojin 498bace178aSGao-Zeyu 49942dddaceSXuan Hu // io.fromBackend.ftqIdxAhead: bju(BjuCnt) + ldReplay + exception 50042dddaceSXuan Hu val ftqIdxAhead = VecInit(Seq.tabulate(FtqRedirectAheadNum)(i => io.fromBackend.ftqIdxAhead(i))) // only bju 50142dddaceSXuan Hu val ftqIdxSelOH = io.fromBackend.ftqIdxSelOH.bits(FtqRedirectAheadNum - 1, 0) 502bace178aSGao-Zeyu 503bace178aSGao-Zeyu val aheadValid = ftqIdxAhead.map(_.valid).reduce(_|_) && !io.fromBackend.redirect.valid 504bace178aSGao-Zeyu val realAhdValid = io.fromBackend.redirect.valid && (ftqIdxSelOH > 0.U) && RegNext(aheadValid) 505d2b20d1aSTang Haojin val backendRedirect = Wire(Valid(new BranchPredictionRedirect)) 5061c6fc24aSEaston Man val backendRedirectReg = Wire(Valid(new BranchPredictionRedirect)) 5071c6fc24aSEaston Man backendRedirectReg.valid := RegNext(Mux(realAhdValid, false.B, backendRedirect.valid)) 5081c6fc24aSEaston Man backendRedirectReg.bits := RegEnable(backendRedirect.bits, backendRedirect.valid) 509bace178aSGao-Zeyu val fromBackendRedirect = Wire(Valid(new BranchPredictionRedirect)) 510bace178aSGao-Zeyu fromBackendRedirect := Mux(realAhdValid, backendRedirect, backendRedirectReg) 51109c6f1ddSLingrui98 512df5b4b8eSYinan Xu val stage2Flush = backendRedirect.valid 51309c6f1ddSLingrui98 val backendFlush = stage2Flush || RegNext(stage2Flush) 51409c6f1ddSLingrui98 val ifuFlush = Wire(Bool()) 51509c6f1ddSLingrui98 51609c6f1ddSLingrui98 val flush = stage2Flush || RegNext(stage2Flush) 51709c6f1ddSLingrui98 51809c6f1ddSLingrui98 val allowBpuIn, allowToIfu = WireInit(false.B) 51909c6f1ddSLingrui98 val flushToIfu = !allowToIfu 520bace178aSGao-Zeyu allowBpuIn := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid 521bace178aSGao-Zeyu allowToIfu := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid 52209c6f1ddSLingrui98 523f56177cbSJenius def copyNum = 5 524b92f8445Sssszwic val bpuPtr, ifuPtr, pfPtr, ifuWbPtr, commPtr, robCommPtr = RegInit(FtqPtr(false.B, 0.U)) 525c9bc5480SLingrui98 val ifuPtrPlus1 = RegInit(FtqPtr(false.B, 1.U)) 5266bf9b30dSLingrui98 val ifuPtrPlus2 = RegInit(FtqPtr(false.B, 2.U)) 527b92f8445Sssszwic val pfPtrPlus1 = RegInit(FtqPtr(false.B, 1.U)) 5286bf9b30dSLingrui98 val commPtrPlus1 = RegInit(FtqPtr(false.B, 1.U)) 529f56177cbSJenius val copied_ifu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U))) 530dc270d3bSJenius val copied_bpu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U))) 5316bf9b30dSLingrui98 require(FtqSize >= 4) 532c5c5edaeSJenius val ifuPtr_write = WireInit(ifuPtr) 533c5c5edaeSJenius val ifuPtrPlus1_write = WireInit(ifuPtrPlus1) 5346bf9b30dSLingrui98 val ifuPtrPlus2_write = WireInit(ifuPtrPlus2) 535b92f8445Sssszwic val pfPtr_write = WireInit(pfPtr) 536b92f8445Sssszwic val pfPtrPlus1_write = WireInit(pfPtrPlus1) 537c5c5edaeSJenius val ifuWbPtr_write = WireInit(ifuWbPtr) 538c5c5edaeSJenius val commPtr_write = WireInit(commPtr) 5396bf9b30dSLingrui98 val commPtrPlus1_write = WireInit(commPtrPlus1) 54089cc69c1STang Haojin val robCommPtr_write = WireInit(robCommPtr) 541c5c5edaeSJenius ifuPtr := ifuPtr_write 542c5c5edaeSJenius ifuPtrPlus1 := ifuPtrPlus1_write 5436bf9b30dSLingrui98 ifuPtrPlus2 := ifuPtrPlus2_write 544b92f8445Sssszwic pfPtr := pfPtr_write 545b92f8445Sssszwic pfPtrPlus1 := pfPtrPlus1_write 546c5c5edaeSJenius ifuWbPtr := ifuWbPtr_write 547c5c5edaeSJenius commPtr := commPtr_write 548f83ef67eSLingrui98 commPtrPlus1 := commPtrPlus1_write 549f56177cbSJenius copied_ifu_ptr.map{ptr => 550f56177cbSJenius ptr := ifuPtr_write 551f56177cbSJenius dontTouch(ptr) 552f56177cbSJenius } 55389cc69c1STang Haojin robCommPtr := robCommPtr_write 55409c6f1ddSLingrui98 val validEntries = distanceBetween(bpuPtr, commPtr) 55543aca6c2SGuokai Chen val canCommit = Wire(Bool()) 55609c6f1ddSLingrui98 557c1b28b66STang Haojin // Instruction page fault and instruction access fault are sent from backend with redirect requests. 558c1b28b66STang Haojin // When IPF and IAF are sent, backendPcFaultIfuPtr points to the FTQ entry whose first instruction 559c1b28b66STang Haojin // raises IPF or IAF, which is ifuWbPtr_write or IfuPtr_write. 560c1b28b66STang Haojin // Only when IFU has written back that FTQ entry can backendIpf and backendIaf be false because this 561c1b28b66STang Haojin // makes sure that IAF and IPF are correctly raised instead of being flushed by redirect requests. 562c1b28b66STang Haojin val backendIpf = RegInit(false.B) 563c1b28b66STang Haojin val backendIgpf = RegInit(false.B) 564c1b28b66STang Haojin val backendIaf = RegInit(false.B) 565c1b28b66STang Haojin val backendPcFaultPtr = RegInit(FtqPtr(false.B, 0.U)) 566c1b28b66STang Haojin when (fromBackendRedirect.valid) { 567c1b28b66STang Haojin backendIpf := fromBackendRedirect.bits.cfiUpdate.backendIPF 568c1b28b66STang Haojin backendIgpf := fromBackendRedirect.bits.cfiUpdate.backendIGPF 569c1b28b66STang Haojin backendIaf := fromBackendRedirect.bits.cfiUpdate.backendIAF 570c1b28b66STang Haojin when (fromBackendRedirect.bits.cfiUpdate.backendIPF || fromBackendRedirect.bits.cfiUpdate.backendIGPF || fromBackendRedirect.bits.cfiUpdate.backendIAF) { 571c1b28b66STang Haojin backendPcFaultPtr := ifuWbPtr_write 572c1b28b66STang Haojin } 573c1b28b66STang Haojin } .elsewhen (ifuWbPtr =/= backendPcFaultPtr) { 574c1b28b66STang Haojin backendIpf := false.B 575c1b28b66STang Haojin backendIgpf := false.B 576c1b28b66STang Haojin backendIaf := false.B 577c1b28b66STang Haojin } 578c1b28b66STang Haojin 57909c6f1ddSLingrui98 // ********************************************************************** 58009c6f1ddSLingrui98 // **************************** enq from bpu **************************** 58109c6f1ddSLingrui98 // ********************************************************************** 58243aca6c2SGuokai Chen val new_entry_ready = validEntries < FtqSize.U || canCommit 58309c6f1ddSLingrui98 io.fromBpu.resp.ready := new_entry_ready 58409c6f1ddSLingrui98 58509c6f1ddSLingrui98 val bpu_s2_resp = io.fromBpu.resp.bits.s2 586cb4f77ceSLingrui98 val bpu_s3_resp = io.fromBpu.resp.bits.s3 587adc0b8dfSGuokai Chen val bpu_s2_redirect = bpu_s2_resp.valid(3) && bpu_s2_resp.hasRedirect(3) 588adc0b8dfSGuokai Chen val bpu_s3_redirect = bpu_s3_resp.valid(3) && bpu_s3_resp.hasRedirect(3) 58909c6f1ddSLingrui98 59009c6f1ddSLingrui98 io.toBpu.enq_ptr := bpuPtr 591935edac4STang Haojin val enq_fire = io.fromBpu.resp.fire && allowBpuIn // from bpu s1 592935edac4STang Haojin val bpu_in_fire = (io.fromBpu.resp.fire || bpu_s2_redirect || bpu_s3_redirect) && allowBpuIn 59309c6f1ddSLingrui98 594b37e4b45SLingrui98 val bpu_in_resp = io.fromBpu.resp.bits.selectedResp 595adc0b8dfSGuokai Chen val bpu_in_stage = io.fromBpu.resp.bits.selectedRespIdxForFtq 59609c6f1ddSLingrui98 val bpu_in_resp_ptr = Mux(bpu_in_stage === BP_S1, bpuPtr, bpu_in_resp.ftq_idx) 59709c6f1ddSLingrui98 val bpu_in_resp_idx = bpu_in_resp_ptr.value 59809c6f1ddSLingrui98 599b92f8445Sssszwic // read ports: pfReq1 + pfReq2 ++ ifuReq1 + ifuReq2 + ifuReq3 + commitUpdate2 + commitUpdate 600b92f8445Sssszwic val ftq_pc_mem = Module(new FtqPcMemWrapper(2)) 6016bf9b30dSLingrui98 // resp from uBTB 602c5c5edaeSJenius ftq_pc_mem.io.wen := bpu_in_fire 603c5c5edaeSJenius ftq_pc_mem.io.waddr := bpu_in_resp_idx 604c5c5edaeSJenius ftq_pc_mem.io.wdata.fromBranchPrediction(bpu_in_resp) 60509c6f1ddSLingrui98 60609c6f1ddSLingrui98 // ifuRedirect + backendRedirect + commit 60716a171eeSEaston Man val ftq_redirect_mem = Module(new SyncDataModuleTemplate(new Ftq_Redirect_SRAMEntry, 60895a47398SGao-Zeyu FtqSize, IfuRedirectNum+FtqRedirectAheadNum+1, 1, hasRen = true)) 60909c6f1ddSLingrui98 // these info is intended to enq at the last stage of bpu 610deb3a97eSGao-Zeyu ftq_redirect_mem.io.wen(0) := io.fromBpu.resp.bits.lastStage.valid(3) 611deb3a97eSGao-Zeyu ftq_redirect_mem.io.waddr(0) := io.fromBpu.resp.bits.lastStage.ftq_idx.value 612deb3a97eSGao-Zeyu ftq_redirect_mem.io.wdata(0) := io.fromBpu.resp.bits.last_stage_spec_info 613deb3a97eSGao-Zeyu println(f"ftq redirect MEM: entry ${ftq_redirect_mem.io.wdata(0).getWidth} * ${FtqSize} * 3") 61409c6f1ddSLingrui98 61509c6f1ddSLingrui98 val ftq_meta_1r_sram = Module(new FtqNRSRAM(new Ftq_1R_SRAMEntry, 1)) 61609c6f1ddSLingrui98 // these info is intended to enq at the last stage of bpu 617adc0b8dfSGuokai Chen ftq_meta_1r_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid(3) 61809c6f1ddSLingrui98 ftq_meta_1r_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value 619c2d1ec7dSLingrui98 ftq_meta_1r_sram.io.wdata.meta := io.fromBpu.resp.bits.last_stage_meta 620deb3a97eSGao-Zeyu ftq_meta_1r_sram.io.wdata.ftb_entry := io.fromBpu.resp.bits.last_stage_ftb_entry 62195a47398SGao-Zeyu // ifuRedirect + backendRedirect (commit moved to ftq_meta_1r_sram) 622241781f0SEaston Man val ftb_entry_mem = Module(new SyncDataModuleTemplate(new FTBEntry_FtqMem, 62395a47398SGao-Zeyu FtqSize, IfuRedirectNum+FtqRedirectAheadNum, 1, hasRen = true)) 624adc0b8dfSGuokai Chen ftb_entry_mem.io.wen(0) := io.fromBpu.resp.bits.lastStage.valid(3) 62509c6f1ddSLingrui98 ftb_entry_mem.io.waddr(0) := io.fromBpu.resp.bits.lastStage.ftq_idx.value 626c2d1ec7dSLingrui98 ftb_entry_mem.io.wdata(0) := io.fromBpu.resp.bits.last_stage_ftb_entry 62709c6f1ddSLingrui98 62809c6f1ddSLingrui98 62909c6f1ddSLingrui98 // multi-write 630b0ed7239SLingrui98 val update_target = Reg(Vec(FtqSize, UInt(VAddrBits.W))) // could be taken target or fallThrough //TODO: remove this 6316bf9b30dSLingrui98 val newest_entry_target = Reg(UInt(VAddrBits.W)) 6321c6fc24aSEaston Man val newest_entry_target_modified = RegInit(false.B) 6336bf9b30dSLingrui98 val newest_entry_ptr = Reg(new FtqPtr) 6341c6fc24aSEaston Man val newest_entry_ptr_modified = RegInit(false.B) 63509c6f1ddSLingrui98 val cfiIndex_vec = Reg(Vec(FtqSize, ValidUndirectioned(UInt(log2Ceil(PredictWidth).W)))) 63609c6f1ddSLingrui98 val mispredict_vec = Reg(Vec(FtqSize, Vec(PredictWidth, Bool()))) 63709c6f1ddSLingrui98 val pred_stage = Reg(Vec(FtqSize, UInt(2.W))) 638209a4cafSSteve Gou val pred_s1_cycle = if (!env.FPGAPlatform) Some(Reg(Vec(FtqSize, UInt(64.W)))) else None 63909c6f1ddSLingrui98 64091346769SMuzi val c_empty :: c_toCommit :: c_committed :: c_flushed :: Nil = Enum(4) 6411c6fc24aSEaston Man val commitStateQueueReg = RegInit(VecInit(Seq.fill(FtqSize) { 64291346769SMuzi VecInit(Seq.fill(PredictWidth)(c_empty)) 64309c6f1ddSLingrui98 })) 6441c6fc24aSEaston Man val commitStateQueueEnable = WireInit(VecInit(Seq.fill(FtqSize)(false.B))) 6451c6fc24aSEaston Man val commitStateQueueNext = WireInit(commitStateQueueReg) 6461c6fc24aSEaston Man 6471c6fc24aSEaston Man for (f <- 0 until FtqSize) { 6481c6fc24aSEaston Man when(commitStateQueueEnable(f)) { 6491c6fc24aSEaston Man commitStateQueueReg(f) := commitStateQueueNext(f) 6501c6fc24aSEaston Man } 6511c6fc24aSEaston Man } 65209c6f1ddSLingrui98 65309c6f1ddSLingrui98 val f_to_send :: f_sent :: Nil = Enum(2) 65409c6f1ddSLingrui98 val entry_fetch_status = RegInit(VecInit(Seq.fill(FtqSize)(f_sent))) 65509c6f1ddSLingrui98 65609c6f1ddSLingrui98 val h_not_hit :: h_false_hit :: h_hit :: Nil = Enum(3) 65709c6f1ddSLingrui98 val entry_hit_status = RegInit(VecInit(Seq.fill(FtqSize)(h_not_hit))) 65809c6f1ddSLingrui98 659f63797a4SLingrui98 // modify registers one cycle later to cut critical path 660f63797a4SLingrui98 val last_cycle_bpu_in = RegNext(bpu_in_fire) 6611c6fc24aSEaston Man val last_cycle_bpu_in_ptr = RegEnable(bpu_in_resp_ptr, bpu_in_fire) 6626bf9b30dSLingrui98 val last_cycle_bpu_in_idx = last_cycle_bpu_in_ptr.value 6631c6fc24aSEaston Man val last_cycle_bpu_target = RegEnable(bpu_in_resp.getTarget(3), bpu_in_fire) 6641c6fc24aSEaston Man val last_cycle_cfiIndex = RegEnable(bpu_in_resp.cfiIndex(3), bpu_in_fire) 6651c6fc24aSEaston Man val last_cycle_bpu_in_stage = RegEnable(bpu_in_stage, bpu_in_fire) 666f56177cbSJenius 6677be982afSLingrui98 def extra_copyNum_for_commitStateQueue = 2 6681c6fc24aSEaston Man val copied_last_cycle_bpu_in = 6691c6fc24aSEaston Man VecInit(Seq.fill(copyNum + extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_fire))) 6701c6fc24aSEaston Man val copied_last_cycle_bpu_in_ptr_for_ftq = 6711c6fc24aSEaston Man VecInit(Seq.fill(extra_copyNum_for_commitStateQueue)(RegEnable(bpu_in_resp_ptr, bpu_in_fire))) 672f56177cbSJenius 6731c6fc24aSEaston Man newest_entry_target_modified := false.B 6741c6fc24aSEaston Man newest_entry_ptr_modified := false.B 675f63797a4SLingrui98 when (last_cycle_bpu_in) { 676f63797a4SLingrui98 entry_fetch_status(last_cycle_bpu_in_idx) := f_to_send 677f63797a4SLingrui98 cfiIndex_vec(last_cycle_bpu_in_idx) := last_cycle_cfiIndex 678f63797a4SLingrui98 pred_stage(last_cycle_bpu_in_idx) := last_cycle_bpu_in_stage 6796bf9b30dSLingrui98 680b0ed7239SLingrui98 update_target(last_cycle_bpu_in_idx) := last_cycle_bpu_target // TODO: remove this 6811c6fc24aSEaston Man newest_entry_target_modified := true.B 6826bf9b30dSLingrui98 newest_entry_target := last_cycle_bpu_target 6831c6fc24aSEaston Man newest_entry_ptr_modified := true.B 6846bf9b30dSLingrui98 newest_entry_ptr := last_cycle_bpu_in_ptr 68509c6f1ddSLingrui98 } 68609c6f1ddSLingrui98 6877be982afSLingrui98 // reduce fanout by delay write for a cycle 6887be982afSLingrui98 when (RegNext(last_cycle_bpu_in)) { 6891c6fc24aSEaston Man mispredict_vec(RegEnable(last_cycle_bpu_in_idx, last_cycle_bpu_in)) := 6901c6fc24aSEaston Man WireInit(VecInit(Seq.fill(PredictWidth)(false.B))) 6917be982afSLingrui98 } 6927be982afSLingrui98 693209a4cafSSteve Gou // record s1 pred cycles 694209a4cafSSteve Gou pred_s1_cycle.map(vec => { 695209a4cafSSteve Gou when (bpu_in_fire && (bpu_in_stage === BP_S1)) { 696209a4cafSSteve Gou vec(bpu_in_resp_ptr.value) := bpu_in_resp.full_pred(0).predCycle.getOrElse(0.U) 697209a4cafSSteve Gou } 698209a4cafSSteve Gou }) 699209a4cafSSteve Gou 7007be982afSLingrui98 // reduce fanout using copied last_cycle_bpu_in and copied last_cycle_bpu_in_ptr 7017be982afSLingrui98 val copied_last_cycle_bpu_in_for_ftq = copied_last_cycle_bpu_in.takeRight(extra_copyNum_for_commitStateQueue) 7027be982afSLingrui98 copied_last_cycle_bpu_in_for_ftq.zip(copied_last_cycle_bpu_in_ptr_for_ftq).zipWithIndex.map { 7037be982afSLingrui98 case ((in, ptr), i) => 7047be982afSLingrui98 when (in) { 7057be982afSLingrui98 val perSetEntries = FtqSize / extra_copyNum_for_commitStateQueue // 32 7067be982afSLingrui98 require(FtqSize % extra_copyNum_for_commitStateQueue == 0) 7077be982afSLingrui98 for (j <- 0 until perSetEntries) { 7089361b0c5SLingrui98 when (ptr.value === (i * perSetEntries + j).U) { 70991346769SMuzi commitStateQueueNext(i * perSetEntries + j) := VecInit(Seq.fill(PredictWidth)(c_empty)) 7101c6fc24aSEaston Man // Clock gating optimization, use 1 gate cell to control a row 7111c6fc24aSEaston Man commitStateQueueEnable(i * perSetEntries + j) := true.B 7127be982afSLingrui98 } 7137be982afSLingrui98 } 7147be982afSLingrui98 } 7159361b0c5SLingrui98 } 7167be982afSLingrui98 71709c6f1ddSLingrui98 bpuPtr := bpuPtr + enq_fire 718dc270d3bSJenius copied_bpu_ptr.map(_ := bpuPtr + enq_fire) 719c9bc5480SLingrui98 when (io.toIfu.req.fire && allowToIfu) { 720c5c5edaeSJenius ifuPtr_write := ifuPtrPlus1 7216bf9b30dSLingrui98 ifuPtrPlus1_write := ifuPtrPlus2 7226bf9b30dSLingrui98 ifuPtrPlus2_write := ifuPtrPlus2 + 1.U 723c9bc5480SLingrui98 } 724b92f8445Sssszwic when (io.toPrefetch.req.fire && allowToIfu) { 725b92f8445Sssszwic pfPtr_write := pfPtrPlus1 726b92f8445Sssszwic pfPtrPlus1_write := pfPtrPlus1 + 1.U 727b92f8445Sssszwic } 72809c6f1ddSLingrui98 72909c6f1ddSLingrui98 // only use ftb result to assign hit status 730adc0b8dfSGuokai Chen when (bpu_s2_resp.valid(3)) { 731adc0b8dfSGuokai Chen entry_hit_status(bpu_s2_resp.ftq_idx.value) := Mux(bpu_s2_resp.full_pred(3).hit, h_hit, h_not_hit) 73209c6f1ddSLingrui98 } 73309c6f1ddSLingrui98 73409c6f1ddSLingrui98 7352f4a3aa4SLingrui98 io.toIfu.flushFromBpu.s2.valid := bpu_s2_redirect 73609c6f1ddSLingrui98 io.toIfu.flushFromBpu.s2.bits := bpu_s2_resp.ftq_idx 737b92f8445Sssszwic io.toPrefetch.flushFromBpu.s2.valid := bpu_s2_redirect 738b92f8445Sssszwic io.toPrefetch.flushFromBpu.s2.bits := bpu_s2_resp.ftq_idx 739adc0b8dfSGuokai Chen when (bpu_s2_redirect) { 74009c6f1ddSLingrui98 bpuPtr := bpu_s2_resp.ftq_idx + 1.U 741dc270d3bSJenius copied_bpu_ptr.map(_ := bpu_s2_resp.ftq_idx + 1.U) 74209c6f1ddSLingrui98 // only when ifuPtr runs ahead of bpu s2 resp should we recover it 74309c6f1ddSLingrui98 when (!isBefore(ifuPtr, bpu_s2_resp.ftq_idx)) { 744c5c5edaeSJenius ifuPtr_write := bpu_s2_resp.ftq_idx 745c5c5edaeSJenius ifuPtrPlus1_write := bpu_s2_resp.ftq_idx + 1.U 7466bf9b30dSLingrui98 ifuPtrPlus2_write := bpu_s2_resp.ftq_idx + 2.U 74709c6f1ddSLingrui98 } 748b92f8445Sssszwic when (!isBefore(pfPtr, bpu_s2_resp.ftq_idx)) { 749b92f8445Sssszwic pfPtr_write := bpu_s2_resp.ftq_idx 750b92f8445Sssszwic pfPtrPlus1_write := bpu_s2_resp.ftq_idx + 1.U 751b92f8445Sssszwic } 75209c6f1ddSLingrui98 } 75309c6f1ddSLingrui98 754cb4f77ceSLingrui98 io.toIfu.flushFromBpu.s3.valid := bpu_s3_redirect 755cb4f77ceSLingrui98 io.toIfu.flushFromBpu.s3.bits := bpu_s3_resp.ftq_idx 756b92f8445Sssszwic io.toPrefetch.flushFromBpu.s3.valid := bpu_s3_redirect 757b92f8445Sssszwic io.toPrefetch.flushFromBpu.s3.bits := bpu_s3_resp.ftq_idx 758adc0b8dfSGuokai Chen when (bpu_s3_redirect) { 759cb4f77ceSLingrui98 bpuPtr := bpu_s3_resp.ftq_idx + 1.U 760dc270d3bSJenius copied_bpu_ptr.map(_ := bpu_s3_resp.ftq_idx + 1.U) 761cb4f77ceSLingrui98 // only when ifuPtr runs ahead of bpu s2 resp should we recover it 762cb4f77ceSLingrui98 when (!isBefore(ifuPtr, bpu_s3_resp.ftq_idx)) { 763c5c5edaeSJenius ifuPtr_write := bpu_s3_resp.ftq_idx 764c5c5edaeSJenius ifuPtrPlus1_write := bpu_s3_resp.ftq_idx + 1.U 7656bf9b30dSLingrui98 ifuPtrPlus2_write := bpu_s3_resp.ftq_idx + 2.U 766cb4f77ceSLingrui98 } 767b92f8445Sssszwic when (!isBefore(pfPtr, bpu_s3_resp.ftq_idx)) { 768b92f8445Sssszwic pfPtr_write := bpu_s3_resp.ftq_idx 769b92f8445Sssszwic pfPtrPlus1_write := bpu_s3_resp.ftq_idx + 1.U 770b92f8445Sssszwic } 771cb4f77ceSLingrui98 } 772cb4f77ceSLingrui98 77309c6f1ddSLingrui98 XSError(isBefore(bpuPtr, ifuPtr) && !isFull(bpuPtr, ifuPtr), "\nifuPtr is before bpuPtr!\n") 774b92f8445Sssszwic XSError(isBefore(bpuPtr, pfPtr) && !isFull(bpuPtr, pfPtr), "\npfPtr is before bpuPtr!\n") 7752448f137SGuokai Chen XSError(isBefore(ifuWbPtr, commPtr) && !isFull(ifuWbPtr, commPtr), "\ncommPtr is before ifuWbPtr!\n") 77609c6f1ddSLingrui98 777dc270d3bSJenius (0 until copyNum).map{i => 778dc270d3bSJenius XSError(copied_bpu_ptr(i) =/= bpuPtr, "\ncopiedBpuPtr is different from bpuPtr!\n") 779dc270d3bSJenius } 780dc270d3bSJenius 78109c6f1ddSLingrui98 // **************************************************************** 78209c6f1ddSLingrui98 // **************************** to ifu **************************** 78309c6f1ddSLingrui98 // **************************************************************** 784f22cf846SJenius // 0 for ifu, and 1-4 for ICache 785935edac4STang Haojin val bpu_in_bypass_buf = RegEnable(ftq_pc_mem.io.wdata, bpu_in_fire) 786935edac4STang Haojin val copied_bpu_in_bypass_buf = VecInit(Seq.fill(copyNum)(RegEnable(ftq_pc_mem.io.wdata, bpu_in_fire))) 787f56177cbSJenius val bpu_in_bypass_buf_for_ifu = bpu_in_bypass_buf 7881c6fc24aSEaston Man val bpu_in_bypass_ptr = RegEnable(bpu_in_resp_ptr, bpu_in_fire) 78909c6f1ddSLingrui98 val last_cycle_to_ifu_fire = RegNext(io.toIfu.req.fire) 790b92f8445Sssszwic val last_cycle_to_pf_fire = RegNext(io.toPrefetch.req.fire) 79109c6f1ddSLingrui98 7921c6fc24aSEaston Man val copied_bpu_in_bypass_ptr = VecInit(Seq.fill(copyNum)(RegEnable(bpu_in_resp_ptr, bpu_in_fire))) 793f56177cbSJenius val copied_last_cycle_to_ifu_fire = VecInit(Seq.fill(copyNum)(RegNext(io.toIfu.req.fire))) 79488bc4f90SLingrui98 79509c6f1ddSLingrui98 // read pc and target 7966bf9b30dSLingrui98 ftq_pc_mem.io.ifuPtr_w := ifuPtr_write 7976bf9b30dSLingrui98 ftq_pc_mem.io.ifuPtrPlus1_w := ifuPtrPlus1_write 7986bf9b30dSLingrui98 ftq_pc_mem.io.ifuPtrPlus2_w := ifuPtrPlus2_write 799b92f8445Sssszwic ftq_pc_mem.io.pfPtr_w := pfPtr_write 800b92f8445Sssszwic ftq_pc_mem.io.pfPtrPlus1_w := pfPtrPlus1_write 8016bf9b30dSLingrui98 ftq_pc_mem.io.commPtr_w := commPtr_write 8026bf9b30dSLingrui98 ftq_pc_mem.io.commPtrPlus1_w := commPtrPlus1_write 803c5c5edaeSJenius 80409c6f1ddSLingrui98 8055ff19bd8SLingrui98 io.toIfu.req.bits.ftqIdx := ifuPtr 806f63797a4SLingrui98 807f56177cbSJenius val toICachePcBundle = Wire(Vec(copyNum,new Ftq_RF_Components)) 808dc270d3bSJenius val toICacheEntryToSend = Wire(Vec(copyNum,Bool())) 809*3e1dbb17SMuzi val nextCycleToPrefetchPcBundle = Wire(new Ftq_RF_Components) 810*3e1dbb17SMuzi val nextCycleToPrefetchEntryToSend = Wire(Bool()) 811*3e1dbb17SMuzi val toPrefetchPcBundle = RegNext(nextCycleToPrefetchPcBundle) 812*3e1dbb17SMuzi val toPrefetchEntryToSend = RegNext(nextCycleToPrefetchEntryToSend) 813b37e4b45SLingrui98 val toIfuPcBundle = Wire(new Ftq_RF_Components) 814f63797a4SLingrui98 val entry_is_to_send = WireInit(entry_fetch_status(ifuPtr.value) === f_to_send) 815f63797a4SLingrui98 val entry_ftq_offset = WireInit(cfiIndex_vec(ifuPtr.value)) 8166bf9b30dSLingrui98 val entry_next_addr = Wire(UInt(VAddrBits.W)) 817b004fa13SJenius 818f56177cbSJenius val pc_mem_ifu_ptr_rdata = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtr_rdata))) 819f56177cbSJenius val pc_mem_ifu_plus1_rdata = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata))) 820b0ed7239SLingrui98 val diff_entry_next_addr = WireInit(update_target(ifuPtr.value)) //TODO: remove this 821f63797a4SLingrui98 822dc270d3bSJenius val copied_ifu_plus1_to_send = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1)))) 823dc270d3bSJenius val copied_ifu_ptr_to_send = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr))) 824dc270d3bSJenius 825f56177cbSJenius for(i <- 0 until copyNum){ 826f56177cbSJenius when(copied_last_cycle_bpu_in(i) && copied_bpu_in_bypass_ptr(i) === copied_ifu_ptr(i)){ 827f56177cbSJenius toICachePcBundle(i) := copied_bpu_in_bypass_buf(i) 828dc270d3bSJenius toICacheEntryToSend(i) := true.B 829f56177cbSJenius }.elsewhen(copied_last_cycle_to_ifu_fire(i)){ 830f56177cbSJenius toICachePcBundle(i) := pc_mem_ifu_plus1_rdata(i) 831dc270d3bSJenius toICacheEntryToSend(i) := copied_ifu_plus1_to_send(i) 832f56177cbSJenius }.otherwise{ 833f56177cbSJenius toICachePcBundle(i) := pc_mem_ifu_ptr_rdata(i) 834dc270d3bSJenius toICacheEntryToSend(i) := copied_ifu_ptr_to_send(i) 835f56177cbSJenius } 836f56177cbSJenius } 837f56177cbSJenius 838*3e1dbb17SMuzi // Calculate requests sent to prefetcher one cycle in advance to cut critical path 839*3e1dbb17SMuzi when(bpu_in_fire && bpu_in_resp_ptr === pfPtr_write) { 840*3e1dbb17SMuzi nextCycleToPrefetchPcBundle := ftq_pc_mem.io.wdata 841*3e1dbb17SMuzi nextCycleToPrefetchEntryToSend := true.B 842*3e1dbb17SMuzi }.elsewhen(io.toPrefetch.req.fire) { 843*3e1dbb17SMuzi nextCycleToPrefetchPcBundle := ftq_pc_mem.io.pfPtrPlus1_rdata 844*3e1dbb17SMuzi nextCycleToPrefetchEntryToSend := entry_fetch_status(pfPtrPlus1.value) === f_to_send || 845*3e1dbb17SMuzi last_cycle_bpu_in && bpu_in_bypass_ptr === pfPtrPlus1 846b92f8445Sssszwic }.otherwise { 847*3e1dbb17SMuzi nextCycleToPrefetchPcBundle := ftq_pc_mem.io.pfPtr_rdata 848*3e1dbb17SMuzi nextCycleToPrefetchEntryToSend := entry_fetch_status(pfPtr.value) === f_to_send || 849*3e1dbb17SMuzi last_cycle_bpu_in && bpu_in_bypass_ptr === pfPtr // reduce potential bubbles 850b92f8445Sssszwic } 851b92f8445Sssszwic 852873dc383SLingrui98 // TODO: reconsider target address bypass logic 85309c6f1ddSLingrui98 when (last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) { 85488bc4f90SLingrui98 toIfuPcBundle := bpu_in_bypass_buf_for_ifu 855f678dd91SSteve Gou entry_is_to_send := true.B 8566bf9b30dSLingrui98 entry_next_addr := last_cycle_bpu_target 857f63797a4SLingrui98 entry_ftq_offset := last_cycle_cfiIndex 858b0ed7239SLingrui98 diff_entry_next_addr := last_cycle_bpu_target // TODO: remove this 85909c6f1ddSLingrui98 }.elsewhen (last_cycle_to_ifu_fire) { 860c5c5edaeSJenius toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata) 861c5c5edaeSJenius entry_is_to_send := RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) || 862c5c5edaeSJenius RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1)) // reduce potential bubbles 863ed434d67SLingrui98 entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1), 86488bc4f90SLingrui98 bpu_in_bypass_buf_for_ifu.startAddr, 865fef810c0SLingrui98 Mux(ifuPtr === newest_entry_ptr, 8666bf9b30dSLingrui98 newest_entry_target, 867f83ef67eSLingrui98 RegNext(ftq_pc_mem.io.ifuPtrPlus2_rdata.startAddr))) // ifuPtr+2 868c5c5edaeSJenius }.otherwise { 869c5c5edaeSJenius toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtr_rdata) 87028f2cf58SLingrui98 entry_is_to_send := RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) || 87128f2cf58SLingrui98 RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) // reduce potential bubbles 8726bf9b30dSLingrui98 entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1), 87388bc4f90SLingrui98 bpu_in_bypass_buf_for_ifu.startAddr, 874fef810c0SLingrui98 Mux(ifuPtr === newest_entry_ptr, 8756bf9b30dSLingrui98 newest_entry_target, 876f83ef67eSLingrui98 RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata.startAddr))) // ifuPtr+1 87709c6f1ddSLingrui98 } 87809c6f1ddSLingrui98 879f678dd91SSteve Gou io.toIfu.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr 880f63797a4SLingrui98 io.toIfu.req.bits.nextStartAddr := entry_next_addr 881f63797a4SLingrui98 io.toIfu.req.bits.ftqOffset := entry_ftq_offset 882b37e4b45SLingrui98 io.toIfu.req.bits.fromFtqPcBundle(toIfuPcBundle) 883c5c5edaeSJenius 884c5c5edaeSJenius io.toICache.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr 885dc270d3bSJenius io.toICache.req.bits.readValid.zipWithIndex.map{case(copy, i) => copy := toICacheEntryToSend(i) && copied_ifu_ptr(i) =/= copied_bpu_ptr(i)} 886b92f8445Sssszwic io.toICache.req.bits.pcMemRead.zipWithIndex.foreach{case(copy,i) => 887b92f8445Sssszwic copy.fromFtqPcBundle(toICachePcBundle(i)) 888b92f8445Sssszwic copy.ftqIdx := ifuPtr 889b92f8445Sssszwic } 890c1b28b66STang Haojin io.toICache.req.bits.backendIpf := backendIpf && backendPcFaultPtr === ifuPtr 891c1b28b66STang Haojin io.toICache.req.bits.backendIgpf := backendIgpf && backendPcFaultPtr === ifuPtr 892c1b28b66STang Haojin io.toICache.req.bits.backendIaf := backendIaf && backendPcFaultPtr === ifuPtr 893b92f8445Sssszwic 894b92f8445Sssszwic io.toPrefetch.req.valid := toPrefetchEntryToSend && pfPtr =/= bpuPtr 895b92f8445Sssszwic io.toPrefetch.req.bits.fromFtqPcBundle(toPrefetchPcBundle) 896b92f8445Sssszwic io.toPrefetch.req.bits.ftqIdx := pfPtr 897b004fa13SJenius // io.toICache.req.bits.bypassSelect := last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr 898b004fa13SJenius // io.toICache.req.bits.bpuBypassWrite.zipWithIndex.map{case(bypassWrtie, i) => 899b004fa13SJenius // bypassWrtie.startAddr := bpu_in_bypass_buf.tail(i).startAddr 900b004fa13SJenius // bypassWrtie.nextlineStart := bpu_in_bypass_buf.tail(i).nextLineAddr 901b004fa13SJenius // } 902f22cf846SJenius 903b0ed7239SLingrui98 // TODO: remove this 904b0ed7239SLingrui98 XSError(io.toIfu.req.valid && diff_entry_next_addr =/= entry_next_addr, 9055a674179SLingrui98 p"\nifu_req_target wrong! ifuPtr: ${ifuPtr}, entry_next_addr: ${Hexadecimal(entry_next_addr)} diff_entry_next_addr: ${Hexadecimal(diff_entry_next_addr)}\n") 906b0ed7239SLingrui98 90709c6f1ddSLingrui98 // when fall through is smaller in value than start address, there must be a false hit 908b37e4b45SLingrui98 when (toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit) { 90909c6f1ddSLingrui98 when (io.toIfu.req.fire && 910cb4f77ceSLingrui98 !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) && 911cb4f77ceSLingrui98 !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr) 91209c6f1ddSLingrui98 ) { 91309c6f1ddSLingrui98 entry_hit_status(ifuPtr.value) := h_false_hit 914352db50aSLingrui98 // XSError(true.B, "FTB false hit by fallThroughError, startAddr: %x, fallTHru: %x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr) 91509c6f1ddSLingrui98 } 916b37e4b45SLingrui98 XSDebug(true.B, "fallThruError! start:%x, fallThru:%x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr) 91709c6f1ddSLingrui98 } 91809c6f1ddSLingrui98 919a60a2901SLingrui98 XSPerfAccumulate(f"fall_through_error_to_ifu", toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit && 920a60a2901SLingrui98 io.toIfu.req.fire && !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) && !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr)) 921a60a2901SLingrui98 92209c6f1ddSLingrui98 val ifu_req_should_be_flushed = 923cb4f77ceSLingrui98 io.toIfu.flushFromBpu.shouldFlushByStage2(io.toIfu.req.bits.ftqIdx) || 924cb4f77ceSLingrui98 io.toIfu.flushFromBpu.shouldFlushByStage3(io.toIfu.req.bits.ftqIdx) 92509c6f1ddSLingrui98 92609c6f1ddSLingrui98 when (io.toIfu.req.fire && !ifu_req_should_be_flushed) { 92709c6f1ddSLingrui98 entry_fetch_status(ifuPtr.value) := f_sent 92809c6f1ddSLingrui98 } 92909c6f1ddSLingrui98 93009c6f1ddSLingrui98 // ********************************************************************* 93109c6f1ddSLingrui98 // **************************** wb from ifu **************************** 93209c6f1ddSLingrui98 // ********************************************************************* 93309c6f1ddSLingrui98 val pdWb = io.fromIfu.pdWb 93409c6f1ddSLingrui98 val pds = pdWb.bits.pd 93509c6f1ddSLingrui98 val ifu_wb_valid = pdWb.valid 93609c6f1ddSLingrui98 val ifu_wb_idx = pdWb.bits.ftqIdx.value 93709c6f1ddSLingrui98 // read ports: commit update 938c776f0d5Smy-mayfly val ftq_pd_mem = Module(new SyncDataModuleTemplate(new Ftq_pd_Entry, FtqSize, FtqRedirectAheadNum+1, 1, hasRen = true)) 93909c6f1ddSLingrui98 ftq_pd_mem.io.wen(0) := ifu_wb_valid 94009c6f1ddSLingrui98 ftq_pd_mem.io.waddr(0) := pdWb.bits.ftqIdx.value 94109c6f1ddSLingrui98 ftq_pd_mem.io.wdata(0).fromPdWb(pdWb.bits) 94209c6f1ddSLingrui98 94309c6f1ddSLingrui98 val hit_pd_valid = entry_hit_status(ifu_wb_idx) === h_hit && ifu_wb_valid 94409c6f1ddSLingrui98 val hit_pd_mispred = hit_pd_valid && pdWb.bits.misOffset.valid 94509c6f1ddSLingrui98 val hit_pd_mispred_reg = RegNext(hit_pd_mispred, init=false.B) 946005e809bSJiuyang Liu val pd_reg = RegEnable(pds, pdWb.valid) 947005e809bSJiuyang Liu val start_pc_reg = RegEnable(pdWb.bits.pc(0), pdWb.valid) 948005e809bSJiuyang Liu val wb_idx_reg = RegEnable(ifu_wb_idx, pdWb.valid) 94909c6f1ddSLingrui98 95009c6f1ddSLingrui98 when (ifu_wb_valid) { 95109c6f1ddSLingrui98 val comm_stq_wen = VecInit(pds.map(_.valid).zip(pdWb.bits.instrRange).map{ 95209c6f1ddSLingrui98 case (v, inRange) => v && inRange 95309c6f1ddSLingrui98 }) 9541c6fc24aSEaston Man commitStateQueueEnable(ifu_wb_idx) := true.B 9551c6fc24aSEaston Man (commitStateQueueNext(ifu_wb_idx) zip comm_stq_wen).map { 9561c6fc24aSEaston Man case (qe, v) => when(v) { 95791346769SMuzi qe := c_toCommit 9581c6fc24aSEaston Man } 95909c6f1ddSLingrui98 } 96009c6f1ddSLingrui98 } 96109c6f1ddSLingrui98 962c5c5edaeSJenius when (ifu_wb_valid) { 963c5c5edaeSJenius ifuWbPtr_write := ifuWbPtr + 1.U 964c5c5edaeSJenius } 96509c6f1ddSLingrui98 966f21bbcb2SGuokai Chen XSError(ifu_wb_valid && isAfter(pdWb.bits.ftqIdx, ifuPtr), "IFU returned a predecode before its req, check IFU") 967f21bbcb2SGuokai Chen 9681c6fc24aSEaston Man ftb_entry_mem.io.ren.get.head := ifu_wb_valid 96909c6f1ddSLingrui98 ftb_entry_mem.io.raddr.head := ifu_wb_idx 97009c6f1ddSLingrui98 val has_false_hit = WireInit(false.B) 97109c6f1ddSLingrui98 when (RegNext(hit_pd_valid)) { 97209c6f1ddSLingrui98 // check for false hit 97309c6f1ddSLingrui98 val pred_ftb_entry = ftb_entry_mem.io.rdata.head 974eeb5ff92SLingrui98 val brSlots = pred_ftb_entry.brSlots 975eeb5ff92SLingrui98 val tailSlot = pred_ftb_entry.tailSlot 97609c6f1ddSLingrui98 // we check cfis that bpu predicted 97709c6f1ddSLingrui98 978eeb5ff92SLingrui98 // bpu predicted branches but denied by predecode 979eeb5ff92SLingrui98 val br_false_hit = 980eeb5ff92SLingrui98 brSlots.map{ 981eeb5ff92SLingrui98 s => s.valid && !(pd_reg(s.offset).valid && pd_reg(s.offset).isBr) 982eeb5ff92SLingrui98 }.reduce(_||_) || 983b37e4b45SLingrui98 (tailSlot.valid && pred_ftb_entry.tailSlot.sharing && 984eeb5ff92SLingrui98 !(pd_reg(tailSlot.offset).valid && pd_reg(tailSlot.offset).isBr)) 985eeb5ff92SLingrui98 986eeb5ff92SLingrui98 val jmpOffset = tailSlot.offset 98709c6f1ddSLingrui98 val jmp_pd = pd_reg(jmpOffset) 98809c6f1ddSLingrui98 val jal_false_hit = pred_ftb_entry.jmpValid && 98909c6f1ddSLingrui98 ((pred_ftb_entry.isJal && !(jmp_pd.valid && jmp_pd.isJal)) || 99009c6f1ddSLingrui98 (pred_ftb_entry.isJalr && !(jmp_pd.valid && jmp_pd.isJalr)) || 99109c6f1ddSLingrui98 (pred_ftb_entry.isCall && !(jmp_pd.valid && jmp_pd.isCall)) || 99209c6f1ddSLingrui98 (pred_ftb_entry.isRet && !(jmp_pd.valid && jmp_pd.isRet)) 99309c6f1ddSLingrui98 ) 99409c6f1ddSLingrui98 99509c6f1ddSLingrui98 has_false_hit := br_false_hit || jal_false_hit || hit_pd_mispred_reg 99665fddcf0Szoujr XSDebug(has_false_hit, "FTB false hit by br or jal or hit_pd, startAddr: %x\n", pdWb.bits.pc(0)) 99765fddcf0Szoujr 998352db50aSLingrui98 // assert(!has_false_hit) 99909c6f1ddSLingrui98 } 100009c6f1ddSLingrui98 100109c6f1ddSLingrui98 when (has_false_hit) { 100209c6f1ddSLingrui98 entry_hit_status(wb_idx_reg) := h_false_hit 100309c6f1ddSLingrui98 } 100409c6f1ddSLingrui98 100509c6f1ddSLingrui98 // ******************************************************************************* 100609c6f1ddSLingrui98 // **************************** redirect from backend **************************** 100709c6f1ddSLingrui98 // ******************************************************************************* 100809c6f1ddSLingrui98 100909c6f1ddSLingrui98 // redirect read cfiInfo, couples to redirectGen s2 101095a47398SGao-Zeyu // ftqIdxAhead(0-3) => ftq_redirect_mem(1-4), reuse ftq_redirect_mem(1) 1011bace178aSGao-Zeyu val ftq_redirect_rdata = Wire(Vec(FtqRedirectAheadNum, new Ftq_Redirect_SRAMEntry)) 1012deb3a97eSGao-Zeyu val ftb_redirect_rdata = Wire(Vec(FtqRedirectAheadNum, new FTBEntry_FtqMem)) 1013c776f0d5Smy-mayfly 1014c776f0d5Smy-mayfly val ftq_pd_rdata = Wire(Vec(FtqRedirectAheadNum, new Ftq_pd_Entry)) 101595a47398SGao-Zeyu for (i <- 1 until FtqRedirectAheadNum) { 101695a47398SGao-Zeyu ftq_redirect_mem.io.ren.get(i + IfuRedirectNum) := ftqIdxAhead(i).valid 101795a47398SGao-Zeyu ftq_redirect_mem.io.raddr(i + IfuRedirectNum) := ftqIdxAhead(i).bits.value 101895a47398SGao-Zeyu ftb_entry_mem.io.ren.get(i + IfuRedirectNum) := ftqIdxAhead(i).valid 101995a47398SGao-Zeyu ftb_entry_mem.io.raddr(i + IfuRedirectNum) := ftqIdxAhead(i).bits.value 1020c776f0d5Smy-mayfly 1021c776f0d5Smy-mayfly ftq_pd_mem.io.ren.get(i) := ftqIdxAhead(i).valid 1022c776f0d5Smy-mayfly ftq_pd_mem.io.raddr(i) := ftqIdxAhead(i).bits.value 10239342624fSGao-Zeyu } 102495a47398SGao-Zeyu ftq_redirect_mem.io.ren.get(IfuRedirectNum) := Mux(aheadValid, ftqIdxAhead(0).valid, backendRedirect.valid) 102595a47398SGao-Zeyu ftq_redirect_mem.io.raddr(IfuRedirectNum) := Mux(aheadValid, ftqIdxAhead(0).bits.value, backendRedirect.bits.ftqIdx.value) 102695a47398SGao-Zeyu ftb_entry_mem.io.ren.get(IfuRedirectNum) := Mux(aheadValid, ftqIdxAhead(0).valid, backendRedirect.valid) 102795a47398SGao-Zeyu ftb_entry_mem.io.raddr(IfuRedirectNum) := Mux(aheadValid, ftqIdxAhead(0).bits.value, backendRedirect.bits.ftqIdx.value) 1028bace178aSGao-Zeyu 1029c776f0d5Smy-mayfly ftq_pd_mem.io.ren.get(0) := Mux(aheadValid, ftqIdxAhead(0).valid, backendRedirect.valid) 1030c776f0d5Smy-mayfly ftq_pd_mem.io.raddr(0) := Mux(aheadValid, ftqIdxAhead(0).bits.value, backendRedirect.bits.ftqIdx.value) 1031c776f0d5Smy-mayfly 1032bace178aSGao-Zeyu for (i <- 0 until FtqRedirectAheadNum) { 103395a47398SGao-Zeyu ftq_redirect_rdata(i) := ftq_redirect_mem.io.rdata(i + IfuRedirectNum) 103495a47398SGao-Zeyu ftb_redirect_rdata(i) := ftb_entry_mem.io.rdata(i + IfuRedirectNum) 1035c776f0d5Smy-mayfly 1036c776f0d5Smy-mayfly ftq_pd_rdata(i) := ftq_pd_mem.io.rdata(i) 1037bace178aSGao-Zeyu } 103895a47398SGao-Zeyu val stage3CfiInfo = Mux(realAhdValid, Mux1H(ftqIdxSelOH, ftq_redirect_rdata), ftq_redirect_mem.io.rdata(IfuRedirectNum)) 1039c776f0d5Smy-mayfly val stage3PdInfo = Mux(realAhdValid, Mux1H(ftqIdxSelOH, ftq_pd_rdata), ftq_pd_mem.io.rdata(0)) 104009c6f1ddSLingrui98 val backendRedirectCfi = fromBackendRedirect.bits.cfiUpdate 104109c6f1ddSLingrui98 backendRedirectCfi.fromFtqRedirectSram(stage3CfiInfo) 1042c776f0d5Smy-mayfly backendRedirectCfi.pd := stage3PdInfo.toPd(fromBackendRedirect.bits.ftqOffset) 104309c6f1ddSLingrui98 1044d2b20d1aSTang Haojin 104595a47398SGao-Zeyu val r_ftb_entry = Mux(realAhdValid, Mux1H(ftqIdxSelOH, ftb_redirect_rdata), ftb_entry_mem.io.rdata(IfuRedirectNum)) 104609c6f1ddSLingrui98 val r_ftqOffset = fromBackendRedirect.bits.ftqOffset 104709c6f1ddSLingrui98 1048d2b20d1aSTang Haojin backendRedirectCfi.br_hit := r_ftb_entry.brIsSaved(r_ftqOffset) 1049d2b20d1aSTang Haojin backendRedirectCfi.jr_hit := r_ftb_entry.isJalr && r_ftb_entry.tailSlot.offset === r_ftqOffset 10503711cf36S小造xu_zh // FIXME: not portable 1051abdc3a32Sxu_zh val sc_disagree = stage3CfiInfo.sc_disagree.getOrElse(VecInit(Seq.fill(numBr)(false.B))) 1052d2b20d1aSTang Haojin backendRedirectCfi.sc_hit := backendRedirectCfi.br_hit && Mux(r_ftb_entry.brSlots(0).offset === r_ftqOffset, 1053abdc3a32Sxu_zh sc_disagree(0), sc_disagree(1)) 1054d2b20d1aSTang Haojin 105509c6f1ddSLingrui98 when (entry_hit_status(fromBackendRedirect.bits.ftqIdx.value) === h_hit) { 105609c6f1ddSLingrui98 backendRedirectCfi.shift := PopCount(r_ftb_entry.getBrMaskByOffset(r_ftqOffset)) +& 105709c6f1ddSLingrui98 (backendRedirectCfi.pd.isBr && !r_ftb_entry.brIsSaved(r_ftqOffset) && 1058eeb5ff92SLingrui98 !r_ftb_entry.newBrCanNotInsert(r_ftqOffset)) 105909c6f1ddSLingrui98 106009c6f1ddSLingrui98 backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr && (r_ftb_entry.brIsSaved(r_ftqOffset) || 1061eeb5ff92SLingrui98 !r_ftb_entry.newBrCanNotInsert(r_ftqOffset)) 106209c6f1ddSLingrui98 }.otherwise { 106309c6f1ddSLingrui98 backendRedirectCfi.shift := (backendRedirectCfi.pd.isBr && backendRedirectCfi.taken).asUInt 106409c6f1ddSLingrui98 backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr.asUInt 106509c6f1ddSLingrui98 } 106609c6f1ddSLingrui98 106709c6f1ddSLingrui98 106809c6f1ddSLingrui98 // *************************************************************************** 106909c6f1ddSLingrui98 // **************************** redirect from ifu **************************** 107009c6f1ddSLingrui98 // *************************************************************************** 1071d2b20d1aSTang Haojin val fromIfuRedirect = WireInit(0.U.asTypeOf(Valid(new BranchPredictionRedirect))) 107209c6f1ddSLingrui98 fromIfuRedirect.valid := pdWb.valid && pdWb.bits.misOffset.valid && !backendFlush 107309c6f1ddSLingrui98 fromIfuRedirect.bits.ftqIdx := pdWb.bits.ftqIdx 107409c6f1ddSLingrui98 fromIfuRedirect.bits.ftqOffset := pdWb.bits.misOffset.bits 107509c6f1ddSLingrui98 fromIfuRedirect.bits.level := RedirectLevel.flushAfter 1076d2b20d1aSTang Haojin fromIfuRedirect.bits.BTBMissBubble := true.B 1077d2b20d1aSTang Haojin fromIfuRedirect.bits.debugIsMemVio := false.B 1078d2b20d1aSTang Haojin fromIfuRedirect.bits.debugIsCtrl := false.B 107909c6f1ddSLingrui98 108009c6f1ddSLingrui98 val ifuRedirectCfiUpdate = fromIfuRedirect.bits.cfiUpdate 108109c6f1ddSLingrui98 ifuRedirectCfiUpdate.pc := pdWb.bits.pc(pdWb.bits.misOffset.bits) 108209c6f1ddSLingrui98 ifuRedirectCfiUpdate.pd := pdWb.bits.pd(pdWb.bits.misOffset.bits) 108309c6f1ddSLingrui98 ifuRedirectCfiUpdate.predTaken := cfiIndex_vec(pdWb.bits.ftqIdx.value).valid 108409c6f1ddSLingrui98 ifuRedirectCfiUpdate.target := pdWb.bits.target 108509c6f1ddSLingrui98 ifuRedirectCfiUpdate.taken := pdWb.bits.cfiOffset.valid 108609c6f1ddSLingrui98 ifuRedirectCfiUpdate.isMisPred := pdWb.bits.misOffset.valid 108709c6f1ddSLingrui98 10881c6fc24aSEaston Man val ifuRedirectReg = RegNextWithEnable(fromIfuRedirect, hasInit = true) 108909c6f1ddSLingrui98 val ifuRedirectToBpu = WireInit(ifuRedirectReg) 109009c6f1ddSLingrui98 ifuFlush := fromIfuRedirect.valid || ifuRedirectToBpu.valid 109109c6f1ddSLingrui98 109216a171eeSEaston Man ftq_redirect_mem.io.ren.get.head := fromIfuRedirect.valid 1093deb3a97eSGao-Zeyu ftq_redirect_mem.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value 109409c6f1ddSLingrui98 109509c6f1ddSLingrui98 val toBpuCfi = ifuRedirectToBpu.bits.cfiUpdate 1096deb3a97eSGao-Zeyu toBpuCfi.fromFtqRedirectSram(ftq_redirect_mem.io.rdata.head) 1097f1267a13SEaston Man when (ifuRedirectReg.bits.cfiUpdate.pd.isRet && ifuRedirectReg.bits.cfiUpdate.pd.valid) { 1098c89b4642SGuokai Chen toBpuCfi.target := toBpuCfi.topAddr 109909c6f1ddSLingrui98 } 110009c6f1ddSLingrui98 1101d2b20d1aSTang Haojin when (ifuRedirectReg.valid) { 1102d2b20d1aSTang Haojin ifuRedirected(ifuRedirectReg.bits.ftqIdx.value) := true.B 1103d2b20d1aSTang Haojin } .elsewhen(RegNext(pdWb.valid)) { 1104d2b20d1aSTang Haojin // if pdWb and no redirect, set to false 1105d2b20d1aSTang Haojin ifuRedirected(last_cycle_bpu_in_ptr.value) := false.B 1106d2b20d1aSTang Haojin } 1107d2b20d1aSTang Haojin 11086022c595SsinceforYy // ********************************************************************** 11096022c595SsinceforYy // ***************************** to backend ***************************** 11106022c595SsinceforYy // ********************************************************************** 11116022c595SsinceforYy // to backend pc mem / target 11126022c595SsinceforYy io.toBackend.pc_mem_wen := RegNext(last_cycle_bpu_in) 1113f533cba7SHuSipeng io.toBackend.pc_mem_waddr := RegEnable(last_cycle_bpu_in_idx, last_cycle_bpu_in) 11146022c595SsinceforYy io.toBackend.pc_mem_wdata := RegEnable(bpu_in_bypass_buf_for_ifu, last_cycle_bpu_in) 11156022c595SsinceforYy 11166022c595SsinceforYy // num cycle is fixed 11176022c595SsinceforYy val newest_entry_en: Bool = RegNext(last_cycle_bpu_in || backendRedirect.valid || ifuRedirectToBpu.valid) 11186022c595SsinceforYy io.toBackend.newest_entry_en := RegNext(newest_entry_en) 11196022c595SsinceforYy io.toBackend.newest_entry_ptr := RegEnable(newest_entry_ptr, newest_entry_en) 11206022c595SsinceforYy io.toBackend.newest_entry_target := RegEnable(newest_entry_target, newest_entry_en) 11216022c595SsinceforYy 112209c6f1ddSLingrui98 // ********************************************************************* 112309c6f1ddSLingrui98 // **************************** wb from exu **************************** 112409c6f1ddSLingrui98 // ********************************************************************* 112509c6f1ddSLingrui98 1126d2b20d1aSTang Haojin backendRedirect.valid := io.fromBackend.redirect.valid 1127d2b20d1aSTang Haojin backendRedirect.bits.connectRedirect(io.fromBackend.redirect.bits) 1128d2b20d1aSTang Haojin backendRedirect.bits.BTBMissBubble := false.B 1129d2b20d1aSTang Haojin 11302e1be6e1SSteve Gou 113109c6f1ddSLingrui98 def extractRedirectInfo(wb: Valid[Redirect]) = { 11326bf9b30dSLingrui98 val ftqPtr = wb.bits.ftqIdx 113309c6f1ddSLingrui98 val ftqOffset = wb.bits.ftqOffset 113409c6f1ddSLingrui98 val taken = wb.bits.cfiUpdate.taken 113509c6f1ddSLingrui98 val mispred = wb.bits.cfiUpdate.isMisPred 11366bf9b30dSLingrui98 (wb.valid, ftqPtr, ftqOffset, taken, mispred) 113709c6f1ddSLingrui98 } 113809c6f1ddSLingrui98 113909c6f1ddSLingrui98 // fix mispredict entry 114009c6f1ddSLingrui98 val lastIsMispredict = RegNext( 1141df5b4b8eSYinan Xu backendRedirect.valid && backendRedirect.bits.level === RedirectLevel.flushAfter, init = false.B 114209c6f1ddSLingrui98 ) 114309c6f1ddSLingrui98 114409c6f1ddSLingrui98 def updateCfiInfo(redirect: Valid[Redirect], isBackend: Boolean = true) = { 11456bf9b30dSLingrui98 val (r_valid, r_ptr, r_offset, r_taken, r_mispred) = extractRedirectInfo(redirect) 11466bf9b30dSLingrui98 val r_idx = r_ptr.value 114709c6f1ddSLingrui98 val cfiIndex_bits_wen = r_valid && r_taken && r_offset < cfiIndex_vec(r_idx).bits 114809c6f1ddSLingrui98 val cfiIndex_valid_wen = r_valid && r_offset === cfiIndex_vec(r_idx).bits 114909c6f1ddSLingrui98 when (cfiIndex_bits_wen || cfiIndex_valid_wen) { 115009c6f1ddSLingrui98 cfiIndex_vec(r_idx).valid := cfiIndex_bits_wen || cfiIndex_valid_wen && r_taken 11513f88c020SGuokai Chen } .elsewhen (r_valid && !r_taken && r_offset =/= cfiIndex_vec(r_idx).bits) { 11523f88c020SGuokai Chen cfiIndex_vec(r_idx).valid :=false.B 115309c6f1ddSLingrui98 } 115409c6f1ddSLingrui98 when (cfiIndex_bits_wen) { 115509c6f1ddSLingrui98 cfiIndex_vec(r_idx).bits := r_offset 115609c6f1ddSLingrui98 } 11571c6fc24aSEaston Man newest_entry_target_modified := true.B 11586bf9b30dSLingrui98 newest_entry_target := redirect.bits.cfiUpdate.target 11591c6fc24aSEaston Man newest_entry_ptr_modified := true.B 1160873dc383SLingrui98 newest_entry_ptr := r_ptr 11611c6fc24aSEaston Man 1162b0ed7239SLingrui98 update_target(r_idx) := redirect.bits.cfiUpdate.target // TODO: remove this 116309c6f1ddSLingrui98 if (isBackend) { 116409c6f1ddSLingrui98 mispredict_vec(r_idx)(r_offset) := r_mispred 116509c6f1ddSLingrui98 } 116609c6f1ddSLingrui98 } 116709c6f1ddSLingrui98 1168bace178aSGao-Zeyu when(fromBackendRedirect.valid) { 1169bace178aSGao-Zeyu updateCfiInfo(fromBackendRedirect) 117009c6f1ddSLingrui98 }.elsewhen (ifuRedirectToBpu.valid) { 117109c6f1ddSLingrui98 updateCfiInfo(ifuRedirectToBpu, isBackend=false) 117209c6f1ddSLingrui98 } 117309c6f1ddSLingrui98 1174bace178aSGao-Zeyu when (fromBackendRedirect.valid) { 1175bace178aSGao-Zeyu when (fromBackendRedirect.bits.ControlRedirectBubble) { 1176d2b20d1aSTang Haojin when (fromBackendRedirect.bits.ControlBTBMissBubble) { 1177d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.BTBMissBubble.id) := true.B 1178d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.BTBMissBubble.id) := true.B 1179d2b20d1aSTang Haojin } .elsewhen (fromBackendRedirect.bits.TAGEMissBubble) { 1180d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.TAGEMissBubble.id) := true.B 1181d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.TAGEMissBubble.id) := true.B 1182d2b20d1aSTang Haojin } .elsewhen (fromBackendRedirect.bits.SCMissBubble) { 1183d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.SCMissBubble.id) := true.B 1184d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.SCMissBubble.id) := true.B 1185d2b20d1aSTang Haojin } .elsewhen (fromBackendRedirect.bits.ITTAGEMissBubble) { 1186d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.ITTAGEMissBubble.id) := true.B 1187d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.ITTAGEMissBubble.id) := true.B 1188d2b20d1aSTang Haojin } .elsewhen (fromBackendRedirect.bits.RASMissBubble) { 1189d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.RASMissBubble.id) := true.B 1190d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.RASMissBubble.id) := true.B 1191d2b20d1aSTang Haojin } 1192d2b20d1aSTang Haojin 1193d2b20d1aSTang Haojin 11949342624fSGao-Zeyu } .elsewhen (backendRedirect.bits.MemVioRedirectBubble) { 1195d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.MemVioRedirectBubble.id) := true.B 1196d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.MemVioRedirectBubble.id) := true.B 1197d2b20d1aSTang Haojin } .otherwise { 1198d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.OtherRedirectBubble.id) := true.B 1199d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.OtherRedirectBubble.id) := true.B 1200d2b20d1aSTang Haojin } 1201d2b20d1aSTang Haojin } .elsewhen (ifuRedirectReg.valid) { 1202d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.BTBMissBubble.id) := true.B 1203d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.BTBMissBubble.id) := true.B 1204d2b20d1aSTang Haojin } 1205d2b20d1aSTang Haojin 1206d2b20d1aSTang Haojin io.ControlBTBMissBubble := fromBackendRedirect.bits.ControlBTBMissBubble 1207d2b20d1aSTang Haojin io.TAGEMissBubble := fromBackendRedirect.bits.TAGEMissBubble 1208d2b20d1aSTang Haojin io.SCMissBubble := fromBackendRedirect.bits.SCMissBubble 1209d2b20d1aSTang Haojin io.ITTAGEMissBubble := fromBackendRedirect.bits.ITTAGEMissBubble 1210d2b20d1aSTang Haojin io.RASMissBubble := fromBackendRedirect.bits.RASMissBubble 1211d2b20d1aSTang Haojin 121209c6f1ddSLingrui98 // *********************************************************************************** 121309c6f1ddSLingrui98 // **************************** flush ptr and state queue **************************** 121409c6f1ddSLingrui98 // *********************************************************************************** 121509c6f1ddSLingrui98 1216df5b4b8eSYinan Xu val redirectVec = VecInit(backendRedirect, fromIfuRedirect) 121709c6f1ddSLingrui98 121809c6f1ddSLingrui98 // when redirect, we should reset ptrs and status queues 1219b92f8445Sssszwic io.icacheFlush := redirectVec.map(r => r.valid).reduce(_||_) 1220b92f8445Sssszwic XSPerfAccumulate("icacheFlushFromBackend", backendRedirect.valid) 1221b92f8445Sssszwic XSPerfAccumulate("icacheFlushFromIFU", fromIfuRedirect.valid) 122209c6f1ddSLingrui98 when(redirectVec.map(r => r.valid).reduce(_||_)){ 12232f4a3aa4SLingrui98 val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits))) 122409c6f1ddSLingrui98 val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_) 12252f4a3aa4SLingrui98 val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level)) 122609c6f1ddSLingrui98 val next = idx + 1.U 122709c6f1ddSLingrui98 bpuPtr := next 1228dc270d3bSJenius copied_bpu_ptr.map(_ := next) 1229c5c5edaeSJenius ifuPtr_write := next 1230c5c5edaeSJenius ifuWbPtr_write := next 1231c5c5edaeSJenius ifuPtrPlus1_write := idx + 2.U 12326bf9b30dSLingrui98 ifuPtrPlus2_write := idx + 3.U 1233b92f8445Sssszwic pfPtr_write := next 1234b92f8445Sssszwic pfPtrPlus1_write := idx + 2.U 12353f88c020SGuokai Chen } 12363f88c020SGuokai Chen when(RegNext(redirectVec.map(r => r.valid).reduce(_||_))){ 12373f88c020SGuokai Chen val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits))) 12383f88c020SGuokai Chen val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_) 12393f88c020SGuokai Chen val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level)) 12403f88c020SGuokai Chen when (RegNext(notIfu)) { 12411c6fc24aSEaston Man commitStateQueueEnable(RegNext(idx.value)) := true.B 12421c6fc24aSEaston Man commitStateQueueNext(RegNext(idx.value)).zipWithIndex.foreach({ case (s, i) => 124391346769SMuzi when(i.U > RegNext(offset)) { 124491346769SMuzi s := c_empty 124591346769SMuzi } 124691346769SMuzi when (i.U === RegNext(offset) && RegNext(flushItSelf)) { 124791346769SMuzi s := c_flushed 124809c6f1ddSLingrui98 } 124909c6f1ddSLingrui98 }) 125009c6f1ddSLingrui98 } 125109c6f1ddSLingrui98 } 125209c6f1ddSLingrui98 12533f88c020SGuokai Chen 125409c6f1ddSLingrui98 // only the valid bit is actually needed 1255df5b4b8eSYinan Xu io.toIfu.redirect.bits := backendRedirect.bits 125609c6f1ddSLingrui98 io.toIfu.redirect.valid := stage2Flush 1257d2b20d1aSTang Haojin io.toIfu.topdown_redirect := fromBackendRedirect 125809c6f1ddSLingrui98 125909c6f1ddSLingrui98 // commit 12609aca92b9SYinan Xu for (c <- io.fromBackend.rob_commits) { 126109c6f1ddSLingrui98 when(c.valid) { 12621c6fc24aSEaston Man commitStateQueueEnable(c.bits.ftqIdx.value) := true.B 126391346769SMuzi commitStateQueueNext(c.bits.ftqIdx.value)(c.bits.ftqOffset) := c_committed 126488825c5cSYinan Xu // TODO: remove this 126588825c5cSYinan Xu // For instruction fusions, we also update the next instruction 1266c3abb8b6SYinan Xu when (c.bits.commitType === 4.U) { 126791346769SMuzi commitStateQueueNext(c.bits.ftqIdx.value)(c.bits.ftqOffset + 1.U) := c_committed 1268c3abb8b6SYinan Xu }.elsewhen(c.bits.commitType === 5.U) { 126991346769SMuzi commitStateQueueNext(c.bits.ftqIdx.value)(c.bits.ftqOffset + 2.U) := c_committed 1270c3abb8b6SYinan Xu }.elsewhen(c.bits.commitType === 6.U) { 127188825c5cSYinan Xu val index = (c.bits.ftqIdx + 1.U).value 12721c6fc24aSEaston Man commitStateQueueEnable(index) := true.B 127391346769SMuzi commitStateQueueNext(index)(0) := c_committed 1274c3abb8b6SYinan Xu }.elsewhen(c.bits.commitType === 7.U) { 127588825c5cSYinan Xu val index = (c.bits.ftqIdx + 1.U).value 12761c6fc24aSEaston Man commitStateQueueEnable(index) := true.B 127791346769SMuzi commitStateQueueNext(index)(1) := c_committed 127888825c5cSYinan Xu } 127909c6f1ddSLingrui98 } 128009c6f1ddSLingrui98 } 128109c6f1ddSLingrui98 128209c6f1ddSLingrui98 // **************************************************************** 128309c6f1ddSLingrui98 // **************************** to bpu **************************** 128409c6f1ddSLingrui98 // **************************************************************** 128509c6f1ddSLingrui98 1286fd3aa057SYuandongliang io.toBpu.redirctFromIFU := ifuRedirectToBpu.valid 128751981c77SbugGenerator io.toBpu.redirect := Mux(fromBackendRedirect.valid, fromBackendRedirect, ifuRedirectToBpu) 1288209a4cafSSteve Gou val dummy_s1_pred_cycle_vec = VecInit(List.tabulate(FtqSize)(_=>0.U(64.W))) 1289209a4cafSSteve Gou val redirect_latency = GTimer() - pred_s1_cycle.getOrElse(dummy_s1_pred_cycle_vec)(io.toBpu.redirect.bits.ftqIdx.value) + 1.U 1290209a4cafSSteve Gou XSPerfHistogram("backend_redirect_latency", redirect_latency, fromBackendRedirect.valid, 0, 60, 1) 1291209a4cafSSteve Gou XSPerfHistogram("ifu_redirect_latency", redirect_latency, !fromBackendRedirect.valid && ifuRedirectToBpu.valid, 0, 60, 1) 129209c6f1ddSLingrui98 1293f21bbcb2SGuokai Chen XSError(io.toBpu.redirect.valid && isBefore(io.toBpu.redirect.bits.ftqIdx, commPtr), "Ftq received a redirect after its commit, check backend or replay") 129409c6f1ddSLingrui98 129502f21c16SLingrui98 val may_have_stall_from_bpu = Wire(Bool()) 129602f21c16SLingrui98 val bpu_ftb_update_stall = RegInit(0.U(2.W)) // 2-cycle stall, so we need 3 states 129702f21c16SLingrui98 may_have_stall_from_bpu := bpu_ftb_update_stall =/= 0.U 12989230e379SMuzi 12999230e379SMuzi val validInstructions = commitStateQueueReg(commPtr.value).map(s => s === c_toCommit || s === c_committed) 13009230e379SMuzi val lastInstructionStatus = PriorityMux(validInstructions.reverse.zip(commitStateQueueReg(commPtr.value).reverse)) 13019230e379SMuzi val firstInstructionFlushed = commitStateQueueReg(commPtr.value)(0) === c_flushed 13029230e379SMuzi canCommit := commPtr =/= ifuWbPtr && !may_have_stall_from_bpu && 13039230e379SMuzi (isAfter(robCommPtr, commPtr) || 13049230e379SMuzi validInstructions.reduce(_ || _) && lastInstructionStatus === c_committed) 13059230e379SMuzi val canMoveCommPtr = commPtr =/= ifuWbPtr && !may_have_stall_from_bpu && 13069230e379SMuzi (isAfter(robCommPtr, commPtr) || 13079230e379SMuzi validInstructions.reduce(_ || _) && lastInstructionStatus === c_committed || 13089230e379SMuzi firstInstructionFlushed) 130991346769SMuzi 131091346769SMuzi when (io.fromBackend.rob_commits.map(_.valid).reduce(_ | _)) { 131191346769SMuzi robCommPtr_write := ParallelPriorityMux(io.fromBackend.rob_commits.map(_.valid).reverse, io.fromBackend.rob_commits.map(_.bits.ftqIdx).reverse) 13129230e379SMuzi } .elsewhen (isAfter(commPtr, robCommPtr)) { 131391346769SMuzi robCommPtr_write := commPtr 131491346769SMuzi } .otherwise { 131591346769SMuzi robCommPtr_write := robCommPtr 131691346769SMuzi } 131709c6f1ddSLingrui98 1318ba5ba1dcSmy-mayfly /** 1319ba5ba1dcSmy-mayfly ************************************************************************************* 1320ba5ba1dcSmy-mayfly * MMIO instruction fetch is allowed only if MMIO is the oldest instruction. 1321ba5ba1dcSmy-mayfly ************************************************************************************* 1322ba5ba1dcSmy-mayfly */ 13231d1e6d4dSJenius val mmioReadPtr = io.mmioCommitRead.mmioFtqPtr 13249230e379SMuzi val mmioLastCommit = isAfter(commPtr, mmioReadPtr) || 13259230e379SMuzi commPtr === mmioReadPtr && validInstructions.reduce(_ || _) && lastInstructionStatus === c_committed 13261d1e6d4dSJenius io.mmioCommitRead.mmioLastCommit := RegNext(mmioLastCommit) 13271d1e6d4dSJenius 132809c6f1ddSLingrui98 // commit reads 1329c5c5edaeSJenius val commit_pc_bundle = RegNext(ftq_pc_mem.io.commPtr_rdata) 133081101dc4SLingrui98 val commit_target = 133134cf890eSLingrui98 Mux(RegNext(commPtr === newest_entry_ptr), 13321c6fc24aSEaston Man RegEnable(newest_entry_target, newest_entry_target_modified), 133381101dc4SLingrui98 RegNext(ftq_pc_mem.io.commPtrPlus1_rdata.startAddr)) 13341c6fc24aSEaston Man ftq_pd_mem.io.ren.get.last := canCommit 133509c6f1ddSLingrui98 ftq_pd_mem.io.raddr.last := commPtr.value 133609c6f1ddSLingrui98 val commit_pd = ftq_pd_mem.io.rdata.last 133716a171eeSEaston Man ftq_redirect_mem.io.ren.get.last := canCommit 1338deb3a97eSGao-Zeyu ftq_redirect_mem.io.raddr.last := commPtr.value 1339deb3a97eSGao-Zeyu val commit_spec_meta = ftq_redirect_mem.io.rdata.last 134009c6f1ddSLingrui98 ftq_meta_1r_sram.io.ren(0) := canCommit 134109c6f1ddSLingrui98 ftq_meta_1r_sram.io.raddr(0) := commPtr.value 1342deb3a97eSGao-Zeyu val commit_meta = ftq_meta_1r_sram.io.rdata(0).meta 1343deb3a97eSGao-Zeyu val commit_ftb_entry = ftq_meta_1r_sram.io.rdata(0).ftb_entry 134409c6f1ddSLingrui98 134509c6f1ddSLingrui98 // need one cycle to read mem and srams 13461c6fc24aSEaston Man val do_commit_ptr = RegEnable(commPtr, canCommit) 13475371700eSzoujr val do_commit = RegNext(canCommit, init=false.B) 13489230e379SMuzi when (canMoveCommPtr) { 13496bf9b30dSLingrui98 commPtr_write := commPtrPlus1 13506bf9b30dSLingrui98 commPtrPlus1_write := commPtrPlus1 + 1.U 13516bf9b30dSLingrui98 } 13521c6fc24aSEaston Man val commit_state = RegEnable(commitStateQueueReg(commPtr.value), canCommit) 13535371700eSzoujr val can_commit_cfi = WireInit(cfiIndex_vec(commPtr.value)) 1354d4fcfc3eSGuokai Chen val do_commit_cfi = WireInit(cfiIndex_vec(do_commit_ptr.value)) 13553f88c020SGuokai Chen // 13563f88c020SGuokai Chen //when (commitStateQueue(commPtr.value)(can_commit_cfi.bits) =/= c_commited) { 13573f88c020SGuokai Chen // can_commit_cfi.valid := false.B 13583f88c020SGuokai Chen //} 13591c6fc24aSEaston Man val commit_cfi = RegEnable(can_commit_cfi, canCommit) 136091346769SMuzi val debug_cfi = commitStateQueueReg(do_commit_ptr.value)(do_commit_cfi.bits) =/= c_committed && do_commit_cfi.valid 136109c6f1ddSLingrui98 13621c6fc24aSEaston Man val commit_mispredict : Vec[Bool] = VecInit((RegEnable(mispredict_vec(commPtr.value), canCommit) zip commit_state).map { 136391346769SMuzi case (mis, state) => mis && state === c_committed 136409c6f1ddSLingrui98 }) 136591346769SMuzi val commit_instCommited: Vec[Bool] = VecInit(commit_state.map(_ === c_committed)) // [PredictWidth] 13665371700eSzoujr val can_commit_hit = entry_hit_status(commPtr.value) 13671c6fc24aSEaston Man val commit_hit = RegEnable(can_commit_hit, canCommit) 13681c6fc24aSEaston Man val diff_commit_target = RegEnable(update_target(commPtr.value), canCommit) // TODO: remove this 13691c6fc24aSEaston Man val commit_stage = RegEnable(pred_stage(commPtr.value), canCommit) 137009c6f1ddSLingrui98 val commit_valid = commit_hit === h_hit || commit_cfi.valid // hit or taken 137109c6f1ddSLingrui98 13725371700eSzoujr val to_bpu_hit = can_commit_hit === h_hit || can_commit_hit === h_false_hit 137302f21c16SLingrui98 switch (bpu_ftb_update_stall) { 137402f21c16SLingrui98 is (0.U) { 137502f21c16SLingrui98 when (can_commit_cfi.valid && !to_bpu_hit && canCommit) { 137602f21c16SLingrui98 bpu_ftb_update_stall := 2.U // 2-cycle stall 137702f21c16SLingrui98 } 137802f21c16SLingrui98 } 137902f21c16SLingrui98 is (2.U) { 138002f21c16SLingrui98 bpu_ftb_update_stall := 1.U 138102f21c16SLingrui98 } 138202f21c16SLingrui98 is (1.U) { 138302f21c16SLingrui98 bpu_ftb_update_stall := 0.U 138402f21c16SLingrui98 } 138502f21c16SLingrui98 is (3.U) { 138602f21c16SLingrui98 XSError(true.B, "bpu_ftb_update_stall should be 0, 1 or 2") 138702f21c16SLingrui98 } 138802f21c16SLingrui98 } 138909c6f1ddSLingrui98 1390b0ed7239SLingrui98 // TODO: remove this 1391b0ed7239SLingrui98 XSError(do_commit && diff_commit_target =/= commit_target, "\ncommit target should be the same as update target\n") 1392b0ed7239SLingrui98 1393b2f6ed0aSSteve Gou // update latency stats 1394b2f6ed0aSSteve Gou val update_latency = GTimer() - pred_s1_cycle.getOrElse(dummy_s1_pred_cycle_vec)(do_commit_ptr.value) + 1.U 1395b2f6ed0aSSteve Gou XSPerfHistogram("bpu_update_latency", update_latency, io.toBpu.update.valid, 0, 64, 2) 1396b2f6ed0aSSteve Gou 139709c6f1ddSLingrui98 io.toBpu.update := DontCare 139809c6f1ddSLingrui98 io.toBpu.update.valid := commit_valid && do_commit 139909c6f1ddSLingrui98 val update = io.toBpu.update.bits 140009c6f1ddSLingrui98 update.false_hit := commit_hit === h_false_hit 140109c6f1ddSLingrui98 update.pc := commit_pc_bundle.startAddr 1402deb3a97eSGao-Zeyu update.meta := commit_meta 1403803124a6SLingrui98 update.cfi_idx := commit_cfi 14048ffcd86aSLingrui98 update.full_target := commit_target 1405edc18578SLingrui98 update.from_stage := commit_stage 1406c2d1ec7dSLingrui98 update.spec_info := commit_spec_meta 14073f88c020SGuokai Chen XSError(commit_valid && do_commit && debug_cfi, "\ncommit cfi can be non c_commited\n") 140809c6f1ddSLingrui98 140909c6f1ddSLingrui98 val commit_real_hit = commit_hit === h_hit 141009c6f1ddSLingrui98 val update_ftb_entry = update.ftb_entry 141109c6f1ddSLingrui98 141209c6f1ddSLingrui98 val ftbEntryGen = Module(new FTBEntryGen).io 141309c6f1ddSLingrui98 ftbEntryGen.start_addr := commit_pc_bundle.startAddr 141409c6f1ddSLingrui98 ftbEntryGen.old_entry := commit_ftb_entry 141509c6f1ddSLingrui98 ftbEntryGen.pd := commit_pd 141609c6f1ddSLingrui98 ftbEntryGen.cfiIndex := commit_cfi 141709c6f1ddSLingrui98 ftbEntryGen.target := commit_target 141809c6f1ddSLingrui98 ftbEntryGen.hit := commit_real_hit 141909c6f1ddSLingrui98 ftbEntryGen.mispredict_vec := commit_mispredict 142009c6f1ddSLingrui98 142109c6f1ddSLingrui98 update_ftb_entry := ftbEntryGen.new_entry 142209c6f1ddSLingrui98 update.new_br_insert_pos := ftbEntryGen.new_br_insert_pos 142309c6f1ddSLingrui98 update.mispred_mask := ftbEntryGen.mispred_mask 142409c6f1ddSLingrui98 update.old_entry := ftbEntryGen.is_old_entry 1425edc18578SLingrui98 update.pred_hit := commit_hit === h_hit || commit_hit === h_false_hit 1426803124a6SLingrui98 update.br_taken_mask := ftbEntryGen.taken_mask 1427cc2d1573SEaston Man update.br_committed := (ftbEntryGen.new_entry.brValids zip ftbEntryGen.new_entry.brOffset) map { 1428cc2d1573SEaston Man case (valid, offset) => valid && commit_instCommited(offset) 1429cc2d1573SEaston Man } 1430803124a6SLingrui98 update.jmp_taken := ftbEntryGen.jmp_taken 1431b37e4b45SLingrui98 1432803124a6SLingrui98 // update.full_pred.fromFtbEntry(ftbEntryGen.new_entry, update.pc) 1433803124a6SLingrui98 // update.full_pred.jalr_target := commit_target 1434803124a6SLingrui98 // update.full_pred.hit := true.B 1435803124a6SLingrui98 // when (update.full_pred.is_jalr) { 1436803124a6SLingrui98 // update.full_pred.targets.last := commit_target 1437803124a6SLingrui98 // } 143809c6f1ddSLingrui98 143909c6f1ddSLingrui98 // ****************************************************************************** 144009c6f1ddSLingrui98 // **************************** commit perf counters **************************** 144109c6f1ddSLingrui98 // ****************************************************************************** 144209c6f1ddSLingrui98 144391346769SMuzi val commit_inst_mask = VecInit(commit_state.map(c => c === c_committed && do_commit)).asUInt 144409c6f1ddSLingrui98 val commit_mispred_mask = commit_mispredict.asUInt 144509c6f1ddSLingrui98 val commit_not_mispred_mask = ~commit_mispred_mask 144609c6f1ddSLingrui98 144709c6f1ddSLingrui98 val commit_br_mask = commit_pd.brMask.asUInt 144809c6f1ddSLingrui98 val commit_jmp_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.jmpInfo.valid.asTypeOf(UInt(1.W))) 144909c6f1ddSLingrui98 val commit_cfi_mask = (commit_br_mask | commit_jmp_mask) 145009c6f1ddSLingrui98 145109c6f1ddSLingrui98 val mbpInstrs = commit_inst_mask & commit_cfi_mask 145209c6f1ddSLingrui98 145309c6f1ddSLingrui98 val mbpRights = mbpInstrs & commit_not_mispred_mask 145409c6f1ddSLingrui98 val mbpWrongs = mbpInstrs & commit_mispred_mask 145509c6f1ddSLingrui98 145609c6f1ddSLingrui98 io.bpuInfo.bpRight := PopCount(mbpRights) 145709c6f1ddSLingrui98 io.bpuInfo.bpWrong := PopCount(mbpWrongs) 145809c6f1ddSLingrui98 1459b92f8445Sssszwic val hartId = p(XSCoreParamsKey).HartId 1460c686adcdSYinan Xu val isWriteFTQTable = Constantin.createRecord(s"isWriteFTQTable$hartId") 1461c686adcdSYinan Xu val ftqBranchTraceDB = ChiselDB.createTable(s"FTQTable$hartId", new FtqDebugBundle) 146209c6f1ddSLingrui98 // Cfi Info 146309c6f1ddSLingrui98 for (i <- 0 until PredictWidth) { 146409c6f1ddSLingrui98 val pc = commit_pc_bundle.startAddr + (i * instBytes).U 146591346769SMuzi val v = commit_state(i) === c_committed 146609c6f1ddSLingrui98 val isBr = commit_pd.brMask(i) 146709c6f1ddSLingrui98 val isJmp = commit_pd.jmpInfo.valid && commit_pd.jmpOffset === i.U 146809c6f1ddSLingrui98 val isCfi = isBr || isJmp 146909c6f1ddSLingrui98 val isTaken = commit_cfi.valid && commit_cfi.bits === i.U 147009c6f1ddSLingrui98 val misPred = commit_mispredict(i) 1471c2ad24ebSLingrui98 // val ghist = commit_spec_meta.ghist.predHist 1472c2ad24ebSLingrui98 val histPtr = commit_spec_meta.histPtr 1473deb3a97eSGao-Zeyu val predCycle = commit_meta(63, 0) 147409c6f1ddSLingrui98 val target = commit_target 147509c6f1ddSLingrui98 147609c6f1ddSLingrui98 val brIdx = OHToUInt(Reverse(Cat(update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U}))) 147709c6f1ddSLingrui98 val inFtbEntry = update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U}.reduce(_||_) 147809c6f1ddSLingrui98 val addIntoHist = ((commit_hit === h_hit) && inFtbEntry) || ((!(commit_hit === h_hit) && i.U === commit_cfi.bits && isBr && commit_cfi.valid)) 147909c6f1ddSLingrui98 XSDebug(v && do_commit && isCfi, p"cfi_update: isBr(${isBr}) pc(${Hexadecimal(pc)}) " + 1480c2ad24ebSLingrui98 p"taken(${isTaken}) mispred(${misPred}) cycle($predCycle) hist(${histPtr.value}) " + 148109c6f1ddSLingrui98 p"startAddr(${Hexadecimal(commit_pc_bundle.startAddr)}) AddIntoHist(${addIntoHist}) " + 148209c6f1ddSLingrui98 p"brInEntry(${inFtbEntry}) brIdx(${brIdx}) target(${Hexadecimal(target)})\n") 148351532d8bSGuokai Chen 148451532d8bSGuokai Chen val logbundle = Wire(new FtqDebugBundle) 148551532d8bSGuokai Chen logbundle.pc := pc 148651532d8bSGuokai Chen logbundle.target := target 148751532d8bSGuokai Chen logbundle.isBr := isBr 148851532d8bSGuokai Chen logbundle.isJmp := isJmp 148951532d8bSGuokai Chen logbundle.isCall := isJmp && commit_pd.hasCall 149051532d8bSGuokai Chen logbundle.isRet := isJmp && commit_pd.hasRet 149151532d8bSGuokai Chen logbundle.misPred := misPred 149251532d8bSGuokai Chen logbundle.isTaken := isTaken 149351532d8bSGuokai Chen logbundle.predStage := commit_stage 149451532d8bSGuokai Chen 149551532d8bSGuokai Chen ftqBranchTraceDB.log( 149651532d8bSGuokai Chen data = logbundle /* hardware of type T */, 1497da3bf434SMaxpicca-Li en = isWriteFTQTable.orR && v && do_commit && isCfi, 149851532d8bSGuokai Chen site = "FTQ" + p(XSCoreParamsKey).HartId.toString, 149951532d8bSGuokai Chen clock = clock, 150051532d8bSGuokai Chen reset = reset 150151532d8bSGuokai Chen ) 150209c6f1ddSLingrui98 } 150309c6f1ddSLingrui98 150409c6f1ddSLingrui98 val enq = io.fromBpu.resp 15052e1be6e1SSteve Gou val perf_redirect = backendRedirect 150609c6f1ddSLingrui98 150709c6f1ddSLingrui98 XSPerfAccumulate("entry", validEntries) 150809c6f1ddSLingrui98 XSPerfAccumulate("bpu_to_ftq_stall", enq.valid && !enq.ready) 150909c6f1ddSLingrui98 XSPerfAccumulate("mispredictRedirect", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level) 151009c6f1ddSLingrui98 XSPerfAccumulate("replayRedirect", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level)) 151109c6f1ddSLingrui98 XSPerfAccumulate("predecodeRedirect", fromIfuRedirect.valid) 151209c6f1ddSLingrui98 151309c6f1ddSLingrui98 XSPerfAccumulate("to_ifu_bubble", io.toIfu.req.ready && !io.toIfu.req.valid) 151409c6f1ddSLingrui98 151509c6f1ddSLingrui98 XSPerfAccumulate("to_ifu_stall", io.toIfu.req.valid && !io.toIfu.req.ready) 151609c6f1ddSLingrui98 XSPerfAccumulate("from_bpu_real_bubble", !enq.valid && enq.ready && allowBpuIn) 151712cedb6fSLingrui98 XSPerfAccumulate("bpu_to_ifu_bubble", bpuPtr === ifuPtr) 1518b2f6ed0aSSteve Gou XSPerfAccumulate("bpu_to_ifu_bubble_when_ftq_full", (bpuPtr === ifuPtr) && isFull(bpuPtr, commPtr) && io.toIfu.req.ready) 151909c6f1ddSLingrui98 1520bace178aSGao-Zeyu XSPerfAccumulate("redirectAhead_ValidNum", ftqIdxAhead.map(_.valid).reduce(_|_)) 15219342624fSGao-Zeyu XSPerfAccumulate("fromBackendRedirect_ValidNum", io.fromBackend.redirect.valid) 15229342624fSGao-Zeyu XSPerfAccumulate("toBpuRedirect_ValidNum", io.toBpu.redirect.valid) 15239342624fSGao-Zeyu 152409c6f1ddSLingrui98 val from_bpu = io.fromBpu.resp.bits 152509c6f1ddSLingrui98 val to_ifu = io.toIfu.req.bits 152609c6f1ddSLingrui98 152709c6f1ddSLingrui98 1528209a4cafSSteve Gou XSPerfHistogram("commit_num_inst", PopCount(commit_inst_mask), do_commit, 0, PredictWidth+1, 1) 152909c6f1ddSLingrui98 153009c6f1ddSLingrui98 153109c6f1ddSLingrui98 153209c6f1ddSLingrui98 153309c6f1ddSLingrui98 val commit_jal_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJal.asTypeOf(UInt(1.W))) 153409c6f1ddSLingrui98 val commit_jalr_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJalr.asTypeOf(UInt(1.W))) 153509c6f1ddSLingrui98 val commit_call_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasCall.asTypeOf(UInt(1.W))) 153609c6f1ddSLingrui98 val commit_ret_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasRet.asTypeOf(UInt(1.W))) 153709c6f1ddSLingrui98 153809c6f1ddSLingrui98 153909c6f1ddSLingrui98 val mbpBRights = mbpRights & commit_br_mask 154009c6f1ddSLingrui98 val mbpJRights = mbpRights & commit_jal_mask 154109c6f1ddSLingrui98 val mbpIRights = mbpRights & commit_jalr_mask 154209c6f1ddSLingrui98 val mbpCRights = mbpRights & commit_call_mask 154309c6f1ddSLingrui98 val mbpRRights = mbpRights & commit_ret_mask 154409c6f1ddSLingrui98 154509c6f1ddSLingrui98 val mbpBWrongs = mbpWrongs & commit_br_mask 154609c6f1ddSLingrui98 val mbpJWrongs = mbpWrongs & commit_jal_mask 154709c6f1ddSLingrui98 val mbpIWrongs = mbpWrongs & commit_jalr_mask 154809c6f1ddSLingrui98 val mbpCWrongs = mbpWrongs & commit_call_mask 154909c6f1ddSLingrui98 val mbpRWrongs = mbpWrongs & commit_ret_mask 155009c6f1ddSLingrui98 15511d7e5011SLingrui98 val commit_pred_stage = RegNext(pred_stage(commPtr.value)) 15521d7e5011SLingrui98 15531d7e5011SLingrui98 def pred_stage_map(src: UInt, name: String) = { 15541d7e5011SLingrui98 (0 until numBpStages).map(i => 15551d7e5011SLingrui98 f"${name}_stage_${i+1}" -> PopCount(src.asBools.map(_ && commit_pred_stage === BP_STAGES(i))) 15561d7e5011SLingrui98 ).foldLeft(Map[String, UInt]())(_+_) 15571d7e5011SLingrui98 } 15581d7e5011SLingrui98 15591d7e5011SLingrui98 val mispred_stage_map = pred_stage_map(mbpWrongs, "mispredict") 15601d7e5011SLingrui98 val br_mispred_stage_map = pred_stage_map(mbpBWrongs, "br_mispredict") 15611d7e5011SLingrui98 val jalr_mispred_stage_map = pred_stage_map(mbpIWrongs, "jalr_mispredict") 15621d7e5011SLingrui98 val correct_stage_map = pred_stage_map(mbpRights, "correct") 15631d7e5011SLingrui98 val br_correct_stage_map = pred_stage_map(mbpBRights, "br_correct") 15641d7e5011SLingrui98 val jalr_correct_stage_map = pred_stage_map(mbpIRights, "jalr_correct") 15651d7e5011SLingrui98 156609c6f1ddSLingrui98 val update_valid = io.toBpu.update.valid 156709c6f1ddSLingrui98 def u(cond: Bool) = update_valid && cond 156809c6f1ddSLingrui98 val ftb_false_hit = u(update.false_hit) 156965fddcf0Szoujr // assert(!ftb_false_hit) 157009c6f1ddSLingrui98 val ftb_hit = u(commit_hit === h_hit) 157109c6f1ddSLingrui98 157209c6f1ddSLingrui98 val ftb_new_entry = u(ftbEntryGen.is_init_entry) 1573b37e4b45SLingrui98 val ftb_new_entry_only_br = ftb_new_entry && !update_ftb_entry.jmpValid 1574b37e4b45SLingrui98 val ftb_new_entry_only_jmp = ftb_new_entry && !update_ftb_entry.brValids(0) 1575b37e4b45SLingrui98 val ftb_new_entry_has_br_and_jmp = ftb_new_entry && update_ftb_entry.brValids(0) && update_ftb_entry.jmpValid 157609c6f1ddSLingrui98 157709c6f1ddSLingrui98 val ftb_old_entry = u(ftbEntryGen.is_old_entry) 157809c6f1ddSLingrui98 157909c6f1ddSLingrui98 val ftb_modified_entry = u(ftbEntryGen.is_new_br || ftbEntryGen.is_jalr_target_modified || ftbEntryGen.is_always_taken_modified) 158009c6f1ddSLingrui98 val ftb_modified_entry_new_br = u(ftbEntryGen.is_new_br) 1581d2b20d1aSTang Haojin val ftb_modified_entry_ifu_redirected = u(ifuRedirected(do_commit_ptr.value)) 158209c6f1ddSLingrui98 val ftb_modified_entry_jalr_target_modified = u(ftbEntryGen.is_jalr_target_modified) 158309c6f1ddSLingrui98 val ftb_modified_entry_br_full = ftb_modified_entry && ftbEntryGen.is_br_full 158409c6f1ddSLingrui98 val ftb_modified_entry_always_taken = ftb_modified_entry && ftbEntryGen.is_always_taken_modified 158509c6f1ddSLingrui98 1586209a4cafSSteve Gou def getFtbEntryLen(pc: UInt, entry: FTBEntry) = (entry.getFallThrough(pc) - pc) >> instOffsetBits 1587209a4cafSSteve Gou val gen_ftb_entry_len = getFtbEntryLen(update.pc, ftbEntryGen.new_entry) 1588209a4cafSSteve Gou XSPerfHistogram("ftb_init_entry_len", gen_ftb_entry_len, ftb_new_entry, 0, PredictWidth+1, 1) 1589209a4cafSSteve Gou XSPerfHistogram("ftb_modified_entry_len", gen_ftb_entry_len, ftb_modified_entry, 0, PredictWidth+1, 1) 1590209a4cafSSteve Gou val s3_ftb_entry_len = getFtbEntryLen(from_bpu.s3.pc(0), from_bpu.last_stage_ftb_entry) 1591209a4cafSSteve Gou XSPerfHistogram("s3_ftb_entry_len", s3_ftb_entry_len, from_bpu.s3.valid(0), 0, PredictWidth+1, 1) 159209c6f1ddSLingrui98 1593209a4cafSSteve Gou XSPerfHistogram("ftq_has_entry", validEntries, true.B, 0, FtqSize+1, 1) 159409c6f1ddSLingrui98 159509c6f1ddSLingrui98 val perfCountsMap = Map( 159609c6f1ddSLingrui98 "BpInstr" -> PopCount(mbpInstrs), 159709c6f1ddSLingrui98 "BpBInstr" -> PopCount(mbpBRights | mbpBWrongs), 159809c6f1ddSLingrui98 "BpRight" -> PopCount(mbpRights), 159909c6f1ddSLingrui98 "BpWrong" -> PopCount(mbpWrongs), 160009c6f1ddSLingrui98 "BpBRight" -> PopCount(mbpBRights), 160109c6f1ddSLingrui98 "BpBWrong" -> PopCount(mbpBWrongs), 160209c6f1ddSLingrui98 "BpJRight" -> PopCount(mbpJRights), 160309c6f1ddSLingrui98 "BpJWrong" -> PopCount(mbpJWrongs), 160409c6f1ddSLingrui98 "BpIRight" -> PopCount(mbpIRights), 160509c6f1ddSLingrui98 "BpIWrong" -> PopCount(mbpIWrongs), 160609c6f1ddSLingrui98 "BpCRight" -> PopCount(mbpCRights), 160709c6f1ddSLingrui98 "BpCWrong" -> PopCount(mbpCWrongs), 160809c6f1ddSLingrui98 "BpRRight" -> PopCount(mbpRRights), 160909c6f1ddSLingrui98 "BpRWrong" -> PopCount(mbpRWrongs), 161009c6f1ddSLingrui98 161109c6f1ddSLingrui98 "ftb_false_hit" -> PopCount(ftb_false_hit), 161209c6f1ddSLingrui98 "ftb_hit" -> PopCount(ftb_hit), 161309c6f1ddSLingrui98 "ftb_new_entry" -> PopCount(ftb_new_entry), 161409c6f1ddSLingrui98 "ftb_new_entry_only_br" -> PopCount(ftb_new_entry_only_br), 161509c6f1ddSLingrui98 "ftb_new_entry_only_jmp" -> PopCount(ftb_new_entry_only_jmp), 161609c6f1ddSLingrui98 "ftb_new_entry_has_br_and_jmp" -> PopCount(ftb_new_entry_has_br_and_jmp), 161709c6f1ddSLingrui98 "ftb_old_entry" -> PopCount(ftb_old_entry), 161809c6f1ddSLingrui98 "ftb_modified_entry" -> PopCount(ftb_modified_entry), 161909c6f1ddSLingrui98 "ftb_modified_entry_new_br" -> PopCount(ftb_modified_entry_new_br), 162009c6f1ddSLingrui98 "ftb_jalr_target_modified" -> PopCount(ftb_modified_entry_jalr_target_modified), 162109c6f1ddSLingrui98 "ftb_modified_entry_br_full" -> PopCount(ftb_modified_entry_br_full), 162209c6f1ddSLingrui98 "ftb_modified_entry_always_taken" -> PopCount(ftb_modified_entry_always_taken) 1623209a4cafSSteve Gou ) ++ mispred_stage_map ++ br_mispred_stage_map ++ jalr_mispred_stage_map ++ 16241d7e5011SLingrui98 correct_stage_map ++ br_correct_stage_map ++ jalr_correct_stage_map 162509c6f1ddSLingrui98 162609c6f1ddSLingrui98 for((key, value) <- perfCountsMap) { 162709c6f1ddSLingrui98 XSPerfAccumulate(key, value) 162809c6f1ddSLingrui98 } 162909c6f1ddSLingrui98 163009c6f1ddSLingrui98 // --------------------------- Debug -------------------------------- 163109c6f1ddSLingrui98 // XSDebug(enq_fire, p"enq! " + io.fromBpu.resp.bits.toPrintable) 163209c6f1ddSLingrui98 XSDebug(io.toIfu.req.fire, p"fire to ifu " + io.toIfu.req.bits.toPrintable) 163309c6f1ddSLingrui98 XSDebug(do_commit, p"deq! [ptr] $do_commit_ptr\n") 163409c6f1ddSLingrui98 XSDebug(true.B, p"[bpuPtr] $bpuPtr, [ifuPtr] $ifuPtr, [ifuWbPtr] $ifuWbPtr [commPtr] $commPtr\n") 163509c6f1ddSLingrui98 XSDebug(true.B, p"[in] v:${io.fromBpu.resp.valid} r:${io.fromBpu.resp.ready} " + 163609c6f1ddSLingrui98 p"[out] v:${io.toIfu.req.valid} r:${io.toIfu.req.ready}\n") 163709c6f1ddSLingrui98 XSDebug(do_commit, p"[deq info] cfiIndex: $commit_cfi, $commit_pc_bundle, target: ${Hexadecimal(commit_target)}\n") 163809c6f1ddSLingrui98 163909c6f1ddSLingrui98 // def ubtbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 164009c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 164109c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 164209c6f1ddSLingrui98 // Mux(valid && pd.isBr, 164309c6f1ddSLingrui98 // isWrong ^ Mux(ans.hit.asBool, 164409c6f1ddSLingrui98 // Mux(ans.taken.asBool, taken && ans.target === commitEntry.target, 164509c6f1ddSLingrui98 // !taken), 164609c6f1ddSLingrui98 // !taken), 164709c6f1ddSLingrui98 // false.B) 164809c6f1ddSLingrui98 // } 164909c6f1ddSLingrui98 // } 165009c6f1ddSLingrui98 165109c6f1ddSLingrui98 // def btbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 165209c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 165309c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 165409c6f1ddSLingrui98 // Mux(valid && pd.isBr, 165509c6f1ddSLingrui98 // isWrong ^ Mux(ans.hit.asBool, 165609c6f1ddSLingrui98 // Mux(ans.taken.asBool, taken && ans.target === commitEntry.target, 165709c6f1ddSLingrui98 // !taken), 165809c6f1ddSLingrui98 // !taken), 165909c6f1ddSLingrui98 // false.B) 166009c6f1ddSLingrui98 // } 166109c6f1ddSLingrui98 // } 166209c6f1ddSLingrui98 166309c6f1ddSLingrui98 // def tageCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 166409c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 166509c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 166609c6f1ddSLingrui98 // Mux(valid && pd.isBr, 166709c6f1ddSLingrui98 // isWrong ^ (ans.taken.asBool === taken), 166809c6f1ddSLingrui98 // false.B) 166909c6f1ddSLingrui98 // } 167009c6f1ddSLingrui98 // } 167109c6f1ddSLingrui98 167209c6f1ddSLingrui98 // def loopCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 167309c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 167409c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 167509c6f1ddSLingrui98 // Mux(valid && (pd.isBr) && ans.hit.asBool, 167609c6f1ddSLingrui98 // isWrong ^ (!taken), 167709c6f1ddSLingrui98 // false.B) 167809c6f1ddSLingrui98 // } 167909c6f1ddSLingrui98 // } 168009c6f1ddSLingrui98 168109c6f1ddSLingrui98 // def rasCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 168209c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 168309c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 168409c6f1ddSLingrui98 // Mux(valid && pd.isRet.asBool /*&& taken*/ && ans.hit.asBool, 168509c6f1ddSLingrui98 // isWrong ^ (ans.target === commitEntry.target), 168609c6f1ddSLingrui98 // false.B) 168709c6f1ddSLingrui98 // } 168809c6f1ddSLingrui98 // } 168909c6f1ddSLingrui98 169009c6f1ddSLingrui98 // val ubtbRights = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), false.B) 169109c6f1ddSLingrui98 // val ubtbWrongs = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), true.B) 169209c6f1ddSLingrui98 // // btb and ubtb pred jal and jalr as well 169309c6f1ddSLingrui98 // val btbRights = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), false.B) 169409c6f1ddSLingrui98 // val btbWrongs = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), true.B) 169509c6f1ddSLingrui98 // val tageRights = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), false.B) 169609c6f1ddSLingrui98 // val tageWrongs = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), true.B) 169709c6f1ddSLingrui98 169809c6f1ddSLingrui98 // val loopRights = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), false.B) 169909c6f1ddSLingrui98 // val loopWrongs = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), true.B) 170009c6f1ddSLingrui98 170109c6f1ddSLingrui98 // val rasRights = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), false.B) 170209c6f1ddSLingrui98 // val rasWrongs = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), true.B) 17031ca0e4f3SYinan Xu 1704cd365d4cSrvcoresjw val perfEvents = Seq( 1705cd365d4cSrvcoresjw ("bpu_s2_redirect ", bpu_s2_redirect ), 1706cb4f77ceSLingrui98 ("bpu_s3_redirect ", bpu_s3_redirect ), 1707cd365d4cSrvcoresjw ("bpu_to_ftq_stall ", enq.valid && ~enq.ready ), 1708cd365d4cSrvcoresjw ("mispredictRedirect ", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level), 1709cd365d4cSrvcoresjw ("replayRedirect ", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level) ), 1710cd365d4cSrvcoresjw ("predecodeRedirect ", fromIfuRedirect.valid ), 1711cd365d4cSrvcoresjw ("to_ifu_bubble ", io.toIfu.req.ready && !io.toIfu.req.valid ), 1712cd365d4cSrvcoresjw ("from_bpu_real_bubble ", !enq.valid && enq.ready && allowBpuIn ), 1713cd365d4cSrvcoresjw ("BpInstr ", PopCount(mbpInstrs) ), 1714cd365d4cSrvcoresjw ("BpBInstr ", PopCount(mbpBRights | mbpBWrongs) ), 1715cd365d4cSrvcoresjw ("BpRight ", PopCount(mbpRights) ), 1716cd365d4cSrvcoresjw ("BpWrong ", PopCount(mbpWrongs) ), 1717cd365d4cSrvcoresjw ("BpBRight ", PopCount(mbpBRights) ), 1718cd365d4cSrvcoresjw ("BpBWrong ", PopCount(mbpBWrongs) ), 1719cd365d4cSrvcoresjw ("BpJRight ", PopCount(mbpJRights) ), 1720cd365d4cSrvcoresjw ("BpJWrong ", PopCount(mbpJWrongs) ), 1721cd365d4cSrvcoresjw ("BpIRight ", PopCount(mbpIRights) ), 1722cd365d4cSrvcoresjw ("BpIWrong ", PopCount(mbpIWrongs) ), 1723cd365d4cSrvcoresjw ("BpCRight ", PopCount(mbpCRights) ), 1724cd365d4cSrvcoresjw ("BpCWrong ", PopCount(mbpCWrongs) ), 1725cd365d4cSrvcoresjw ("BpRRight ", PopCount(mbpRRights) ), 1726cd365d4cSrvcoresjw ("BpRWrong ", PopCount(mbpRWrongs) ), 1727cd365d4cSrvcoresjw ("ftb_false_hit ", PopCount(ftb_false_hit) ), 1728cd365d4cSrvcoresjw ("ftb_hit ", PopCount(ftb_hit) ), 1729cd365d4cSrvcoresjw ) 17301ca0e4f3SYinan Xu generatePerfEvent() 173109c6f1ddSLingrui98} 1732