109c6f1ddSLingrui98/*************************************************************************************** 209c6f1ddSLingrui98* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 309c6f1ddSLingrui98* Copyright (c) 2020-2021 Peng Cheng Laboratory 409c6f1ddSLingrui98* 509c6f1ddSLingrui98* XiangShan is licensed under Mulan PSL v2. 609c6f1ddSLingrui98* You can use this software according to the terms and conditions of the Mulan PSL v2. 709c6f1ddSLingrui98* You may obtain a copy of Mulan PSL v2 at: 809c6f1ddSLingrui98* http://license.coscl.org.cn/MulanPSL2 909c6f1ddSLingrui98* 1009c6f1ddSLingrui98* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 1109c6f1ddSLingrui98* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 1209c6f1ddSLingrui98* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 1309c6f1ddSLingrui98* 1409c6f1ddSLingrui98* See the Mulan PSL v2 for more details. 1509c6f1ddSLingrui98***************************************************************************************/ 1609c6f1ddSLingrui98 1709c6f1ddSLingrui98package xiangshan.frontend 1809c6f1ddSLingrui98 198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters 2009c6f1ddSLingrui98import chisel3._ 2109c6f1ddSLingrui98import chisel3.util._ 221ca0e4f3SYinan Xuimport utils._ 233c02ee8fSwakafaimport utility._ 2409c6f1ddSLingrui98import xiangshan._ 25e30430c2SJayimport xiangshan.frontend.icache._ 261ca0e4f3SYinan Xuimport xiangshan.backend.CtrlToFtqIO 272e1be6e1SSteve Gouimport xiangshan.backend.decode.ImmUnion 283c02ee8fSwakafaimport utility.ChiselDB 2951532d8bSGuokai Chen 3051532d8bSGuokai Chenclass FtqDebugBundle extends Bundle { 3151532d8bSGuokai Chen val pc = UInt(39.W) 3251532d8bSGuokai Chen val target = UInt(39.W) 3351532d8bSGuokai Chen val isBr = Bool() 3451532d8bSGuokai Chen val isJmp = Bool() 3551532d8bSGuokai Chen val isCall = Bool() 3651532d8bSGuokai Chen val isRet = Bool() 3751532d8bSGuokai Chen val misPred = Bool() 3851532d8bSGuokai Chen val isTaken = Bool() 3951532d8bSGuokai Chen val predStage = UInt(2.W) 4051532d8bSGuokai Chen} 4109c6f1ddSLingrui98 423b739f49SXuan Huclass FtqPtr(entries: Int) extends CircularQueuePtr[FtqPtr]( 433b739f49SXuan Hu entries 4409c6f1ddSLingrui98){ 453b739f49SXuan Hu def this()(implicit p: Parameters) = this(p(XSCoreParamsKey).FtqSize) 4609c6f1ddSLingrui98} 4709c6f1ddSLingrui98 4809c6f1ddSLingrui98object FtqPtr { 4909c6f1ddSLingrui98 def apply(f: Bool, v: UInt)(implicit p: Parameters): FtqPtr = { 5009c6f1ddSLingrui98 val ptr = Wire(new FtqPtr) 5109c6f1ddSLingrui98 ptr.flag := f 5209c6f1ddSLingrui98 ptr.value := v 5309c6f1ddSLingrui98 ptr 5409c6f1ddSLingrui98 } 5509c6f1ddSLingrui98 def inverse(ptr: FtqPtr)(implicit p: Parameters): FtqPtr = { 5609c6f1ddSLingrui98 apply(!ptr.flag, ptr.value) 5709c6f1ddSLingrui98 } 5809c6f1ddSLingrui98} 5909c6f1ddSLingrui98 6009c6f1ddSLingrui98class FtqNRSRAM[T <: Data](gen: T, numRead: Int)(implicit p: Parameters) extends XSModule { 6109c6f1ddSLingrui98 6209c6f1ddSLingrui98 val io = IO(new Bundle() { 6309c6f1ddSLingrui98 val raddr = Input(Vec(numRead, UInt(log2Up(FtqSize).W))) 6409c6f1ddSLingrui98 val ren = Input(Vec(numRead, Bool())) 6509c6f1ddSLingrui98 val rdata = Output(Vec(numRead, gen)) 6609c6f1ddSLingrui98 val waddr = Input(UInt(log2Up(FtqSize).W)) 6709c6f1ddSLingrui98 val wen = Input(Bool()) 6809c6f1ddSLingrui98 val wdata = Input(gen) 6909c6f1ddSLingrui98 }) 7009c6f1ddSLingrui98 7109c6f1ddSLingrui98 for(i <- 0 until numRead){ 7209c6f1ddSLingrui98 val sram = Module(new SRAMTemplate(gen, FtqSize)) 7309c6f1ddSLingrui98 sram.io.r.req.valid := io.ren(i) 7409c6f1ddSLingrui98 sram.io.r.req.bits.setIdx := io.raddr(i) 7509c6f1ddSLingrui98 io.rdata(i) := sram.io.r.resp.data(0) 7609c6f1ddSLingrui98 sram.io.w.req.valid := io.wen 7709c6f1ddSLingrui98 sram.io.w.req.bits.setIdx := io.waddr 7809c6f1ddSLingrui98 sram.io.w.req.bits.data := VecInit(io.wdata) 7909c6f1ddSLingrui98 } 8009c6f1ddSLingrui98 8109c6f1ddSLingrui98} 8209c6f1ddSLingrui98 8309c6f1ddSLingrui98class Ftq_RF_Components(implicit p: Parameters) extends XSBundle with BPUUtils { 8409c6f1ddSLingrui98 val startAddr = UInt(VAddrBits.W) 85b37e4b45SLingrui98 val nextLineAddr = UInt(VAddrBits.W) 8609c6f1ddSLingrui98 val isNextMask = Vec(PredictWidth, Bool()) 87b37e4b45SLingrui98 val fallThruError = Bool() 88b37e4b45SLingrui98 // val carry = Bool() 8909c6f1ddSLingrui98 def getPc(offset: UInt) = { 9085215037SLingrui98 def getHigher(pc: UInt) = pc(VAddrBits-1, log2Ceil(PredictWidth)+instOffsetBits+1) 9185215037SLingrui98 def getOffset(pc: UInt) = pc(log2Ceil(PredictWidth)+instOffsetBits, instOffsetBits) 92b37e4b45SLingrui98 Cat(getHigher(Mux(isNextMask(offset) && startAddr(log2Ceil(PredictWidth)+instOffsetBits), nextLineAddr, startAddr)), 9309c6f1ddSLingrui98 getOffset(startAddr)+offset, 0.U(instOffsetBits.W)) 9409c6f1ddSLingrui98 } 9509c6f1ddSLingrui98 def fromBranchPrediction(resp: BranchPredictionBundle) = { 96a229ab6cSLingrui98 def carryPos(addr: UInt) = addr(instOffsetBits+log2Ceil(PredictWidth)+1) 97adc0b8dfSGuokai Chen this.startAddr := resp.pc(3) 98adc0b8dfSGuokai Chen this.nextLineAddr := resp.pc(3) + (FetchWidth * 4 * 2).U // may be broken on other configs 9909c6f1ddSLingrui98 this.isNextMask := VecInit((0 until PredictWidth).map(i => 100935edac4STang Haojin (resp.pc(3)(log2Ceil(PredictWidth), 1) +& i.U)(log2Ceil(PredictWidth)).asBool 10109c6f1ddSLingrui98 )) 102adc0b8dfSGuokai Chen this.fallThruError := resp.fallThruError(3) 10309c6f1ddSLingrui98 this 10409c6f1ddSLingrui98 } 10509c6f1ddSLingrui98 override def toPrintable: Printable = { 106b37e4b45SLingrui98 p"startAddr:${Hexadecimal(startAddr)}" 10709c6f1ddSLingrui98 } 10809c6f1ddSLingrui98} 10909c6f1ddSLingrui98 11009c6f1ddSLingrui98class Ftq_pd_Entry(implicit p: Parameters) extends XSBundle { 11109c6f1ddSLingrui98 val brMask = Vec(PredictWidth, Bool()) 11209c6f1ddSLingrui98 val jmpInfo = ValidUndirectioned(Vec(3, Bool())) 11309c6f1ddSLingrui98 val jmpOffset = UInt(log2Ceil(PredictWidth).W) 11409c6f1ddSLingrui98 val jalTarget = UInt(VAddrBits.W) 11509c6f1ddSLingrui98 val rvcMask = Vec(PredictWidth, Bool()) 11609c6f1ddSLingrui98 def hasJal = jmpInfo.valid && !jmpInfo.bits(0) 11709c6f1ddSLingrui98 def hasJalr = jmpInfo.valid && jmpInfo.bits(0) 11809c6f1ddSLingrui98 def hasCall = jmpInfo.valid && jmpInfo.bits(1) 11909c6f1ddSLingrui98 def hasRet = jmpInfo.valid && jmpInfo.bits(2) 12009c6f1ddSLingrui98 12109c6f1ddSLingrui98 def fromPdWb(pdWb: PredecodeWritebackBundle) = { 12209c6f1ddSLingrui98 val pds = pdWb.pd 12309c6f1ddSLingrui98 this.brMask := VecInit(pds.map(pd => pd.isBr && pd.valid)) 12409c6f1ddSLingrui98 this.jmpInfo.valid := VecInit(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid)).asUInt.orR 12509c6f1ddSLingrui98 this.jmpInfo.bits := ParallelPriorityMux(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid), 12609c6f1ddSLingrui98 pds.map(pd => VecInit(pd.isJalr, pd.isCall, pd.isRet))) 12709c6f1ddSLingrui98 this.jmpOffset := ParallelPriorityEncoder(pds.map(pd => (pd.isJal || pd.isJalr) && pd.valid)) 12809c6f1ddSLingrui98 this.rvcMask := VecInit(pds.map(pd => pd.isRVC)) 12909c6f1ddSLingrui98 this.jalTarget := pdWb.jalTarget 13009c6f1ddSLingrui98 } 13109c6f1ddSLingrui98 13209c6f1ddSLingrui98 def toPd(offset: UInt) = { 13309c6f1ddSLingrui98 require(offset.getWidth == log2Ceil(PredictWidth)) 13409c6f1ddSLingrui98 val pd = Wire(new PreDecodeInfo) 13509c6f1ddSLingrui98 pd.valid := true.B 13609c6f1ddSLingrui98 pd.isRVC := rvcMask(offset) 13709c6f1ddSLingrui98 val isBr = brMask(offset) 13809c6f1ddSLingrui98 val isJalr = offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(0) 13909c6f1ddSLingrui98 pd.brType := Cat(offset === jmpOffset && jmpInfo.valid, isJalr || isBr) 14009c6f1ddSLingrui98 pd.isCall := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(1) 14109c6f1ddSLingrui98 pd.isRet := offset === jmpOffset && jmpInfo.valid && jmpInfo.bits(2) 14209c6f1ddSLingrui98 pd 14309c6f1ddSLingrui98 } 14409c6f1ddSLingrui98} 14509c6f1ddSLingrui98 146f9c51548Sssszwicclass PrefetchPtrDB(implicit p: Parameters) extends Bundle { 147f9c51548Sssszwic val fromFtqPtr = UInt(log2Up(p(XSCoreParamsKey).FtqSize).W) 148f9c51548Sssszwic val fromIfuPtr = UInt(log2Up(p(XSCoreParamsKey).FtqSize).W) 149f9c51548Sssszwic} 15009c6f1ddSLingrui98 1513711cf36S小造xu_zhclass Ftq_Redirect_SRAMEntry(implicit p: Parameters) extends SpeculativeInfo { 152abdc3a32Sxu_zh val sc_disagree = if (!env.FPGAPlatform) Some(Vec(numBr, Bool())) else None 1533711cf36S小造xu_zh} 15409c6f1ddSLingrui98 15509c6f1ddSLingrui98class Ftq_1R_SRAMEntry(implicit p: Parameters) extends XSBundle with HasBPUConst { 15609c6f1ddSLingrui98 val meta = UInt(MaxMetaLength.W) 15709c6f1ddSLingrui98} 15809c6f1ddSLingrui98 15909c6f1ddSLingrui98class Ftq_Pred_Info(implicit p: Parameters) extends XSBundle { 16009c6f1ddSLingrui98 val target = UInt(VAddrBits.W) 16109c6f1ddSLingrui98 val cfiIndex = ValidUndirectioned(UInt(log2Ceil(PredictWidth).W)) 16209c6f1ddSLingrui98} 16309c6f1ddSLingrui98 16409c6f1ddSLingrui98 16509c6f1ddSLingrui98class FtqRead[T <: Data](private val gen: T)(implicit p: Parameters) extends XSBundle { 166*9477429fSsinceforYy val vld = Output(Bool()) 16709c6f1ddSLingrui98 val ptr = Output(new FtqPtr) 16809c6f1ddSLingrui98 val offset = Output(UInt(log2Ceil(PredictWidth).W)) 16909c6f1ddSLingrui98 val data = Input(gen) 170*9477429fSsinceforYy def apply(vld: Bool, ptr: FtqPtr, offset: UInt) = { 171*9477429fSsinceforYy this.vld := vld 17209c6f1ddSLingrui98 this.ptr := ptr 17309c6f1ddSLingrui98 this.offset := offset 17409c6f1ddSLingrui98 this.data 17509c6f1ddSLingrui98 } 17609c6f1ddSLingrui98} 17709c6f1ddSLingrui98 17809c6f1ddSLingrui98 17909c6f1ddSLingrui98class FtqToBpuIO(implicit p: Parameters) extends XSBundle { 18009c6f1ddSLingrui98 val redirect = Valid(new BranchPredictionRedirect) 18109c6f1ddSLingrui98 val update = Valid(new BranchPredictionUpdate) 18209c6f1ddSLingrui98 val enq_ptr = Output(new FtqPtr) 18309c6f1ddSLingrui98} 18409c6f1ddSLingrui98 18509c6f1ddSLingrui98class FtqToIfuIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper { 18609c6f1ddSLingrui98 val req = Decoupled(new FetchRequestBundle) 187d2b20d1aSTang Haojin val redirect = Valid(new BranchPredictionRedirect) 188d2b20d1aSTang Haojin val topdown_redirect = Valid(new BranchPredictionRedirect) 18909c6f1ddSLingrui98 val flushFromBpu = new Bundle { 19009c6f1ddSLingrui98 // when ifu pipeline is not stalled, 19109c6f1ddSLingrui98 // a packet from bpu s3 can reach f1 at most 19209c6f1ddSLingrui98 val s2 = Valid(new FtqPtr) 193cb4f77ceSLingrui98 val s3 = Valid(new FtqPtr) 19409c6f1ddSLingrui98 def shouldFlushBy(src: Valid[FtqPtr], idx_to_flush: FtqPtr) = { 19509c6f1ddSLingrui98 src.valid && !isAfter(src.bits, idx_to_flush) 19609c6f1ddSLingrui98 } 19709c6f1ddSLingrui98 def shouldFlushByStage2(idx: FtqPtr) = shouldFlushBy(s2, idx) 198cb4f77ceSLingrui98 def shouldFlushByStage3(idx: FtqPtr) = shouldFlushBy(s3, idx) 19909c6f1ddSLingrui98 } 20009c6f1ddSLingrui98} 20109c6f1ddSLingrui98 202c5c5edaeSJeniusclass FtqToICacheIO(implicit p: Parameters) extends XSBundle with HasCircularQueuePtrHelper { 203c5c5edaeSJenius //NOTE: req.bits must be prepare in T cycle 204c5c5edaeSJenius // while req.valid is set true in T + 1 cycle 205c5c5edaeSJenius val req = Decoupled(new FtqToICacheRequestBundle) 206c5c5edaeSJenius} 207c5c5edaeSJenius 20809c6f1ddSLingrui98trait HasBackendRedirectInfo extends HasXSParameter { 20909c6f1ddSLingrui98 def isLoadReplay(r: Valid[Redirect]) = r.bits.flushItself() 21009c6f1ddSLingrui98} 21109c6f1ddSLingrui98 21209c6f1ddSLingrui98class FtqToCtrlIO(implicit p: Parameters) extends XSBundle with HasBackendRedirectInfo { 213b56f947eSYinan Xu // write to backend pc mem 214b56f947eSYinan Xu val pc_mem_wen = Output(Bool()) 215b56f947eSYinan Xu val pc_mem_waddr = Output(UInt(log2Ceil(FtqSize).W)) 216b56f947eSYinan Xu val pc_mem_wdata = Output(new Ftq_RF_Components) 217873dc383SLingrui98 // newest target 2186022c595SsinceforYy val newest_entry_en = Output(Bool()) 219873dc383SLingrui98 val newest_entry_target = Output(UInt(VAddrBits.W)) 220873dc383SLingrui98 val newest_entry_ptr = Output(new FtqPtr) 22109c6f1ddSLingrui98} 22209c6f1ddSLingrui98 22309c6f1ddSLingrui98 22409c6f1ddSLingrui98class FTBEntryGen(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo with HasBPUParameter { 22509c6f1ddSLingrui98 val io = IO(new Bundle { 22609c6f1ddSLingrui98 val start_addr = Input(UInt(VAddrBits.W)) 22709c6f1ddSLingrui98 val old_entry = Input(new FTBEntry) 22809c6f1ddSLingrui98 val pd = Input(new Ftq_pd_Entry) 22909c6f1ddSLingrui98 val cfiIndex = Flipped(Valid(UInt(log2Ceil(PredictWidth).W))) 23009c6f1ddSLingrui98 val target = Input(UInt(VAddrBits.W)) 23109c6f1ddSLingrui98 val hit = Input(Bool()) 23209c6f1ddSLingrui98 val mispredict_vec = Input(Vec(PredictWidth, Bool())) 23309c6f1ddSLingrui98 23409c6f1ddSLingrui98 val new_entry = Output(new FTBEntry) 23509c6f1ddSLingrui98 val new_br_insert_pos = Output(Vec(numBr, Bool())) 23609c6f1ddSLingrui98 val taken_mask = Output(Vec(numBr, Bool())) 237803124a6SLingrui98 val jmp_taken = Output(Bool()) 23809c6f1ddSLingrui98 val mispred_mask = Output(Vec(numBr+1, Bool())) 23909c6f1ddSLingrui98 24009c6f1ddSLingrui98 // for perf counters 24109c6f1ddSLingrui98 val is_init_entry = Output(Bool()) 24209c6f1ddSLingrui98 val is_old_entry = Output(Bool()) 24309c6f1ddSLingrui98 val is_new_br = Output(Bool()) 24409c6f1ddSLingrui98 val is_jalr_target_modified = Output(Bool()) 24509c6f1ddSLingrui98 val is_always_taken_modified = Output(Bool()) 24609c6f1ddSLingrui98 val is_br_full = Output(Bool()) 24709c6f1ddSLingrui98 }) 24809c6f1ddSLingrui98 24909c6f1ddSLingrui98 // no mispredictions detected at predecode 25009c6f1ddSLingrui98 val hit = io.hit 25109c6f1ddSLingrui98 val pd = io.pd 25209c6f1ddSLingrui98 25309c6f1ddSLingrui98 val init_entry = WireInit(0.U.asTypeOf(new FTBEntry)) 25409c6f1ddSLingrui98 25509c6f1ddSLingrui98 25609c6f1ddSLingrui98 val cfi_is_br = pd.brMask(io.cfiIndex.bits) && io.cfiIndex.valid 25709c6f1ddSLingrui98 val entry_has_jmp = pd.jmpInfo.valid 25809c6f1ddSLingrui98 val new_jmp_is_jal = entry_has_jmp && !pd.jmpInfo.bits(0) && io.cfiIndex.valid 25909c6f1ddSLingrui98 val new_jmp_is_jalr = entry_has_jmp && pd.jmpInfo.bits(0) && io.cfiIndex.valid 26009c6f1ddSLingrui98 val new_jmp_is_call = entry_has_jmp && pd.jmpInfo.bits(1) && io.cfiIndex.valid 26109c6f1ddSLingrui98 val new_jmp_is_ret = entry_has_jmp && pd.jmpInfo.bits(2) && io.cfiIndex.valid 26209c6f1ddSLingrui98 val last_jmp_rvi = entry_has_jmp && pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask.last 263a60a2901SLingrui98 // val last_br_rvi = cfi_is_br && io.cfiIndex.bits === (PredictWidth-1).U && !pd.rvcMask.last 26409c6f1ddSLingrui98 26509c6f1ddSLingrui98 val cfi_is_jal = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jal 26609c6f1ddSLingrui98 val cfi_is_jalr = io.cfiIndex.bits === pd.jmpOffset && new_jmp_is_jalr 26709c6f1ddSLingrui98 268a60a2901SLingrui98 def carryPos = log2Ceil(PredictWidth)+instOffsetBits 26909c6f1ddSLingrui98 def getLower(pc: UInt) = pc(carryPos-1, instOffsetBits) 27009c6f1ddSLingrui98 // if not hit, establish a new entry 27109c6f1ddSLingrui98 init_entry.valid := true.B 27209c6f1ddSLingrui98 // tag is left for ftb to assign 273eeb5ff92SLingrui98 274eeb5ff92SLingrui98 // case br 275eeb5ff92SLingrui98 val init_br_slot = init_entry.getSlotForBr(0) 276eeb5ff92SLingrui98 when (cfi_is_br) { 277eeb5ff92SLingrui98 init_br_slot.valid := true.B 278eeb5ff92SLingrui98 init_br_slot.offset := io.cfiIndex.bits 279b37e4b45SLingrui98 init_br_slot.setLowerStatByTarget(io.start_addr, io.target, numBr == 1) 280eeb5ff92SLingrui98 init_entry.always_taken(0) := true.B // set to always taken on init 281eeb5ff92SLingrui98 } 282eeb5ff92SLingrui98 283eeb5ff92SLingrui98 // case jmp 284eeb5ff92SLingrui98 when (entry_has_jmp) { 285eeb5ff92SLingrui98 init_entry.tailSlot.offset := pd.jmpOffset 286eeb5ff92SLingrui98 init_entry.tailSlot.valid := new_jmp_is_jal || new_jmp_is_jalr 287eeb5ff92SLingrui98 init_entry.tailSlot.setLowerStatByTarget(io.start_addr, Mux(cfi_is_jalr, io.target, pd.jalTarget), isShare=false) 288eeb5ff92SLingrui98 } 289eeb5ff92SLingrui98 29009c6f1ddSLingrui98 val jmpPft = getLower(io.start_addr) +& pd.jmpOffset +& Mux(pd.rvcMask(pd.jmpOffset), 1.U, 2.U) 291a60a2901SLingrui98 init_entry.pftAddr := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft, getLower(io.start_addr)) 292a60a2901SLingrui98 init_entry.carry := Mux(entry_has_jmp && !last_jmp_rvi, jmpPft(carryPos-instOffsetBits), true.B) 29309c6f1ddSLingrui98 init_entry.isJalr := new_jmp_is_jalr 29409c6f1ddSLingrui98 init_entry.isCall := new_jmp_is_call 29509c6f1ddSLingrui98 init_entry.isRet := new_jmp_is_ret 296f4ebc4b2SLingrui98 // that means fall thru points to the middle of an inst 297ae409b75SSteve Gou init_entry.last_may_be_rvi_call := pd.jmpOffset === (PredictWidth-1).U && !pd.rvcMask(pd.jmpOffset) 29809c6f1ddSLingrui98 29909c6f1ddSLingrui98 // if hit, check whether a new cfi(only br is possible) is detected 30009c6f1ddSLingrui98 val oe = io.old_entry 301eeb5ff92SLingrui98 val br_recorded_vec = oe.getBrRecordedVec(io.cfiIndex.bits) 30209c6f1ddSLingrui98 val br_recorded = br_recorded_vec.asUInt.orR 30309c6f1ddSLingrui98 val is_new_br = cfi_is_br && !br_recorded 30409c6f1ddSLingrui98 val new_br_offset = io.cfiIndex.bits 30509c6f1ddSLingrui98 // vec(i) means new br will be inserted BEFORE old br(i) 306eeb5ff92SLingrui98 val allBrSlotsVec = oe.allSlotsForBr 30709c6f1ddSLingrui98 val new_br_insert_onehot = VecInit((0 until numBr).map{ 30809c6f1ddSLingrui98 i => i match { 309eeb5ff92SLingrui98 case 0 => 310eeb5ff92SLingrui98 !allBrSlotsVec(0).valid || new_br_offset < allBrSlotsVec(0).offset 311eeb5ff92SLingrui98 case idx => 312eeb5ff92SLingrui98 allBrSlotsVec(idx-1).valid && new_br_offset > allBrSlotsVec(idx-1).offset && 313eeb5ff92SLingrui98 (!allBrSlotsVec(idx).valid || new_br_offset < allBrSlotsVec(idx).offset) 31409c6f1ddSLingrui98 } 31509c6f1ddSLingrui98 }) 31609c6f1ddSLingrui98 31709c6f1ddSLingrui98 val old_entry_modified = WireInit(io.old_entry) 31809c6f1ddSLingrui98 for (i <- 0 until numBr) { 319eeb5ff92SLingrui98 val slot = old_entry_modified.allSlotsForBr(i) 320eeb5ff92SLingrui98 when (new_br_insert_onehot(i)) { 321eeb5ff92SLingrui98 slot.valid := true.B 322eeb5ff92SLingrui98 slot.offset := new_br_offset 323b37e4b45SLingrui98 slot.setLowerStatByTarget(io.start_addr, io.target, i == numBr-1) 324eeb5ff92SLingrui98 old_entry_modified.always_taken(i) := true.B 325eeb5ff92SLingrui98 }.elsewhen (new_br_offset > oe.allSlotsForBr(i).offset) { 326eeb5ff92SLingrui98 old_entry_modified.always_taken(i) := false.B 327eeb5ff92SLingrui98 // all other fields remain unchanged 328eeb5ff92SLingrui98 }.otherwise { 329eeb5ff92SLingrui98 // case i == 0, remain unchanged 330eeb5ff92SLingrui98 if (i != 0) { 331b37e4b45SLingrui98 val noNeedToMoveFromFormerSlot = (i == numBr-1).B && !oe.brSlots.last.valid 332eeb5ff92SLingrui98 when (!noNeedToMoveFromFormerSlot) { 333eeb5ff92SLingrui98 slot.fromAnotherSlot(oe.allSlotsForBr(i-1)) 334eeb5ff92SLingrui98 old_entry_modified.always_taken(i) := oe.always_taken(i) 33509c6f1ddSLingrui98 } 336eeb5ff92SLingrui98 } 337eeb5ff92SLingrui98 } 338eeb5ff92SLingrui98 } 33909c6f1ddSLingrui98 340eeb5ff92SLingrui98 // two circumstances: 341eeb5ff92SLingrui98 // 1. oe: | br | j |, new br should be in front of j, thus addr of j should be new pft 342eeb5ff92SLingrui98 // 2. oe: | br | br |, new br could be anywhere between, thus new pft is the addr of either 343eeb5ff92SLingrui98 // the previous last br or the new br 344eeb5ff92SLingrui98 val may_have_to_replace = oe.noEmptySlotForNewBr 345eeb5ff92SLingrui98 val pft_need_to_change = is_new_br && may_have_to_replace 34609c6f1ddSLingrui98 // it should either be the given last br or the new br 34709c6f1ddSLingrui98 when (pft_need_to_change) { 348eeb5ff92SLingrui98 val new_pft_offset = 349710a8720SLingrui98 Mux(!new_br_insert_onehot.asUInt.orR, 350710a8720SLingrui98 new_br_offset, oe.allSlotsForBr.last.offset) 351eeb5ff92SLingrui98 352710a8720SLingrui98 // set jmp to invalid 35309c6f1ddSLingrui98 old_entry_modified.pftAddr := getLower(io.start_addr) + new_pft_offset 35409c6f1ddSLingrui98 old_entry_modified.carry := (getLower(io.start_addr) +& new_pft_offset).head(1).asBool 355f4ebc4b2SLingrui98 old_entry_modified.last_may_be_rvi_call := false.B 35609c6f1ddSLingrui98 old_entry_modified.isCall := false.B 35709c6f1ddSLingrui98 old_entry_modified.isRet := false.B 358eeb5ff92SLingrui98 old_entry_modified.isJalr := false.B 35909c6f1ddSLingrui98 } 36009c6f1ddSLingrui98 36109c6f1ddSLingrui98 val old_entry_jmp_target_modified = WireInit(oe) 362710a8720SLingrui98 val old_target = oe.tailSlot.getTarget(io.start_addr) // may be wrong because we store only 20 lowest bits 363b37e4b45SLingrui98 val old_tail_is_jmp = !oe.tailSlot.sharing 364eeb5ff92SLingrui98 val jalr_target_modified = cfi_is_jalr && (old_target =/= io.target) && old_tail_is_jmp // TODO: pass full jalr target 3653bcae573SLingrui98 when (jalr_target_modified) { 36609c6f1ddSLingrui98 old_entry_jmp_target_modified.setByJmpTarget(io.start_addr, io.target) 36709c6f1ddSLingrui98 old_entry_jmp_target_modified.always_taken := 0.U.asTypeOf(Vec(numBr, Bool())) 36809c6f1ddSLingrui98 } 36909c6f1ddSLingrui98 37009c6f1ddSLingrui98 val old_entry_always_taken = WireInit(oe) 37109c6f1ddSLingrui98 val always_taken_modified_vec = Wire(Vec(numBr, Bool())) // whether modified or not 37209c6f1ddSLingrui98 for (i <- 0 until numBr) { 37309c6f1ddSLingrui98 old_entry_always_taken.always_taken(i) := 37409c6f1ddSLingrui98 oe.always_taken(i) && io.cfiIndex.valid && oe.brValids(i) && io.cfiIndex.bits === oe.brOffset(i) 375710a8720SLingrui98 always_taken_modified_vec(i) := oe.always_taken(i) && !old_entry_always_taken.always_taken(i) 37609c6f1ddSLingrui98 } 37709c6f1ddSLingrui98 val always_taken_modified = always_taken_modified_vec.reduce(_||_) 37809c6f1ddSLingrui98 37909c6f1ddSLingrui98 38009c6f1ddSLingrui98 38109c6f1ddSLingrui98 val derived_from_old_entry = 38209c6f1ddSLingrui98 Mux(is_new_br, old_entry_modified, 3833bcae573SLingrui98 Mux(jalr_target_modified, old_entry_jmp_target_modified, old_entry_always_taken)) 38409c6f1ddSLingrui98 38509c6f1ddSLingrui98 38609c6f1ddSLingrui98 io.new_entry := Mux(!hit, init_entry, derived_from_old_entry) 38709c6f1ddSLingrui98 38809c6f1ddSLingrui98 io.new_br_insert_pos := new_br_insert_onehot 38909c6f1ddSLingrui98 io.taken_mask := VecInit((io.new_entry.brOffset zip io.new_entry.brValids).map{ 39009c6f1ddSLingrui98 case (off, v) => io.cfiIndex.bits === off && io.cfiIndex.valid && v 39109c6f1ddSLingrui98 }) 392803124a6SLingrui98 io.jmp_taken := io.new_entry.jmpValid && io.new_entry.tailSlot.offset === io.cfiIndex.bits 39309c6f1ddSLingrui98 for (i <- 0 until numBr) { 39409c6f1ddSLingrui98 io.mispred_mask(i) := io.new_entry.brValids(i) && io.mispredict_vec(io.new_entry.brOffset(i)) 39509c6f1ddSLingrui98 } 39609c6f1ddSLingrui98 io.mispred_mask.last := io.new_entry.jmpValid && io.mispredict_vec(pd.jmpOffset) 39709c6f1ddSLingrui98 39809c6f1ddSLingrui98 // for perf counters 39909c6f1ddSLingrui98 io.is_init_entry := !hit 4003bcae573SLingrui98 io.is_old_entry := hit && !is_new_br && !jalr_target_modified && !always_taken_modified 40109c6f1ddSLingrui98 io.is_new_br := hit && is_new_br 4023bcae573SLingrui98 io.is_jalr_target_modified := hit && jalr_target_modified 40309c6f1ddSLingrui98 io.is_always_taken_modified := hit && always_taken_modified 404eeb5ff92SLingrui98 io.is_br_full := hit && is_new_br && may_have_to_replace 40509c6f1ddSLingrui98} 40609c6f1ddSLingrui98 407c5c5edaeSJeniusclass FtqPcMemWrapper(numOtherReads: Int)(implicit p: Parameters) extends XSModule with HasBackendRedirectInfo { 408c5c5edaeSJenius val io = IO(new Bundle { 409c5c5edaeSJenius val ifuPtr_w = Input(new FtqPtr) 410c5c5edaeSJenius val ifuPtrPlus1_w = Input(new FtqPtr) 4116bf9b30dSLingrui98 val ifuPtrPlus2_w = Input(new FtqPtr) 412c5c5edaeSJenius val commPtr_w = Input(new FtqPtr) 4136bf9b30dSLingrui98 val commPtrPlus1_w = Input(new FtqPtr) 414c5c5edaeSJenius val ifuPtr_rdata = Output(new Ftq_RF_Components) 415c5c5edaeSJenius val ifuPtrPlus1_rdata = Output(new Ftq_RF_Components) 4166bf9b30dSLingrui98 val ifuPtrPlus2_rdata = Output(new Ftq_RF_Components) 417c5c5edaeSJenius val commPtr_rdata = Output(new Ftq_RF_Components) 4186bf9b30dSLingrui98 val commPtrPlus1_rdata = Output(new Ftq_RF_Components) 419c5c5edaeSJenius 420c5c5edaeSJenius val other_raddrs = Input(Vec(numOtherReads, UInt(log2Ceil(FtqSize).W))) 421c5c5edaeSJenius val other_rdatas = Output(Vec(numOtherReads, new Ftq_RF_Components)) 422c5c5edaeSJenius 423c5c5edaeSJenius val wen = Input(Bool()) 424c5c5edaeSJenius val waddr = Input(UInt(log2Ceil(FtqSize).W)) 425c5c5edaeSJenius val wdata = Input(new Ftq_RF_Components) 426c5c5edaeSJenius }) 427c5c5edaeSJenius 4286bf9b30dSLingrui98 val num_pc_read = numOtherReads + 5 429c5c5edaeSJenius val mem = Module(new SyncDataModuleTemplate(new Ftq_RF_Components, FtqSize, 43028f2cf58SLingrui98 num_pc_read, 1, "FtqPC")) 431c5c5edaeSJenius mem.io.wen(0) := io.wen 432c5c5edaeSJenius mem.io.waddr(0) := io.waddr 433c5c5edaeSJenius mem.io.wdata(0) := io.wdata 434c5c5edaeSJenius 4356bf9b30dSLingrui98 // read one cycle ahead for ftq local reads 436c5c5edaeSJenius val raddr_vec = VecInit(io.other_raddrs ++ 43788bc4f90SLingrui98 Seq(io.ifuPtr_w.value, io.ifuPtrPlus1_w.value, io.ifuPtrPlus2_w.value, io.commPtrPlus1_w.value, io.commPtr_w.value)) 438c5c5edaeSJenius 439c5c5edaeSJenius mem.io.raddr := raddr_vec 440c5c5edaeSJenius 4416bf9b30dSLingrui98 io.other_rdatas := mem.io.rdata.dropRight(5) 4426bf9b30dSLingrui98 io.ifuPtr_rdata := mem.io.rdata.dropRight(4).last 4436bf9b30dSLingrui98 io.ifuPtrPlus1_rdata := mem.io.rdata.dropRight(3).last 4446bf9b30dSLingrui98 io.ifuPtrPlus2_rdata := mem.io.rdata.dropRight(2).last 4456bf9b30dSLingrui98 io.commPtrPlus1_rdata := mem.io.rdata.dropRight(1).last 446c5c5edaeSJenius io.commPtr_rdata := mem.io.rdata.last 447c5c5edaeSJenius} 448c5c5edaeSJenius 44909c6f1ddSLingrui98class Ftq(implicit p: Parameters) extends XSModule with HasCircularQueuePtrHelper 450e30430c2SJay with HasBackendRedirectInfo with BPUUtils with HasBPUConst with HasPerfEvents 451e30430c2SJay with HasICacheParameters{ 45209c6f1ddSLingrui98 val io = IO(new Bundle { 45309c6f1ddSLingrui98 val fromBpu = Flipped(new BpuToFtqIO) 45409c6f1ddSLingrui98 val fromIfu = Flipped(new IfuToFtqIO) 45509c6f1ddSLingrui98 val fromBackend = Flipped(new CtrlToFtqIO) 45609c6f1ddSLingrui98 45709c6f1ddSLingrui98 val toBpu = new FtqToBpuIO 45809c6f1ddSLingrui98 val toIfu = new FtqToIfuIO 459c5c5edaeSJenius val toICache = new FtqToICacheIO 46009c6f1ddSLingrui98 val toBackend = new FtqToCtrlIO 46109c6f1ddSLingrui98 4627052722fSJay val toPrefetch = new FtqPrefechBundle 4637052722fSJay 46409c6f1ddSLingrui98 val bpuInfo = new Bundle { 46509c6f1ddSLingrui98 val bpRight = Output(UInt(XLEN.W)) 46609c6f1ddSLingrui98 val bpWrong = Output(UInt(XLEN.W)) 46709c6f1ddSLingrui98 } 4681d1e6d4dSJenius 4691d1e6d4dSJenius val mmioCommitRead = Flipped(new mmioCommitRead) 470d2b20d1aSTang Haojin 471d2b20d1aSTang Haojin // for perf 472d2b20d1aSTang Haojin val ControlBTBMissBubble = Output(Bool()) 473d2b20d1aSTang Haojin val TAGEMissBubble = Output(Bool()) 474d2b20d1aSTang Haojin val SCMissBubble = Output(Bool()) 475d2b20d1aSTang Haojin val ITTAGEMissBubble = Output(Bool()) 476d2b20d1aSTang Haojin val RASMissBubble = Output(Bool()) 47709c6f1ddSLingrui98 }) 47809c6f1ddSLingrui98 io.bpuInfo := DontCare 47909c6f1ddSLingrui98 480d2b20d1aSTang Haojin val topdown_stage = RegInit(0.U.asTypeOf(new FrontendTopDownBundle)) 481d2b20d1aSTang Haojin // only driven by clock, not valid-ready 482d2b20d1aSTang Haojin topdown_stage := io.fromBpu.resp.bits.topdown_info 483d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info := topdown_stage 484d2b20d1aSTang Haojin 485d2b20d1aSTang Haojin val ifuRedirected = RegInit(VecInit(Seq.fill(FtqSize)(false.B))) 486d2b20d1aSTang Haojin 487bace178aSGao-Zeyu 48842dddaceSXuan Hu // io.fromBackend.ftqIdxAhead: bju(BjuCnt) + ldReplay + exception 48942dddaceSXuan Hu val ftqIdxAhead = VecInit(Seq.tabulate(FtqRedirectAheadNum)(i => io.fromBackend.ftqIdxAhead(i))) // only bju 49042dddaceSXuan Hu val ftqIdxSelOH = io.fromBackend.ftqIdxSelOH.bits(FtqRedirectAheadNum - 1, 0) 491bace178aSGao-Zeyu 492bace178aSGao-Zeyu val aheadValid = ftqIdxAhead.map(_.valid).reduce(_|_) && !io.fromBackend.redirect.valid 493bace178aSGao-Zeyu val realAhdValid = io.fromBackend.redirect.valid && (ftqIdxSelOH > 0.U) && RegNext(aheadValid) 494d2b20d1aSTang Haojin val backendRedirect = Wire(Valid(new BranchPredictionRedirect)) 495bace178aSGao-Zeyu val backendRedirectReg = RegNext(backendRedirect) 496bace178aSGao-Zeyu backendRedirectReg.valid := Mux(realAhdValid, 0.B, backendRedirect.valid) 497bace178aSGao-Zeyu val fromBackendRedirect = Wire(Valid(new BranchPredictionRedirect)) 498bace178aSGao-Zeyu fromBackendRedirect := Mux(realAhdValid, backendRedirect, backendRedirectReg) 49909c6f1ddSLingrui98 500df5b4b8eSYinan Xu val stage2Flush = backendRedirect.valid 50109c6f1ddSLingrui98 val backendFlush = stage2Flush || RegNext(stage2Flush) 50209c6f1ddSLingrui98 val ifuFlush = Wire(Bool()) 50309c6f1ddSLingrui98 50409c6f1ddSLingrui98 val flush = stage2Flush || RegNext(stage2Flush) 50509c6f1ddSLingrui98 50609c6f1ddSLingrui98 val allowBpuIn, allowToIfu = WireInit(false.B) 50709c6f1ddSLingrui98 val flushToIfu = !allowToIfu 508bace178aSGao-Zeyu allowBpuIn := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid 509bace178aSGao-Zeyu allowToIfu := !ifuFlush && !backendRedirect.valid && !backendRedirectReg.valid 51009c6f1ddSLingrui98 511f56177cbSJenius def copyNum = 5 51289cc69c1STang Haojin val bpuPtr, ifuPtr, ifuWbPtr, commPtr, robCommPtr = RegInit(FtqPtr(false.B, 0.U)) 513c9bc5480SLingrui98 val ifuPtrPlus1 = RegInit(FtqPtr(false.B, 1.U)) 5146bf9b30dSLingrui98 val ifuPtrPlus2 = RegInit(FtqPtr(false.B, 2.U)) 5156bf9b30dSLingrui98 val commPtrPlus1 = RegInit(FtqPtr(false.B, 1.U)) 516f56177cbSJenius val copied_ifu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U))) 517dc270d3bSJenius val copied_bpu_ptr = Seq.fill(copyNum)(RegInit(FtqPtr(false.B, 0.U))) 5186bf9b30dSLingrui98 require(FtqSize >= 4) 519c5c5edaeSJenius val ifuPtr_write = WireInit(ifuPtr) 520c5c5edaeSJenius val ifuPtrPlus1_write = WireInit(ifuPtrPlus1) 5216bf9b30dSLingrui98 val ifuPtrPlus2_write = WireInit(ifuPtrPlus2) 522c5c5edaeSJenius val ifuWbPtr_write = WireInit(ifuWbPtr) 523c5c5edaeSJenius val commPtr_write = WireInit(commPtr) 5246bf9b30dSLingrui98 val commPtrPlus1_write = WireInit(commPtrPlus1) 52589cc69c1STang Haojin val robCommPtr_write = WireInit(robCommPtr) 526c5c5edaeSJenius ifuPtr := ifuPtr_write 527c5c5edaeSJenius ifuPtrPlus1 := ifuPtrPlus1_write 5286bf9b30dSLingrui98 ifuPtrPlus2 := ifuPtrPlus2_write 529c5c5edaeSJenius ifuWbPtr := ifuWbPtr_write 530c5c5edaeSJenius commPtr := commPtr_write 531f83ef67eSLingrui98 commPtrPlus1 := commPtrPlus1_write 532f56177cbSJenius copied_ifu_ptr.map{ptr => 533f56177cbSJenius ptr := ifuPtr_write 534f56177cbSJenius dontTouch(ptr) 535f56177cbSJenius } 53689cc69c1STang Haojin robCommPtr := robCommPtr_write 53709c6f1ddSLingrui98 val validEntries = distanceBetween(bpuPtr, commPtr) 53843aca6c2SGuokai Chen val canCommit = Wire(Bool()) 53909c6f1ddSLingrui98 54009c6f1ddSLingrui98 // ********************************************************************** 54109c6f1ddSLingrui98 // **************************** enq from bpu **************************** 54209c6f1ddSLingrui98 // ********************************************************************** 54343aca6c2SGuokai Chen val new_entry_ready = validEntries < FtqSize.U || canCommit 54409c6f1ddSLingrui98 io.fromBpu.resp.ready := new_entry_ready 54509c6f1ddSLingrui98 54609c6f1ddSLingrui98 val bpu_s2_resp = io.fromBpu.resp.bits.s2 547cb4f77ceSLingrui98 val bpu_s3_resp = io.fromBpu.resp.bits.s3 548adc0b8dfSGuokai Chen val bpu_s2_redirect = bpu_s2_resp.valid(3) && bpu_s2_resp.hasRedirect(3) 549adc0b8dfSGuokai Chen val bpu_s3_redirect = bpu_s3_resp.valid(3) && bpu_s3_resp.hasRedirect(3) 55009c6f1ddSLingrui98 55109c6f1ddSLingrui98 io.toBpu.enq_ptr := bpuPtr 552935edac4STang Haojin val enq_fire = io.fromBpu.resp.fire && allowBpuIn // from bpu s1 553935edac4STang Haojin val bpu_in_fire = (io.fromBpu.resp.fire || bpu_s2_redirect || bpu_s3_redirect) && allowBpuIn 55409c6f1ddSLingrui98 555b37e4b45SLingrui98 val bpu_in_resp = io.fromBpu.resp.bits.selectedResp 556adc0b8dfSGuokai Chen val bpu_in_stage = io.fromBpu.resp.bits.selectedRespIdxForFtq 55709c6f1ddSLingrui98 val bpu_in_resp_ptr = Mux(bpu_in_stage === BP_S1, bpuPtr, bpu_in_resp.ftq_idx) 55809c6f1ddSLingrui98 val bpu_in_resp_idx = bpu_in_resp_ptr.value 55909c6f1ddSLingrui98 560378f00d9SJenius // read ports: prefetchReq ++ ifuReq1 + ifuReq2 + ifuReq3 + commitUpdate2 + commitUpdate 561378f00d9SJenius val ftq_pc_mem = Module(new FtqPcMemWrapper(1)) 5626bf9b30dSLingrui98 // resp from uBTB 563c5c5edaeSJenius ftq_pc_mem.io.wen := bpu_in_fire 564c5c5edaeSJenius ftq_pc_mem.io.waddr := bpu_in_resp_idx 565c5c5edaeSJenius ftq_pc_mem.io.wdata.fromBranchPrediction(bpu_in_resp) 56609c6f1ddSLingrui98 56709c6f1ddSLingrui98 // ifuRedirect + backendRedirect + commit 568bace178aSGao-Zeyu val ftq_redirect_sram = Module(new FtqNRSRAM(new Ftq_Redirect_SRAMEntry, 1+FtqRedirectAheadNum+1)) 56909c6f1ddSLingrui98 // these info is intended to enq at the last stage of bpu 570adc0b8dfSGuokai Chen ftq_redirect_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid(3) 57109c6f1ddSLingrui98 ftq_redirect_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value 572c2d1ec7dSLingrui98 ftq_redirect_sram.io.wdata := io.fromBpu.resp.bits.last_stage_spec_info 57349cbc998SLingrui98 println(f"ftq redirect SRAM: entry ${ftq_redirect_sram.io.wdata.getWidth} * ${FtqSize} * 3") 57449cbc998SLingrui98 println(f"ftq redirect SRAM: ahead fh ${ftq_redirect_sram.io.wdata.afhob.getWidth} * ${FtqSize} * 3") 57509c6f1ddSLingrui98 57609c6f1ddSLingrui98 val ftq_meta_1r_sram = Module(new FtqNRSRAM(new Ftq_1R_SRAMEntry, 1)) 57709c6f1ddSLingrui98 // these info is intended to enq at the last stage of bpu 578adc0b8dfSGuokai Chen ftq_meta_1r_sram.io.wen := io.fromBpu.resp.bits.lastStage.valid(3) 57909c6f1ddSLingrui98 ftq_meta_1r_sram.io.waddr := io.fromBpu.resp.bits.lastStage.ftq_idx.value 580c2d1ec7dSLingrui98 ftq_meta_1r_sram.io.wdata.meta := io.fromBpu.resp.bits.last_stage_meta 58109c6f1ddSLingrui98 // ifuRedirect + backendRedirect + commit 582bace178aSGao-Zeyu val ftb_entry_mem = Module(new SyncDataModuleTemplate(new FTBEntry, FtqSize, 1+FtqRedirectAheadNum+1, 1)) 583adc0b8dfSGuokai Chen ftb_entry_mem.io.wen(0) := io.fromBpu.resp.bits.lastStage.valid(3) 58409c6f1ddSLingrui98 ftb_entry_mem.io.waddr(0) := io.fromBpu.resp.bits.lastStage.ftq_idx.value 585c2d1ec7dSLingrui98 ftb_entry_mem.io.wdata(0) := io.fromBpu.resp.bits.last_stage_ftb_entry 58609c6f1ddSLingrui98 58709c6f1ddSLingrui98 58809c6f1ddSLingrui98 // multi-write 589b0ed7239SLingrui98 val update_target = Reg(Vec(FtqSize, UInt(VAddrBits.W))) // could be taken target or fallThrough //TODO: remove this 5906bf9b30dSLingrui98 val newest_entry_target = Reg(UInt(VAddrBits.W)) 5916bf9b30dSLingrui98 val newest_entry_ptr = Reg(new FtqPtr) 59209c6f1ddSLingrui98 val cfiIndex_vec = Reg(Vec(FtqSize, ValidUndirectioned(UInt(log2Ceil(PredictWidth).W)))) 59309c6f1ddSLingrui98 val mispredict_vec = Reg(Vec(FtqSize, Vec(PredictWidth, Bool()))) 59409c6f1ddSLingrui98 val pred_stage = Reg(Vec(FtqSize, UInt(2.W))) 595209a4cafSSteve Gou val pred_s1_cycle = if (!env.FPGAPlatform) Some(Reg(Vec(FtqSize, UInt(64.W)))) else None 59609c6f1ddSLingrui98 59709c6f1ddSLingrui98 val c_invalid :: c_valid :: c_commited :: Nil = Enum(3) 59809c6f1ddSLingrui98 val commitStateQueue = RegInit(VecInit(Seq.fill(FtqSize) { 59909c6f1ddSLingrui98 VecInit(Seq.fill(PredictWidth)(c_invalid)) 60009c6f1ddSLingrui98 })) 60109c6f1ddSLingrui98 60209c6f1ddSLingrui98 val f_to_send :: f_sent :: Nil = Enum(2) 60309c6f1ddSLingrui98 val entry_fetch_status = RegInit(VecInit(Seq.fill(FtqSize)(f_sent))) 60409c6f1ddSLingrui98 60509c6f1ddSLingrui98 val h_not_hit :: h_false_hit :: h_hit :: Nil = Enum(3) 60609c6f1ddSLingrui98 val entry_hit_status = RegInit(VecInit(Seq.fill(FtqSize)(h_not_hit))) 60709c6f1ddSLingrui98 608f63797a4SLingrui98 // modify registers one cycle later to cut critical path 609f63797a4SLingrui98 val last_cycle_bpu_in = RegNext(bpu_in_fire) 6106bf9b30dSLingrui98 val last_cycle_bpu_in_ptr = RegNext(bpu_in_resp_ptr) 6116bf9b30dSLingrui98 val last_cycle_bpu_in_idx = last_cycle_bpu_in_ptr.value 612adc0b8dfSGuokai Chen val last_cycle_bpu_target = RegNext(bpu_in_resp.getTarget(3)) 613adc0b8dfSGuokai Chen val last_cycle_cfiIndex = RegNext(bpu_in_resp.cfiIndex(3)) 614f63797a4SLingrui98 val last_cycle_bpu_in_stage = RegNext(bpu_in_stage) 615f56177cbSJenius 6167be982afSLingrui98 def extra_copyNum_for_commitStateQueue = 2 6177be982afSLingrui98 val copied_last_cycle_bpu_in = VecInit(Seq.fill(copyNum+extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_fire))) 6187be982afSLingrui98 val copied_last_cycle_bpu_in_ptr_for_ftq = VecInit(Seq.fill(extra_copyNum_for_commitStateQueue)(RegNext(bpu_in_resp_ptr))) 619f56177cbSJenius 620f63797a4SLingrui98 when (last_cycle_bpu_in) { 621f63797a4SLingrui98 entry_fetch_status(last_cycle_bpu_in_idx) := f_to_send 622f63797a4SLingrui98 cfiIndex_vec(last_cycle_bpu_in_idx) := last_cycle_cfiIndex 623f63797a4SLingrui98 pred_stage(last_cycle_bpu_in_idx) := last_cycle_bpu_in_stage 6246bf9b30dSLingrui98 625b0ed7239SLingrui98 update_target(last_cycle_bpu_in_idx) := last_cycle_bpu_target // TODO: remove this 6266bf9b30dSLingrui98 newest_entry_target := last_cycle_bpu_target 6276bf9b30dSLingrui98 newest_entry_ptr := last_cycle_bpu_in_ptr 62809c6f1ddSLingrui98 } 62909c6f1ddSLingrui98 6307be982afSLingrui98 // reduce fanout by delay write for a cycle 6317be982afSLingrui98 when (RegNext(last_cycle_bpu_in)) { 6327be982afSLingrui98 mispredict_vec(RegNext(last_cycle_bpu_in_idx)) := WireInit(VecInit(Seq.fill(PredictWidth)(false.B))) 6337be982afSLingrui98 } 6347be982afSLingrui98 635209a4cafSSteve Gou // record s1 pred cycles 636209a4cafSSteve Gou pred_s1_cycle.map(vec => { 637209a4cafSSteve Gou when (bpu_in_fire && (bpu_in_stage === BP_S1)) { 638209a4cafSSteve Gou vec(bpu_in_resp_ptr.value) := bpu_in_resp.full_pred(0).predCycle.getOrElse(0.U) 639209a4cafSSteve Gou } 640209a4cafSSteve Gou }) 641209a4cafSSteve Gou 6427be982afSLingrui98 // reduce fanout using copied last_cycle_bpu_in and copied last_cycle_bpu_in_ptr 6437be982afSLingrui98 val copied_last_cycle_bpu_in_for_ftq = copied_last_cycle_bpu_in.takeRight(extra_copyNum_for_commitStateQueue) 6447be982afSLingrui98 copied_last_cycle_bpu_in_for_ftq.zip(copied_last_cycle_bpu_in_ptr_for_ftq).zipWithIndex.map { 6457be982afSLingrui98 case ((in, ptr), i) => 6467be982afSLingrui98 when (in) { 6477be982afSLingrui98 val perSetEntries = FtqSize / extra_copyNum_for_commitStateQueue // 32 6487be982afSLingrui98 require(FtqSize % extra_copyNum_for_commitStateQueue == 0) 6497be982afSLingrui98 for (j <- 0 until perSetEntries) { 6509361b0c5SLingrui98 when (ptr.value === (i*perSetEntries+j).U) { 6517be982afSLingrui98 commitStateQueue(i*perSetEntries+j) := VecInit(Seq.fill(PredictWidth)(c_invalid)) 6527be982afSLingrui98 } 6537be982afSLingrui98 } 6547be982afSLingrui98 } 6559361b0c5SLingrui98 } 6567be982afSLingrui98 65709c6f1ddSLingrui98 bpuPtr := bpuPtr + enq_fire 658dc270d3bSJenius copied_bpu_ptr.map(_ := bpuPtr + enq_fire) 659c9bc5480SLingrui98 when (io.toIfu.req.fire && allowToIfu) { 660c5c5edaeSJenius ifuPtr_write := ifuPtrPlus1 6616bf9b30dSLingrui98 ifuPtrPlus1_write := ifuPtrPlus2 6626bf9b30dSLingrui98 ifuPtrPlus2_write := ifuPtrPlus2 + 1.U 663c9bc5480SLingrui98 } 66409c6f1ddSLingrui98 66509c6f1ddSLingrui98 // only use ftb result to assign hit status 666adc0b8dfSGuokai Chen when (bpu_s2_resp.valid(3)) { 667adc0b8dfSGuokai Chen entry_hit_status(bpu_s2_resp.ftq_idx.value) := Mux(bpu_s2_resp.full_pred(3).hit, h_hit, h_not_hit) 66809c6f1ddSLingrui98 } 66909c6f1ddSLingrui98 67009c6f1ddSLingrui98 6712f4a3aa4SLingrui98 io.toIfu.flushFromBpu.s2.valid := bpu_s2_redirect 67209c6f1ddSLingrui98 io.toIfu.flushFromBpu.s2.bits := bpu_s2_resp.ftq_idx 673adc0b8dfSGuokai Chen when (bpu_s2_redirect) { 67409c6f1ddSLingrui98 bpuPtr := bpu_s2_resp.ftq_idx + 1.U 675dc270d3bSJenius copied_bpu_ptr.map(_ := bpu_s2_resp.ftq_idx + 1.U) 67609c6f1ddSLingrui98 // only when ifuPtr runs ahead of bpu s2 resp should we recover it 67709c6f1ddSLingrui98 when (!isBefore(ifuPtr, bpu_s2_resp.ftq_idx)) { 678c5c5edaeSJenius ifuPtr_write := bpu_s2_resp.ftq_idx 679c5c5edaeSJenius ifuPtrPlus1_write := bpu_s2_resp.ftq_idx + 1.U 6806bf9b30dSLingrui98 ifuPtrPlus2_write := bpu_s2_resp.ftq_idx + 2.U 68109c6f1ddSLingrui98 } 68209c6f1ddSLingrui98 } 68309c6f1ddSLingrui98 684cb4f77ceSLingrui98 io.toIfu.flushFromBpu.s3.valid := bpu_s3_redirect 685cb4f77ceSLingrui98 io.toIfu.flushFromBpu.s3.bits := bpu_s3_resp.ftq_idx 686adc0b8dfSGuokai Chen when (bpu_s3_redirect) { 687cb4f77ceSLingrui98 bpuPtr := bpu_s3_resp.ftq_idx + 1.U 688dc270d3bSJenius copied_bpu_ptr.map(_ := bpu_s3_resp.ftq_idx + 1.U) 689cb4f77ceSLingrui98 // only when ifuPtr runs ahead of bpu s2 resp should we recover it 690cb4f77ceSLingrui98 when (!isBefore(ifuPtr, bpu_s3_resp.ftq_idx)) { 691c5c5edaeSJenius ifuPtr_write := bpu_s3_resp.ftq_idx 692c5c5edaeSJenius ifuPtrPlus1_write := bpu_s3_resp.ftq_idx + 1.U 6936bf9b30dSLingrui98 ifuPtrPlus2_write := bpu_s3_resp.ftq_idx + 2.U 694cb4f77ceSLingrui98 } 695cb4f77ceSLingrui98 } 696cb4f77ceSLingrui98 69709c6f1ddSLingrui98 XSError(isBefore(bpuPtr, ifuPtr) && !isFull(bpuPtr, ifuPtr), "\nifuPtr is before bpuPtr!\n") 6982448f137SGuokai Chen XSError(isBefore(ifuWbPtr, commPtr) && !isFull(ifuWbPtr, commPtr), "\ncommPtr is before ifuWbPtr!\n") 69909c6f1ddSLingrui98 700dc270d3bSJenius (0 until copyNum).map{i => 701dc270d3bSJenius XSError(copied_bpu_ptr(i) =/= bpuPtr, "\ncopiedBpuPtr is different from bpuPtr!\n") 702dc270d3bSJenius } 703dc270d3bSJenius 70409c6f1ddSLingrui98 // **************************************************************** 70509c6f1ddSLingrui98 // **************************** to ifu **************************** 70609c6f1ddSLingrui98 // **************************************************************** 707f22cf846SJenius // 0 for ifu, and 1-4 for ICache 708935edac4STang Haojin val bpu_in_bypass_buf = RegEnable(ftq_pc_mem.io.wdata, bpu_in_fire) 709935edac4STang Haojin val copied_bpu_in_bypass_buf = VecInit(Seq.fill(copyNum)(RegEnable(ftq_pc_mem.io.wdata, bpu_in_fire))) 710f56177cbSJenius val bpu_in_bypass_buf_for_ifu = bpu_in_bypass_buf 71109c6f1ddSLingrui98 val bpu_in_bypass_ptr = RegNext(bpu_in_resp_ptr) 71209c6f1ddSLingrui98 val last_cycle_to_ifu_fire = RegNext(io.toIfu.req.fire) 71309c6f1ddSLingrui98 714f56177cbSJenius val copied_bpu_in_bypass_ptr = VecInit(Seq.fill(copyNum)(RegNext(bpu_in_resp_ptr))) 715f56177cbSJenius val copied_last_cycle_to_ifu_fire = VecInit(Seq.fill(copyNum)(RegNext(io.toIfu.req.fire))) 71688bc4f90SLingrui98 71709c6f1ddSLingrui98 // read pc and target 7186bf9b30dSLingrui98 ftq_pc_mem.io.ifuPtr_w := ifuPtr_write 7196bf9b30dSLingrui98 ftq_pc_mem.io.ifuPtrPlus1_w := ifuPtrPlus1_write 7206bf9b30dSLingrui98 ftq_pc_mem.io.ifuPtrPlus2_w := ifuPtrPlus2_write 7216bf9b30dSLingrui98 ftq_pc_mem.io.commPtr_w := commPtr_write 7226bf9b30dSLingrui98 ftq_pc_mem.io.commPtrPlus1_w := commPtrPlus1_write 723c5c5edaeSJenius 72409c6f1ddSLingrui98 7255ff19bd8SLingrui98 io.toIfu.req.bits.ftqIdx := ifuPtr 726f63797a4SLingrui98 727f56177cbSJenius val toICachePcBundle = Wire(Vec(copyNum,new Ftq_RF_Components)) 728dc270d3bSJenius val toICacheEntryToSend = Wire(Vec(copyNum,Bool())) 729b37e4b45SLingrui98 val toIfuPcBundle = Wire(new Ftq_RF_Components) 730f63797a4SLingrui98 val entry_is_to_send = WireInit(entry_fetch_status(ifuPtr.value) === f_to_send) 731f63797a4SLingrui98 val entry_ftq_offset = WireInit(cfiIndex_vec(ifuPtr.value)) 7326bf9b30dSLingrui98 val entry_next_addr = Wire(UInt(VAddrBits.W)) 733b004fa13SJenius 734f56177cbSJenius val pc_mem_ifu_ptr_rdata = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtr_rdata))) 735f56177cbSJenius val pc_mem_ifu_plus1_rdata = VecInit(Seq.fill(copyNum)(RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata))) 736b0ed7239SLingrui98 val diff_entry_next_addr = WireInit(update_target(ifuPtr.value)) //TODO: remove this 737f63797a4SLingrui98 738dc270d3bSJenius val copied_ifu_plus1_to_send = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1)))) 739dc270d3bSJenius val copied_ifu_ptr_to_send = VecInit(Seq.fill(copyNum)(RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) || RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr))) 740dc270d3bSJenius 741f56177cbSJenius for(i <- 0 until copyNum){ 742f56177cbSJenius when(copied_last_cycle_bpu_in(i) && copied_bpu_in_bypass_ptr(i) === copied_ifu_ptr(i)){ 743f56177cbSJenius toICachePcBundle(i) := copied_bpu_in_bypass_buf(i) 744dc270d3bSJenius toICacheEntryToSend(i) := true.B 745f56177cbSJenius }.elsewhen(copied_last_cycle_to_ifu_fire(i)){ 746f56177cbSJenius toICachePcBundle(i) := pc_mem_ifu_plus1_rdata(i) 747dc270d3bSJenius toICacheEntryToSend(i) := copied_ifu_plus1_to_send(i) 748f56177cbSJenius }.otherwise{ 749f56177cbSJenius toICachePcBundle(i) := pc_mem_ifu_ptr_rdata(i) 750dc270d3bSJenius toICacheEntryToSend(i) := copied_ifu_ptr_to_send(i) 751f56177cbSJenius } 752f56177cbSJenius } 753f56177cbSJenius 754873dc383SLingrui98 // TODO: reconsider target address bypass logic 75509c6f1ddSLingrui98 when (last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) { 75688bc4f90SLingrui98 toIfuPcBundle := bpu_in_bypass_buf_for_ifu 757f678dd91SSteve Gou entry_is_to_send := true.B 7586bf9b30dSLingrui98 entry_next_addr := last_cycle_bpu_target 759f63797a4SLingrui98 entry_ftq_offset := last_cycle_cfiIndex 760b0ed7239SLingrui98 diff_entry_next_addr := last_cycle_bpu_target // TODO: remove this 76109c6f1ddSLingrui98 }.elsewhen (last_cycle_to_ifu_fire) { 762c5c5edaeSJenius toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata) 763c5c5edaeSJenius entry_is_to_send := RegNext(entry_fetch_status(ifuPtrPlus1.value) === f_to_send) || 764c5c5edaeSJenius RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1)) // reduce potential bubbles 765ed434d67SLingrui98 entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1), 76688bc4f90SLingrui98 bpu_in_bypass_buf_for_ifu.startAddr, 767fef810c0SLingrui98 Mux(ifuPtr === newest_entry_ptr, 7686bf9b30dSLingrui98 newest_entry_target, 769f83ef67eSLingrui98 RegNext(ftq_pc_mem.io.ifuPtrPlus2_rdata.startAddr))) // ifuPtr+2 770c5c5edaeSJenius }.otherwise { 771c5c5edaeSJenius toIfuPcBundle := RegNext(ftq_pc_mem.io.ifuPtr_rdata) 77228f2cf58SLingrui98 entry_is_to_send := RegNext(entry_fetch_status(ifuPtr.value) === f_to_send) || 77328f2cf58SLingrui98 RegNext(last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr) // reduce potential bubbles 7746bf9b30dSLingrui98 entry_next_addr := Mux(last_cycle_bpu_in && bpu_in_bypass_ptr === (ifuPtrPlus1), 77588bc4f90SLingrui98 bpu_in_bypass_buf_for_ifu.startAddr, 776fef810c0SLingrui98 Mux(ifuPtr === newest_entry_ptr, 7776bf9b30dSLingrui98 newest_entry_target, 778f83ef67eSLingrui98 RegNext(ftq_pc_mem.io.ifuPtrPlus1_rdata.startAddr))) // ifuPtr+1 77909c6f1ddSLingrui98 } 78009c6f1ddSLingrui98 781f678dd91SSteve Gou io.toIfu.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr 782f63797a4SLingrui98 io.toIfu.req.bits.nextStartAddr := entry_next_addr 783f63797a4SLingrui98 io.toIfu.req.bits.ftqOffset := entry_ftq_offset 784b37e4b45SLingrui98 io.toIfu.req.bits.fromFtqPcBundle(toIfuPcBundle) 785c5c5edaeSJenius 786c5c5edaeSJenius io.toICache.req.valid := entry_is_to_send && ifuPtr =/= bpuPtr 787dc270d3bSJenius io.toICache.req.bits.readValid.zipWithIndex.map{case(copy, i) => copy := toICacheEntryToSend(i) && copied_ifu_ptr(i) =/= copied_bpu_ptr(i)} 788b004fa13SJenius io.toICache.req.bits.pcMemRead.zipWithIndex.map{case(copy,i) => copy.fromFtqPcBundle(toICachePcBundle(i))} 789b004fa13SJenius // io.toICache.req.bits.bypassSelect := last_cycle_bpu_in && bpu_in_bypass_ptr === ifuPtr 790b004fa13SJenius // io.toICache.req.bits.bpuBypassWrite.zipWithIndex.map{case(bypassWrtie, i) => 791b004fa13SJenius // bypassWrtie.startAddr := bpu_in_bypass_buf.tail(i).startAddr 792b004fa13SJenius // bypassWrtie.nextlineStart := bpu_in_bypass_buf.tail(i).nextLineAddr 793b004fa13SJenius // } 794f22cf846SJenius 795b0ed7239SLingrui98 // TODO: remove this 796b0ed7239SLingrui98 XSError(io.toIfu.req.valid && diff_entry_next_addr =/= entry_next_addr, 7975a674179SLingrui98 p"\nifu_req_target wrong! ifuPtr: ${ifuPtr}, entry_next_addr: ${Hexadecimal(entry_next_addr)} diff_entry_next_addr: ${Hexadecimal(diff_entry_next_addr)}\n") 798b0ed7239SLingrui98 79909c6f1ddSLingrui98 // when fall through is smaller in value than start address, there must be a false hit 800b37e4b45SLingrui98 when (toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit) { 80109c6f1ddSLingrui98 when (io.toIfu.req.fire && 802cb4f77ceSLingrui98 !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) && 803cb4f77ceSLingrui98 !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr) 80409c6f1ddSLingrui98 ) { 80509c6f1ddSLingrui98 entry_hit_status(ifuPtr.value) := h_false_hit 806352db50aSLingrui98 // XSError(true.B, "FTB false hit by fallThroughError, startAddr: %x, fallTHru: %x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr) 80709c6f1ddSLingrui98 } 808b37e4b45SLingrui98 XSDebug(true.B, "fallThruError! start:%x, fallThru:%x\n", io.toIfu.req.bits.startAddr, io.toIfu.req.bits.nextStartAddr) 80909c6f1ddSLingrui98 } 81009c6f1ddSLingrui98 811a60a2901SLingrui98 XSPerfAccumulate(f"fall_through_error_to_ifu", toIfuPcBundle.fallThruError && entry_hit_status(ifuPtr.value) === h_hit && 812a60a2901SLingrui98 io.toIfu.req.fire && !(bpu_s2_redirect && bpu_s2_resp.ftq_idx === ifuPtr) && !(bpu_s3_redirect && bpu_s3_resp.ftq_idx === ifuPtr)) 813a60a2901SLingrui98 81409c6f1ddSLingrui98 val ifu_req_should_be_flushed = 815cb4f77ceSLingrui98 io.toIfu.flushFromBpu.shouldFlushByStage2(io.toIfu.req.bits.ftqIdx) || 816cb4f77ceSLingrui98 io.toIfu.flushFromBpu.shouldFlushByStage3(io.toIfu.req.bits.ftqIdx) 81709c6f1ddSLingrui98 81809c6f1ddSLingrui98 when (io.toIfu.req.fire && !ifu_req_should_be_flushed) { 81909c6f1ddSLingrui98 entry_fetch_status(ifuPtr.value) := f_sent 82009c6f1ddSLingrui98 } 82109c6f1ddSLingrui98 82209c6f1ddSLingrui98 // ********************************************************************* 82309c6f1ddSLingrui98 // **************************** wb from ifu **************************** 82409c6f1ddSLingrui98 // ********************************************************************* 82509c6f1ddSLingrui98 val pdWb = io.fromIfu.pdWb 82609c6f1ddSLingrui98 val pds = pdWb.bits.pd 82709c6f1ddSLingrui98 val ifu_wb_valid = pdWb.valid 82809c6f1ddSLingrui98 val ifu_wb_idx = pdWb.bits.ftqIdx.value 82909c6f1ddSLingrui98 // read ports: commit update 83009c6f1ddSLingrui98 val ftq_pd_mem = Module(new SyncDataModuleTemplate(new Ftq_pd_Entry, FtqSize, 1, 1)) 83109c6f1ddSLingrui98 ftq_pd_mem.io.wen(0) := ifu_wb_valid 83209c6f1ddSLingrui98 ftq_pd_mem.io.waddr(0) := pdWb.bits.ftqIdx.value 83309c6f1ddSLingrui98 ftq_pd_mem.io.wdata(0).fromPdWb(pdWb.bits) 83409c6f1ddSLingrui98 83509c6f1ddSLingrui98 val hit_pd_valid = entry_hit_status(ifu_wb_idx) === h_hit && ifu_wb_valid 83609c6f1ddSLingrui98 val hit_pd_mispred = hit_pd_valid && pdWb.bits.misOffset.valid 83709c6f1ddSLingrui98 val hit_pd_mispred_reg = RegNext(hit_pd_mispred, init=false.B) 838005e809bSJiuyang Liu val pd_reg = RegEnable(pds, pdWb.valid) 839005e809bSJiuyang Liu val start_pc_reg = RegEnable(pdWb.bits.pc(0), pdWb.valid) 840005e809bSJiuyang Liu val wb_idx_reg = RegEnable(ifu_wb_idx, pdWb.valid) 84109c6f1ddSLingrui98 84209c6f1ddSLingrui98 when (ifu_wb_valid) { 84309c6f1ddSLingrui98 val comm_stq_wen = VecInit(pds.map(_.valid).zip(pdWb.bits.instrRange).map{ 84409c6f1ddSLingrui98 case (v, inRange) => v && inRange 84509c6f1ddSLingrui98 }) 84609c6f1ddSLingrui98 (commitStateQueue(ifu_wb_idx) zip comm_stq_wen).map{ 84709c6f1ddSLingrui98 case (qe, v) => when (v) { qe := c_valid } 84809c6f1ddSLingrui98 } 84909c6f1ddSLingrui98 } 85009c6f1ddSLingrui98 851c5c5edaeSJenius when (ifu_wb_valid) { 852c5c5edaeSJenius ifuWbPtr_write := ifuWbPtr + 1.U 853c5c5edaeSJenius } 85409c6f1ddSLingrui98 855f21bbcb2SGuokai Chen XSError(ifu_wb_valid && isAfter(pdWb.bits.ftqIdx, ifuPtr), "IFU returned a predecode before its req, check IFU") 856f21bbcb2SGuokai Chen 85709c6f1ddSLingrui98 ftb_entry_mem.io.raddr.head := ifu_wb_idx 85809c6f1ddSLingrui98 val has_false_hit = WireInit(false.B) 85909c6f1ddSLingrui98 when (RegNext(hit_pd_valid)) { 86009c6f1ddSLingrui98 // check for false hit 86109c6f1ddSLingrui98 val pred_ftb_entry = ftb_entry_mem.io.rdata.head 862eeb5ff92SLingrui98 val brSlots = pred_ftb_entry.brSlots 863eeb5ff92SLingrui98 val tailSlot = pred_ftb_entry.tailSlot 86409c6f1ddSLingrui98 // we check cfis that bpu predicted 86509c6f1ddSLingrui98 866eeb5ff92SLingrui98 // bpu predicted branches but denied by predecode 867eeb5ff92SLingrui98 val br_false_hit = 868eeb5ff92SLingrui98 brSlots.map{ 869eeb5ff92SLingrui98 s => s.valid && !(pd_reg(s.offset).valid && pd_reg(s.offset).isBr) 870eeb5ff92SLingrui98 }.reduce(_||_) || 871b37e4b45SLingrui98 (tailSlot.valid && pred_ftb_entry.tailSlot.sharing && 872eeb5ff92SLingrui98 !(pd_reg(tailSlot.offset).valid && pd_reg(tailSlot.offset).isBr)) 873eeb5ff92SLingrui98 874eeb5ff92SLingrui98 val jmpOffset = tailSlot.offset 87509c6f1ddSLingrui98 val jmp_pd = pd_reg(jmpOffset) 87609c6f1ddSLingrui98 val jal_false_hit = pred_ftb_entry.jmpValid && 87709c6f1ddSLingrui98 ((pred_ftb_entry.isJal && !(jmp_pd.valid && jmp_pd.isJal)) || 87809c6f1ddSLingrui98 (pred_ftb_entry.isJalr && !(jmp_pd.valid && jmp_pd.isJalr)) || 87909c6f1ddSLingrui98 (pred_ftb_entry.isCall && !(jmp_pd.valid && jmp_pd.isCall)) || 88009c6f1ddSLingrui98 (pred_ftb_entry.isRet && !(jmp_pd.valid && jmp_pd.isRet)) 88109c6f1ddSLingrui98 ) 88209c6f1ddSLingrui98 88309c6f1ddSLingrui98 has_false_hit := br_false_hit || jal_false_hit || hit_pd_mispred_reg 88465fddcf0Szoujr XSDebug(has_false_hit, "FTB false hit by br or jal or hit_pd, startAddr: %x\n", pdWb.bits.pc(0)) 88565fddcf0Szoujr 886352db50aSLingrui98 // assert(!has_false_hit) 88709c6f1ddSLingrui98 } 88809c6f1ddSLingrui98 88909c6f1ddSLingrui98 when (has_false_hit) { 89009c6f1ddSLingrui98 entry_hit_status(wb_idx_reg) := h_false_hit 89109c6f1ddSLingrui98 } 89209c6f1ddSLingrui98 89309c6f1ddSLingrui98 // ******************************************************************************* 89409c6f1ddSLingrui98 // **************************** redirect from backend **************************** 89509c6f1ddSLingrui98 // ******************************************************************************* 89609c6f1ddSLingrui98 89709c6f1ddSLingrui98 // redirect read cfiInfo, couples to redirectGen s2 898bace178aSGao-Zeyu val redirectReadStart = 1 // 0 for ifuRedirect 899bace178aSGao-Zeyu val ftq_redirect_rdata = Wire(Vec(FtqRedirectAheadNum, new Ftq_Redirect_SRAMEntry)) 900bace178aSGao-Zeyu val ftb_redirect_rdata = Wire(Vec(FtqRedirectAheadNum, new FTBEntry)) 901bace178aSGao-Zeyu for (i <- redirectReadStart until FtqRedirectAheadNum) { 902bace178aSGao-Zeyu ftq_redirect_sram.io.ren(i + redirectReadStart) := ftqIdxAhead(i).valid 903bace178aSGao-Zeyu ftq_redirect_sram.io.raddr(i + redirectReadStart) := ftqIdxAhead(i).bits.value 904bace178aSGao-Zeyu ftb_entry_mem.io.raddr(i + redirectReadStart) := ftqIdxAhead(i).bits.value 9059342624fSGao-Zeyu } 906bace178aSGao-Zeyu ftq_redirect_sram.io.ren(redirectReadStart) := Mux(aheadValid, ftqIdxAhead(0).valid, backendRedirect.valid) 907bace178aSGao-Zeyu ftq_redirect_sram.io.raddr(redirectReadStart) := Mux(aheadValid, ftqIdxAhead(0).bits.value, backendRedirect.bits.ftqIdx.value) 908bace178aSGao-Zeyu ftb_entry_mem.io.raddr(redirectReadStart) := Mux(aheadValid, ftqIdxAhead(0).bits.value, backendRedirect.bits.ftqIdx.value) 909bace178aSGao-Zeyu 910bace178aSGao-Zeyu for (i <- 0 until FtqRedirectAheadNum) { 911bace178aSGao-Zeyu ftq_redirect_rdata(i) := ftq_redirect_sram.io.rdata(i + redirectReadStart) 912bace178aSGao-Zeyu ftb_redirect_rdata(i) := ftb_entry_mem.io.rdata(i + redirectReadStart) 913bace178aSGao-Zeyu } 914bace178aSGao-Zeyu val stage3CfiInfo = Mux(realAhdValid, Mux1H(ftqIdxSelOH, ftq_redirect_rdata), ftq_redirect_sram.io.rdata(redirectReadStart)) 91509c6f1ddSLingrui98 val backendRedirectCfi = fromBackendRedirect.bits.cfiUpdate 91609c6f1ddSLingrui98 backendRedirectCfi.fromFtqRedirectSram(stage3CfiInfo) 91709c6f1ddSLingrui98 918d2b20d1aSTang Haojin 919bace178aSGao-Zeyu val r_ftb_entry = Mux(realAhdValid, Mux1H(ftqIdxSelOH, ftb_redirect_rdata), ftb_entry_mem.io.rdata(redirectReadStart)) 92009c6f1ddSLingrui98 val r_ftqOffset = fromBackendRedirect.bits.ftqOffset 92109c6f1ddSLingrui98 922d2b20d1aSTang Haojin backendRedirectCfi.br_hit := r_ftb_entry.brIsSaved(r_ftqOffset) 923d2b20d1aSTang Haojin backendRedirectCfi.jr_hit := r_ftb_entry.isJalr && r_ftb_entry.tailSlot.offset === r_ftqOffset 9243711cf36S小造xu_zh // FIXME: not portable 925abdc3a32Sxu_zh val sc_disagree = stage3CfiInfo.sc_disagree.getOrElse(VecInit(Seq.fill(numBr)(false.B))) 926d2b20d1aSTang Haojin backendRedirectCfi.sc_hit := backendRedirectCfi.br_hit && Mux(r_ftb_entry.brSlots(0).offset === r_ftqOffset, 927abdc3a32Sxu_zh sc_disagree(0), sc_disagree(1)) 928d2b20d1aSTang Haojin 92909c6f1ddSLingrui98 when (entry_hit_status(fromBackendRedirect.bits.ftqIdx.value) === h_hit) { 93009c6f1ddSLingrui98 backendRedirectCfi.shift := PopCount(r_ftb_entry.getBrMaskByOffset(r_ftqOffset)) +& 93109c6f1ddSLingrui98 (backendRedirectCfi.pd.isBr && !r_ftb_entry.brIsSaved(r_ftqOffset) && 932eeb5ff92SLingrui98 !r_ftb_entry.newBrCanNotInsert(r_ftqOffset)) 93309c6f1ddSLingrui98 93409c6f1ddSLingrui98 backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr && (r_ftb_entry.brIsSaved(r_ftqOffset) || 935eeb5ff92SLingrui98 !r_ftb_entry.newBrCanNotInsert(r_ftqOffset)) 93609c6f1ddSLingrui98 }.otherwise { 93709c6f1ddSLingrui98 backendRedirectCfi.shift := (backendRedirectCfi.pd.isBr && backendRedirectCfi.taken).asUInt 93809c6f1ddSLingrui98 backendRedirectCfi.addIntoHist := backendRedirectCfi.pd.isBr.asUInt 93909c6f1ddSLingrui98 } 94009c6f1ddSLingrui98 94109c6f1ddSLingrui98 94209c6f1ddSLingrui98 // *************************************************************************** 94309c6f1ddSLingrui98 // **************************** redirect from ifu **************************** 94409c6f1ddSLingrui98 // *************************************************************************** 945d2b20d1aSTang Haojin val fromIfuRedirect = WireInit(0.U.asTypeOf(Valid(new BranchPredictionRedirect))) 94609c6f1ddSLingrui98 fromIfuRedirect.valid := pdWb.valid && pdWb.bits.misOffset.valid && !backendFlush 94709c6f1ddSLingrui98 fromIfuRedirect.bits.ftqIdx := pdWb.bits.ftqIdx 94809c6f1ddSLingrui98 fromIfuRedirect.bits.ftqOffset := pdWb.bits.misOffset.bits 94909c6f1ddSLingrui98 fromIfuRedirect.bits.level := RedirectLevel.flushAfter 950d2b20d1aSTang Haojin fromIfuRedirect.bits.BTBMissBubble := true.B 951d2b20d1aSTang Haojin fromIfuRedirect.bits.debugIsMemVio := false.B 952d2b20d1aSTang Haojin fromIfuRedirect.bits.debugIsCtrl := false.B 95309c6f1ddSLingrui98 95409c6f1ddSLingrui98 val ifuRedirectCfiUpdate = fromIfuRedirect.bits.cfiUpdate 95509c6f1ddSLingrui98 ifuRedirectCfiUpdate.pc := pdWb.bits.pc(pdWb.bits.misOffset.bits) 95609c6f1ddSLingrui98 ifuRedirectCfiUpdate.pd := pdWb.bits.pd(pdWb.bits.misOffset.bits) 95709c6f1ddSLingrui98 ifuRedirectCfiUpdate.predTaken := cfiIndex_vec(pdWb.bits.ftqIdx.value).valid 95809c6f1ddSLingrui98 ifuRedirectCfiUpdate.target := pdWb.bits.target 95909c6f1ddSLingrui98 ifuRedirectCfiUpdate.taken := pdWb.bits.cfiOffset.valid 96009c6f1ddSLingrui98 ifuRedirectCfiUpdate.isMisPred := pdWb.bits.misOffset.valid 96109c6f1ddSLingrui98 962d2b20d1aSTang Haojin val ifuRedirectReg = RegNext(fromIfuRedirect, init=0.U.asTypeOf(Valid(new BranchPredictionRedirect))) 96309c6f1ddSLingrui98 val ifuRedirectToBpu = WireInit(ifuRedirectReg) 96409c6f1ddSLingrui98 ifuFlush := fromIfuRedirect.valid || ifuRedirectToBpu.valid 96509c6f1ddSLingrui98 96609c6f1ddSLingrui98 ftq_redirect_sram.io.ren.head := fromIfuRedirect.valid 96709c6f1ddSLingrui98 ftq_redirect_sram.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value 96809c6f1ddSLingrui98 96909c6f1ddSLingrui98 ftb_entry_mem.io.raddr.head := fromIfuRedirect.bits.ftqIdx.value 97009c6f1ddSLingrui98 97109c6f1ddSLingrui98 val toBpuCfi = ifuRedirectToBpu.bits.cfiUpdate 97209c6f1ddSLingrui98 toBpuCfi.fromFtqRedirectSram(ftq_redirect_sram.io.rdata.head) 973f1267a13SEaston Man when (ifuRedirectReg.bits.cfiUpdate.pd.isRet && ifuRedirectReg.bits.cfiUpdate.pd.valid) { 974c89b4642SGuokai Chen toBpuCfi.target := toBpuCfi.topAddr 97509c6f1ddSLingrui98 } 97609c6f1ddSLingrui98 977d2b20d1aSTang Haojin when (ifuRedirectReg.valid) { 978d2b20d1aSTang Haojin ifuRedirected(ifuRedirectReg.bits.ftqIdx.value) := true.B 979d2b20d1aSTang Haojin } .elsewhen(RegNext(pdWb.valid)) { 980d2b20d1aSTang Haojin // if pdWb and no redirect, set to false 981d2b20d1aSTang Haojin ifuRedirected(last_cycle_bpu_in_ptr.value) := false.B 982d2b20d1aSTang Haojin } 983d2b20d1aSTang Haojin 9846022c595SsinceforYy // ********************************************************************** 9856022c595SsinceforYy // ***************************** to backend ***************************** 9866022c595SsinceforYy // ********************************************************************** 9876022c595SsinceforYy // to backend pc mem / target 9886022c595SsinceforYy io.toBackend.pc_mem_wen := RegNext(last_cycle_bpu_in) 9896022c595SsinceforYy io.toBackend.pc_mem_waddr := RegEnable(last_cycle_bpu_in_idx, last_cycle_bpu_in) 9906022c595SsinceforYy io.toBackend.pc_mem_wdata := RegEnable(bpu_in_bypass_buf_for_ifu, last_cycle_bpu_in) 9916022c595SsinceforYy 9926022c595SsinceforYy // num cycle is fixed 9936022c595SsinceforYy val newest_entry_en: Bool = RegNext(last_cycle_bpu_in || backendRedirect.valid || ifuRedirectToBpu.valid) 9946022c595SsinceforYy io.toBackend.newest_entry_en := RegNext(newest_entry_en) 9956022c595SsinceforYy io.toBackend.newest_entry_ptr := RegEnable(newest_entry_ptr, newest_entry_en) 9966022c595SsinceforYy io.toBackend.newest_entry_target := RegEnable(newest_entry_target, newest_entry_en) 9976022c595SsinceforYy 99809c6f1ddSLingrui98 // ********************************************************************* 99909c6f1ddSLingrui98 // **************************** wb from exu **************************** 100009c6f1ddSLingrui98 // ********************************************************************* 100109c6f1ddSLingrui98 1002d2b20d1aSTang Haojin backendRedirect.valid := io.fromBackend.redirect.valid 1003d2b20d1aSTang Haojin backendRedirect.bits.connectRedirect(io.fromBackend.redirect.bits) 1004d2b20d1aSTang Haojin backendRedirect.bits.BTBMissBubble := false.B 1005d2b20d1aSTang Haojin 10062e1be6e1SSteve Gou 100709c6f1ddSLingrui98 def extractRedirectInfo(wb: Valid[Redirect]) = { 10086bf9b30dSLingrui98 val ftqPtr = wb.bits.ftqIdx 100909c6f1ddSLingrui98 val ftqOffset = wb.bits.ftqOffset 101009c6f1ddSLingrui98 val taken = wb.bits.cfiUpdate.taken 101109c6f1ddSLingrui98 val mispred = wb.bits.cfiUpdate.isMisPred 10126bf9b30dSLingrui98 (wb.valid, ftqPtr, ftqOffset, taken, mispred) 101309c6f1ddSLingrui98 } 101409c6f1ddSLingrui98 101509c6f1ddSLingrui98 // fix mispredict entry 101609c6f1ddSLingrui98 val lastIsMispredict = RegNext( 1017df5b4b8eSYinan Xu backendRedirect.valid && backendRedirect.bits.level === RedirectLevel.flushAfter, init = false.B 101809c6f1ddSLingrui98 ) 101909c6f1ddSLingrui98 102009c6f1ddSLingrui98 def updateCfiInfo(redirect: Valid[Redirect], isBackend: Boolean = true) = { 10216bf9b30dSLingrui98 val (r_valid, r_ptr, r_offset, r_taken, r_mispred) = extractRedirectInfo(redirect) 10226bf9b30dSLingrui98 val r_idx = r_ptr.value 102309c6f1ddSLingrui98 val cfiIndex_bits_wen = r_valid && r_taken && r_offset < cfiIndex_vec(r_idx).bits 102409c6f1ddSLingrui98 val cfiIndex_valid_wen = r_valid && r_offset === cfiIndex_vec(r_idx).bits 102509c6f1ddSLingrui98 when (cfiIndex_bits_wen || cfiIndex_valid_wen) { 102609c6f1ddSLingrui98 cfiIndex_vec(r_idx).valid := cfiIndex_bits_wen || cfiIndex_valid_wen && r_taken 10273f88c020SGuokai Chen } .elsewhen (r_valid && !r_taken && r_offset =/= cfiIndex_vec(r_idx).bits) { 10283f88c020SGuokai Chen cfiIndex_vec(r_idx).valid :=false.B 102909c6f1ddSLingrui98 } 103009c6f1ddSLingrui98 when (cfiIndex_bits_wen) { 103109c6f1ddSLingrui98 cfiIndex_vec(r_idx).bits := r_offset 103209c6f1ddSLingrui98 } 10336bf9b30dSLingrui98 newest_entry_target := redirect.bits.cfiUpdate.target 1034873dc383SLingrui98 newest_entry_ptr := r_ptr 1035b0ed7239SLingrui98 update_target(r_idx) := redirect.bits.cfiUpdate.target // TODO: remove this 103609c6f1ddSLingrui98 if (isBackend) { 103709c6f1ddSLingrui98 mispredict_vec(r_idx)(r_offset) := r_mispred 103809c6f1ddSLingrui98 } 103909c6f1ddSLingrui98 } 104009c6f1ddSLingrui98 1041bace178aSGao-Zeyu when(fromBackendRedirect.valid) { 1042bace178aSGao-Zeyu updateCfiInfo(fromBackendRedirect) 104309c6f1ddSLingrui98 }.elsewhen (ifuRedirectToBpu.valid) { 104409c6f1ddSLingrui98 updateCfiInfo(ifuRedirectToBpu, isBackend=false) 104509c6f1ddSLingrui98 } 104609c6f1ddSLingrui98 1047bace178aSGao-Zeyu when (fromBackendRedirect.valid) { 1048bace178aSGao-Zeyu when (fromBackendRedirect.bits.ControlRedirectBubble) { 1049d2b20d1aSTang Haojin when (fromBackendRedirect.bits.ControlBTBMissBubble) { 1050d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.BTBMissBubble.id) := true.B 1051d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.BTBMissBubble.id) := true.B 1052d2b20d1aSTang Haojin } .elsewhen (fromBackendRedirect.bits.TAGEMissBubble) { 1053d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.TAGEMissBubble.id) := true.B 1054d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.TAGEMissBubble.id) := true.B 1055d2b20d1aSTang Haojin } .elsewhen (fromBackendRedirect.bits.SCMissBubble) { 1056d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.SCMissBubble.id) := true.B 1057d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.SCMissBubble.id) := true.B 1058d2b20d1aSTang Haojin } .elsewhen (fromBackendRedirect.bits.ITTAGEMissBubble) { 1059d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.ITTAGEMissBubble.id) := true.B 1060d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.ITTAGEMissBubble.id) := true.B 1061d2b20d1aSTang Haojin } .elsewhen (fromBackendRedirect.bits.RASMissBubble) { 1062d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.RASMissBubble.id) := true.B 1063d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.RASMissBubble.id) := true.B 1064d2b20d1aSTang Haojin } 1065d2b20d1aSTang Haojin 1066d2b20d1aSTang Haojin 10679342624fSGao-Zeyu } .elsewhen (backendRedirect.bits.MemVioRedirectBubble) { 1068d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.MemVioRedirectBubble.id) := true.B 1069d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.MemVioRedirectBubble.id) := true.B 1070d2b20d1aSTang Haojin } .otherwise { 1071d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.OtherRedirectBubble.id) := true.B 1072d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.OtherRedirectBubble.id) := true.B 1073d2b20d1aSTang Haojin } 1074d2b20d1aSTang Haojin } .elsewhen (ifuRedirectReg.valid) { 1075d2b20d1aSTang Haojin topdown_stage.reasons(TopDownCounters.BTBMissBubble.id) := true.B 1076d2b20d1aSTang Haojin io.toIfu.req.bits.topdown_info.reasons(TopDownCounters.BTBMissBubble.id) := true.B 1077d2b20d1aSTang Haojin } 1078d2b20d1aSTang Haojin 1079d2b20d1aSTang Haojin io.ControlBTBMissBubble := fromBackendRedirect.bits.ControlBTBMissBubble 1080d2b20d1aSTang Haojin io.TAGEMissBubble := fromBackendRedirect.bits.TAGEMissBubble 1081d2b20d1aSTang Haojin io.SCMissBubble := fromBackendRedirect.bits.SCMissBubble 1082d2b20d1aSTang Haojin io.ITTAGEMissBubble := fromBackendRedirect.bits.ITTAGEMissBubble 1083d2b20d1aSTang Haojin io.RASMissBubble := fromBackendRedirect.bits.RASMissBubble 1084d2b20d1aSTang Haojin 108509c6f1ddSLingrui98 // *********************************************************************************** 108609c6f1ddSLingrui98 // **************************** flush ptr and state queue **************************** 108709c6f1ddSLingrui98 // *********************************************************************************** 108809c6f1ddSLingrui98 1089df5b4b8eSYinan Xu val redirectVec = VecInit(backendRedirect, fromIfuRedirect) 109009c6f1ddSLingrui98 109109c6f1ddSLingrui98 // when redirect, we should reset ptrs and status queues 109209c6f1ddSLingrui98 when(redirectVec.map(r => r.valid).reduce(_||_)){ 10932f4a3aa4SLingrui98 val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits))) 109409c6f1ddSLingrui98 val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_) 10952f4a3aa4SLingrui98 val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level)) 109609c6f1ddSLingrui98 val next = idx + 1.U 109709c6f1ddSLingrui98 bpuPtr := next 1098dc270d3bSJenius copied_bpu_ptr.map(_ := next) 1099c5c5edaeSJenius ifuPtr_write := next 1100c5c5edaeSJenius ifuWbPtr_write := next 1101c5c5edaeSJenius ifuPtrPlus1_write := idx + 2.U 11026bf9b30dSLingrui98 ifuPtrPlus2_write := idx + 3.U 11033f88c020SGuokai Chen 11043f88c020SGuokai Chen } 11053f88c020SGuokai Chen when(RegNext(redirectVec.map(r => r.valid).reduce(_||_))){ 11063f88c020SGuokai Chen val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits))) 11073f88c020SGuokai Chen val notIfu = redirectVec.dropRight(1).map(r => r.valid).reduce(_||_) 11083f88c020SGuokai Chen val (idx, offset, flushItSelf) = (r.ftqIdx, r.ftqOffset, RedirectLevel.flushItself(r.level)) 11093f88c020SGuokai Chen when (RegNext(notIfu)) { 11103f88c020SGuokai Chen commitStateQueue(RegNext(idx.value)).zipWithIndex.foreach({ case (s, i) => 11113f88c020SGuokai Chen when(i.U > RegNext(offset) || i.U === RegNext(offset) && RegNext(flushItSelf)){ 111209c6f1ddSLingrui98 s := c_invalid 111309c6f1ddSLingrui98 } 111409c6f1ddSLingrui98 }) 111509c6f1ddSLingrui98 } 111609c6f1ddSLingrui98 } 111709c6f1ddSLingrui98 11183f88c020SGuokai Chen 111909c6f1ddSLingrui98 // only the valid bit is actually needed 1120df5b4b8eSYinan Xu io.toIfu.redirect.bits := backendRedirect.bits 112109c6f1ddSLingrui98 io.toIfu.redirect.valid := stage2Flush 1122d2b20d1aSTang Haojin io.toIfu.topdown_redirect := fromBackendRedirect 112309c6f1ddSLingrui98 112409c6f1ddSLingrui98 // commit 11259aca92b9SYinan Xu for (c <- io.fromBackend.rob_commits) { 112609c6f1ddSLingrui98 when(c.valid) { 112709c6f1ddSLingrui98 commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset) := c_commited 112888825c5cSYinan Xu // TODO: remove this 112988825c5cSYinan Xu // For instruction fusions, we also update the next instruction 1130c3abb8b6SYinan Xu when (c.bits.commitType === 4.U) { 113188825c5cSYinan Xu commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 1.U) := c_commited 1132c3abb8b6SYinan Xu }.elsewhen(c.bits.commitType === 5.U) { 113388825c5cSYinan Xu commitStateQueue(c.bits.ftqIdx.value)(c.bits.ftqOffset + 2.U) := c_commited 1134c3abb8b6SYinan Xu }.elsewhen(c.bits.commitType === 6.U) { 113588825c5cSYinan Xu val index = (c.bits.ftqIdx + 1.U).value 113688825c5cSYinan Xu commitStateQueue(index)(0) := c_commited 1137c3abb8b6SYinan Xu }.elsewhen(c.bits.commitType === 7.U) { 113888825c5cSYinan Xu val index = (c.bits.ftqIdx + 1.U).value 113988825c5cSYinan Xu commitStateQueue(index)(1) := c_commited 114088825c5cSYinan Xu } 114109c6f1ddSLingrui98 } 114209c6f1ddSLingrui98 } 114309c6f1ddSLingrui98 114489cc69c1STang Haojin robCommPtr_write := Mux(io.fromBackend.rob_commits.map(_.valid).reduce(_ | _), ParallelPriorityMux(io.fromBackend.rob_commits.map(_.valid).reverse, io.fromBackend.rob_commits.map(_.bits.ftqIdx).reverse), robCommPtr) 114589cc69c1STang Haojin 114609c6f1ddSLingrui98 // **************************************************************** 114709c6f1ddSLingrui98 // **************************** to bpu **************************** 114809c6f1ddSLingrui98 // **************************************************************** 114909c6f1ddSLingrui98 115051981c77SbugGenerator io.toBpu.redirect := Mux(fromBackendRedirect.valid, fromBackendRedirect, ifuRedirectToBpu) 1151209a4cafSSteve Gou val dummy_s1_pred_cycle_vec = VecInit(List.tabulate(FtqSize)(_=>0.U(64.W))) 1152209a4cafSSteve Gou val redirect_latency = GTimer() - pred_s1_cycle.getOrElse(dummy_s1_pred_cycle_vec)(io.toBpu.redirect.bits.ftqIdx.value) + 1.U 1153209a4cafSSteve Gou XSPerfHistogram("backend_redirect_latency", redirect_latency, fromBackendRedirect.valid, 0, 60, 1) 1154209a4cafSSteve Gou XSPerfHistogram("ifu_redirect_latency", redirect_latency, !fromBackendRedirect.valid && ifuRedirectToBpu.valid, 0, 60, 1) 115509c6f1ddSLingrui98 1156f21bbcb2SGuokai Chen XSError(io.toBpu.redirect.valid && isBefore(io.toBpu.redirect.bits.ftqIdx, commPtr), "Ftq received a redirect after its commit, check backend or replay") 115709c6f1ddSLingrui98 115802f21c16SLingrui98 val may_have_stall_from_bpu = Wire(Bool()) 115902f21c16SLingrui98 val bpu_ftb_update_stall = RegInit(0.U(2.W)) // 2-cycle stall, so we need 3 states 116002f21c16SLingrui98 may_have_stall_from_bpu := bpu_ftb_update_stall =/= 0.U 116189cc69c1STang Haojin val notInvalidSeq = commitStateQueue(commPtr.value).map(s => s =/= c_invalid).reverse 11624b0d80d8SXuan Hu // Todo: @huxuan check it 11634b0d80d8SXuan Hu // canCommit := commPtr =/= ifuWbPtr && !may_have_stall_from_bpu && 11644b0d80d8SXuan Hu // Cat(commitStateQueue(commPtr.value).map(s => { 11654b0d80d8SXuan Hu // s === c_invalid || s === c_commited 11664b0d80d8SXuan Hu // })).andR 116743aca6c2SGuokai Chen canCommit := commPtr =/= ifuWbPtr && !may_have_stall_from_bpu && 116889cc69c1STang Haojin (isAfter(robCommPtr, commPtr) || PriorityMuxDefault(notInvalidSeq.zip(commitStateQueue(commPtr.value).reverse), c_invalid) === c_commited) 116909c6f1ddSLingrui98 11701d1e6d4dSJenius val mmioReadPtr = io.mmioCommitRead.mmioFtqPtr 11711d1e6d4dSJenius val mmioLastCommit = isBefore(commPtr, mmioReadPtr) && (isAfter(ifuPtr,mmioReadPtr) || mmioReadPtr === ifuPtr) && 1172935edac4STang Haojin Cat(commitStateQueue(mmioReadPtr.value).map(s => { s === c_invalid || s === c_commited})).andR 11731d1e6d4dSJenius io.mmioCommitRead.mmioLastCommit := RegNext(mmioLastCommit) 11741d1e6d4dSJenius 117509c6f1ddSLingrui98 // commit reads 1176c5c5edaeSJenius val commit_pc_bundle = RegNext(ftq_pc_mem.io.commPtr_rdata) 117781101dc4SLingrui98 val commit_target = 117834cf890eSLingrui98 Mux(RegNext(commPtr === newest_entry_ptr), 117934cf890eSLingrui98 RegNext(newest_entry_target), 118081101dc4SLingrui98 RegNext(ftq_pc_mem.io.commPtrPlus1_rdata.startAddr)) 118109c6f1ddSLingrui98 ftq_pd_mem.io.raddr.last := commPtr.value 118209c6f1ddSLingrui98 val commit_pd = ftq_pd_mem.io.rdata.last 118309c6f1ddSLingrui98 ftq_redirect_sram.io.ren.last := canCommit 118409c6f1ddSLingrui98 ftq_redirect_sram.io.raddr.last := commPtr.value 118509c6f1ddSLingrui98 val commit_spec_meta = ftq_redirect_sram.io.rdata.last 118609c6f1ddSLingrui98 ftq_meta_1r_sram.io.ren(0) := canCommit 118709c6f1ddSLingrui98 ftq_meta_1r_sram.io.raddr(0) := commPtr.value 118809c6f1ddSLingrui98 val commit_meta = ftq_meta_1r_sram.io.rdata(0) 118909c6f1ddSLingrui98 ftb_entry_mem.io.raddr.last := commPtr.value 119009c6f1ddSLingrui98 val commit_ftb_entry = ftb_entry_mem.io.rdata.last 119109c6f1ddSLingrui98 119209c6f1ddSLingrui98 // need one cycle to read mem and srams 119309c6f1ddSLingrui98 val do_commit_ptr = RegNext(commPtr) 11945371700eSzoujr val do_commit = RegNext(canCommit, init=false.B) 11956bf9b30dSLingrui98 when (canCommit) { 11966bf9b30dSLingrui98 commPtr_write := commPtrPlus1 11976bf9b30dSLingrui98 commPtrPlus1_write := commPtrPlus1 + 1.U 11986bf9b30dSLingrui98 } 119909c6f1ddSLingrui98 val commit_state = RegNext(commitStateQueue(commPtr.value)) 12005371700eSzoujr val can_commit_cfi = WireInit(cfiIndex_vec(commPtr.value)) 1201d4fcfc3eSGuokai Chen val do_commit_cfi = WireInit(cfiIndex_vec(do_commit_ptr.value)) 12023f88c020SGuokai Chen // 12033f88c020SGuokai Chen //when (commitStateQueue(commPtr.value)(can_commit_cfi.bits) =/= c_commited) { 12043f88c020SGuokai Chen // can_commit_cfi.valid := false.B 12053f88c020SGuokai Chen //} 12065371700eSzoujr val commit_cfi = RegNext(can_commit_cfi) 1207d4fcfc3eSGuokai Chen val debug_cfi = commitStateQueue(do_commit_ptr.value)(do_commit_cfi.bits) =/= c_commited && do_commit_cfi.valid 120809c6f1ddSLingrui98 1209cc2d1573SEaston Man val commit_mispredict : Vec[Bool] = VecInit((RegNext(mispredict_vec(commPtr.value)) zip commit_state).map { 121009c6f1ddSLingrui98 case (mis, state) => mis && state === c_commited 121109c6f1ddSLingrui98 }) 1212cc2d1573SEaston Man val commit_instCommited: Vec[Bool] = VecInit(commit_state.map(_ === c_commited)) // [PredictWidth] 12135371700eSzoujr val can_commit_hit = entry_hit_status(commPtr.value) 12145371700eSzoujr val commit_hit = RegNext(can_commit_hit) 12155fa3df0dSLingrui98 val diff_commit_target = RegNext(update_target(commPtr.value)) // TODO: remove this 1216edc18578SLingrui98 val commit_stage = RegNext(pred_stage(commPtr.value)) 121709c6f1ddSLingrui98 val commit_valid = commit_hit === h_hit || commit_cfi.valid // hit or taken 121809c6f1ddSLingrui98 12195371700eSzoujr val to_bpu_hit = can_commit_hit === h_hit || can_commit_hit === h_false_hit 122002f21c16SLingrui98 switch (bpu_ftb_update_stall) { 122102f21c16SLingrui98 is (0.U) { 122202f21c16SLingrui98 when (can_commit_cfi.valid && !to_bpu_hit && canCommit) { 122302f21c16SLingrui98 bpu_ftb_update_stall := 2.U // 2-cycle stall 122402f21c16SLingrui98 } 122502f21c16SLingrui98 } 122602f21c16SLingrui98 is (2.U) { 122702f21c16SLingrui98 bpu_ftb_update_stall := 1.U 122802f21c16SLingrui98 } 122902f21c16SLingrui98 is (1.U) { 123002f21c16SLingrui98 bpu_ftb_update_stall := 0.U 123102f21c16SLingrui98 } 123202f21c16SLingrui98 is (3.U) { 123302f21c16SLingrui98 XSError(true.B, "bpu_ftb_update_stall should be 0, 1 or 2") 123402f21c16SLingrui98 } 123502f21c16SLingrui98 } 123609c6f1ddSLingrui98 1237b0ed7239SLingrui98 // TODO: remove this 1238b0ed7239SLingrui98 XSError(do_commit && diff_commit_target =/= commit_target, "\ncommit target should be the same as update target\n") 1239b0ed7239SLingrui98 1240b2f6ed0aSSteve Gou // update latency stats 1241b2f6ed0aSSteve Gou val update_latency = GTimer() - pred_s1_cycle.getOrElse(dummy_s1_pred_cycle_vec)(do_commit_ptr.value) + 1.U 1242b2f6ed0aSSteve Gou XSPerfHistogram("bpu_update_latency", update_latency, io.toBpu.update.valid, 0, 64, 2) 1243b2f6ed0aSSteve Gou 124409c6f1ddSLingrui98 io.toBpu.update := DontCare 124509c6f1ddSLingrui98 io.toBpu.update.valid := commit_valid && do_commit 124609c6f1ddSLingrui98 val update = io.toBpu.update.bits 124709c6f1ddSLingrui98 update.false_hit := commit_hit === h_false_hit 124809c6f1ddSLingrui98 update.pc := commit_pc_bundle.startAddr 124909c6f1ddSLingrui98 update.meta := commit_meta.meta 1250803124a6SLingrui98 update.cfi_idx := commit_cfi 12518ffcd86aSLingrui98 update.full_target := commit_target 1252edc18578SLingrui98 update.from_stage := commit_stage 1253c2d1ec7dSLingrui98 update.spec_info := commit_spec_meta 12543f88c020SGuokai Chen XSError(commit_valid && do_commit && debug_cfi, "\ncommit cfi can be non c_commited\n") 125509c6f1ddSLingrui98 125609c6f1ddSLingrui98 val commit_real_hit = commit_hit === h_hit 125709c6f1ddSLingrui98 val update_ftb_entry = update.ftb_entry 125809c6f1ddSLingrui98 125909c6f1ddSLingrui98 val ftbEntryGen = Module(new FTBEntryGen).io 126009c6f1ddSLingrui98 ftbEntryGen.start_addr := commit_pc_bundle.startAddr 126109c6f1ddSLingrui98 ftbEntryGen.old_entry := commit_ftb_entry 126209c6f1ddSLingrui98 ftbEntryGen.pd := commit_pd 126309c6f1ddSLingrui98 ftbEntryGen.cfiIndex := commit_cfi 126409c6f1ddSLingrui98 ftbEntryGen.target := commit_target 126509c6f1ddSLingrui98 ftbEntryGen.hit := commit_real_hit 126609c6f1ddSLingrui98 ftbEntryGen.mispredict_vec := commit_mispredict 126709c6f1ddSLingrui98 126809c6f1ddSLingrui98 update_ftb_entry := ftbEntryGen.new_entry 126909c6f1ddSLingrui98 update.new_br_insert_pos := ftbEntryGen.new_br_insert_pos 127009c6f1ddSLingrui98 update.mispred_mask := ftbEntryGen.mispred_mask 127109c6f1ddSLingrui98 update.old_entry := ftbEntryGen.is_old_entry 1272edc18578SLingrui98 update.pred_hit := commit_hit === h_hit || commit_hit === h_false_hit 1273803124a6SLingrui98 update.br_taken_mask := ftbEntryGen.taken_mask 1274cc2d1573SEaston Man update.br_committed := (ftbEntryGen.new_entry.brValids zip ftbEntryGen.new_entry.brOffset) map { 1275cc2d1573SEaston Man case (valid, offset) => valid && commit_instCommited(offset) 1276cc2d1573SEaston Man } 1277803124a6SLingrui98 update.jmp_taken := ftbEntryGen.jmp_taken 1278b37e4b45SLingrui98 1279803124a6SLingrui98 // update.full_pred.fromFtbEntry(ftbEntryGen.new_entry, update.pc) 1280803124a6SLingrui98 // update.full_pred.jalr_target := commit_target 1281803124a6SLingrui98 // update.full_pred.hit := true.B 1282803124a6SLingrui98 // when (update.full_pred.is_jalr) { 1283803124a6SLingrui98 // update.full_pred.targets.last := commit_target 1284803124a6SLingrui98 // } 128509c6f1ddSLingrui98 1286e30430c2SJay // **************************************************************** 1287e30430c2SJay // *********************** to prefetch **************************** 1288e30430c2SJay // **************************************************************** 1289f9c51548Sssszwic /** 1290f9c51548Sssszwic ****************************************************************************** 1291f9c51548Sssszwic * prefetchPtr control 1292f9c51548Sssszwic * - 1. prefetchPtr plus 1 when toPrefetch fire and keep distance from bpuPtr more than 2 1293f9c51548Sssszwic * - 2. limit range of prefetchPtr is in [ifuPtr + minRange, ifuPtr + maxRange] 1294f9c51548Sssszwic * - 3. flush prefetchPtr when receive redirect from ifu or backend 1295f9c51548Sssszwic ****************************************************************************** 1296f9c51548Sssszwic */ 1297e30430c2SJay val prefetchPtr = RegInit(FtqPtr(false.B, 0.U)) 1298f9c51548Sssszwic val nextPrefetchPtr = WireInit(prefetchPtr) 1299e30430c2SJay 1300f9c51548Sssszwic prefetchPtr := nextPrefetchPtr 1301f9c51548Sssszwic 1302f9c51548Sssszwic // TODO: consider req which cross cacheline 1303f9c51548Sssszwic when(io.toPrefetch.req.fire) { 1304f9c51548Sssszwic when(prefetchPtr < bpuPtr - 2.U) { 1305f9c51548Sssszwic nextPrefetchPtr := prefetchPtr + 1.U 1306a677d2cbSguohongyu } 1307a677d2cbSguohongyu } 1308a677d2cbSguohongyu 1309f9c51548Sssszwic when(prefetchPtr < ifuPtr + minRangeFromIFUptr.U) { 1310f9c51548Sssszwic nextPrefetchPtr := ifuPtr + minRangeFromIFUptr.U 1311f9c51548Sssszwic }.elsewhen(prefetchPtr > ifuPtr + maxRangeFromIFUptr.U) { 1312f9c51548Sssszwic nextPrefetchPtr := ifuPtr + maxRangeFromIFUptr.U 1313e30430c2SJay } 1314e30430c2SJay 1315de7689fcSJay when(redirectVec.map(r => r.valid).reduce(_||_)){ 1316de7689fcSJay val r = PriorityMux(redirectVec.map(r => (r.valid -> r.bits))) 1317f9c51548Sssszwic val next = r.ftqIdx + minRangeFromIFUptr.U 1318f9c51548Sssszwic nextPrefetchPtr := next 1319de7689fcSJay } 1320de7689fcSJay 1321f9c51548Sssszwic // data from ftq_pc_mem has 1 cycle delay 1322f9c51548Sssszwic io.toPrefetch.req.valid := RegNext(entry_fetch_status(nextPrefetchPtr.value) === f_to_send) 1323f9c51548Sssszwic ftq_pc_mem.io.other_raddrs(0) := nextPrefetchPtr.value 1324f9c51548Sssszwic io.toPrefetch.req.bits.target := RegNext(ftq_pc_mem.io.other_rdatas(0).startAddr) 1325378f00d9SJenius 1326f9c51548Sssszwic // record position relationship between ifuPtr, pfPtr and bpuPtr 1327f9c51548Sssszwic val isWritePrefetchPtrTable = WireInit(Constantin.createRecord("isWritePrefetchPtrTable" + p(XSCoreParamsKey).HartId.toString)) 1328f9c51548Sssszwic val prefetchPtrTable = ChiselDB.createTable("PrefetchPtrTable" + p(XSCoreParamsKey).HartId.toString, new PrefetchPtrDB) 1329f9c51548Sssszwic val prefetchPtrDumpData = Wire(new PrefetchPtrDB) 1330f9c51548Sssszwic prefetchPtrDumpData.fromFtqPtr := distanceBetween(bpuPtr, prefetchPtr) 1331f9c51548Sssszwic prefetchPtrDumpData.fromIfuPtr := distanceBetween(prefetchPtr, ifuPtr) 1332378f00d9SJenius 1333f9c51548Sssszwic prefetchPtrTable.log( 1334f9c51548Sssszwic data = prefetchPtrDumpData, 1335f9c51548Sssszwic en = isWritePrefetchPtrTable.orR && io.toPrefetch.req.fire, 1336f9c51548Sssszwic site = "FTQ" + p(XSCoreParamsKey).HartId.toString, 1337f9c51548Sssszwic clock = clock, 1338f9c51548Sssszwic reset = reset 1339f9c51548Sssszwic ) 1340f9c51548Sssszwic 1341de7689fcSJay 134209c6f1ddSLingrui98 // ****************************************************************************** 134309c6f1ddSLingrui98 // **************************** commit perf counters **************************** 134409c6f1ddSLingrui98 // ****************************************************************************** 134509c6f1ddSLingrui98 134609c6f1ddSLingrui98 val commit_inst_mask = VecInit(commit_state.map(c => c === c_commited && do_commit)).asUInt 134709c6f1ddSLingrui98 val commit_mispred_mask = commit_mispredict.asUInt 134809c6f1ddSLingrui98 val commit_not_mispred_mask = ~commit_mispred_mask 134909c6f1ddSLingrui98 135009c6f1ddSLingrui98 val commit_br_mask = commit_pd.brMask.asUInt 135109c6f1ddSLingrui98 val commit_jmp_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.jmpInfo.valid.asTypeOf(UInt(1.W))) 135209c6f1ddSLingrui98 val commit_cfi_mask = (commit_br_mask | commit_jmp_mask) 135309c6f1ddSLingrui98 135409c6f1ddSLingrui98 val mbpInstrs = commit_inst_mask & commit_cfi_mask 135509c6f1ddSLingrui98 135609c6f1ddSLingrui98 val mbpRights = mbpInstrs & commit_not_mispred_mask 135709c6f1ddSLingrui98 val mbpWrongs = mbpInstrs & commit_mispred_mask 135809c6f1ddSLingrui98 135909c6f1ddSLingrui98 io.bpuInfo.bpRight := PopCount(mbpRights) 136009c6f1ddSLingrui98 io.bpuInfo.bpWrong := PopCount(mbpWrongs) 136109c6f1ddSLingrui98 1362da3bf434SMaxpicca-Li val isWriteFTQTable = WireInit(Constantin.createRecord("isWriteFTQTable" + p(XSCoreParamsKey).HartId.toString)) 136351532d8bSGuokai Chen val ftqBranchTraceDB = ChiselDB.createTable("FTQTable" + p(XSCoreParamsKey).HartId.toString, new FtqDebugBundle) 136409c6f1ddSLingrui98 // Cfi Info 136509c6f1ddSLingrui98 for (i <- 0 until PredictWidth) { 136609c6f1ddSLingrui98 val pc = commit_pc_bundle.startAddr + (i * instBytes).U 136709c6f1ddSLingrui98 val v = commit_state(i) === c_commited 136809c6f1ddSLingrui98 val isBr = commit_pd.brMask(i) 136909c6f1ddSLingrui98 val isJmp = commit_pd.jmpInfo.valid && commit_pd.jmpOffset === i.U 137009c6f1ddSLingrui98 val isCfi = isBr || isJmp 137109c6f1ddSLingrui98 val isTaken = commit_cfi.valid && commit_cfi.bits === i.U 137209c6f1ddSLingrui98 val misPred = commit_mispredict(i) 1373c2ad24ebSLingrui98 // val ghist = commit_spec_meta.ghist.predHist 1374c2ad24ebSLingrui98 val histPtr = commit_spec_meta.histPtr 137509c6f1ddSLingrui98 val predCycle = commit_meta.meta(63, 0) 137609c6f1ddSLingrui98 val target = commit_target 137709c6f1ddSLingrui98 137809c6f1ddSLingrui98 val brIdx = OHToUInt(Reverse(Cat(update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U}))) 137909c6f1ddSLingrui98 val inFtbEntry = update_ftb_entry.brValids.zip(update_ftb_entry.brOffset).map{case(v, offset) => v && offset === i.U}.reduce(_||_) 138009c6f1ddSLingrui98 val addIntoHist = ((commit_hit === h_hit) && inFtbEntry) || ((!(commit_hit === h_hit) && i.U === commit_cfi.bits && isBr && commit_cfi.valid)) 138109c6f1ddSLingrui98 XSDebug(v && do_commit && isCfi, p"cfi_update: isBr(${isBr}) pc(${Hexadecimal(pc)}) " + 1382c2ad24ebSLingrui98 p"taken(${isTaken}) mispred(${misPred}) cycle($predCycle) hist(${histPtr.value}) " + 138309c6f1ddSLingrui98 p"startAddr(${Hexadecimal(commit_pc_bundle.startAddr)}) AddIntoHist(${addIntoHist}) " + 138409c6f1ddSLingrui98 p"brInEntry(${inFtbEntry}) brIdx(${brIdx}) target(${Hexadecimal(target)})\n") 138551532d8bSGuokai Chen 138651532d8bSGuokai Chen val logbundle = Wire(new FtqDebugBundle) 138751532d8bSGuokai Chen logbundle.pc := pc 138851532d8bSGuokai Chen logbundle.target := target 138951532d8bSGuokai Chen logbundle.isBr := isBr 139051532d8bSGuokai Chen logbundle.isJmp := isJmp 139151532d8bSGuokai Chen logbundle.isCall := isJmp && commit_pd.hasCall 139251532d8bSGuokai Chen logbundle.isRet := isJmp && commit_pd.hasRet 139351532d8bSGuokai Chen logbundle.misPred := misPred 139451532d8bSGuokai Chen logbundle.isTaken := isTaken 139551532d8bSGuokai Chen logbundle.predStage := commit_stage 139651532d8bSGuokai Chen 139751532d8bSGuokai Chen ftqBranchTraceDB.log( 139851532d8bSGuokai Chen data = logbundle /* hardware of type T */, 1399da3bf434SMaxpicca-Li en = isWriteFTQTable.orR && v && do_commit && isCfi, 140051532d8bSGuokai Chen site = "FTQ" + p(XSCoreParamsKey).HartId.toString, 140151532d8bSGuokai Chen clock = clock, 140251532d8bSGuokai Chen reset = reset 140351532d8bSGuokai Chen ) 140409c6f1ddSLingrui98 } 140509c6f1ddSLingrui98 140609c6f1ddSLingrui98 val enq = io.fromBpu.resp 14072e1be6e1SSteve Gou val perf_redirect = backendRedirect 140809c6f1ddSLingrui98 140909c6f1ddSLingrui98 XSPerfAccumulate("entry", validEntries) 141009c6f1ddSLingrui98 XSPerfAccumulate("bpu_to_ftq_stall", enq.valid && !enq.ready) 141109c6f1ddSLingrui98 XSPerfAccumulate("mispredictRedirect", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level) 141209c6f1ddSLingrui98 XSPerfAccumulate("replayRedirect", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level)) 141309c6f1ddSLingrui98 XSPerfAccumulate("predecodeRedirect", fromIfuRedirect.valid) 141409c6f1ddSLingrui98 141509c6f1ddSLingrui98 XSPerfAccumulate("to_ifu_bubble", io.toIfu.req.ready && !io.toIfu.req.valid) 141609c6f1ddSLingrui98 141709c6f1ddSLingrui98 XSPerfAccumulate("to_ifu_stall", io.toIfu.req.valid && !io.toIfu.req.ready) 141809c6f1ddSLingrui98 XSPerfAccumulate("from_bpu_real_bubble", !enq.valid && enq.ready && allowBpuIn) 141912cedb6fSLingrui98 XSPerfAccumulate("bpu_to_ifu_bubble", bpuPtr === ifuPtr) 1420b2f6ed0aSSteve Gou XSPerfAccumulate("bpu_to_ifu_bubble_when_ftq_full", (bpuPtr === ifuPtr) && isFull(bpuPtr, commPtr) && io.toIfu.req.ready) 142109c6f1ddSLingrui98 1422bace178aSGao-Zeyu XSPerfAccumulate("redirectAhead_ValidNum", ftqIdxAhead.map(_.valid).reduce(_|_)) 14239342624fSGao-Zeyu XSPerfAccumulate("fromBackendRedirect_ValidNum", io.fromBackend.redirect.valid) 14249342624fSGao-Zeyu XSPerfAccumulate("toBpuRedirect_ValidNum", io.toBpu.redirect.valid) 14259342624fSGao-Zeyu 142609c6f1ddSLingrui98 val from_bpu = io.fromBpu.resp.bits 142709c6f1ddSLingrui98 val to_ifu = io.toIfu.req.bits 142809c6f1ddSLingrui98 142909c6f1ddSLingrui98 1430209a4cafSSteve Gou XSPerfHistogram("commit_num_inst", PopCount(commit_inst_mask), do_commit, 0, PredictWidth+1, 1) 143109c6f1ddSLingrui98 143209c6f1ddSLingrui98 143309c6f1ddSLingrui98 143409c6f1ddSLingrui98 143509c6f1ddSLingrui98 val commit_jal_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJal.asTypeOf(UInt(1.W))) 143609c6f1ddSLingrui98 val commit_jalr_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasJalr.asTypeOf(UInt(1.W))) 143709c6f1ddSLingrui98 val commit_call_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasCall.asTypeOf(UInt(1.W))) 143809c6f1ddSLingrui98 val commit_ret_mask = UIntToOH(commit_pd.jmpOffset) & Fill(PredictWidth, commit_pd.hasRet.asTypeOf(UInt(1.W))) 143909c6f1ddSLingrui98 144009c6f1ddSLingrui98 144109c6f1ddSLingrui98 val mbpBRights = mbpRights & commit_br_mask 144209c6f1ddSLingrui98 val mbpJRights = mbpRights & commit_jal_mask 144309c6f1ddSLingrui98 val mbpIRights = mbpRights & commit_jalr_mask 144409c6f1ddSLingrui98 val mbpCRights = mbpRights & commit_call_mask 144509c6f1ddSLingrui98 val mbpRRights = mbpRights & commit_ret_mask 144609c6f1ddSLingrui98 144709c6f1ddSLingrui98 val mbpBWrongs = mbpWrongs & commit_br_mask 144809c6f1ddSLingrui98 val mbpJWrongs = mbpWrongs & commit_jal_mask 144909c6f1ddSLingrui98 val mbpIWrongs = mbpWrongs & commit_jalr_mask 145009c6f1ddSLingrui98 val mbpCWrongs = mbpWrongs & commit_call_mask 145109c6f1ddSLingrui98 val mbpRWrongs = mbpWrongs & commit_ret_mask 145209c6f1ddSLingrui98 14531d7e5011SLingrui98 val commit_pred_stage = RegNext(pred_stage(commPtr.value)) 14541d7e5011SLingrui98 14551d7e5011SLingrui98 def pred_stage_map(src: UInt, name: String) = { 14561d7e5011SLingrui98 (0 until numBpStages).map(i => 14571d7e5011SLingrui98 f"${name}_stage_${i+1}" -> PopCount(src.asBools.map(_ && commit_pred_stage === BP_STAGES(i))) 14581d7e5011SLingrui98 ).foldLeft(Map[String, UInt]())(_+_) 14591d7e5011SLingrui98 } 14601d7e5011SLingrui98 14611d7e5011SLingrui98 val mispred_stage_map = pred_stage_map(mbpWrongs, "mispredict") 14621d7e5011SLingrui98 val br_mispred_stage_map = pred_stage_map(mbpBWrongs, "br_mispredict") 14631d7e5011SLingrui98 val jalr_mispred_stage_map = pred_stage_map(mbpIWrongs, "jalr_mispredict") 14641d7e5011SLingrui98 val correct_stage_map = pred_stage_map(mbpRights, "correct") 14651d7e5011SLingrui98 val br_correct_stage_map = pred_stage_map(mbpBRights, "br_correct") 14661d7e5011SLingrui98 val jalr_correct_stage_map = pred_stage_map(mbpIRights, "jalr_correct") 14671d7e5011SLingrui98 146809c6f1ddSLingrui98 val update_valid = io.toBpu.update.valid 146909c6f1ddSLingrui98 def u(cond: Bool) = update_valid && cond 147009c6f1ddSLingrui98 val ftb_false_hit = u(update.false_hit) 147165fddcf0Szoujr // assert(!ftb_false_hit) 147209c6f1ddSLingrui98 val ftb_hit = u(commit_hit === h_hit) 147309c6f1ddSLingrui98 147409c6f1ddSLingrui98 val ftb_new_entry = u(ftbEntryGen.is_init_entry) 1475b37e4b45SLingrui98 val ftb_new_entry_only_br = ftb_new_entry && !update_ftb_entry.jmpValid 1476b37e4b45SLingrui98 val ftb_new_entry_only_jmp = ftb_new_entry && !update_ftb_entry.brValids(0) 1477b37e4b45SLingrui98 val ftb_new_entry_has_br_and_jmp = ftb_new_entry && update_ftb_entry.brValids(0) && update_ftb_entry.jmpValid 147809c6f1ddSLingrui98 147909c6f1ddSLingrui98 val ftb_old_entry = u(ftbEntryGen.is_old_entry) 148009c6f1ddSLingrui98 148109c6f1ddSLingrui98 val ftb_modified_entry = u(ftbEntryGen.is_new_br || ftbEntryGen.is_jalr_target_modified || ftbEntryGen.is_always_taken_modified) 148209c6f1ddSLingrui98 val ftb_modified_entry_new_br = u(ftbEntryGen.is_new_br) 1483d2b20d1aSTang Haojin val ftb_modified_entry_ifu_redirected = u(ifuRedirected(do_commit_ptr.value)) 148409c6f1ddSLingrui98 val ftb_modified_entry_jalr_target_modified = u(ftbEntryGen.is_jalr_target_modified) 148509c6f1ddSLingrui98 val ftb_modified_entry_br_full = ftb_modified_entry && ftbEntryGen.is_br_full 148609c6f1ddSLingrui98 val ftb_modified_entry_always_taken = ftb_modified_entry && ftbEntryGen.is_always_taken_modified 148709c6f1ddSLingrui98 1488209a4cafSSteve Gou def getFtbEntryLen(pc: UInt, entry: FTBEntry) = (entry.getFallThrough(pc) - pc) >> instOffsetBits 1489209a4cafSSteve Gou val gen_ftb_entry_len = getFtbEntryLen(update.pc, ftbEntryGen.new_entry) 1490209a4cafSSteve Gou XSPerfHistogram("ftb_init_entry_len", gen_ftb_entry_len, ftb_new_entry, 0, PredictWidth+1, 1) 1491209a4cafSSteve Gou XSPerfHistogram("ftb_modified_entry_len", gen_ftb_entry_len, ftb_modified_entry, 0, PredictWidth+1, 1) 1492209a4cafSSteve Gou val s3_ftb_entry_len = getFtbEntryLen(from_bpu.s3.pc(0), from_bpu.last_stage_ftb_entry) 1493209a4cafSSteve Gou XSPerfHistogram("s3_ftb_entry_len", s3_ftb_entry_len, from_bpu.s3.valid(0), 0, PredictWidth+1, 1) 149409c6f1ddSLingrui98 1495209a4cafSSteve Gou XSPerfHistogram("ftq_has_entry", validEntries, true.B, 0, FtqSize+1, 1) 149609c6f1ddSLingrui98 149709c6f1ddSLingrui98 val perfCountsMap = Map( 149809c6f1ddSLingrui98 "BpInstr" -> PopCount(mbpInstrs), 149909c6f1ddSLingrui98 "BpBInstr" -> PopCount(mbpBRights | mbpBWrongs), 150009c6f1ddSLingrui98 "BpRight" -> PopCount(mbpRights), 150109c6f1ddSLingrui98 "BpWrong" -> PopCount(mbpWrongs), 150209c6f1ddSLingrui98 "BpBRight" -> PopCount(mbpBRights), 150309c6f1ddSLingrui98 "BpBWrong" -> PopCount(mbpBWrongs), 150409c6f1ddSLingrui98 "BpJRight" -> PopCount(mbpJRights), 150509c6f1ddSLingrui98 "BpJWrong" -> PopCount(mbpJWrongs), 150609c6f1ddSLingrui98 "BpIRight" -> PopCount(mbpIRights), 150709c6f1ddSLingrui98 "BpIWrong" -> PopCount(mbpIWrongs), 150809c6f1ddSLingrui98 "BpCRight" -> PopCount(mbpCRights), 150909c6f1ddSLingrui98 "BpCWrong" -> PopCount(mbpCWrongs), 151009c6f1ddSLingrui98 "BpRRight" -> PopCount(mbpRRights), 151109c6f1ddSLingrui98 "BpRWrong" -> PopCount(mbpRWrongs), 151209c6f1ddSLingrui98 151309c6f1ddSLingrui98 "ftb_false_hit" -> PopCount(ftb_false_hit), 151409c6f1ddSLingrui98 "ftb_hit" -> PopCount(ftb_hit), 151509c6f1ddSLingrui98 "ftb_new_entry" -> PopCount(ftb_new_entry), 151609c6f1ddSLingrui98 "ftb_new_entry_only_br" -> PopCount(ftb_new_entry_only_br), 151709c6f1ddSLingrui98 "ftb_new_entry_only_jmp" -> PopCount(ftb_new_entry_only_jmp), 151809c6f1ddSLingrui98 "ftb_new_entry_has_br_and_jmp" -> PopCount(ftb_new_entry_has_br_and_jmp), 151909c6f1ddSLingrui98 "ftb_old_entry" -> PopCount(ftb_old_entry), 152009c6f1ddSLingrui98 "ftb_modified_entry" -> PopCount(ftb_modified_entry), 152109c6f1ddSLingrui98 "ftb_modified_entry_new_br" -> PopCount(ftb_modified_entry_new_br), 152209c6f1ddSLingrui98 "ftb_jalr_target_modified" -> PopCount(ftb_modified_entry_jalr_target_modified), 152309c6f1ddSLingrui98 "ftb_modified_entry_br_full" -> PopCount(ftb_modified_entry_br_full), 152409c6f1ddSLingrui98 "ftb_modified_entry_always_taken" -> PopCount(ftb_modified_entry_always_taken) 1525209a4cafSSteve Gou ) ++ mispred_stage_map ++ br_mispred_stage_map ++ jalr_mispred_stage_map ++ 15261d7e5011SLingrui98 correct_stage_map ++ br_correct_stage_map ++ jalr_correct_stage_map 152709c6f1ddSLingrui98 152809c6f1ddSLingrui98 for((key, value) <- perfCountsMap) { 152909c6f1ddSLingrui98 XSPerfAccumulate(key, value) 153009c6f1ddSLingrui98 } 153109c6f1ddSLingrui98 153209c6f1ddSLingrui98 // --------------------------- Debug -------------------------------- 153309c6f1ddSLingrui98 // XSDebug(enq_fire, p"enq! " + io.fromBpu.resp.bits.toPrintable) 153409c6f1ddSLingrui98 XSDebug(io.toIfu.req.fire, p"fire to ifu " + io.toIfu.req.bits.toPrintable) 153509c6f1ddSLingrui98 XSDebug(do_commit, p"deq! [ptr] $do_commit_ptr\n") 153609c6f1ddSLingrui98 XSDebug(true.B, p"[bpuPtr] $bpuPtr, [ifuPtr] $ifuPtr, [ifuWbPtr] $ifuWbPtr [commPtr] $commPtr\n") 153709c6f1ddSLingrui98 XSDebug(true.B, p"[in] v:${io.fromBpu.resp.valid} r:${io.fromBpu.resp.ready} " + 153809c6f1ddSLingrui98 p"[out] v:${io.toIfu.req.valid} r:${io.toIfu.req.ready}\n") 153909c6f1ddSLingrui98 XSDebug(do_commit, p"[deq info] cfiIndex: $commit_cfi, $commit_pc_bundle, target: ${Hexadecimal(commit_target)}\n") 154009c6f1ddSLingrui98 154109c6f1ddSLingrui98 // def ubtbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 154209c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 154309c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 154409c6f1ddSLingrui98 // Mux(valid && pd.isBr, 154509c6f1ddSLingrui98 // isWrong ^ Mux(ans.hit.asBool, 154609c6f1ddSLingrui98 // Mux(ans.taken.asBool, taken && ans.target === commitEntry.target, 154709c6f1ddSLingrui98 // !taken), 154809c6f1ddSLingrui98 // !taken), 154909c6f1ddSLingrui98 // false.B) 155009c6f1ddSLingrui98 // } 155109c6f1ddSLingrui98 // } 155209c6f1ddSLingrui98 155309c6f1ddSLingrui98 // def btbCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 155409c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 155509c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 155609c6f1ddSLingrui98 // Mux(valid && pd.isBr, 155709c6f1ddSLingrui98 // isWrong ^ Mux(ans.hit.asBool, 155809c6f1ddSLingrui98 // Mux(ans.taken.asBool, taken && ans.target === commitEntry.target, 155909c6f1ddSLingrui98 // !taken), 156009c6f1ddSLingrui98 // !taken), 156109c6f1ddSLingrui98 // false.B) 156209c6f1ddSLingrui98 // } 156309c6f1ddSLingrui98 // } 156409c6f1ddSLingrui98 156509c6f1ddSLingrui98 // def tageCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 156609c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 156709c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 156809c6f1ddSLingrui98 // Mux(valid && pd.isBr, 156909c6f1ddSLingrui98 // isWrong ^ (ans.taken.asBool === taken), 157009c6f1ddSLingrui98 // false.B) 157109c6f1ddSLingrui98 // } 157209c6f1ddSLingrui98 // } 157309c6f1ddSLingrui98 157409c6f1ddSLingrui98 // def loopCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 157509c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 157609c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 157709c6f1ddSLingrui98 // Mux(valid && (pd.isBr) && ans.hit.asBool, 157809c6f1ddSLingrui98 // isWrong ^ (!taken), 157909c6f1ddSLingrui98 // false.B) 158009c6f1ddSLingrui98 // } 158109c6f1ddSLingrui98 // } 158209c6f1ddSLingrui98 158309c6f1ddSLingrui98 // def rasCheck(commit: FtqEntry, predAns: Seq[PredictorAnswer], isWrong: Bool) = { 158409c6f1ddSLingrui98 // commit.valids.zip(commit.pd).zip(predAns).zip(commit.takens).map { 158509c6f1ddSLingrui98 // case (((valid, pd), ans), taken) => 158609c6f1ddSLingrui98 // Mux(valid && pd.isRet.asBool /*&& taken*/ && ans.hit.asBool, 158709c6f1ddSLingrui98 // isWrong ^ (ans.target === commitEntry.target), 158809c6f1ddSLingrui98 // false.B) 158909c6f1ddSLingrui98 // } 159009c6f1ddSLingrui98 // } 159109c6f1ddSLingrui98 159209c6f1ddSLingrui98 // val ubtbRights = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), false.B) 159309c6f1ddSLingrui98 // val ubtbWrongs = ubtbCheck(commitEntry, commitEntry.metas.map(_.ubtbAns), true.B) 159409c6f1ddSLingrui98 // // btb and ubtb pred jal and jalr as well 159509c6f1ddSLingrui98 // val btbRights = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), false.B) 159609c6f1ddSLingrui98 // val btbWrongs = btbCheck(commitEntry, commitEntry.metas.map(_.btbAns), true.B) 159709c6f1ddSLingrui98 // val tageRights = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), false.B) 159809c6f1ddSLingrui98 // val tageWrongs = tageCheck(commitEntry, commitEntry.metas.map(_.tageAns), true.B) 159909c6f1ddSLingrui98 160009c6f1ddSLingrui98 // val loopRights = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), false.B) 160109c6f1ddSLingrui98 // val loopWrongs = loopCheck(commitEntry, commitEntry.metas.map(_.loopAns), true.B) 160209c6f1ddSLingrui98 160309c6f1ddSLingrui98 // val rasRights = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), false.B) 160409c6f1ddSLingrui98 // val rasWrongs = rasCheck(commitEntry, commitEntry.metas.map(_.rasAns), true.B) 16051ca0e4f3SYinan Xu 1606cd365d4cSrvcoresjw val perfEvents = Seq( 1607cd365d4cSrvcoresjw ("bpu_s2_redirect ", bpu_s2_redirect ), 1608cb4f77ceSLingrui98 ("bpu_s3_redirect ", bpu_s3_redirect ), 1609cd365d4cSrvcoresjw ("bpu_to_ftq_stall ", enq.valid && ~enq.ready ), 1610cd365d4cSrvcoresjw ("mispredictRedirect ", perf_redirect.valid && RedirectLevel.flushAfter === perf_redirect.bits.level), 1611cd365d4cSrvcoresjw ("replayRedirect ", perf_redirect.valid && RedirectLevel.flushItself(perf_redirect.bits.level) ), 1612cd365d4cSrvcoresjw ("predecodeRedirect ", fromIfuRedirect.valid ), 1613cd365d4cSrvcoresjw ("to_ifu_bubble ", io.toIfu.req.ready && !io.toIfu.req.valid ), 1614cd365d4cSrvcoresjw ("from_bpu_real_bubble ", !enq.valid && enq.ready && allowBpuIn ), 1615cd365d4cSrvcoresjw ("BpInstr ", PopCount(mbpInstrs) ), 1616cd365d4cSrvcoresjw ("BpBInstr ", PopCount(mbpBRights | mbpBWrongs) ), 1617cd365d4cSrvcoresjw ("BpRight ", PopCount(mbpRights) ), 1618cd365d4cSrvcoresjw ("BpWrong ", PopCount(mbpWrongs) ), 1619cd365d4cSrvcoresjw ("BpBRight ", PopCount(mbpBRights) ), 1620cd365d4cSrvcoresjw ("BpBWrong ", PopCount(mbpBWrongs) ), 1621cd365d4cSrvcoresjw ("BpJRight ", PopCount(mbpJRights) ), 1622cd365d4cSrvcoresjw ("BpJWrong ", PopCount(mbpJWrongs) ), 1623cd365d4cSrvcoresjw ("BpIRight ", PopCount(mbpIRights) ), 1624cd365d4cSrvcoresjw ("BpIWrong ", PopCount(mbpIWrongs) ), 1625cd365d4cSrvcoresjw ("BpCRight ", PopCount(mbpCRights) ), 1626cd365d4cSrvcoresjw ("BpCWrong ", PopCount(mbpCWrongs) ), 1627cd365d4cSrvcoresjw ("BpRRight ", PopCount(mbpRRights) ), 1628cd365d4cSrvcoresjw ("BpRWrong ", PopCount(mbpRWrongs) ), 1629cd365d4cSrvcoresjw ("ftb_false_hit ", PopCount(ftb_false_hit) ), 1630cd365d4cSrvcoresjw ("ftb_hit ", PopCount(ftb_hit) ), 1631cd365d4cSrvcoresjw ) 16321ca0e4f3SYinan Xu generatePerfEvent() 163309c6f1ddSLingrui98} 1634