109c6f1ddSLingrui98/*************************************************************************************** 209c6f1ddSLingrui98* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 309c6f1ddSLingrui98* Copyright (c) 2020-2021 Peng Cheng Laboratory 409c6f1ddSLingrui98* 509c6f1ddSLingrui98* XiangShan is licensed under Mulan PSL v2. 609c6f1ddSLingrui98* You can use this software according to the terms and conditions of the Mulan PSL v2. 709c6f1ddSLingrui98* You may obtain a copy of Mulan PSL v2 at: 809c6f1ddSLingrui98* http://license.coscl.org.cn/MulanPSL2 909c6f1ddSLingrui98* 1009c6f1ddSLingrui98* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 1109c6f1ddSLingrui98* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 1209c6f1ddSLingrui98* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 1309c6f1ddSLingrui98* 1409c6f1ddSLingrui98* See the Mulan PSL v2 for more details. 1509c6f1ddSLingrui98***************************************************************************************/ 1609c6f1ddSLingrui98 1709c6f1ddSLingrui98package xiangshan.frontend 1809c6f1ddSLingrui98 1909c6f1ddSLingrui98import chipsalliance.rocketchip.config.Parameters 2009c6f1ddSLingrui98import chisel3._ 2109c6f1ddSLingrui98import chisel3.stage.{ChiselGeneratorAnnotation, ChiselStage} 2209c6f1ddSLingrui98import chisel3.util._ 2309c6f1ddSLingrui98import xiangshan._ 2409c6f1ddSLingrui98import utils._ 2509c6f1ddSLingrui98import chisel3.experimental.chiselName 2609c6f1ddSLingrui98 2709c6f1ddSLingrui98import scala.math.min 2809c6f1ddSLingrui98 2909c6f1ddSLingrui98 3009c6f1ddSLingrui98trait FTBParams extends HasXSParameter with HasBPUConst { 31ba4cf515SLingrui98 val numEntries = 4096 3209c6f1ddSLingrui98 val numWays = 4 3309c6f1ddSLingrui98 val numSets = numEntries/numWays // 512 3409c6f1ddSLingrui98 val tagSize = 20 3509c6f1ddSLingrui98 3609c6f1ddSLingrui98 val TAR_STAT_SZ = 2 3709c6f1ddSLingrui98 def TAR_FIT = 0.U(TAR_STAT_SZ.W) 3809c6f1ddSLingrui98 def TAR_OVF = 1.U(TAR_STAT_SZ.W) 3909c6f1ddSLingrui98 def TAR_UDF = 2.U(TAR_STAT_SZ.W) 4009c6f1ddSLingrui98 4109c6f1ddSLingrui98 def BR_OFFSET_LEN = 13 4209c6f1ddSLingrui98 def JMP_OFFSET_LEN = 21 4309c6f1ddSLingrui98} 4409c6f1ddSLingrui98 4509c6f1ddSLingrui98class FTBEntry(implicit p: Parameters) extends XSBundle with FTBParams with BPUUtils { 4609c6f1ddSLingrui98 val valid = Bool() 4709c6f1ddSLingrui98 4809c6f1ddSLingrui98 val brOffset = Vec(numBr, UInt(log2Up(FetchWidth*2).W)) 4909c6f1ddSLingrui98 val brLowers = Vec(numBr, UInt(BR_OFFSET_LEN.W)) 5009c6f1ddSLingrui98 val brTarStats = Vec(numBr, UInt(TAR_STAT_SZ.W)) 5109c6f1ddSLingrui98 val brValids = Vec(numBr, Bool()) 5209c6f1ddSLingrui98 5309c6f1ddSLingrui98 val jmpOffset = UInt(log2Ceil(PredictWidth).W) 5409c6f1ddSLingrui98 val jmpLower = UInt(JMP_OFFSET_LEN.W) 5509c6f1ddSLingrui98 val jmpTarStat = UInt(TAR_STAT_SZ.W) 5609c6f1ddSLingrui98 val jmpValid = Bool() 5709c6f1ddSLingrui98 5809c6f1ddSLingrui98 // Partial Fall-Through Address 5909c6f1ddSLingrui98 val pftAddr = UInt((log2Up(PredictWidth)+1).W) 6009c6f1ddSLingrui98 val carry = Bool() 6109c6f1ddSLingrui98 6209c6f1ddSLingrui98 val isCall = Bool() 6309c6f1ddSLingrui98 val isRet = Bool() 6409c6f1ddSLingrui98 val isJalr = Bool() 6509c6f1ddSLingrui98 6609c6f1ddSLingrui98 val oversize = Bool() 6709c6f1ddSLingrui98 6809c6f1ddSLingrui98 val last_is_rvc = Bool() 6909c6f1ddSLingrui98 7009c6f1ddSLingrui98 val always_taken = Vec(numBr, Bool()) 7109c6f1ddSLingrui98 7209c6f1ddSLingrui98 def getTarget(offsetLen: Int)(pc: UInt, lower: UInt, stat: UInt) = { 7309c6f1ddSLingrui98 val higher = pc(VAddrBits-1, offsetLen) 7409c6f1ddSLingrui98 Cat( 7509c6f1ddSLingrui98 Mux(stat === TAR_OVF, higher+1.U, 7609c6f1ddSLingrui98 Mux(stat === TAR_UDF, higher-1.U, higher)), 7709c6f1ddSLingrui98 lower 7809c6f1ddSLingrui98 ) 7909c6f1ddSLingrui98 } 8009c6f1ddSLingrui98 val getBrTarget = getTarget(BR_OFFSET_LEN)(_, _, _) 8109c6f1ddSLingrui98 8209c6f1ddSLingrui98 def getBrTargets(pc: UInt) = { 8309c6f1ddSLingrui98 VecInit((brLowers zip brTarStats).map{ 8409c6f1ddSLingrui98 case (lower, stat) => getBrTarget(pc, lower, stat) 8509c6f1ddSLingrui98 }) 8609c6f1ddSLingrui98 } 8709c6f1ddSLingrui98 8809c6f1ddSLingrui98 def getJmpTarget(pc: UInt) = getTarget(JMP_OFFSET_LEN)(pc, jmpLower, jmpTarStat) 8909c6f1ddSLingrui98 9009c6f1ddSLingrui98 def getLowerStatByTarget(offsetLen: Int)(pc: UInt, target: UInt) = { 9109c6f1ddSLingrui98 val pc_higher = pc(VAddrBits-1, offsetLen) 927f36ad77Szoujr val target_higher = target(VAddrBits-1, offsetLen) 9309c6f1ddSLingrui98 val stat = WireInit(Mux(target_higher > pc_higher, TAR_OVF, 9409c6f1ddSLingrui98 Mux(target_higher < pc_higher, TAR_UDF, TAR_FIT))) 9509c6f1ddSLingrui98 val lower = WireInit(target(offsetLen-1, 0)) 9609c6f1ddSLingrui98 (lower, stat) 9709c6f1ddSLingrui98 } 9809c6f1ddSLingrui98 def getBrLowerStatByTarget(pc: UInt, target: UInt) = getLowerStatByTarget(BR_OFFSET_LEN)(pc, target) 9909c6f1ddSLingrui98 def getJmpLowerStatByTarget(pc: UInt, target: UInt) = getLowerStatByTarget(JMP_OFFSET_LEN)(pc, target) 10009c6f1ddSLingrui98 def setByBrTarget(brIdx: Int, pc: UInt, target: UInt) = { 10109c6f1ddSLingrui98 val (lower, stat) = getBrLowerStatByTarget(pc, target) 10209c6f1ddSLingrui98 this.brLowers(brIdx) := lower 10309c6f1ddSLingrui98 this.brTarStats(brIdx) := stat 10409c6f1ddSLingrui98 } 10509c6f1ddSLingrui98 def setByJmpTarget(pc: UInt, target: UInt) = { 10609c6f1ddSLingrui98 val (lower, stat) = getJmpLowerStatByTarget(pc, target) 10709c6f1ddSLingrui98 this.jmpLower := lower 10809c6f1ddSLingrui98 this.jmpTarStat := stat 10909c6f1ddSLingrui98 } 11009c6f1ddSLingrui98 11109c6f1ddSLingrui98 11209c6f1ddSLingrui98 def getOffsetVec = VecInit(brOffset :+ jmpOffset) 11309c6f1ddSLingrui98 def isJal = !isJalr 11409c6f1ddSLingrui98 def getFallThrough(pc: UInt) = getFallThroughAddr(pc, carry, pftAddr) 11509c6f1ddSLingrui98 def hasBr(offset: UInt) = (brValids zip brOffset).map{ 11609c6f1ddSLingrui98 case (v, off) => v && off <= offset 11709c6f1ddSLingrui98 }.reduce(_||_) 11809c6f1ddSLingrui98 11909c6f1ddSLingrui98 def getBrMaskByOffset(offset: UInt) = (brValids zip brOffset).map{ 12009c6f1ddSLingrui98 case (v, off) => v && off <= offset 12109c6f1ddSLingrui98 } 12209c6f1ddSLingrui98 12309c6f1ddSLingrui98 def brIsSaved(offset: UInt) = (brValids zip brOffset).map{ 12409c6f1ddSLingrui98 case (v, off) => v && off === offset 12509c6f1ddSLingrui98 }.reduce(_||_) 12609c6f1ddSLingrui98 def display(cond: Bool): Unit = { 12709c6f1ddSLingrui98 XSDebug(cond, p"-----------FTB entry----------- \n") 12809c6f1ddSLingrui98 XSDebug(cond, p"v=${valid}\n") 12909c6f1ddSLingrui98 for(i <- 0 until numBr) { 13009c6f1ddSLingrui98 XSDebug(cond, p"[br$i]: v=${brValids(i)}, offset=${brOffset(i)}, lower=${Hexadecimal(brLowers(i))}\n") 13109c6f1ddSLingrui98 } 13209c6f1ddSLingrui98 XSDebug(cond, p"[jmp]: v=${jmpValid}, offset=${jmpOffset}, lower=${Hexadecimal(jmpLower)}\n") 13309c6f1ddSLingrui98 XSDebug(cond, p"pftAddr=${Hexadecimal(pftAddr)}, carry=$carry\n") 13409c6f1ddSLingrui98 XSDebug(cond, p"isCall=$isCall, isRet=$isRet, isjalr=$isJalr\n") 13509c6f1ddSLingrui98 XSDebug(cond, p"oversize=$oversize, last_is_rvc=$last_is_rvc\n") 13609c6f1ddSLingrui98 XSDebug(cond, p"------------------------------- \n") 13709c6f1ddSLingrui98 } 13809c6f1ddSLingrui98 13909c6f1ddSLingrui98} 14009c6f1ddSLingrui98 14109c6f1ddSLingrui98class FTBEntryWithTag(implicit p: Parameters) extends XSBundle with FTBParams with BPUUtils { 14209c6f1ddSLingrui98 val entry = new FTBEntry 14309c6f1ddSLingrui98 val tag = UInt(tagSize.W) 14409c6f1ddSLingrui98 def display(cond: Bool): Unit = { 14509c6f1ddSLingrui98 XSDebug(cond, p"-----------FTB entry----------- \n") 14609c6f1ddSLingrui98 XSDebug(cond, p"v=${entry.valid}, tag=${Hexadecimal(tag)}\n") 14709c6f1ddSLingrui98 for(i <- 0 until numBr) { 14809c6f1ddSLingrui98 XSDebug(cond, p"[br$i]: v=${entry.brValids(i)}, offset=${entry.brOffset(i)}, lower=${Hexadecimal(entry.brLowers(i))}\n") 14909c6f1ddSLingrui98 } 15009c6f1ddSLingrui98 XSDebug(cond, p"[jmp]: v=${entry.jmpValid}, offset=${entry.jmpOffset}, lower=${Hexadecimal(entry.jmpLower)}\n") 15109c6f1ddSLingrui98 XSDebug(cond, p"pftAddr=${Hexadecimal(entry.pftAddr)}, carry=${entry.carry}\n") 15209c6f1ddSLingrui98 XSDebug(cond, p"isCall=${entry.isCall}, isRet=${entry.isRet}, isjalr=${entry.isJalr}\n") 15309c6f1ddSLingrui98 XSDebug(cond, p"oversize=${entry.oversize}, last_is_rvc=${entry.last_is_rvc}\n") 15409c6f1ddSLingrui98 XSDebug(cond, p"------------------------------- \n") 15509c6f1ddSLingrui98 } 15609c6f1ddSLingrui98} 15709c6f1ddSLingrui98 15809c6f1ddSLingrui98class FTBMeta(implicit p: Parameters) extends XSBundle with FTBParams { 159bb09c7feSzoujr val writeWay = UInt(log2Ceil(numWays).W) 16009c6f1ddSLingrui98 val hit = Bool() 16109c6f1ddSLingrui98 val pred_cycle = UInt(64.W) // TODO: Use Option 16209c6f1ddSLingrui98} 16309c6f1ddSLingrui98 16409c6f1ddSLingrui98object FTBMeta { 16509c6f1ddSLingrui98 def apply(writeWay: UInt, hit: Bool, pred_cycle: UInt)(implicit p: Parameters): FTBMeta = { 16609c6f1ddSLingrui98 val e = Wire(new FTBMeta) 16709c6f1ddSLingrui98 e.writeWay := writeWay 16809c6f1ddSLingrui98 e.hit := hit 16909c6f1ddSLingrui98 e.pred_cycle := pred_cycle 17009c6f1ddSLingrui98 e 17109c6f1ddSLingrui98 } 17209c6f1ddSLingrui98} 17309c6f1ddSLingrui98 174c6bf0bffSzoujr// class UpdateQueueEntry(implicit p: Parameters) extends XSBundle with FTBParams { 175c6bf0bffSzoujr// val pc = UInt(VAddrBits.W) 176c6bf0bffSzoujr// val ftb_entry = new FTBEntry 177c6bf0bffSzoujr// val hit = Bool() 178c6bf0bffSzoujr// val hit_way = UInt(log2Ceil(numWays).W) 179c6bf0bffSzoujr// } 180c6bf0bffSzoujr// 181c6bf0bffSzoujr// object UpdateQueueEntry { 182c6bf0bffSzoujr// def apply(pc: UInt, fe: FTBEntry, hit: Bool, hit_way: UInt)(implicit p: Parameters): UpdateQueueEntry = { 183c6bf0bffSzoujr// val e = Wire(new UpdateQueueEntry) 184c6bf0bffSzoujr// e.pc := pc 185c6bf0bffSzoujr// e.ftb_entry := fe 186c6bf0bffSzoujr// e.hit := hit 187c6bf0bffSzoujr// e.hit_way := hit_way 188c6bf0bffSzoujr// e 189c6bf0bffSzoujr// } 190c6bf0bffSzoujr// } 191c6bf0bffSzoujr 192c6bf0bffSzoujrclass FTB(implicit p: Parameters) extends BasePredictor with FTBParams with BPUUtils with HasCircularQueuePtrHelper { 19309c6f1ddSLingrui98 override val meta_size = WireInit(0.U.asTypeOf(new FTBMeta)).getWidth 19409c6f1ddSLingrui98 19509c6f1ddSLingrui98 val ftbAddr = new TableAddr(log2Up(numSets), 1) 19609c6f1ddSLingrui98 19709c6f1ddSLingrui98 class FTBBank(val numSets: Int, val nWays: Int) extends XSModule with BPUUtils { 19809c6f1ddSLingrui98 val io = IO(new Bundle { 1995371700eSzoujr val s1_fire = Input(Bool()) 20009c6f1ddSLingrui98 20109c6f1ddSLingrui98 // when ftb hit, read_hits.valid is true, and read_hits.bits is OH of hit way 20209c6f1ddSLingrui98 // when ftb not hit, read_hits.valid is false, and read_hits is OH of allocWay 203bb09c7feSzoujr // val read_hits = Valid(Vec(numWays, Bool())) 204*1c8d9e26Szoujr val req_pc = Flipped(DecoupledIO(UInt(VAddrBits.W))) 205*1c8d9e26Szoujr val read_resp = Output(new FTBEntry) 206bb09c7feSzoujr val read_hits = Valid(UInt(log2Ceil(numWays).W)) 20709c6f1ddSLingrui98 208*1c8d9e26Szoujr val u_req_pc = Flipped(DecoupledIO(UInt(VAddrBits.W))) 209*1c8d9e26Szoujr val update_hits = Valid(UInt(log2Ceil(numWays).W)) 210*1c8d9e26Szoujr val update_access = Input(Bool()) 211*1c8d9e26Szoujr 21209c6f1ddSLingrui98 val update_pc = Input(UInt(VAddrBits.W)) 21309c6f1ddSLingrui98 val update_write_data = Flipped(Valid(new FTBEntryWithTag)) 214c6bf0bffSzoujr val update_write_way = Input(UInt(log2Ceil(numWays).W)) 215c6bf0bffSzoujr val update_write_alloc = Input(Bool()) 21609c6f1ddSLingrui98 }) 21709c6f1ddSLingrui98 218*1c8d9e26Szoujr // Extract holdRead logic to fix bug that update read override predict read result 219*1c8d9e26Szoujr val ftb = Module(new SRAMTemplate(new FTBEntryWithTag, set = numSets, way = numWays, shouldReset = true, holdRead = false, singlePort = true)) 22009c6f1ddSLingrui98 221*1c8d9e26Szoujr val pred_rdata = HoldUnless(ftb.io.r.resp.data, RegNext(io.req_pc.valid && !io.update_access)) 222*1c8d9e26Szoujr ftb.io.r.req.valid := io.req_pc.valid || io.u_req_pc.valid // io.s0_fire 223*1c8d9e26Szoujr ftb.io.r.req.bits.setIdx := Mux(io.u_req_pc.valid, ftbAddr.getIdx(io.u_req_pc.bits), ftbAddr.getIdx(io.req_pc.bits)) // s0_idx 224*1c8d9e26Szoujr 225*1c8d9e26Szoujr assert(!(io.req_pc.valid && io.u_req_pc.valid)) 22609c6f1ddSLingrui98 22709c6f1ddSLingrui98 io.req_pc.ready := ftb.io.r.req.ready 228*1c8d9e26Szoujr io.u_req_pc.ready := ftb.io.r.req.ready 22909c6f1ddSLingrui98 23009c6f1ddSLingrui98 val req_tag = RegEnable(ftbAddr.getTag(io.req_pc.bits)(tagSize-1, 0), io.req_pc.valid) 231ac3f6f25Szoujr val req_idx = RegEnable(ftbAddr.getIdx(io.req_pc.bits), io.req_pc.valid) 23209c6f1ddSLingrui98 233*1c8d9e26Szoujr val u_req_tag = RegEnable(ftbAddr.getTag(io.u_req_pc.bits)(tagSize-1, 0), io.u_req_pc.valid) 23409c6f1ddSLingrui98 235*1c8d9e26Szoujr val read_entries = pred_rdata.map(_.entry) 236*1c8d9e26Szoujr val read_tags = pred_rdata.map(_.tag) 237*1c8d9e26Szoujr 238*1c8d9e26Szoujr val total_hits = VecInit((0 until numWays).map(b => read_tags(b) === req_tag && read_entries(b).valid && io.s1_fire)) 23909c6f1ddSLingrui98 val hit = total_hits.reduce(_||_) 240bb09c7feSzoujr // val hit_way_1h = VecInit(PriorityEncoderOH(total_hits)) 241bb09c7feSzoujr val hit_way = PriorityEncoder(total_hits) 242bb09c7feSzoujr 243*1c8d9e26Szoujr val u_total_hits = VecInit((0 until numWays).map(b => 244*1c8d9e26Szoujr ftb.io.r.resp.data(b).tag === u_req_tag && ftb.io.r.resp.data(b).entry.valid && RegNext(io.update_access))) 245*1c8d9e26Szoujr val u_hit = u_total_hits.reduce(_||_) 246*1c8d9e26Szoujr // val hit_way_1h = VecInit(PriorityEncoderOH(total_hits)) 247*1c8d9e26Szoujr val u_hit_way = PriorityEncoder(u_total_hits) 248*1c8d9e26Szoujr 249bb09c7feSzoujr assert(PopCount(total_hits) === 1.U || PopCount(total_hits) === 0.U) 250*1c8d9e26Szoujr assert(PopCount(u_total_hits) === 1.U || PopCount(u_total_hits) === 0.U) 25109c6f1ddSLingrui98 252ac3f6f25Szoujr val replacer = ReplacementPolicy.fromString(Some("setplru"), numWays, numSets) 253c6bf0bffSzoujr // val allocWriteWay = replacer.way(req_idx) 25409c6f1ddSLingrui98 255ac3f6f25Szoujr val touch_set = Seq.fill(1)(Wire(UInt(log2Ceil(numSets).W))) 256ac3f6f25Szoujr val touch_way = Seq.fill(1)(Wire(Valid(UInt(log2Ceil(numWays).W)))) 257ac3f6f25Szoujr 258ac3f6f25Szoujr touch_set(0) := req_idx 259ac3f6f25Szoujr 260*1c8d9e26Szoujr touch_way(0).valid := hit 261bb09c7feSzoujr touch_way(0).bits := hit_way 262ac3f6f25Szoujr 263c6bf0bffSzoujr replacer.access(touch_set, touch_way) 264c6bf0bffSzoujr 265ac3f6f25Szoujr // def allocWay(valids: UInt, meta_tags: UInt, req_tag: UInt) = { 266ac3f6f25Szoujr // val randomAlloc = false 267ac3f6f25Szoujr // if (numWays > 1) { 268ac3f6f25Szoujr // val w = Wire(UInt(log2Up(numWays).W)) 269ac3f6f25Szoujr // val valid = WireInit(valids.andR) 270ac3f6f25Szoujr // val tags = Cat(meta_tags, req_tag) 271ac3f6f25Szoujr // val l = log2Up(numWays) 272ac3f6f25Szoujr // val nChunks = (tags.getWidth + l - 1) / l 273ac3f6f25Szoujr // val chunks = (0 until nChunks).map( i => 274ac3f6f25Szoujr // tags(min((i+1)*l, tags.getWidth)-1, i*l) 275ac3f6f25Szoujr // ) 276ac3f6f25Szoujr // w := Mux(valid, if (randomAlloc) {LFSR64()(log2Up(numWays)-1,0)} else {chunks.reduce(_^_)}, PriorityEncoder(~valids)) 277ac3f6f25Szoujr // w 278ac3f6f25Szoujr // } else { 279ac3f6f25Szoujr // val w = WireInit(0.U) 280ac3f6f25Szoujr // w 281ac3f6f25Szoujr // } 282ac3f6f25Szoujr // } 283ac3f6f25Szoujr 284ac3f6f25Szoujr // val allocWriteWay = allocWay( 285ac3f6f25Szoujr // VecInit(read_entries.map(_.valid)).asUInt, 286ac3f6f25Szoujr // VecInit(read_tags).asUInt, 287ac3f6f25Szoujr // req_tag 288ac3f6f25Szoujr // ) 28909c6f1ddSLingrui98 2905371700eSzoujr def allocWay(valids: UInt, idx: UInt) = { 2915371700eSzoujr if (numWays > 1) { 2925371700eSzoujr val w = Wire(UInt(log2Up(numWays).W)) 2935371700eSzoujr val valid = WireInit(valids.andR) 2945371700eSzoujr w := Mux(valid, replacer.way(idx), PriorityEncoder(~valids)) 2955371700eSzoujr w 2965371700eSzoujr }else { 2975371700eSzoujr val w = WireInit(0.U) 2985371700eSzoujr w 2995371700eSzoujr } 3005371700eSzoujr } 3015371700eSzoujr 30209c6f1ddSLingrui98 io.read_resp := PriorityMux(total_hits, read_entries) // Mux1H 30309c6f1ddSLingrui98 io.read_hits.valid := hit 304bb09c7feSzoujr // io.read_hits.bits := Mux(hit, hit_way_1h, VecInit(UIntToOH(allocWriteWay).asBools())) 3055371700eSzoujr io.read_hits.bits := hit_way 30609c6f1ddSLingrui98 307*1c8d9e26Szoujr io.update_hits.valid := u_hit 308*1c8d9e26Szoujr io.update_hits.bits := u_hit_way 309*1c8d9e26Szoujr 310c6bf0bffSzoujr // XSDebug(!hit, "FTB not hit, alloc a way: %d\n", allocWriteWay) 311ac3f6f25Szoujr 31209c6f1ddSLingrui98 // Update logic 31309c6f1ddSLingrui98 val u_valid = io.update_write_data.valid 31409c6f1ddSLingrui98 val u_data = io.update_write_data.bits 31509c6f1ddSLingrui98 val u_idx = ftbAddr.getIdx(io.update_pc) 3165371700eSzoujr val allocWriteWay = allocWay(VecInit(read_entries.map(_.valid)).asUInt, u_idx) 3175371700eSzoujr val u_mask = UIntToOH(Mux(io.update_write_alloc, allocWriteWay, io.update_write_way)) 318c6bf0bffSzoujr 319c6bf0bffSzoujr for (i <- 0 until numWays) { 3205371700eSzoujr XSPerfAccumulate(f"ftb_replace_way$i", u_valid && io.update_write_alloc && OHToUInt(u_mask) === i.U) 3215371700eSzoujr XSPerfAccumulate(f"ftb_replace_way${i}_has_empty", u_valid && io.update_write_alloc && !read_entries.map(_.valid).reduce(_&&_) && OHToUInt(u_mask) === i.U) 3225371700eSzoujr XSPerfAccumulate(f"ftb_hit_way$i", hit && !io.update_access && hit_way === i.U) 323c6bf0bffSzoujr } 32409c6f1ddSLingrui98 32509c6f1ddSLingrui98 ftb.io.w.apply(u_valid, u_data, u_idx, u_mask) 32609c6f1ddSLingrui98 } // FTBBank 32709c6f1ddSLingrui98 32809c6f1ddSLingrui98 val ftbBank = Module(new FTBBank(numSets, numWays)) 32909c6f1ddSLingrui98 33009c6f1ddSLingrui98 ftbBank.io.req_pc.valid := io.s0_fire 33109c6f1ddSLingrui98 ftbBank.io.req_pc.bits := s0_pc 33209c6f1ddSLingrui98 33309c6f1ddSLingrui98 val ftb_entry = RegEnable(ftbBank.io.read_resp, io.s1_fire) 33409c6f1ddSLingrui98 val s1_hit = ftbBank.io.read_hits.valid 33509c6f1ddSLingrui98 val s2_hit = RegEnable(s1_hit, io.s1_fire) 33609c6f1ddSLingrui98 val writeWay = ftbBank.io.read_hits.bits 33709c6f1ddSLingrui98 33809c6f1ddSLingrui98 val fallThruAddr = getFallThroughAddr(s2_pc, ftb_entry.carry, ftb_entry.pftAddr) 33909c6f1ddSLingrui98 34009c6f1ddSLingrui98 // io.out.bits.resp := RegEnable(io.in.bits.resp_in(0), 0.U.asTypeOf(new BranchPredictionResp), io.s1_fire) 34109c6f1ddSLingrui98 io.out.resp := io.in.bits.resp_in(0) 34209c6f1ddSLingrui98 34309c6f1ddSLingrui98 val s1_latch_call_is_rvc = DontCare // TODO: modify when add RAS 34409c6f1ddSLingrui98 34509c6f1ddSLingrui98 io.out.resp.s2.preds.taken_mask := io.in.bits.resp_in(0).s2.preds.taken_mask 34609c6f1ddSLingrui98 for (i <- 0 until numBr) { 34709c6f1ddSLingrui98 when (ftb_entry.always_taken(i)) { 34809c6f1ddSLingrui98 io.out.resp.s2.preds.taken_mask(i) := true.B 34909c6f1ddSLingrui98 } 35009c6f1ddSLingrui98 } 35109c6f1ddSLingrui98 35209c6f1ddSLingrui98 io.out.resp.s2.preds.hit := s2_hit 35309c6f1ddSLingrui98 io.out.resp.s2.pc := s2_pc 35409c6f1ddSLingrui98 io.out.resp.s2.ftb_entry := ftb_entry 35509c6f1ddSLingrui98 io.out.resp.s2.preds.fromFtbEntry(ftb_entry, s2_pc) 35609c6f1ddSLingrui98 357bb09c7feSzoujr io.out.s3_meta := RegEnable(RegEnable(FTBMeta(writeWay, s1_hit, GTimer()).asUInt(), io.s1_fire), io.s2_fire) 35809c6f1ddSLingrui98 35909c6f1ddSLingrui98 when(s2_hit) { 36009c6f1ddSLingrui98 io.out.resp.s2.ftb_entry.pftAddr := ftb_entry.pftAddr 36109c6f1ddSLingrui98 io.out.resp.s2.ftb_entry.carry := ftb_entry.carry 36209c6f1ddSLingrui98 }.otherwise { 36309c6f1ddSLingrui98 io.out.resp.s2.ftb_entry.pftAddr := s2_pc(instOffsetBits + log2Ceil(PredictWidth), instOffsetBits) ^ (1 << log2Ceil(PredictWidth)).U 36409c6f1ddSLingrui98 io.out.resp.s2.ftb_entry.carry := s2_pc(instOffsetBits + log2Ceil(PredictWidth)).asBool 36509c6f1ddSLingrui98 io.out.resp.s2.ftb_entry.oversize := false.B 36609c6f1ddSLingrui98 } 36709c6f1ddSLingrui98 36809c6f1ddSLingrui98 // always taken logic 36909c6f1ddSLingrui98 when (s2_hit) { 37009c6f1ddSLingrui98 for (i <- 0 until numBr) { 37109c6f1ddSLingrui98 when (ftb_entry.always_taken(i)) { 37209c6f1ddSLingrui98 io.out.resp.s2.preds.taken_mask(i) := true.B 37309c6f1ddSLingrui98 } 37409c6f1ddSLingrui98 } 37509c6f1ddSLingrui98 } 37609c6f1ddSLingrui98 37709c6f1ddSLingrui98 // Update logic 37809c6f1ddSLingrui98 val update = RegNext(io.update.bits) 37909c6f1ddSLingrui98 380c6bf0bffSzoujr // val update_queue = Mem(64, new UpdateQueueEntry) 381c6bf0bffSzoujr // val head, tail = RegInit(UpdateQueuePtr(false.B, 0.U)) 382c6bf0bffSzoujr // val u_queue = Module(new Queue(new UpdateQueueEntry, entries = 64, flow = true)) 383c6bf0bffSzoujr // assert(u_queue.io.count < 64.U) 384c6bf0bffSzoujr 38509c6f1ddSLingrui98 val u_meta = update.meta.asTypeOf(new FTBMeta) 38609c6f1ddSLingrui98 val u_valid = RegNext(io.update.valid && !io.update.bits.old_entry) 387bb09c7feSzoujr 388c6bf0bffSzoujr // io.s1_ready := ftbBank.io.req_pc.ready && u_queue.io.count === 0.U && !u_valid 389c6bf0bffSzoujr io.s1_ready := ftbBank.io.req_pc.ready && !(u_valid && !u_meta.hit) 390bb09c7feSzoujr 391c6bf0bffSzoujr // val update_now = u_queue.io.deq.fire && u_queue.io.deq.bits.hit 392c6bf0bffSzoujr val update_now = u_valid && u_meta.hit 393c6bf0bffSzoujr 394*1c8d9e26Szoujr ftbBank.io.u_req_pc.valid := u_valid && !u_meta.hit 395*1c8d9e26Szoujr ftbBank.io.u_req_pc.bits := update.pc 396bb09c7feSzoujr 397c6bf0bffSzoujr // assert(!(u_valid && RegNext(u_valid) && update.pc === RegNext(update.pc))) 3985371700eSzoujr // assert(!(u_valid && RegNext(u_valid))) 399bb09c7feSzoujr 400c6bf0bffSzoujr // val u_way = u_queue.io.deq.bits.hit_way 40109c6f1ddSLingrui98 40209c6f1ddSLingrui98 val ftb_write = Wire(new FTBEntryWithTag) 403c6bf0bffSzoujr // ftb_write.entry := Mux(update_now, u_queue.io.deq.bits.ftb_entry, RegNext(u_queue.io.deq.bits.ftb_entry)) 404c6bf0bffSzoujr // ftb_write.tag := ftbAddr.getTag(Mux(update_now, u_queue.io.deq.bits.pc, RegNext(u_queue.io.deq.bits.pc)))(tagSize-1, 0) 405c6bf0bffSzoujr ftb_write.entry := Mux(update_now, update.ftb_entry, RegNext(update.ftb_entry)) 406c6bf0bffSzoujr ftb_write.tag := ftbAddr.getTag(Mux(update_now, update.pc, RegNext(update.pc)))(tagSize-1, 0) 40709c6f1ddSLingrui98 408c6bf0bffSzoujr // val write_valid = update_now || RegNext(u_queue.io.deq.fire && !u_queue.io.deq.bits.hit) 409c6bf0bffSzoujr val write_valid = update_now || RegNext(u_valid && !u_meta.hit) 410c6bf0bffSzoujr 411c6bf0bffSzoujr // u_queue.io.enq.valid := u_valid 412c6bf0bffSzoujr // u_queue.io.enq.bits := UpdateQueueEntry(update.pc, update.ftb_entry, u_meta.hit, u_meta.writeWay) 413c6bf0bffSzoujr // u_queue.io.deq.ready := RegNext(!u_queue.io.deq.fire || update_now) 414c6bf0bffSzoujr 415c6bf0bffSzoujr ftbBank.io.update_write_data.valid := write_valid 416c6bf0bffSzoujr ftbBank.io.update_write_data.bits := ftb_write 417c6bf0bffSzoujr // ftbBank.io.update_pc := Mux(update_now, u_queue.io.deq.bits.pc, RegNext(u_queue.io.deq.bits.pc)) 418c6bf0bffSzoujr ftbBank.io.update_pc := Mux(update_now, update.pc, RegNext(update.pc)) 419*1c8d9e26Szoujr ftbBank.io.update_write_way := Mux(update_now, u_meta.writeWay, ftbBank.io.update_hits.bits) 420*1c8d9e26Szoujr // ftbBank.io.update_write_alloc := Mux(update_now, !u_queue.io.deq.bits.hit, !ftbBank.io.update_hits.valid) 421*1c8d9e26Szoujr ftbBank.io.update_write_alloc := Mux(update_now, false.B, !ftbBank.io.update_hits.valid) 422*1c8d9e26Szoujr ftbBank.io.update_access := u_valid && !u_meta.hit 4235371700eSzoujr ftbBank.io.s1_fire := io.s1_fire 42409c6f1ddSLingrui98 42509c6f1ddSLingrui98 XSDebug("req_v=%b, req_pc=%x, ready=%b (resp at next cycle)\n", io.s0_fire, s0_pc, ftbBank.io.req_pc.ready) 42609c6f1ddSLingrui98 XSDebug("s2_hit=%b, hit_way=%b\n", s2_hit, writeWay.asUInt) 42709c6f1ddSLingrui98 XSDebug("s2_taken_mask=%b, s2_real_taken_mask=%b\n", 42809c6f1ddSLingrui98 io.in.bits.resp_in(0).s2.preds.taken_mask.asUInt, io.out.resp.s2.real_taken_mask().asUInt) 42909c6f1ddSLingrui98 XSDebug("s2_target=%x\n", io.out.resp.s2.target) 43009c6f1ddSLingrui98 43109c6f1ddSLingrui98 ftb_entry.display(true.B) 43209c6f1ddSLingrui98 433c6bf0bffSzoujr // XSDebug(u_valid, "Update from ftq\n") 434c6bf0bffSzoujr // XSDebug(u_valid, "update_pc=%x, tag=%x, pred_cycle=%d\n", 435c6bf0bffSzoujr // update.pc, ftbAddr.getTag(update.pc), u_meta.pred_cycle) 436c6bf0bffSzoujr // XSDebug(RegNext(u_valid), "Write into FTB\n") 437c6bf0bffSzoujr // XSDebug(RegNext(u_valid), "hit=%d, update_write_way=%d\n", 438*1c8d9e26Szoujr // ftbBank.io.update_hits.valid, u_meta.writeWay) 43909c6f1ddSLingrui98 44009c6f1ddSLingrui98 44109c6f1ddSLingrui98 44209c6f1ddSLingrui98 44309c6f1ddSLingrui98 44409c6f1ddSLingrui98 XSPerfAccumulate("ftb_read_hits", RegNext(io.s0_fire) && s1_hit) 44509c6f1ddSLingrui98 XSPerfAccumulate("ftb_read_misses", RegNext(io.s0_fire) && !s1_hit) 44609c6f1ddSLingrui98 447c6bf0bffSzoujr XSPerfAccumulate("ftb_commit_hits", io.update.valid && io.update.bits.preds.hit) 448c6bf0bffSzoujr XSPerfAccumulate("ftb_commit_misses", io.update.valid && !io.update.bits.preds.hit) 44909c6f1ddSLingrui98 45009c6f1ddSLingrui98 XSPerfAccumulate("ftb_update_req", io.update.valid) 45109c6f1ddSLingrui98 XSPerfAccumulate("ftb_update_ignored", io.update.valid && io.update.bits.old_entry) 45209c6f1ddSLingrui98 XSPerfAccumulate("ftb_updated", u_valid) 45309c6f1ddSLingrui98} 454