109c6f1ddSLingrui98/*************************************************************************************** 209c6f1ddSLingrui98* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 309c6f1ddSLingrui98* Copyright (c) 2020-2021 Peng Cheng Laboratory 409c6f1ddSLingrui98* 509c6f1ddSLingrui98* XiangShan is licensed under Mulan PSL v2. 609c6f1ddSLingrui98* You can use this software according to the terms and conditions of the Mulan PSL v2. 709c6f1ddSLingrui98* You may obtain a copy of Mulan PSL v2 at: 809c6f1ddSLingrui98* http://license.coscl.org.cn/MulanPSL2 909c6f1ddSLingrui98* 1009c6f1ddSLingrui98* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 1109c6f1ddSLingrui98* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 1209c6f1ddSLingrui98* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 1309c6f1ddSLingrui98* 1409c6f1ddSLingrui98* See the Mulan PSL v2 for more details. 1509c6f1ddSLingrui98***************************************************************************************/ 1609c6f1ddSLingrui98package xiangshan.frontend 1709c6f1ddSLingrui98 1809c6f1ddSLingrui98import chipsalliance.rocketchip.config.Parameters 1909c6f1ddSLingrui98import chisel3._ 2009c6f1ddSLingrui98import chisel3.util._ 21bf358e08SLingrui98import chisel3.experimental.chiselName 2209c6f1ddSLingrui98import xiangshan._ 2309c6f1ddSLingrui98import utils._ 24c2ad24ebSLingrui98import scala.math._ 2509c6f1ddSLingrui98 26bf358e08SLingrui98@chiselName 2709c6f1ddSLingrui98class FetchRequestBundle(implicit p: Parameters) extends XSBundle { 2809c6f1ddSLingrui98 val startAddr = UInt(VAddrBits.W) 2909c6f1ddSLingrui98 val fallThruAddr = UInt(VAddrBits.W) 3009c6f1ddSLingrui98 val fallThruError = Bool() 3109c6f1ddSLingrui98 val ftqIdx = new FtqPtr 3209c6f1ddSLingrui98 val ftqOffset = ValidUndirectioned(UInt(log2Ceil(PredictWidth).W)) 3309c6f1ddSLingrui98 val target = UInt(VAddrBits.W) 3409c6f1ddSLingrui98 val oversize = Bool() 3509c6f1ddSLingrui98 3609c6f1ddSLingrui98 def fromFtqPcBundle(b: Ftq_RF_Components) = { 375ff19bd8SLingrui98 val ftError = b.fallThroughError() 3809c6f1ddSLingrui98 this.startAddr := b.startAddr 395ff19bd8SLingrui98 this.fallThruError := ftError 405ff19bd8SLingrui98 this.fallThruAddr := Mux(ftError, b.nextRangeAddr, b.getFallThrough()) 4109c6f1ddSLingrui98 this.oversize := b.oversize 4209c6f1ddSLingrui98 this 4309c6f1ddSLingrui98 } 4409c6f1ddSLingrui98 def fromBpuResp(resp: BranchPredictionBundle) = { 4509c6f1ddSLingrui98 // only used to bypass, so some fields remains unchanged 4609c6f1ddSLingrui98 this.startAddr := resp.pc 4709c6f1ddSLingrui98 this.target := resp.target 4809c6f1ddSLingrui98 this.ftqOffset := resp.genCfiIndex 4909c6f1ddSLingrui98 this.fallThruAddr := resp.fallThroughAddr 5009c6f1ddSLingrui98 this.oversize := resp.ftb_entry.oversize 5109c6f1ddSLingrui98 this 5209c6f1ddSLingrui98 } 5309c6f1ddSLingrui98 override def toPrintable: Printable = { 5409c6f1ddSLingrui98 p"[start] ${Hexadecimal(startAddr)} [pft] ${Hexadecimal(fallThruAddr)}" + 5509c6f1ddSLingrui98 p"[tgt] ${Hexadecimal(target)} [ftqIdx] $ftqIdx [jmp] v:${ftqOffset.valid}" + 5609c6f1ddSLingrui98 p" offset: ${ftqOffset.bits}\n" 5709c6f1ddSLingrui98 } 5809c6f1ddSLingrui98} 5909c6f1ddSLingrui98 6009c6f1ddSLingrui98class PredecodeWritebackBundle(implicit p:Parameters) extends XSBundle { 6109c6f1ddSLingrui98 val pc = Vec(PredictWidth, UInt(VAddrBits.W)) 6209c6f1ddSLingrui98 val pd = Vec(PredictWidth, new PreDecodeInfo) // TODO: redefine Predecode 6309c6f1ddSLingrui98 val ftqIdx = new FtqPtr 6409c6f1ddSLingrui98 val ftqOffset = UInt(log2Ceil(PredictWidth).W) 6509c6f1ddSLingrui98 val misOffset = ValidUndirectioned(UInt(log2Ceil(PredictWidth).W)) 6609c6f1ddSLingrui98 val cfiOffset = ValidUndirectioned(UInt(log2Ceil(PredictWidth).W)) 6709c6f1ddSLingrui98 val target = UInt(VAddrBits.W) 6809c6f1ddSLingrui98 val jalTarget = UInt(VAddrBits.W) 6909c6f1ddSLingrui98 val instrRange = Vec(PredictWidth, Bool()) 7009c6f1ddSLingrui98} 7109c6f1ddSLingrui98 72*7052722fSJay// Ftq send req to Prefetch 73*7052722fSJayclass PrefetchRequest(implicit p:Parameters) extends XSBundle { 74*7052722fSJay val target = UInt(VAddrBits.W) 75*7052722fSJay} 7609c6f1ddSLingrui98 77*7052722fSJayclass FtqPrefechBundle(implicit p:Parameters) extends XSBundle { 78*7052722fSJay val req = DecoupledIO(new PrefetchRequest) 7909c6f1ddSLingrui98} 8009c6f1ddSLingrui98 8109c6f1ddSLingrui98class FetchToIBuffer(implicit p: Parameters) extends XSBundle { 8209c6f1ddSLingrui98 val instrs = Vec(PredictWidth, UInt(32.W)) 8309c6f1ddSLingrui98 val valid = UInt(PredictWidth.W) 842a3050c2SJay val enqEnable = UInt(PredictWidth.W) 8509c6f1ddSLingrui98 val pd = Vec(PredictWidth, new PreDecodeInfo) 8609c6f1ddSLingrui98 val pc = Vec(PredictWidth, UInt(VAddrBits.W)) 8709c6f1ddSLingrui98 val foldpc = Vec(PredictWidth, UInt(MemPredPCWidth.W)) 8809c6f1ddSLingrui98 val ftqPtr = new FtqPtr 8909c6f1ddSLingrui98 val ftqOffset = Vec(PredictWidth, ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))) 9009c6f1ddSLingrui98 val ipf = Vec(PredictWidth, Bool()) 9109c6f1ddSLingrui98 val acf = Vec(PredictWidth, Bool()) 9209c6f1ddSLingrui98 val crossPageIPFFix = Vec(PredictWidth, Bool()) 9372951335SLi Qianruo val triggered = Vec(PredictWidth, new TriggerCf) 9409c6f1ddSLingrui98} 9509c6f1ddSLingrui98 96c2ad24ebSLingrui98// class BitWiseUInt(val width: Int, val init: UInt) extends Module { 97c2ad24ebSLingrui98// val io = IO(new Bundle { 98c2ad24ebSLingrui98// val set 99c2ad24ebSLingrui98// }) 100c2ad24ebSLingrui98// } 10109c6f1ddSLingrui98// Move from BPU 102c2ad24ebSLingrui98abstract class GlobalHistory(implicit p: Parameters) extends XSBundle with HasBPUConst { 103c2ad24ebSLingrui98 def update(br_valids: Vec[Bool], real_taken_mask: Vec[Bool]): GlobalHistory 104c2ad24ebSLingrui98} 105c2ad24ebSLingrui98 106c2ad24ebSLingrui98class ShiftingGlobalHistory(implicit p: Parameters) extends GlobalHistory { 10709c6f1ddSLingrui98 val predHist = UInt(HistoryLength.W) 10809c6f1ddSLingrui98 109c2ad24ebSLingrui98 def update(shift: UInt, taken: Bool, hist: UInt = this.predHist): ShiftingGlobalHistory = { 110c2ad24ebSLingrui98 val g = Wire(new ShiftingGlobalHistory) 11109c6f1ddSLingrui98 g.predHist := (hist << shift) | taken 11209c6f1ddSLingrui98 g 11309c6f1ddSLingrui98 } 11409c6f1ddSLingrui98 115c2ad24ebSLingrui98 def update(br_valids: Vec[Bool], real_taken_mask: Vec[Bool]): ShiftingGlobalHistory = { 116eeb5ff92SLingrui98 require(br_valids.length == numBr) 117eeb5ff92SLingrui98 require(real_taken_mask.length == numBr) 118eeb5ff92SLingrui98 val last_valid_idx = PriorityMux( 119eeb5ff92SLingrui98 br_valids.reverse :+ true.B, 120eeb5ff92SLingrui98 (numBr to 0 by -1).map(_.U(log2Ceil(numBr+1).W)) 121eeb5ff92SLingrui98 ) 122eeb5ff92SLingrui98 val first_taken_idx = PriorityEncoder(false.B +: real_taken_mask) 123eeb5ff92SLingrui98 val smaller = Mux(last_valid_idx < first_taken_idx, 124eeb5ff92SLingrui98 last_valid_idx, 125eeb5ff92SLingrui98 first_taken_idx 126eeb5ff92SLingrui98 ) 127eeb5ff92SLingrui98 val shift = smaller 128eeb5ff92SLingrui98 val taken = real_taken_mask.reduce(_||_) 129eeb5ff92SLingrui98 update(shift, taken, this.predHist) 130eeb5ff92SLingrui98 } 131eeb5ff92SLingrui98 132c2ad24ebSLingrui98 // static read 133c2ad24ebSLingrui98 def read(n: Int): Bool = predHist.asBools()(n) 134c2ad24ebSLingrui98 135c2ad24ebSLingrui98 final def === (that: ShiftingGlobalHistory): Bool = { 13609c6f1ddSLingrui98 predHist === that.predHist 13709c6f1ddSLingrui98 } 13809c6f1ddSLingrui98 139c2ad24ebSLingrui98 final def =/= (that: ShiftingGlobalHistory): Bool = !(this === that) 140c2ad24ebSLingrui98} 14109c6f1ddSLingrui98 142c2ad24ebSLingrui98// circular global history pointer 143c2ad24ebSLingrui98class CGHPtr(implicit p: Parameters) extends CircularQueuePtr[CGHPtr]( 144c2ad24ebSLingrui98 p => p(XSCoreParamsKey).HistoryLength 145c2ad24ebSLingrui98){ 146c2ad24ebSLingrui98 override def cloneType = (new CGHPtr).asInstanceOf[this.type] 147c2ad24ebSLingrui98} 148c2ad24ebSLingrui98class CircularGlobalHistory(implicit p: Parameters) extends GlobalHistory { 149c2ad24ebSLingrui98 val buffer = Vec(HistoryLength, Bool()) 150c2ad24ebSLingrui98 type HistPtr = UInt 151c2ad24ebSLingrui98 def update(br_valids: Vec[Bool], real_taken_mask: Vec[Bool]): CircularGlobalHistory = { 152c2ad24ebSLingrui98 this 153c2ad24ebSLingrui98 } 154c2ad24ebSLingrui98} 155c2ad24ebSLingrui98 156dd6c0695SLingrui98class FoldedHistory(val len: Int, val compLen: Int, val max_update_num: Int)(implicit p: Parameters) 157c2ad24ebSLingrui98 extends XSBundle with HasBPUConst { 158dd6c0695SLingrui98 require(compLen >= 1) 159c2ad24ebSLingrui98 require(len > 0) 160c2ad24ebSLingrui98 // require(folded_len <= len) 161dd6c0695SLingrui98 require(compLen >= max_update_num) 162dd6c0695SLingrui98 val folded_hist = UInt(compLen.W) 163dd6c0695SLingrui98 164dd6c0695SLingrui98 def info = (len, compLen) 165c2ad24ebSLingrui98 def oldest_bit_to_get_from_ghr = (0 until max_update_num).map(len - _ - 1) 166c2ad24ebSLingrui98 def oldest_bit_pos_in_folded = oldest_bit_to_get_from_ghr map (_ % compLen) 167c2ad24ebSLingrui98 def oldest_bit_wrap_around = oldest_bit_to_get_from_ghr map (_ / compLen > 0) 168c2ad24ebSLingrui98 def oldest_bit_start = oldest_bit_pos_in_folded.head 169c2ad24ebSLingrui98 170dd6c0695SLingrui98 def get_oldest_bits_from_ghr(ghr: Vec[Bool], histPtr: CGHPtr) = { 171c2ad24ebSLingrui98 // TODO: wrap inc for histPtr value 172dd6c0695SLingrui98 oldest_bit_to_get_from_ghr.map(i => ghr((histPtr + (i+1).U).value)) 173c2ad24ebSLingrui98 } 174c2ad24ebSLingrui98 175ab890bfeSLingrui98 def circular_shift_left(src: UInt, shamt: Int) = { 176c2ad24ebSLingrui98 val srcLen = src.getWidth 177c2ad24ebSLingrui98 val src_doubled = Cat(src, src) 178ab890bfeSLingrui98 val shifted = src_doubled(srcLen*2-1-shamt, srcLen-shamt) 179ab890bfeSLingrui98 shifted 180c2ad24ebSLingrui98 } 181c2ad24ebSLingrui98 182c2ad24ebSLingrui98 183ab890bfeSLingrui98 def update(ghr: Vec[Bool], histPtr: CGHPtr, num: Int, taken: Bool): FoldedHistory = { 184c2ad24ebSLingrui98 // do xors for several bitsets at specified bits 185c2ad24ebSLingrui98 def bitsets_xor(len: Int, bitsets: Seq[Seq[Tuple2[Int, Bool]]]) = { 186c2ad24ebSLingrui98 val res = Wire(Vec(len, Bool())) 187c2ad24ebSLingrui98 // println(f"num bitsets: ${bitsets.length}") 188c2ad24ebSLingrui98 // println(f"bitsets $bitsets") 189c2ad24ebSLingrui98 val resArr = Array.fill(len)(List[Bool]()) 190c2ad24ebSLingrui98 for (bs <- bitsets) { 191c2ad24ebSLingrui98 for ((n, b) <- bs) { 192c2ad24ebSLingrui98 resArr(n) = b :: resArr(n) 193c2ad24ebSLingrui98 } 194c2ad24ebSLingrui98 } 195c2ad24ebSLingrui98 // println(f"${resArr.mkString}") 196c2ad24ebSLingrui98 // println(f"histLen: ${this.len}, foldedLen: $folded_len") 197c2ad24ebSLingrui98 for (i <- 0 until len) { 198c2ad24ebSLingrui98 // println(f"bit[$i], ${resArr(i).mkString}") 199c2ad24ebSLingrui98 if (resArr(i).length > 2) { 200c2ad24ebSLingrui98 println(f"[warning] update logic of foldest history has two or more levels of xor gates! " + 201dd6c0695SLingrui98 f"histlen:${this.len}, compLen:$compLen") 202c2ad24ebSLingrui98 } 203c2ad24ebSLingrui98 if (resArr(i).length == 0) { 204dd6c0695SLingrui98 println(f"[error] bits $i is not assigned in folded hist update logic! histlen:${this.len}, compLen:$compLen") 205c2ad24ebSLingrui98 } 206c2ad24ebSLingrui98 res(i) := resArr(i).foldLeft(false.B)(_^_) 207c2ad24ebSLingrui98 } 208c2ad24ebSLingrui98 res.asUInt 209c2ad24ebSLingrui98 } 210dd6c0695SLingrui98 val oldest_bits = get_oldest_bits_from_ghr(ghr, histPtr) 211c2ad24ebSLingrui98 212c2ad24ebSLingrui98 // mask off bits that do not update 213c2ad24ebSLingrui98 val oldest_bits_masked = oldest_bits.zipWithIndex.map{ 214ab890bfeSLingrui98 case (ob, i) => ob && (i < num).B 215c2ad24ebSLingrui98 } 216c2ad24ebSLingrui98 // if a bit does not wrap around, it should not be xored when it exits 217c2ad24ebSLingrui98 val oldest_bits_set = (0 until max_update_num).filter(oldest_bit_wrap_around).map(i => (oldest_bit_pos_in_folded(i), oldest_bits_masked(i))) 218c2ad24ebSLingrui98 219c2ad24ebSLingrui98 // println(f"old bits pos ${oldest_bits_set.map(_._1)}") 220c2ad24ebSLingrui98 221c2ad24ebSLingrui98 // only the last bit could be 1, as we have at most one taken branch at a time 222ab890bfeSLingrui98 val newest_bits_masked = VecInit((0 until max_update_num).map(i => taken && ((i+1) == num).B)).asUInt 223c2ad24ebSLingrui98 // if a bit does not wrap around, newest bits should not be xored onto it either 224e992912cSLingrui98 val newest_bits_set = (0 until max_update_num).map(i => (compLen-1-i, newest_bits_masked(i))) 225c2ad24ebSLingrui98 226c2ad24ebSLingrui98 // println(f"new bits set ${newest_bits_set.map(_._1)}") 227c2ad24ebSLingrui98 // 228c2ad24ebSLingrui98 val original_bits_masked = VecInit(folded_hist.asBools.zipWithIndex.map{ 229ab890bfeSLingrui98 case (fb, i) => fb && !(num >= (len-i)).B 230c2ad24ebSLingrui98 }) 231c2ad24ebSLingrui98 val original_bits_set = (0 until compLen).map(i => (i, original_bits_masked(i))) 232c2ad24ebSLingrui98 233c2ad24ebSLingrui98 234c2ad24ebSLingrui98 // histLen too short to wrap around 235c2ad24ebSLingrui98 val new_folded_hist = 236dd6c0695SLingrui98 if (len <= compLen) { 237dd6c0695SLingrui98 ((folded_hist << num) | taken)(compLen-1,0) 238c2ad24ebSLingrui98 // circular_shift_left(max_update_num)(Cat(Reverse(newest_bits_masked), folded_hist(compLen-max_update_num-1,0)), num) 239c2ad24ebSLingrui98 } else { 240c2ad24ebSLingrui98 // do xor then shift 241c2ad24ebSLingrui98 val xored = bitsets_xor(compLen, Seq(original_bits_set, oldest_bits_set, newest_bits_set)) 242ab890bfeSLingrui98 circular_shift_left(xored, num) 243c2ad24ebSLingrui98 } 244c2ad24ebSLingrui98 val fh = WireInit(this) 245c2ad24ebSLingrui98 fh.folded_hist := new_folded_hist 246c2ad24ebSLingrui98 fh 247c2ad24ebSLingrui98 } 248c2ad24ebSLingrui98 249dd6c0695SLingrui98 // def update(ghr: Vec[Bool], histPtr: CGHPtr, valids: Vec[Bool], takens: Vec[Bool]): FoldedHistory = { 250dd6c0695SLingrui98 // val fh = WireInit(this) 251dd6c0695SLingrui98 // require(valids.length == max_update_num) 252dd6c0695SLingrui98 // require(takens.length == max_update_num) 253dd6c0695SLingrui98 // val last_valid_idx = PriorityMux( 254dd6c0695SLingrui98 // valids.reverse :+ true.B, 255dd6c0695SLingrui98 // (max_update_num to 0 by -1).map(_.U(log2Ceil(max_update_num+1).W)) 256dd6c0695SLingrui98 // ) 257dd6c0695SLingrui98 // val first_taken_idx = PriorityEncoder(false.B +: takens) 258dd6c0695SLingrui98 // val smaller = Mux(last_valid_idx < first_taken_idx, 259dd6c0695SLingrui98 // last_valid_idx, 260dd6c0695SLingrui98 // first_taken_idx 261dd6c0695SLingrui98 // ) 262dd6c0695SLingrui98 // // update folded_hist 263dd6c0695SLingrui98 // fh.update(ghr, histPtr, smaller, takens.reduce(_||_)) 264dd6c0695SLingrui98 // } 265c2ad24ebSLingrui98 // println(f"folded hist original length: ${len}, folded len: ${folded_len} " + 266c2ad24ebSLingrui98 // f"oldest bits' pos in folded: ${oldest_bit_pos_in_folded}") 267c2ad24ebSLingrui98 268c2ad24ebSLingrui98 26909c6f1ddSLingrui98} 27009c6f1ddSLingrui98 27109c6f1ddSLingrui98class TableAddr(val idxBits: Int, val banks: Int)(implicit p: Parameters) extends XSBundle{ 27209c6f1ddSLingrui98 def tagBits = VAddrBits - idxBits - instOffsetBits 27309c6f1ddSLingrui98 27409c6f1ddSLingrui98 val tag = UInt(tagBits.W) 27509c6f1ddSLingrui98 val idx = UInt(idxBits.W) 27609c6f1ddSLingrui98 val offset = UInt(instOffsetBits.W) 27709c6f1ddSLingrui98 27809c6f1ddSLingrui98 def fromUInt(x: UInt) = x.asTypeOf(UInt(VAddrBits.W)).asTypeOf(this) 27909c6f1ddSLingrui98 def getTag(x: UInt) = fromUInt(x).tag 28009c6f1ddSLingrui98 def getIdx(x: UInt) = fromUInt(x).idx 28109c6f1ddSLingrui98 def getBank(x: UInt) = if (banks > 1) getIdx(x)(log2Up(banks) - 1, 0) else 0.U 28209c6f1ddSLingrui98 def getBankIdx(x: UInt) = if (banks > 1) getIdx(x)(idxBits - 1, log2Up(banks)) else getIdx(x) 28309c6f1ddSLingrui98} 284eeb5ff92SLingrui98 285eeb5ff92SLingrui98@chiselName 28609c6f1ddSLingrui98class BranchPrediction(implicit p: Parameters) extends XSBundle with HasBPUConst { 287eeb5ff92SLingrui98 val br_taken_mask = Vec(numBr, Bool()) 28809c6f1ddSLingrui98 289eeb5ff92SLingrui98 val slot_valids = Vec(totalSlot, Bool()) 29009c6f1ddSLingrui98 291eeb5ff92SLingrui98 val targets = Vec(totalSlot, UInt(VAddrBits.W)) 29209c6f1ddSLingrui98 29309c6f1ddSLingrui98 val is_jal = Bool() 29409c6f1ddSLingrui98 val is_jalr = Bool() 29509c6f1ddSLingrui98 val is_call = Bool() 29609c6f1ddSLingrui98 val is_ret = Bool() 297eeb5ff92SLingrui98 val is_br_sharing = Bool() 29809c6f1ddSLingrui98 29909c6f1ddSLingrui98 // val call_is_rvc = Bool() 30009c6f1ddSLingrui98 val hit = Bool() 30109c6f1ddSLingrui98 302eeb5ff92SLingrui98 def br_slot_valids = slot_valids.init 303eeb5ff92SLingrui98 def tail_slot_valid = slot_valids.last 304eeb5ff92SLingrui98 305eeb5ff92SLingrui98 def br_valids = { 306eeb5ff92SLingrui98 VecInit( 307eeb5ff92SLingrui98 if (shareTailSlot) 308eeb5ff92SLingrui98 br_slot_valids :+ (tail_slot_valid && is_br_sharing) 309eeb5ff92SLingrui98 else 310eeb5ff92SLingrui98 br_slot_valids 311eeb5ff92SLingrui98 ) 312eeb5ff92SLingrui98 } 313eeb5ff92SLingrui98 314eeb5ff92SLingrui98 def taken_mask_on_slot = { 315eeb5ff92SLingrui98 VecInit( 316eeb5ff92SLingrui98 if (shareTailSlot) 317eeb5ff92SLingrui98 (br_slot_valids zip br_taken_mask.init).map{ case (t, v) => t && v } :+ ( 318eeb5ff92SLingrui98 (br_taken_mask.last && tail_slot_valid && is_br_sharing) || 319eeb5ff92SLingrui98 tail_slot_valid && !is_br_sharing 320eeb5ff92SLingrui98 ) 321eeb5ff92SLingrui98 else 322eeb5ff92SLingrui98 (br_slot_valids zip br_taken_mask).map{ case (v, t) => v && t } :+ 323eeb5ff92SLingrui98 tail_slot_valid 324eeb5ff92SLingrui98 ) 325eeb5ff92SLingrui98 } 326eeb5ff92SLingrui98 327eeb5ff92SLingrui98 def taken = br_taken_mask.reduce(_||_) || slot_valids.last // || (is_jal || is_jalr) 32809c6f1ddSLingrui98 32909c6f1ddSLingrui98 def fromFtbEntry(entry: FTBEntry, pc: UInt) = { 330eeb5ff92SLingrui98 slot_valids := entry.brSlots.map(_.valid) :+ entry.tailSlot.valid 331eeb5ff92SLingrui98 targets := entry.getTargetVec(pc) 332eeb5ff92SLingrui98 is_jal := entry.tailSlot.valid && entry.isJal 333eeb5ff92SLingrui98 is_jalr := entry.tailSlot.valid && entry.isJalr 334eeb5ff92SLingrui98 is_call := entry.tailSlot.valid && entry.isCall 335eeb5ff92SLingrui98 is_ret := entry.tailSlot.valid && entry.isRet 336eeb5ff92SLingrui98 is_br_sharing := entry.tailSlot.valid && entry.tailSlot.sharing 33709c6f1ddSLingrui98 } 33809c6f1ddSLingrui98 // override def toPrintable: Printable = { 33909c6f1ddSLingrui98 // p"-----------BranchPrediction----------- " + 34009c6f1ddSLingrui98 // p"[taken_mask] ${Binary(taken_mask.asUInt)} " + 34109c6f1ddSLingrui98 // p"[is_br] ${Binary(is_br.asUInt)}, [is_jal] ${Binary(is_jal.asUInt)} " + 34209c6f1ddSLingrui98 // p"[is_jalr] ${Binary(is_jalr.asUInt)}, [is_call] ${Binary(is_call.asUInt)}, [is_ret] ${Binary(is_ret.asUInt)} " + 34309c6f1ddSLingrui98 // p"[target] ${Hexadecimal(target)}}, [hit] $hit " 34409c6f1ddSLingrui98 // } 34509c6f1ddSLingrui98 34609c6f1ddSLingrui98 def display(cond: Bool): Unit = { 347eeb5ff92SLingrui98 XSDebug(cond, p"[taken_mask] ${Binary(br_taken_mask.asUInt)} [hit] $hit\n") 34809c6f1ddSLingrui98 } 34909c6f1ddSLingrui98} 35009c6f1ddSLingrui98 351bf358e08SLingrui98@chiselName 35209c6f1ddSLingrui98class BranchPredictionBundle(implicit p: Parameters) extends XSBundle with HasBPUConst with BPUUtils{ 35309c6f1ddSLingrui98 val pc = UInt(VAddrBits.W) 35409c6f1ddSLingrui98 35509c6f1ddSLingrui98 val valid = Bool() 35609c6f1ddSLingrui98 35709c6f1ddSLingrui98 val hasRedirect = Bool() 35809c6f1ddSLingrui98 val ftq_idx = new FtqPtr 35909c6f1ddSLingrui98 // val hit = Bool() 36009c6f1ddSLingrui98 val preds = new BranchPrediction 36109c6f1ddSLingrui98 362dd6c0695SLingrui98 val folded_hist = new AllFoldedHistories(foldedGHistInfos) 363c2ad24ebSLingrui98 val histPtr = new CGHPtr 36409c6f1ddSLingrui98 val phist = UInt(PathHistoryLength.W) 36509c6f1ddSLingrui98 val rasSp = UInt(log2Ceil(RasSize).W) 36609c6f1ddSLingrui98 val rasTop = new RASEntry 36709c6f1ddSLingrui98 val specCnt = Vec(numBr, UInt(10.W)) 36809c6f1ddSLingrui98 // val meta = UInt(MaxMetaLength.W) 36909c6f1ddSLingrui98 37009c6f1ddSLingrui98 val ftb_entry = new FTBEntry() // TODO: Send this entry to ftq 37109c6f1ddSLingrui98 372eeb5ff92SLingrui98 def real_slot_taken_mask(): Vec[Bool] = { 373eeb5ff92SLingrui98 VecInit(preds.taken_mask_on_slot.map(_ && preds.hit)) 374eeb5ff92SLingrui98 } 375eeb5ff92SLingrui98 376eeb5ff92SLingrui98 // len numBr 377bf358e08SLingrui98 def real_br_taken_mask(): Vec[Bool] = { 378eeb5ff92SLingrui98 if (shareTailSlot) 379eeb5ff92SLingrui98 VecInit( 380eeb5ff92SLingrui98 preds.taken_mask_on_slot.map(_ && preds.hit).init :+ 381eeb5ff92SLingrui98 (preds.br_taken_mask.last && preds.tail_slot_valid && preds.is_br_sharing && preds.hit) 382eeb5ff92SLingrui98 ) 383eeb5ff92SLingrui98 else 384eeb5ff92SLingrui98 VecInit(real_slot_taken_mask().init) 38509c6f1ddSLingrui98 } 38609c6f1ddSLingrui98 3871ccea249SLingrui98 // the vec indicating if ghr should shift on each branch 3881ccea249SLingrui98 def shouldShiftVec = 3891ccea249SLingrui98 VecInit(preds.br_valids.zipWithIndex.map{ case (v, i) => 3901ccea249SLingrui98 v && !real_br_taken_mask.take(i).reduceOption(_||_).getOrElse(false.B)}) 3911ccea249SLingrui98 392ab890bfeSLingrui98 def lastBrPosOH = 393ab890bfeSLingrui98 (!preds.hit || !preds.br_valids.reduce(_||_)) +: // not hit or no brs in entry 394ab890bfeSLingrui98 VecInit((0 until numBr).map(i => 395ab890bfeSLingrui98 preds.br_valids(i) && 396ab890bfeSLingrui98 !real_br_taken_mask.take(i).reduceOption(_||_).getOrElse(false.B) && // no brs taken in front it 397ab890bfeSLingrui98 (real_br_taken_mask()(i) || !preds.br_valids.drop(i+1).reduceOption(_||_).getOrElse(false.B)) && // no brs behind it 398ab890bfeSLingrui98 preds.hit 399ab890bfeSLingrui98 )) 400ab890bfeSLingrui98 401c2ad24ebSLingrui98 def br_count(): UInt = { 402c2ad24ebSLingrui98 val last_valid_idx = PriorityMux( 403c2ad24ebSLingrui98 preds.br_valids.reverse :+ true.B, 404c2ad24ebSLingrui98 (numBr to 0 by -1).map(_.U(log2Ceil(numBr+1).W)) 405c2ad24ebSLingrui98 ) 406c2ad24ebSLingrui98 val first_taken_idx = PriorityEncoder(false.B +: real_br_taken_mask) 407c2ad24ebSLingrui98 Mux(last_valid_idx < first_taken_idx, 408c2ad24ebSLingrui98 last_valid_idx, 409c2ad24ebSLingrui98 first_taken_idx 410c2ad24ebSLingrui98 ) 411c2ad24ebSLingrui98 } 412c2ad24ebSLingrui98 413eeb5ff92SLingrui98 def hit_taken_on_jmp = 414eeb5ff92SLingrui98 !real_slot_taken_mask().init.reduce(_||_) && 415eeb5ff92SLingrui98 real_slot_taken_mask().last && !preds.is_br_sharing 416bf358e08SLingrui98 def hit_taken_on_call = hit_taken_on_jmp && preds.is_call 417bf358e08SLingrui98 def hit_taken_on_ret = hit_taken_on_jmp && preds.is_ret 418bf358e08SLingrui98 def hit_taken_on_jalr = hit_taken_on_jmp && preds.is_jalr 41909c6f1ddSLingrui98 42009c6f1ddSLingrui98 def fallThroughAddr = getFallThroughAddr(pc, ftb_entry.carry, ftb_entry.pftAddr) 421bf358e08SLingrui98 42209c6f1ddSLingrui98 def target(): UInt = { 423eeb5ff92SLingrui98 val targetVec = preds.targets :+ fallThroughAddr :+ (pc + (FetchWidth*4).U) 424eeb5ff92SLingrui98 val selVec = real_slot_taken_mask() :+ (preds.hit && !real_slot_taken_mask().asUInt.orR) :+ true.B 425bf358e08SLingrui98 PriorityMux(selVec zip targetVec) 42609c6f1ddSLingrui98 } 42709c6f1ddSLingrui98 def genCfiIndex = { 42809c6f1ddSLingrui98 val cfiIndex = Wire(ValidUndirectioned(UInt(log2Ceil(PredictWidth).W))) 429eeb5ff92SLingrui98 cfiIndex.valid := real_slot_taken_mask().asUInt.orR 43009c6f1ddSLingrui98 // when no takens, set cfiIndex to PredictWidth-1 43109c6f1ddSLingrui98 cfiIndex.bits := 432eeb5ff92SLingrui98 ParallelPriorityMux(real_slot_taken_mask(), ftb_entry.getOffsetVec) | 433eeb5ff92SLingrui98 Fill(log2Ceil(PredictWidth), (!real_slot_taken_mask().asUInt.orR).asUInt) 43409c6f1ddSLingrui98 cfiIndex 43509c6f1ddSLingrui98 } 43609c6f1ddSLingrui98 43709c6f1ddSLingrui98 def display(cond: Bool): Unit = { 43809c6f1ddSLingrui98 XSDebug(cond, p"[pc] ${Hexadecimal(pc)}\n") 439dd6c0695SLingrui98 folded_hist.display(cond) 44009c6f1ddSLingrui98 preds.display(cond) 44109c6f1ddSLingrui98 ftb_entry.display(cond) 44209c6f1ddSLingrui98 } 44309c6f1ddSLingrui98} 44409c6f1ddSLingrui98 445bf358e08SLingrui98@chiselName 44609c6f1ddSLingrui98class BranchPredictionResp(implicit p: Parameters) extends XSBundle with HasBPUConst { 44709c6f1ddSLingrui98 // val valids = Vec(3, Bool()) 44809c6f1ddSLingrui98 val s1 = new BranchPredictionBundle() 44909c6f1ddSLingrui98 val s2 = new BranchPredictionBundle() 45009c6f1ddSLingrui98 val s3 = new BranchPredictionBundle() 45109c6f1ddSLingrui98 45209c6f1ddSLingrui98 def selectedResp = 45309c6f1ddSLingrui98 PriorityMux(Seq( 45409c6f1ddSLingrui98 ((s3.valid && s3.hasRedirect) -> s3), 45509c6f1ddSLingrui98 ((s2.valid && s2.hasRedirect) -> s2), 45609c6f1ddSLingrui98 (s1.valid -> s1) 45709c6f1ddSLingrui98 )) 45809c6f1ddSLingrui98 def selectedRespIdx = 45909c6f1ddSLingrui98 PriorityMux(Seq( 46009c6f1ddSLingrui98 ((s3.valid && s3.hasRedirect) -> BP_S3), 46109c6f1ddSLingrui98 ((s2.valid && s2.hasRedirect) -> BP_S2), 46209c6f1ddSLingrui98 (s1.valid -> BP_S1) 46309c6f1ddSLingrui98 )) 46409c6f1ddSLingrui98 def lastStage = s3 46509c6f1ddSLingrui98} 46609c6f1ddSLingrui98 46709c6f1ddSLingrui98class BpuToFtqBundle(implicit p: Parameters) extends BranchPredictionResp with HasBPUConst { 46809c6f1ddSLingrui98 val meta = UInt(MaxMetaLength.W) 46909c6f1ddSLingrui98} 47009c6f1ddSLingrui98 47109c6f1ddSLingrui98object BpuToFtqBundle { 47209c6f1ddSLingrui98 def apply(resp: BranchPredictionResp)(implicit p: Parameters): BpuToFtqBundle = { 47309c6f1ddSLingrui98 val e = Wire(new BpuToFtqBundle()) 47409c6f1ddSLingrui98 e.s1 := resp.s1 47509c6f1ddSLingrui98 e.s2 := resp.s2 47609c6f1ddSLingrui98 e.s3 := resp.s3 47709c6f1ddSLingrui98 47809c6f1ddSLingrui98 e.meta := DontCare 47909c6f1ddSLingrui98 e 48009c6f1ddSLingrui98 } 48109c6f1ddSLingrui98} 48209c6f1ddSLingrui98 48309c6f1ddSLingrui98class BranchPredictionUpdate(implicit p: Parameters) extends BranchPredictionBundle with HasBPUConst { 48409c6f1ddSLingrui98 val mispred_mask = Vec(numBr+1, Bool()) 48509c6f1ddSLingrui98 val false_hit = Bool() 48609c6f1ddSLingrui98 val new_br_insert_pos = Vec(numBr, Bool()) 48709c6f1ddSLingrui98 val old_entry = Bool() 48809c6f1ddSLingrui98 val meta = UInt(MaxMetaLength.W) 489abdbe4b7SLingrui98 val full_target = UInt(VAddrBits.W) 49009c6f1ddSLingrui98 49109c6f1ddSLingrui98 def fromFtqRedirectSram(entry: Ftq_Redirect_SRAMEntry) = { 492dd6c0695SLingrui98 folded_hist := entry.folded_hist 493c2ad24ebSLingrui98 histPtr := entry.histPtr 49409c6f1ddSLingrui98 phist := entry.phist 49509c6f1ddSLingrui98 rasSp := entry.rasSp 49609c6f1ddSLingrui98 rasTop := entry.rasEntry 49709c6f1ddSLingrui98 specCnt := entry.specCnt 49809c6f1ddSLingrui98 this 49909c6f1ddSLingrui98 } 50009c6f1ddSLingrui98 501c2ad24ebSLingrui98 override def display(cond: Bool) = { 50209c6f1ddSLingrui98 XSDebug(cond, p"-----------BranchPredictionUpdate-----------\n") 50309c6f1ddSLingrui98 XSDebug(cond, p"[mispred_mask] ${Binary(mispred_mask.asUInt)} [false_hit] $false_hit\n") 50409c6f1ddSLingrui98 XSDebug(cond, p"[new_br_insert_pos] ${Binary(new_br_insert_pos.asUInt)}\n") 50509c6f1ddSLingrui98 super.display(cond) 50609c6f1ddSLingrui98 XSDebug(cond, p"--------------------------------------------\n") 50709c6f1ddSLingrui98 } 50809c6f1ddSLingrui98} 50909c6f1ddSLingrui98 51009c6f1ddSLingrui98class BranchPredictionRedirect(implicit p: Parameters) extends Redirect with HasBPUConst { 51109c6f1ddSLingrui98 // override def toPrintable: Printable = { 51209c6f1ddSLingrui98 // p"-----------BranchPredictionRedirect----------- " + 51309c6f1ddSLingrui98 // p"-----------cfiUpdate----------- " + 51409c6f1ddSLingrui98 // p"[pc] ${Hexadecimal(cfiUpdate.pc)} " + 51509c6f1ddSLingrui98 // p"[predTaken] ${cfiUpdate.predTaken}, [taken] ${cfiUpdate.taken}, [isMisPred] ${cfiUpdate.isMisPred} " + 51609c6f1ddSLingrui98 // p"[target] ${Hexadecimal(cfiUpdate.target)} " + 51709c6f1ddSLingrui98 // p"------------------------------- " + 5189aca92b9SYinan Xu // p"[robPtr] f=${robIdx.flag} v=${robIdx.value} " + 51909c6f1ddSLingrui98 // p"[ftqPtr] f=${ftqIdx.flag} v=${ftqIdx.value} " + 52009c6f1ddSLingrui98 // p"[ftqOffset] ${ftqOffset} " + 52109c6f1ddSLingrui98 // p"[level] ${level}, [interrupt] ${interrupt} " + 52209c6f1ddSLingrui98 // p"[stFtqIdx] f=${stFtqIdx.flag} v=${stFtqIdx.value} " + 52309c6f1ddSLingrui98 // p"[stFtqOffset] ${stFtqOffset} " + 52409c6f1ddSLingrui98 // p"\n" 52509c6f1ddSLingrui98 52609c6f1ddSLingrui98 // } 52709c6f1ddSLingrui98 52809c6f1ddSLingrui98 def display(cond: Bool): Unit = { 52909c6f1ddSLingrui98 XSDebug(cond, p"-----------BranchPredictionRedirect----------- \n") 53009c6f1ddSLingrui98 XSDebug(cond, p"-----------cfiUpdate----------- \n") 53109c6f1ddSLingrui98 XSDebug(cond, p"[pc] ${Hexadecimal(cfiUpdate.pc)}\n") 532c2ad24ebSLingrui98 // XSDebug(cond, p"[hist] ${Binary(cfiUpdate.hist.predHist)}\n") 53309c6f1ddSLingrui98 XSDebug(cond, p"[br_hit] ${cfiUpdate.br_hit} [isMisPred] ${cfiUpdate.isMisPred}\n") 53409c6f1ddSLingrui98 XSDebug(cond, p"[pred_taken] ${cfiUpdate.predTaken} [taken] ${cfiUpdate.taken} [isMisPred] ${cfiUpdate.isMisPred}\n") 53509c6f1ddSLingrui98 XSDebug(cond, p"[target] ${Hexadecimal(cfiUpdate.target)} \n") 53609c6f1ddSLingrui98 XSDebug(cond, p"[shift] ${cfiUpdate.shift}\n") 53709c6f1ddSLingrui98 XSDebug(cond, p"------------------------------- \n") 5389aca92b9SYinan Xu XSDebug(cond, p"[robPtr] f=${robIdx.flag} v=${robIdx.value}\n") 53909c6f1ddSLingrui98 XSDebug(cond, p"[ftqPtr] f=${ftqIdx.flag} v=${ftqIdx.value} \n") 54009c6f1ddSLingrui98 XSDebug(cond, p"[ftqOffset] ${ftqOffset} \n") 54109c6f1ddSLingrui98 XSDebug(cond, p"[stFtqIdx] f=${stFtqIdx.flag} v=${stFtqIdx.value}\n") 54209c6f1ddSLingrui98 XSDebug(cond, p"[stFtqOffset] ${stFtqOffset}\n") 54309c6f1ddSLingrui98 XSDebug(cond, p"---------------------------------------------- \n") 54409c6f1ddSLingrui98 } 54509c6f1ddSLingrui98} 546