1package xiangshan.frontend 2 3import chisel3._ 4import chisel3.util._ 5import device.RAMHelper 6import xiangshan._ 7import utils._ 8 9trait HasIFUConst { this: XSModule => 10 val resetVector = 0x80000000L//TODO: set reset vec 11 val groupAlign = log2Up(FetchWidth * 4 * 2) 12 def groupPC(pc: UInt): UInt = Cat(pc(VAddrBits-1, groupAlign), 0.U(groupAlign.W)) 13 // each 1 bit in mask stands for 2 Bytes 14 def mask(pc: UInt): UInt = (Fill(PredictWidth * 2, 1.U(1.W)) >> pc(groupAlign - 1, 1))(PredictWidth - 1, 0) 15 def snpc(pc: UInt): UInt = pc + (PopCount(mask(pc)) << 1) 16} 17 18class IFUIO extends XSBundle 19{ 20 val fetchPacket = DecoupledIO(new FetchPacket) 21 val redirect = Flipped(ValidIO(new Redirect)) 22 val outOfOrderBrInfo = Flipped(ValidIO(new BranchUpdateInfo)) 23 val inOrderBrInfo = Flipped(ValidIO(new BranchUpdateInfo)) 24 val icacheReq = DecoupledIO(new FakeIcacheReq) 25 val icacheResp = Flipped(DecoupledIO(new FakeIcacheResp)) 26 val icacheFlush = Output(UInt(2.W)) 27} 28 29 30class IFU extends XSModule with HasIFUConst 31{ 32 val io = IO(new IFUIO) 33 val bpu = if (EnableBPU) Module(new BPU) else Module(new FakeBPU) 34 val pd = Module(new PreDecode) 35 36 val if2_redirect, if3_redirect, if4_redirect = WireInit(false.B) 37 val if1_flush, if2_flush, if3_flush, if4_flush = WireInit(false.B) 38 39 if4_flush := io.redirect.valid 40 if3_flush := if4_flush || if4_redirect 41 if2_flush := if3_flush || if3_redirect 42 if1_flush := if2_flush || if2_redirect 43 44 //********************** IF1 ****************************// 45 val if1_valid = !reset.asBool 46 val if1_npc = WireInit(0.U(VAddrBits.W)) 47 val if2_ready = WireInit(false.B) 48 val if1_fire = if1_valid && (if2_ready || if1_flush) && io.icacheReq.ready 49 50 // val extHist = VecInit(Fill(ExtHistoryLength, RegInit(0.U(1.W)))) 51 val extHist = RegInit(VecInit(Seq.fill(ExtHistoryLength)(0.U(1.W)))) 52 val headPtr = RegInit(0.U(log2Up(ExtHistoryLength).W)) 53 val shiftPtr = WireInit(false.B) 54 val newPtr = Wire(UInt(log2Up(ExtHistoryLength).W)) 55 val ptr = Mux(shiftPtr, newPtr, headPtr) 56 when (shiftPtr) { headPtr := newPtr } 57 val hist = Wire(Vec(HistoryLength, UInt(1.W))) 58 for (i <- 0 until HistoryLength) { 59 hist(i) := extHist(ptr + i.U) 60 } 61 62 newPtr := headPtr 63 shiftPtr := false.B 64 65 //********************** IF2 ****************************// 66 val if2_valid = RegEnable(next = if1_valid, init = false.B, enable = if1_fire) 67 val if3_ready = WireInit(false.B) 68 val if2_fire = if2_valid && if3_ready 69 val if2_pc = RegEnable(next = if1_npc, init = resetVector.U, enable = if1_fire) 70 val if2_snpc = snpc(if2_pc) 71 val if2_histPtr = RegEnable(ptr, if1_fire) 72 if2_ready := if2_fire || !if2_valid 73 when (if2_flush) { if2_valid := if1_fire } 74 75 when (RegNext(reset.asBool) && !reset.asBool) { 76 if1_npc := resetVector.U(VAddrBits.W) 77 }.elsewhen (if2_fire) { 78 if1_npc := if2_snpc 79 }.otherwise { 80 if1_npc := RegNext(if1_npc) 81 } 82 83 val if2_bp = bpu.io.out(0).bits 84 if2_redirect := if2_fire && bpu.io.out(0).valid && if2_bp.redirect && !if2_bp.saveHalfRVI 85 when (if2_redirect) { 86 if1_npc := if2_bp.target 87 } 88 89 when (if2_fire && (if2_bp.taken || if2_bp.hasNotTakenBrs)) { 90 shiftPtr := true.B 91 newPtr := headPtr - 1.U 92 hist(0) := if2_bp.taken.asUInt 93 extHist(newPtr) := if2_bp.taken.asUInt 94 } 95 96 //********************** IF3 ****************************// 97 val if3_valid = RegEnable(next = if2_valid, init = false.B, enable = if2_fire) 98 val if4_ready = WireInit(false.B) 99 val if3_fire = if3_valid && if4_ready && io.icacheResp.valid 100 val if3_pc = RegEnable(if2_pc, if2_fire) 101 val if3_histPtr = RegEnable(if2_histPtr, if2_fire) 102 if3_ready := if3_fire || !if3_valid 103 when (if3_flush) { if3_valid := false.B } 104 105 val if3_bp = bpu.io.out(1).bits 106 val prev_half_valid = RegInit(false.B) 107 val prev_half_redirect = RegInit(false.B) 108 val prev_half_fetchpc = Reg(UInt(VAddrBits.W)) 109 val prev_half_idx = Reg(UInt(log2Up(PredictWidth).W)) 110 val prev_half_tgt = Reg(UInt(VAddrBits.W)) 111 val prev_half_taken = RegInit(false.B) 112 val prev_half_instr = Reg(UInt(16.W)) 113 when (if3_flush) { 114 prev_half_valid := false.B 115 prev_half_redirect := false.B 116 }.elsewhen (if3_fire && if3_bp.saveHalfRVI) { 117 prev_half_valid := true.B 118 prev_half_redirect := if3_bp.redirect && bpu.io.out(1).valid 119 prev_half_fetchpc := if3_pc 120 val idx = Mux(if3_bp.redirect && bpu.io.out(1).valid, if3_bp.jmpIdx, PopCount(mask(if3_pc)) - 1.U) 121 prev_half_idx := idx 122 prev_half_tgt := if3_bp.target 123 prev_half_taken := if3_bp.taken 124 prev_half_instr := pd.io.out.instrs(idx)(15, 0) 125 }.elsewhen (if3_fire) { 126 prev_half_valid := false.B 127 prev_half_redirect := false.B 128 } 129 130 // if3_redirect := if3_fire && (prev_half_valid && prev_half_taken || bpu.io.out(1).valid && if3_bp.redirect && !if3_bp.saveHalfRVI) 131 // when (if3_redirect) { 132 // if1_npc := Mux(prev_half_valid && prev_half_redirect, prev_half_tgt, if3_bp.target) 133 // } 134 135 when (bpu.io.out(1).valid && if3_fire) { 136 when (prev_half_valid && prev_half_taken) { 137 if3_redirect := true.B 138 if1_npc := prev_half_tgt 139 shiftPtr := true.B 140 newPtr := if3_histPtr - 1.U 141 hist(0) := 1.U 142 extHist(newPtr) := 1.U 143 }.elsewhen (if3_bp.redirect && !if3_bp.saveHalfRVI) { 144 if3_redirect := true.B 145 if1_npc := if3_bp.target 146 shiftPtr := true.B 147 newPtr := Mux(if3_bp.taken || if3_bp.hasNotTakenBrs, if3_histPtr - 1.U, if3_histPtr) 148 hist(0) := Mux(if3_bp.taken || if3_bp.hasNotTakenBrs, if3_bp.taken.asUInt, extHist(if3_histPtr)) 149 extHist(newPtr) := Mux(if3_bp.taken || if3_bp.hasNotTakenBrs, if3_bp.taken.asUInt, extHist(if3_histPtr)) 150 }.elsewhen (if3_bp.saveHalfRVI) { 151 if3_redirect := true.B 152 if1_npc := snpc(if3_pc) 153 shiftPtr := true.B 154 newPtr := Mux(if3_bp.hasNotTakenBrs, if3_histPtr - 1.U, if3_histPtr) 155 hist(0) := Mux(if3_bp.hasNotTakenBrs, 0.U, extHist(if3_histPtr)) 156 extHist(newPtr) := Mux(if3_bp.hasNotTakenBrs, 0.U, extHist(if3_histPtr)) 157 }.otherwise { 158 if3_redirect := false.B 159 } 160 }.otherwise { 161 if3_redirect := false.B 162 } 163 164 165 //********************** IF4 ****************************// 166 val if4_pd = RegEnable(pd.io.out, if3_fire) 167 // val if4_icacheResp = RegEnable(io.icacheResp.bits, if3_fire) 168 val if4_valid = RegEnable(next = if3_valid, init = false.B, enable = if3_fire) 169 val if4_fire = if4_valid && io.fetchPacket.ready 170 val if4_pc = RegEnable(if3_pc, if3_fire) 171 val if4_histPtr = RegEnable(if3_histPtr, if3_fire) 172 if4_ready := (if4_fire || !if4_valid) && GTimer() > 500.U 173 when (if4_flush) { if4_valid := false.B } 174 175 val if4_bp = bpu.io.out(2).bits 176 177 when (bpu.io.out(2).valid && if4_fire && if4_bp.redirect) { 178 when (!if4_bp.saveHalfRVI) { 179 if4_redirect := true.B 180 if1_npc := if4_bp.target 181 182 shiftPtr := true.B 183 newPtr := Mux(if4_bp.taken || if4_bp.hasNotTakenBrs, if4_histPtr - 1.U, if4_histPtr) 184 hist(0) := Mux(if4_bp.taken || if4_bp.hasNotTakenBrs, if4_bp.taken.asUInt, extHist(if4_histPtr)) 185 extHist(newPtr) := Mux(if4_bp.taken || if4_bp.hasNotTakenBrs, if4_bp.taken.asUInt, extHist(if4_histPtr)) 186 187 }.otherwise { 188 if4_redirect := true.B 189 if1_npc := snpc(if4_pc) 190 191 prev_half_valid := true.B 192 prev_half_redirect := true.B 193 prev_half_fetchpc := if4_pc 194 val idx = PopCount(mask(if4_pc)) - 1.U 195 prev_half_idx := idx 196 prev_half_tgt := if4_bp.target 197 prev_half_taken := if4_bp.taken 198 prev_half_instr := if4_pd.instrs(idx)(15, 0) 199 200 shiftPtr := true.B 201 newPtr := Mux(if4_bp.hasNotTakenBrs, if4_histPtr - 1.U, if4_histPtr) 202 hist(0) := Mux(if4_bp.hasNotTakenBrs, 0.U, extHist(if4_histPtr)) 203 extHist(newPtr) := Mux(if4_bp.hasNotTakenBrs, 0.U, extHist(if4_histPtr)) 204 } 205 }.otherwise { 206 if4_redirect := false.B 207 } 208 209 when (io.outOfOrderBrInfo.valid) { 210 shiftPtr := true.B 211 newPtr := io.outOfOrderBrInfo.bits.brInfo.histPtr - 1.U 212 hist(0) := io.outOfOrderBrInfo.bits.taken 213 extHist(newPtr) := io.outOfOrderBrInfo.bits.taken 214 } 215 216 when (io.redirect.valid) { 217 if1_npc := io.redirect.bits.target 218 } 219 220 io.icacheReq.valid := if1_valid && if2_ready 221 io.icacheReq.bits.addr := if1_npc 222 io.icacheResp.ready := if3_valid && if4_ready && GTimer() > 500.U 223 io.icacheFlush := Cat(if3_flush, if2_flush) 224 225 val inOrderBrHist = Wire(Vec(HistoryLength, UInt(1.W))) 226 (0 until HistoryLength).foreach(i => inOrderBrHist(i) := extHist(i.U + io.inOrderBrInfo.bits.brInfo.histPtr)) 227 bpu.io.inOrderBrInfo.valid := io.inOrderBrInfo.valid 228 bpu.io.inOrderBrInfo.bits := Cat(inOrderBrHist.asUInt, io.inOrderBrInfo.bits.asUInt).asTypeOf(new BranchUpdateInfoWithHist) 229 // bpu.io.flush := Cat(if4_flush, if3_flush, if2_flush) 230 bpu.io.flush := VecInit(if2_flush, if3_flush, if4_flush) 231 bpu.io.in.valid := if1_fire 232 bpu.io.in.bits.pc := if1_npc 233 bpu.io.in.bits.hist := hist.asUInt 234 bpu.io.in.bits.inMask := mask(if1_npc) 235 bpu.io.out(0).ready := if2_fire 236 bpu.io.out(1).ready := if3_fire 237 bpu.io.out(2).ready := if4_fire 238 bpu.io.predecode.valid := if4_valid 239 bpu.io.predecode.bits.mask := if4_pd.mask 240 bpu.io.predecode.bits.pd := if4_pd.pd 241 bpu.io.branchInfo.ready := if4_fire 242 243 pd.io.in := io.icacheResp.bits 244 pd.io.prev.valid := prev_half_valid 245 pd.io.prev.bits := prev_half_instr 246 247 io.fetchPacket.valid := if4_valid && !io.redirect.valid 248 io.fetchPacket.bits.instrs := if4_pd.instrs 249 io.fetchPacket.bits.mask := if4_pd.mask & (Fill(PredictWidth, !if4_bp.taken) | (Fill(PredictWidth, 1.U(1.W)) >> (~if4_bp.jmpIdx))) 250 io.fetchPacket.bits.pc := if4_pd.pc 251 (0 until PredictWidth).foreach(i => io.fetchPacket.bits.pnpc(i) := if4_pd.pc(i) + Mux(if4_pd.pd(i).isRVC, 2.U, 4.U)) 252 when (if4_bp.taken) { 253 io.fetchPacket.bits.pnpc(if4_bp.jmpIdx) := if4_bp.target 254 } 255 io.fetchPacket.bits.brInfo := bpu.io.branchInfo.bits 256 (0 until PredictWidth).foreach(i => io.fetchPacket.bits.brInfo(i).histPtr := if4_histPtr) 257 io.fetchPacket.bits.pd := if4_pd.pd 258 259 // debug info 260 XSDebug(RegNext(reset.asBool) && !reset.asBool, "Reseting...\n") 261 XSDebug(io.icacheFlush(0).asBool, "Flush icache stage2...\n") 262 XSDebug(io.icacheFlush(1).asBool, "Flush icache stage3...\n") 263 XSDebug(io.redirect.valid, "Rediret from backend! isExcp=%d isMisPred=%d isReplay=%d pc=%x\n", 264 io.redirect.bits.isException, io.redirect.bits.isMisPred, io.redirect.bits.isReplay, io.redirect.bits.pc) 265 XSDebug(io.redirect.valid, p"Rediret from backend! target=${Hexadecimal(io.redirect.bits.target)} brTag=${io.redirect.bits.brTag}\n") 266 267 XSDebug("[IF1] v=%d fire=%d flush=%d pc=%x ptr=%d mask=%b\n", if1_valid, if1_fire, if1_flush, if1_npc, ptr, mask(if1_npc)) 268 XSDebug("[IF2] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x ptr=%d snpc=%x\n", if2_valid, if2_ready, if2_fire, if2_redirect, if2_flush, if2_pc, if2_histPtr, if2_snpc) 269 XSDebug("[IF3] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x ptr=%d\n", if3_valid, if3_ready, if3_fire, if3_redirect, if3_flush, if3_pc, if3_histPtr) 270 XSDebug("[IF4] v=%d r=%d fire=%d redirect=%d flush=%d pc=%x ptr=%d\n", if4_valid, if4_ready, if4_fire, if4_redirect, if4_flush, if4_pc, if4_histPtr) 271 272 XSDebug("[IF1][icacheReq] v=%d r=%d addr=%x\n", io.icacheReq.valid, io.icacheReq.ready, io.icacheReq.bits.addr) 273 XSDebug("[IF1][ghr] headPtr=%d shiftPtr=%d newPtr=%d ptr=%d\n", headPtr, shiftPtr, newPtr, ptr) 274 XSDebug("[IF1][ghr] hist=%b\n", hist.asUInt) 275 XSDebug("[IF1][ghr] extHist=%b\n\n", extHist.asUInt) 276 277 XSDebug("[IF2][bp] redirect=%d taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n\n", if2_bp.redirect, if2_bp.taken, if2_bp.jmpIdx, if2_bp.hasNotTakenBrs, if2_bp.target, if2_bp.saveHalfRVI) 278 279 XSDebug("[IF3][icacheResp] v=%d r=%d pc=%x mask=%b\n", io.icacheResp.valid, io.icacheResp.ready, io.icacheResp.bits.pc, io.icacheResp.bits.mask) 280 XSDebug("[IF3][bp] redirect=%d taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if3_bp.redirect, if3_bp.taken, if3_bp.jmpIdx, if3_bp.hasNotTakenBrs, if3_bp.target, if3_bp.saveHalfRVI) 281 XSDebug("[IF3][prevHalfInstr] v=%d redirect=%d fetchpc=%x idx=%d tgt=%x taken=%d instr=%x\n\n", 282 prev_half_valid, prev_half_redirect, prev_half_fetchpc, prev_half_idx, prev_half_tgt, prev_half_taken, prev_half_instr) 283 284 XSDebug("[IF4][predecode] mask=%b\n", if4_pd.mask) 285 XSDebug("[IF4][bp] redirect=%d taken=%d jmpIdx=%d hasNTBrs=%d target=%x saveHalfRVI=%d\n", if4_bp.redirect, if4_bp.taken, if4_bp.jmpIdx, if4_bp.hasNotTakenBrs, if4_bp.target, if4_bp.saveHalfRVI) 286 XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] v=%d r=%d mask=%b\n", io.fetchPacket.valid, io.fetchPacket.ready, io.fetchPacket.bits.mask) 287 for (i <- 0 until PredictWidth) { 288 XSDebug(io.fetchPacket.fire(), "[IF4][fetchPacket] %b %x pc=%x pnpc=%x pd: rvc=%d brType=%b call=%d ret=%d\n", 289 io.fetchPacket.bits.mask(i), 290 io.fetchPacket.bits.instrs(i), 291 io.fetchPacket.bits.pc(i), 292 io.fetchPacket.bits.pnpc(i), 293 io.fetchPacket.bits.pd(i).isRVC, 294 io.fetchPacket.bits.pd(i).brType, 295 io.fetchPacket.bits.pd(i).isCall, 296 io.fetchPacket.bits.pd(i).isRet 297 ) 298 } 299}