17052722fSJay/*************************************************************************************** 27052722fSJay * Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 37052722fSJay * Copyright (c) 2020-2021 Peng Cheng Laboratory 47052722fSJay * 57052722fSJay * XiangShan is licensed under Mulan PSL v2. 67052722fSJay * You can use this software according to the terms and conditions of the Mulan PSL v2. 77052722fSJay * You may obtain a copy of Mulan PSL v2 at: 87052722fSJay * http://license.coscl.org.cn/MulanPSL2 97052722fSJay * 107052722fSJay * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 117052722fSJay * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 127052722fSJay * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 137052722fSJay * 147052722fSJay * See the Mulan PSL v2 for more details. 157052722fSJay ***************************************************************************************/ 167052722fSJay 177052722fSJaypackage xiangshan.frontend.icache 187052722fSJay 197052722fSJayimport chipsalliance.rocketchip.config.Parameters 207052722fSJayimport chisel3._ 217052722fSJayimport chisel3.util._ 227052722fSJayimport freechips.rocketchip.tilelink._ 237052722fSJayimport utils._ 247052722fSJayimport xiangshan.cache.mmu._ 257052722fSJayimport xiangshan.frontend._ 267052722fSJayimport xiangshan.backend.fu.{PMPReqBundle, PMPRespBundle} 27de7689fcSJayimport huancun.{PreferCacheKey} 287052722fSJay 297052722fSJay 307052722fSJayabstract class IPrefetchBundle(implicit p: Parameters) extends ICacheBundle 317052722fSJayabstract class IPrefetchModule(implicit p: Parameters) extends ICacheModule 327052722fSJay 337052722fSJayclass PIQReq(implicit p: Parameters) extends IPrefetchBundle { 347052722fSJay val paddr = UInt(PAddrBits.W) 357052722fSJay} 367052722fSJay 377052722fSJay 387052722fSJayclass IPrefetchToMissUnit(implicit p: Parameters) extends IPrefetchBundle{ 397052722fSJay val enqReq = DecoupledIO(new PIQReq) 407052722fSJay} 417052722fSJay 427052722fSJayclass IPredfetchIO(implicit p: Parameters) extends IPrefetchBundle { 437052722fSJay val fromFtq = Flipped(new FtqPrefechBundle) 44*f1fe8698SLemover val iTLBInter = new TlbRequestIO 4561e1db30SJay val pmp = new ICachePMPBundle 467052722fSJay val toIMeta = Decoupled(new ICacheReadBundle) 477052722fSJay val fromIMeta = Input(new ICacheMetaRespBundle) 487052722fSJay val toMissUnit = new IPrefetchToMissUnit 4900240ba6SJay val fromMSHR = Flipped(Vec(PortNumber,ValidIO(UInt(PAddrBits.W)))) 50a108d429SJay 51a108d429SJay val prefetchEnable = Input(Bool()) 52a108d429SJay val prefetchDisable = Input(Bool()) 537052722fSJay} 547052722fSJay 557052722fSJayclass IPrefetchPipe(implicit p: Parameters) extends IPrefetchModule 567052722fSJay{ 577052722fSJay val io = IO(new IPredfetchIO) 587052722fSJay 59a108d429SJay val enableBit = RegInit(false.B) 60a108d429SJay val maxPrefetchCoutner = RegInit(0.U(log2Ceil(nPrefetchEntries + 1).W)) 61a108d429SJay 62a108d429SJay val reachMaxSize = maxPrefetchCoutner === nPrefetchEntries.U 63a108d429SJay 64a108d429SJay when(io.prefetchEnable){ 65a108d429SJay enableBit := true.B 66a108d429SJay }.elsewhen((enableBit && io.prefetchDisable) || (enableBit && reachMaxSize)){ 67a108d429SJay enableBit := false.B 68a108d429SJay } 69a108d429SJay 70a108d429SJay class PrefetchDir(implicit p: Parameters) extends IPrefetchBundle 71a108d429SJay { 72a108d429SJay val valid = Bool() 73a108d429SJay val paddr = UInt(PAddrBits.W) 74a108d429SJay } 75a108d429SJay 76a108d429SJay val prefetch_dir = RegInit(VecInit(Seq.fill(nPrefetchEntries)(0.U.asTypeOf(new PrefetchDir)))) 77a108d429SJay 787052722fSJay val fromFtq = io.fromFtq 797052722fSJay val (toITLB, fromITLB) = (io.iTLBInter.req, io.iTLBInter.resp) 807052722fSJay val (toIMeta, fromIMeta) = (io.toIMeta, io.fromIMeta.metaData(0)) 817052722fSJay val (toPMP, fromPMP) = (io.pmp.req, io.pmp.resp) 827052722fSJay val toMissUnit = io.toMissUnit 837052722fSJay 847052722fSJay val p0_fire, p1_fire, p2_fire, p3_fire = WireInit(false.B) 857052722fSJay val p1_discard, p2_discard, p3_discard = WireInit(false.B) 867052722fSJay val p0_ready, p1_ready, p2_ready, p3_ready = WireInit(false.B) 877052722fSJay 887052722fSJay /** Prefetch Stage 0: req from Ftq */ 897052722fSJay val p0_valid = fromFtq.req.valid 90d6b06a99SJay val p0_vaddr = addrAlign(fromFtq.req.bits.target, blockBytes, VAddrBits) 91a108d429SJay p0_fire := p0_valid && p1_ready && toITLB.fire() && !fromITLB.bits.miss && toIMeta.ready && enableBit 92e8747464SJenius //discard req when source not ready 93e8747464SJenius // p0_discard := p0_valid && ((toITLB.fire() && fromITLB.bits.miss) || !toIMeta.ready || !enableBit) 947052722fSJay 957052722fSJay toIMeta.valid := p0_valid 967052722fSJay toIMeta.bits.vSetIdx(0) := get_idx(p0_vaddr) 977052722fSJay 987052722fSJay toIMeta.bits.vSetIdx(1) := DontCare 997052722fSJay toIMeta.bits.isDoubleLine := false.B 1007052722fSJay 1017052722fSJay toITLB.valid := p0_valid 1027052722fSJay toITLB.bits.size := 3.U // TODO: fix the size 1037052722fSJay toITLB.bits.vaddr := p0_vaddr 1047052722fSJay toITLB.bits.debug.pc := p0_vaddr 1057052722fSJay 106*f1fe8698SLemover toITLB.bits.kill := DontCare 1077052722fSJay toITLB.bits.cmd := TlbCmd.exec 108*f1fe8698SLemover toITLB.bits.debug.robIdx := DontCare 1097052722fSJay toITLB.bits.debug.isFirstIssue := DontCare 1107052722fSJay 1117052722fSJay 1127052722fSJay fromITLB.ready := true.B 1137052722fSJay 114e8747464SJenius fromFtq.req.ready := true.B //(!enableBit || (enableBit && p3_ready)) && toIMeta.ready //&& GTimer() > 500.U 1157052722fSJay 1167052722fSJay /** Prefetch Stage 1: cache probe filter */ 1177052722fSJay val p1_valid = generatePipeControl(lastFire = p0_fire, thisFire = p1_fire || p1_discard, thisFlush = false.B, lastFlush = false.B) 1187052722fSJay 119005e809bSJiuyang Liu val p1_vaddr = RegEnable(p0_vaddr, p0_fire) 1207052722fSJay 1217052722fSJay //tlb resp 122de7689fcSJay val tlb_resp_valid = RegInit(false.B) 123de7689fcSJay when(p0_fire) {tlb_resp_valid := true.B} 124de7689fcSJay .elsewhen(tlb_resp_valid && (p1_fire || p1_discard)) {tlb_resp_valid := false.B} 1257052722fSJay 126de7689fcSJay val tlb_resp_paddr = ResultHoldBypass(valid = RegNext(p0_fire), data = fromITLB.bits.paddr) 127de7689fcSJay val tlb_resp_pf = ResultHoldBypass(valid = RegNext(p0_fire), data = fromITLB.bits.excp.pf.instr && tlb_resp_valid) 128de7689fcSJay val tlb_resp_af = ResultHoldBypass(valid = RegNext(p0_fire), data = fromITLB.bits.excp.af.instr && tlb_resp_valid) 1297052722fSJay 1307052722fSJay val p1_exception = VecInit(Seq(tlb_resp_pf, tlb_resp_af)) 1317052722fSJay val p1_has_except = p1_exception.reduce(_ || _) 1327052722fSJay 1337052722fSJay val p1_ptag = get_phy_tag(tlb_resp_paddr) 1347052722fSJay 1357052722fSJay val p1_meta_ptags = ResultHoldBypass(data = VecInit(fromIMeta.map(way => way.tag)),valid = RegNext(p0_fire)) 1367052722fSJay val p1_meta_cohs = ResultHoldBypass(data = VecInit(fromIMeta.map(way => way.coh)),valid = RegNext(p0_fire)) 1377052722fSJay 1387052722fSJay val p1_tag_eq_vec = VecInit(p1_meta_ptags.map(_ === p1_ptag )) 1397052722fSJay val p1_tag_match_vec = VecInit(p1_tag_eq_vec.zipWithIndex.map{ case(way_tag_eq, w) => way_tag_eq && p1_meta_cohs(w).isValid()}) 1407052722fSJay val p1_tag_match = ParallelOR(p1_tag_match_vec) 1417052722fSJay val (p1_hit, p1_miss) = (p1_valid && p1_tag_match && !p1_has_except, p1_valid && !p1_tag_match && !p1_has_except) 1427052722fSJay 1437052722fSJay //overriding the invalid req 1447052722fSJay val p1_req_cancle = (p1_hit || (tlb_resp_valid && p1_exception.reduce(_ || _))) && p1_valid 1457052722fSJay val p1_req_accept = p1_valid && tlb_resp_valid && p1_miss 1467052722fSJay 1477052722fSJay p1_ready := p1_fire || p1_req_cancle || !p1_valid 148a108d429SJay p1_fire := p1_valid && p1_req_accept && p2_ready && enableBit 1497052722fSJay p1_discard := p1_valid && p1_req_cancle 1507052722fSJay 1517052722fSJay /** Prefetch Stage 2: filtered req PIQ enqueue */ 1527052722fSJay val p2_valid = generatePipeControl(lastFire = p1_fire, thisFire = p2_fire || p2_discard, thisFlush = false.B, lastFlush = false.B) 15361e1db30SJay val p2_pmp_fire = p2_valid 1547052722fSJay val pmpExcpAF = fromPMP.instr 1557052722fSJay 156005e809bSJiuyang Liu val p2_paddr = RegEnable(tlb_resp_paddr, p1_fire) 157005e809bSJiuyang Liu val p2_except_pf = RegEnable(tlb_resp_pf, p1_fire) 158005e809bSJiuyang Liu val p2_except_af = DataHoldBypass(pmpExcpAF, p2_pmp_fire) || RegEnable(tlb_resp_af, p1_fire) 1597052722fSJay val p2_mmio = DataHoldBypass(io.pmp.resp.mmio && !p2_except_af && !p2_except_pf, p2_pmp_fire) 1607052722fSJay 16100240ba6SJay /*when a prefetch req meet with a miss req in MSHR cancle the prefetch req */ 16200240ba6SJay val p2_check_in_mshr = VecInit(io.fromMSHR.map(mshr => mshr.valid && mshr.bits === addrAlign(p2_paddr, blockBytes, PAddrBits))).reduce(_||_) 16300240ba6SJay 1647052722fSJay //TODO wait PMP logic 1657052722fSJay val p2_exception = VecInit(Seq(pmpExcpAF, p2_mmio)).reduce(_||_) 1667052722fSJay 1677052722fSJay io.pmp.req.valid := p2_pmp_fire 1687052722fSJay io.pmp.req.bits.addr := p2_paddr 1697052722fSJay io.pmp.req.bits.size := 3.U 1707052722fSJay io.pmp.req.bits.cmd := TlbCmd.exec 1717052722fSJay 1727052722fSJay p2_ready := p2_fire || p2_discard || !p2_valid 1737052722fSJay p2_fire := p2_valid && !p2_exception && p3_ready && p2_pmp_fire 17461e1db30SJay p2_discard := p2_valid && (p2_exception && p2_pmp_fire) 1757052722fSJay 1767052722fSJay /** Prefetch Stage 2: filtered req PIQ enqueue */ 177a108d429SJay val p3_valid = generatePipeControl(lastFire = p2_fire, thisFire = p3_fire || p3_discard, thisFlush = false.B, lastFlush = false.B) 1787052722fSJay 179005e809bSJiuyang Liu val p3_paddr = RegEnable(p2_paddr, p2_fire) 180005e809bSJiuyang Liu val p3_check_in_mshr = RegEnable(p2_check_in_mshr, p2_fire) 1817052722fSJay 182a108d429SJay val p3_hit_dir = VecInit((0 until nPrefetchEntries).map(i => prefetch_dir(i).valid && prefetch_dir(i).paddr === p3_paddr )).reduce(_||_) 183a108d429SJay 184e8747464SJenius p3_discard := p3_hit_dir || p3_check_in_mshr || (p3_valid && enableBit && !toMissUnit.enqReq.ready) 185a108d429SJay 186a108d429SJay toMissUnit.enqReq.valid := p3_valid && enableBit && !p3_discard 1877052722fSJay toMissUnit.enqReq.bits.paddr := p3_paddr 1887052722fSJay 189a108d429SJay when(reachMaxSize){ 190a108d429SJay maxPrefetchCoutner := 0.U 191a108d429SJay 192a108d429SJay prefetch_dir.foreach(_.valid := false.B) 193a108d429SJay }.elsewhen(toMissUnit.enqReq.fire()){ 194a108d429SJay maxPrefetchCoutner := maxPrefetchCoutner + 1.U 195a108d429SJay 196a108d429SJay prefetch_dir(maxPrefetchCoutner).valid := true.B 197a108d429SJay prefetch_dir(maxPrefetchCoutner).paddr := p3_paddr 198a108d429SJay } 199a108d429SJay 200a108d429SJay p3_ready := toMissUnit.enqReq.ready || !enableBit 2017052722fSJay p3_fire := toMissUnit.enqReq.fire() 2027052722fSJay 2037052722fSJay} 2047052722fSJay 2057052722fSJayclass IPrefetchEntry(edge: TLEdgeOut, id: Int)(implicit p: Parameters) extends ICacheMissUnitModule 2067052722fSJay{ 2077052722fSJay val io = IO(new Bundle { 2085e649ad5SJay val id = Input(UInt(log2Ceil(PortNumber + nPrefetchEntries).W)) 2097052722fSJay 2107052722fSJay val req = Flipped(DecoupledIO(new PIQReq)) 2117052722fSJay 2127052722fSJay //tilelink channel 2137052722fSJay val mem_hint = DecoupledIO(new TLBundleA(edge.bundle)) 2147052722fSJay val mem_hint_ack = Flipped(DecoupledIO(new TLBundleD(edge.bundle))) 2157052722fSJay 2167052722fSJay }) 2177052722fSJay 2187052722fSJay /** default value for control signals */ 2197052722fSJay io.mem_hint.bits := DontCare 2207052722fSJay io.mem_hint_ack.ready := true.B 2217052722fSJay 2227052722fSJay 2237052722fSJay val s_idle :: s_send_hint :: s_wait_hint_ack :: Nil = Enum(3) 2247052722fSJay val state = RegInit(s_idle) 2257052722fSJay /** control logic transformation */ 2267052722fSJay //request register 2277052722fSJay val req = Reg(new PIQReq) 2287052722fSJay //initial 2297052722fSJay io.mem_hint.bits := DontCare 2307052722fSJay io.mem_hint_ack.ready := true.B 2317052722fSJay 2327052722fSJay io.req.ready := (state === s_idle) 2337052722fSJay io.mem_hint.valid := (state === s_send_hint) 2347052722fSJay 2357052722fSJay //state change 2367052722fSJay switch(state) { 2377052722fSJay is(s_idle) { 2387052722fSJay when(io.req.fire()) { 2397052722fSJay state := s_send_hint 2407052722fSJay req := io.req.bits 2417052722fSJay } 2427052722fSJay } 2437052722fSJay 2447052722fSJay // memory request 2457052722fSJay is(s_send_hint) { 2467052722fSJay when(io.mem_hint.fire()) { 2477052722fSJay state := s_idle 2487052722fSJay } 2497052722fSJay } 2507052722fSJay } 2517052722fSJay 2527052722fSJay /** refill write and meta write */ 2537052722fSJay val hint = edge.Hint( 2547052722fSJay fromSource = io.id, 2557052722fSJay toAddress = addrAlign(req.paddr, blockBytes, PAddrBits) + blockBytes.U, 2567052722fSJay lgSize = (log2Up(cacheParams.blockBytes)).U, 2577052722fSJay param = TLHints.PREFETCH_READ 2587052722fSJay )._2 2597052722fSJay io.mem_hint.bits := hint 260de7689fcSJay io.mem_hint.bits.user.lift(PreferCacheKey).foreach(_ := true.B) 2617052722fSJay 2627052722fSJay 2637052722fSJay XSPerfAccumulate("PrefetchEntryReq" + Integer.toString(id, 10), io.req.fire()) 2647052722fSJay 2657052722fSJay} 266