11d8f4dcbSJay/*************************************************************************************** 21d8f4dcbSJay* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 31d8f4dcbSJay* Copyright (c) 2020-2021 Peng Cheng Laboratory 41d8f4dcbSJay* 51d8f4dcbSJay* XiangShan is licensed under Mulan PSL v2. 61d8f4dcbSJay* You can use this software according to the terms and conditions of the Mulan PSL v2. 71d8f4dcbSJay* You may obtain a copy of Mulan PSL v2 at: 81d8f4dcbSJay* http://license.coscl.org.cn/MulanPSL2 91d8f4dcbSJay* 101d8f4dcbSJay* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 111d8f4dcbSJay* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 121d8f4dcbSJay* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 131d8f4dcbSJay* 141d8f4dcbSJay* See the Mulan PSL v2 for more details. 151d8f4dcbSJay***************************************************************************************/ 161d8f4dcbSJay 171d8f4dcbSJaypackage xiangshan.frontend.icache 181d8f4dcbSJay 191d8f4dcbSJayimport chipsalliance.rocketchip.config.Parameters 201d8f4dcbSJayimport chisel3._ 211d8f4dcbSJayimport chisel3.util._ 221d8f4dcbSJayimport freechips.rocketchip.diplomacy.IdRange 231d8f4dcbSJayimport freechips.rocketchip.tilelink.ClientStates._ 241d8f4dcbSJayimport freechips.rocketchip.tilelink.TLPermissions._ 251d8f4dcbSJayimport freechips.rocketchip.tilelink._ 261d8f4dcbSJayimport xiangshan._ 271d8f4dcbSJayimport huancun.{AliasKey, DirtyKey} 281d8f4dcbSJayimport xiangshan.cache._ 291d8f4dcbSJayimport utils._ 30*41cb8b61SJeniusimport difftest._ 311d8f4dcbSJay 321d8f4dcbSJay 331d8f4dcbSJayabstract class ICacheMissUnitModule(implicit p: Parameters) extends XSModule 341d8f4dcbSJay with HasICacheParameters 351d8f4dcbSJay 361d8f4dcbSJayabstract class ICacheMissUnitBundle(implicit p: Parameters) extends XSBundle 371d8f4dcbSJay with HasICacheParameters 381d8f4dcbSJay 391d8f4dcbSJayclass ICacheMissReq(implicit p: Parameters) extends ICacheBundle 401d8f4dcbSJay{ 411d8f4dcbSJay val paddr = UInt(PAddrBits.W) 421d8f4dcbSJay val vaddr = UInt(VAddrBits.W) 431d8f4dcbSJay val waymask = UInt(nWays.W) 441d8f4dcbSJay val coh = new ClientMetadata 451d8f4dcbSJay 461d8f4dcbSJay def getVirSetIdx = get_idx(vaddr) 471d8f4dcbSJay def getPhyTag = get_phy_tag(paddr) 481d8f4dcbSJay} 491d8f4dcbSJay 501d8f4dcbSJay 511d8f4dcbSJayclass ICacheMissResp(implicit p: Parameters) extends ICacheBundle 521d8f4dcbSJay{ 531d8f4dcbSJay val data = UInt(blockBits.W) 5458dbdfc2SJay val corrupt = Bool() 551d8f4dcbSJay} 561d8f4dcbSJay 571d8f4dcbSJayclass ICacheMissBundle(implicit p: Parameters) extends ICacheBundle{ 581d8f4dcbSJay val req = Vec(2, Flipped(DecoupledIO(new ICacheMissReq))) 591d8f4dcbSJay val resp = Vec(2,ValidIO(new ICacheMissResp)) 601d8f4dcbSJay val flush = Input(Bool()) 611d8f4dcbSJay} 621d8f4dcbSJay 631d8f4dcbSJay 641d8f4dcbSJayclass ICacheMissEntry(edge: TLEdgeOut, id: Int)(implicit p: Parameters) extends ICacheMissUnitModule 651d8f4dcbSJay with MemoryOpConstants 661d8f4dcbSJay{ 671d8f4dcbSJay val io = IO(new Bundle { 687052722fSJay val id = Input(UInt(log2Ceil(PortNumber).W)) 691d8f4dcbSJay 701d8f4dcbSJay val req = Flipped(DecoupledIO(new ICacheMissReq)) 711d8f4dcbSJay val resp = ValidIO(new ICacheMissResp) 721d8f4dcbSJay 731d8f4dcbSJay //tilelink channel 741d8f4dcbSJay val mem_acquire = DecoupledIO(new TLBundleA(edge.bundle)) 751d8f4dcbSJay val mem_grant = Flipped(DecoupledIO(new TLBundleD(edge.bundle))) 761d8f4dcbSJay val mem_finish = DecoupledIO(new TLBundleE(edge.bundle)) 771d8f4dcbSJay 781d8f4dcbSJay val meta_write = DecoupledIO(new ICacheMetaWriteBundle) 791d8f4dcbSJay val data_write = DecoupledIO(new ICacheDataWriteBundle) 801d8f4dcbSJay 812a25dbb4SJay val release_req = DecoupledIO(new ReplacePipeReq) 822a25dbb4SJay val release_resp = Flipped(ValidIO(UInt(ReplaceIdWid.W))) 832a25dbb4SJay val victimInfor = Output(new ICacheVictimInfor()) 847052722fSJay 8500240ba6SJay val toPrefetch = ValidIO(UInt(PAddrBits.W)) 8600240ba6SJay 871d8f4dcbSJay }) 881d8f4dcbSJay 891d8f4dcbSJay /** default value for control signals */ 901d8f4dcbSJay io.resp := DontCare 911d8f4dcbSJay io.mem_acquire.bits := DontCare 921d8f4dcbSJay io.mem_grant.ready := true.B 931d8f4dcbSJay io.meta_write.bits := DontCare 941d8f4dcbSJay io.data_write.bits := DontCare 951d8f4dcbSJay 962a25dbb4SJay val s_idle :: s_send_mem_aquire :: s_wait_mem_grant :: s_write_back :: s_send_grant_ack :: s_send_replace :: s_wait_replace :: s_wait_resp :: Nil = Enum(8) 971d8f4dcbSJay val state = RegInit(s_idle) 981d8f4dcbSJay /** control logic transformation */ 991d8f4dcbSJay //request register 1001d8f4dcbSJay val req = Reg(new ICacheMissReq) 1011d8f4dcbSJay val req_idx = req.getVirSetIdx //virtual index 1021d8f4dcbSJay val req_tag = req.getPhyTag //physical tag 1031d8f4dcbSJay val req_waymask = req.waymask 1047052722fSJay val release_id = Cat(MainPipeKey.U, id.U) 10558dbdfc2SJay val req_corrupt = RegInit(false.B) 1061d8f4dcbSJay 1072a25dbb4SJay io.victimInfor.valid := state === s_send_replace || state === s_wait_replace || state === s_wait_resp 1082a25dbb4SJay io.victimInfor.vidx := req_idx 1091d8f4dcbSJay 1101d8f4dcbSJay val (_, _, refill_done, refill_address_inc) = edge.addr_inc(io.mem_grant) 1111d8f4dcbSJay 1121d8f4dcbSJay //cacheline register 1131d8f4dcbSJay val readBeatCnt = Reg(UInt(log2Up(refillCycles).W)) 1141d8f4dcbSJay val respDataReg = Reg(Vec(refillCycles, UInt(beatBits.W))) 1151d8f4dcbSJay 1161d8f4dcbSJay //initial 1171d8f4dcbSJay io.resp.bits := DontCare 1181d8f4dcbSJay io.mem_acquire.bits := DontCare 1191d8f4dcbSJay io.mem_grant.ready := true.B 1201d8f4dcbSJay io.meta_write.bits := DontCare 1211d8f4dcbSJay io.data_write.bits := DontCare 1221d8f4dcbSJay 1232a25dbb4SJay io.release_req.bits.paddr := req.paddr 1242a25dbb4SJay io.release_req.bits.vaddr := req.vaddr 1252a25dbb4SJay io.release_req.bits.voluntary := true.B 1262a25dbb4SJay io.release_req.bits.waymask := req.waymask 1270bebd829SJay io.release_req.bits.needData := false.B 1282a25dbb4SJay io.release_req.bits.id := release_id 1292a25dbb4SJay io.release_req.bits.param := DontCare //release will not care tilelink param 1301d8f4dcbSJay 1311d8f4dcbSJay io.req.ready := (state === s_idle) 1322a25dbb4SJay io.mem_acquire.valid := (state === s_send_mem_aquire) 1332a25dbb4SJay io.release_req.valid := (state === s_send_replace) 1341d8f4dcbSJay 13500240ba6SJay io.toPrefetch.valid := (state =/= s_idle) 13600240ba6SJay io.toPrefetch.bits := addrAlign(req.paddr, blockBytes, PAddrBits) 13700240ba6SJay 1381d8f4dcbSJay val grantack = RegEnable(edge.GrantAck(io.mem_grant.bits), io.mem_grant.fire()) 1391d8f4dcbSJay val grant_param = Reg(UInt(TLPermissions.bdWidth.W)) 1401d8f4dcbSJay val is_dirty = RegInit(false.B) 1411d8f4dcbSJay val is_grant = RegEnable(edge.isRequest(io.mem_grant.bits), io.mem_grant.fire()) 1421d8f4dcbSJay 1431d8f4dcbSJay //state change 1441d8f4dcbSJay switch(state) { 1451d8f4dcbSJay is(s_idle) { 1461d8f4dcbSJay when(io.req.fire()) { 1471d8f4dcbSJay readBeatCnt := 0.U 1481d8f4dcbSJay state := s_send_mem_aquire 1491d8f4dcbSJay req := io.req.bits 1501d8f4dcbSJay } 1511d8f4dcbSJay } 1521d8f4dcbSJay 1531d8f4dcbSJay // memory request 1541d8f4dcbSJay is(s_send_mem_aquire) { 1551d8f4dcbSJay when(io.mem_acquire.fire()) { 1561d8f4dcbSJay state := s_wait_mem_grant 1571d8f4dcbSJay } 1581d8f4dcbSJay } 1591d8f4dcbSJay 1601d8f4dcbSJay is(s_wait_mem_grant) { 1611d8f4dcbSJay when(edge.hasData(io.mem_grant.bits)) { 1621d8f4dcbSJay when(io.mem_grant.fire()) { 1631d8f4dcbSJay readBeatCnt := readBeatCnt + 1.U 1641d8f4dcbSJay respDataReg(readBeatCnt) := io.mem_grant.bits.data 16558dbdfc2SJay req_corrupt := io.mem_grant.bits.corrupt 1661d8f4dcbSJay grant_param := io.mem_grant.bits.param 1671d8f4dcbSJay is_dirty := io.mem_grant.bits.echo.lift(DirtyKey).getOrElse(false.B) 1681d8f4dcbSJay when(readBeatCnt === (refillCycles - 1).U) { 1691d8f4dcbSJay assert(refill_done, "refill not done!") 1702a25dbb4SJay state := s_send_grant_ack 1711d8f4dcbSJay } 1721d8f4dcbSJay } 1731d8f4dcbSJay } 1741d8f4dcbSJay } 1751d8f4dcbSJay 1761d8f4dcbSJay is(s_send_grant_ack) { 1771d8f4dcbSJay when(io.mem_finish.fire()) { 1786cc2baa1SJay state := s_send_replace 1791d8f4dcbSJay } 1801d8f4dcbSJay } 1811d8f4dcbSJay 1822a25dbb4SJay is(s_send_replace){ 1832a25dbb4SJay when(io.release_req.fire()){ 1842a25dbb4SJay state := s_wait_replace 1852a25dbb4SJay } 1862a25dbb4SJay } 1872a25dbb4SJay 1882a25dbb4SJay is(s_wait_replace){ 1892a25dbb4SJay when(io.release_resp.valid && io.release_resp.bits === release_id){ 1902a25dbb4SJay state := s_write_back 1912a25dbb4SJay } 1922a25dbb4SJay } 1932a25dbb4SJay 1942a25dbb4SJay is(s_write_back) { 1952a25dbb4SJay state := Mux(io.meta_write.fire() && io.data_write.fire(), s_wait_resp, s_write_back) 1962a25dbb4SJay } 1972a25dbb4SJay 1981d8f4dcbSJay is(s_wait_resp) { 1991d8f4dcbSJay io.resp.bits.data := respDataReg.asUInt 20058dbdfc2SJay io.resp.bits.corrupt := req_corrupt 2011d8f4dcbSJay when(io.resp.fire()) { 2021d8f4dcbSJay state := s_idle 2031d8f4dcbSJay } 2041d8f4dcbSJay } 2051d8f4dcbSJay } 2061d8f4dcbSJay 2071d8f4dcbSJay /** refill write and meta write */ 2081d8f4dcbSJay val missCoh = ClientMetadata(Nothing) 2091d8f4dcbSJay val grow_param = missCoh.onAccess(M_XRD)._2 2101d8f4dcbSJay val acquireBlock = edge.AcquireBlock( 2111d8f4dcbSJay fromSource = io.id, 2121d8f4dcbSJay toAddress = addrAlign(req.paddr, blockBytes, PAddrBits), 2131d8f4dcbSJay lgSize = (log2Up(cacheParams.blockBytes)).U, 2141d8f4dcbSJay growPermissions = grow_param 2151d8f4dcbSJay )._2 2161d8f4dcbSJay io.mem_acquire.bits := acquireBlock 2171d8f4dcbSJay // resolve cache alias by L2 2181d8f4dcbSJay io.mem_acquire.bits.user.lift(AliasKey).foreach(_ := req.vaddr(13, 12)) 2191d8f4dcbSJay require(nSets <= 256) // icache size should not be more than 128KB 2201d8f4dcbSJay 2211d8f4dcbSJay /** Grant ACK */ 2221d8f4dcbSJay io.mem_finish.valid := (state === s_send_grant_ack) && is_grant 2231d8f4dcbSJay io.mem_finish.bits := grantack 2241d8f4dcbSJay 2251d8f4dcbSJay //resp to ifu 2261d8f4dcbSJay io.resp.valid := state === s_wait_resp 2272a25dbb4SJay /** update coh meta */ 2282a25dbb4SJay def missCohGen(param: UInt, dirty: Bool): UInt = { 2292a25dbb4SJay MuxLookup(Cat(param, dirty), Nothing, Seq( 2302a25dbb4SJay Cat(toB, false.B) -> Branch, 2312a25dbb4SJay Cat(toB, true.B) -> Branch, 2322a25dbb4SJay Cat(toT, false.B) -> Trunk, 2332a25dbb4SJay Cat(toT, true.B) -> Dirty)) 2342a25dbb4SJay } 2352a25dbb4SJay 2362a25dbb4SJay val miss_new_coh = ClientMetadata(missCohGen(grant_param, is_dirty)) 2372a25dbb4SJay 2382a25dbb4SJay io.meta_write.valid := (state === s_write_back) 2392a25dbb4SJay io.meta_write.bits.generate(tag = req_tag, coh = miss_new_coh, idx = req_idx, waymask = req_waymask, bankIdx = req_idx(0)) 2402a25dbb4SJay 2412a25dbb4SJay io.data_write.valid := (state === s_write_back) 242*41cb8b61SJenius io.data_write.bits.generate(data = respDataReg.asUInt, 243*41cb8b61SJenius idx = req_idx, 244*41cb8b61SJenius waymask = req_waymask, 245*41cb8b61SJenius bankIdx = req_idx(0), 246*41cb8b61SJenius paddr = req.paddr) 2471d8f4dcbSJay 2481d8f4dcbSJay XSPerfAccumulate( 2491d8f4dcbSJay "entryPenalty" + Integer.toString(id, 10), 2501d8f4dcbSJay BoolStopWatch( 2511d8f4dcbSJay start = io.req.fire(), 2521d8f4dcbSJay stop = io.resp.valid, 2531d8f4dcbSJay startHighPriority = true) 2541d8f4dcbSJay ) 2551d8f4dcbSJay XSPerfAccumulate("entryReq" + Integer.toString(id, 10), io.req.fire()) 2561d8f4dcbSJay 2571d8f4dcbSJay} 2581d8f4dcbSJay 2591d8f4dcbSJay 2601d8f4dcbSJayclass ICacheMissUnit(edge: TLEdgeOut)(implicit p: Parameters) extends ICacheMissUnitModule 2611d8f4dcbSJay{ 2621d8f4dcbSJay val io = IO(new Bundle{ 263*41cb8b61SJenius val hartId = Input(UInt(8.W)) 2641d8f4dcbSJay val req = Vec(2, Flipped(DecoupledIO(new ICacheMissReq))) 2651d8f4dcbSJay val resp = Vec(2, ValidIO(new ICacheMissResp)) 2661d8f4dcbSJay 2671d8f4dcbSJay val mem_acquire = DecoupledIO(new TLBundleA(edge.bundle)) 2681d8f4dcbSJay val mem_grant = Flipped(DecoupledIO(new TLBundleD(edge.bundle))) 2691d8f4dcbSJay val mem_finish = DecoupledIO(new TLBundleE(edge.bundle)) 2701d8f4dcbSJay 2711d8f4dcbSJay val meta_write = DecoupledIO(new ICacheMetaWriteBundle) 2721d8f4dcbSJay val data_write = DecoupledIO(new ICacheDataWriteBundle) 2731d8f4dcbSJay 2742a25dbb4SJay val release_req = DecoupledIO(new ReplacePipeReq) 2752a25dbb4SJay val release_resp = Flipped(ValidIO(UInt(ReplaceIdWid.W))) 2761d8f4dcbSJay 2772a25dbb4SJay val victimInfor = Vec(PortNumber, Output(new ICacheVictimInfor())) 2782a25dbb4SJay 2797052722fSJay val prefetch_req = Flipped(DecoupledIO(new PIQReq)) 28000240ba6SJay val prefetch_check = Vec(PortNumber,ValidIO(UInt(PAddrBits.W))) 28100240ba6SJay 2827052722fSJay 2831d8f4dcbSJay }) 2841d8f4dcbSJay // assign default values to output signals 2851d8f4dcbSJay io.mem_grant.ready := false.B 2861d8f4dcbSJay 2871d8f4dcbSJay val meta_write_arb = Module(new Arbiter(new ICacheMetaWriteBundle, PortNumber)) 2881d8f4dcbSJay val refill_arb = Module(new Arbiter(new ICacheDataWriteBundle, PortNumber)) 2892a25dbb4SJay val release_arb = Module(new Arbiter(new ReplacePipeReq, PortNumber)) 2901d8f4dcbSJay 2911d8f4dcbSJay io.mem_grant.ready := true.B 2921d8f4dcbSJay 2932a25dbb4SJay val entries = (0 until PortNumber) map { i => 2941d8f4dcbSJay val entry = Module(new ICacheMissEntry(edge, i)) 2951d8f4dcbSJay 2961d8f4dcbSJay entry.io.id := i.U 2971d8f4dcbSJay 2981d8f4dcbSJay // entry req 2991d8f4dcbSJay entry.io.req.valid := io.req(i).valid 3001d8f4dcbSJay entry.io.req.bits := io.req(i).bits 3011d8f4dcbSJay io.req(i).ready := entry.io.req.ready 3021d8f4dcbSJay 3031d8f4dcbSJay // entry resp 3041d8f4dcbSJay meta_write_arb.io.in(i) <> entry.io.meta_write 3051d8f4dcbSJay refill_arb.io.in(i) <> entry.io.data_write 3062a25dbb4SJay release_arb.io.in(i) <> entry.io.release_req 3071d8f4dcbSJay 3081d8f4dcbSJay entry.io.mem_grant.valid := false.B 3091d8f4dcbSJay entry.io.mem_grant.bits := DontCare 3101d8f4dcbSJay when (io.mem_grant.bits.source === i.U) { 3111d8f4dcbSJay entry.io.mem_grant <> io.mem_grant 3121d8f4dcbSJay } 3131d8f4dcbSJay 3141d8f4dcbSJay io.resp(i) <> entry.io.resp 3151d8f4dcbSJay 3162a25dbb4SJay io.victimInfor(i) := entry.io.victimInfor 31700240ba6SJay io.prefetch_check(i) <> entry.io.toPrefetch 3182a25dbb4SJay 3192a25dbb4SJay entry.io.release_resp <> io.release_resp 3202a25dbb4SJay 3211d8f4dcbSJay XSPerfAccumulate( 3221d8f4dcbSJay "entryPenalty" + Integer.toString(i, 10), 3231d8f4dcbSJay BoolStopWatch( 3241d8f4dcbSJay start = entry.io.req.fire(), 3251d8f4dcbSJay stop = entry.io.resp.fire(), 3261d8f4dcbSJay startHighPriority = true) 3271d8f4dcbSJay ) 3281d8f4dcbSJay XSPerfAccumulate("entryReq" + Integer.toString(i, 10), entry.io.req.fire()) 3291d8f4dcbSJay 3301d8f4dcbSJay entry 3311d8f4dcbSJay } 3321d8f4dcbSJay 3337052722fSJay val alloc = Wire(UInt(log2Ceil(nPrefetchEntries).W)) 3347052722fSJay 335de7689fcSJay val prefEntries = (PortNumber until PortNumber + nPrefetchEntries) map { i => 3367052722fSJay val prefetchEntry = Module(new IPrefetchEntry(edge, PortNumber)) 3377052722fSJay 3387052722fSJay prefetchEntry.io.mem_hint_ack.valid := false.B 3397052722fSJay prefetchEntry.io.mem_hint_ack.bits := DontCare 3407052722fSJay 3417052722fSJay when(io.mem_grant.bits.source === PortNumber.U) { 3427052722fSJay prefetchEntry.io.mem_hint_ack <> io.mem_grant 3437052722fSJay } 3447052722fSJay 345de7689fcSJay prefetchEntry.io.req.valid := io.prefetch_req.valid && ((i-PortNumber).U === alloc) 3467052722fSJay prefetchEntry.io.req.bits := io.prefetch_req.bits 3477052722fSJay 3487052722fSJay prefetchEntry.io.id := i.U 3497052722fSJay 3507052722fSJay prefetchEntry 3517052722fSJay } 3527052722fSJay 3537052722fSJay alloc := PriorityEncoder(prefEntries.map(_.io.req.ready)) 3547052722fSJay io.prefetch_req.ready := ParallelOR(prefEntries.map(_.io.req.ready)) 3557052722fSJay val tl_a_chanel = entries.map(_.io.mem_acquire) ++ prefEntries.map(_.io.mem_hint) 3567052722fSJay TLArbiter.lowest(edge, io.mem_acquire, tl_a_chanel:_*) 3577052722fSJay 3581d8f4dcbSJay TLArbiter.lowest(edge, io.mem_finish, entries.map(_.io.mem_finish):_*) 3591d8f4dcbSJay 3601d8f4dcbSJay io.meta_write <> meta_write_arb.io.out 3611d8f4dcbSJay io.data_write <> refill_arb.io.out 3622a25dbb4SJay io.release_req <> release_arb.io.out 3631d8f4dcbSJay 364*41cb8b61SJenius if (env.EnableDifftest) { 365*41cb8b61SJenius val difftest = Module(new DifftestRefillEvent) 366*41cb8b61SJenius difftest.io.clock := clock 367*41cb8b61SJenius difftest.io.coreid := io.hartId 368*41cb8b61SJenius difftest.io.cacheid := 0.U 369*41cb8b61SJenius difftest.io.valid := refill_arb.io.out.valid 370*41cb8b61SJenius difftest.io.addr := refill_arb.io.out.bits.paddr 371*41cb8b61SJenius difftest.io.data := refill_arb.io.out.bits.data.asTypeOf(difftest.io.data) 372*41cb8b61SJenius } 373*41cb8b61SJenius 3741d8f4dcbSJay (0 until nWays).map{ w => 3751d8f4dcbSJay XSPerfAccumulate("line_0_refill_way_" + Integer.toString(w, 10), entries(0).io.meta_write.valid && OHToUInt(entries(0).io.meta_write.bits.waymask) === w.U) 3761d8f4dcbSJay XSPerfAccumulate("line_1_refill_way_" + Integer.toString(w, 10), entries(1).io.meta_write.valid && OHToUInt(entries(1).io.meta_write.bits.waymask) === w.U) 3771d8f4dcbSJay } 3781d8f4dcbSJay 3791d8f4dcbSJay} 3801d8f4dcbSJay 3811d8f4dcbSJay 3821d8f4dcbSJay 383