1*92e3bfefSLemover/*************************************************************************************** 2*92e3bfefSLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3*92e3bfefSLemover* Copyright (c) 2020-2021 Peng Cheng Laboratory 4*92e3bfefSLemover* 5*92e3bfefSLemover* XiangShan is licensed under Mulan PSL v2. 6*92e3bfefSLemover* You can use this software according to the terms and conditions of the Mulan PSL v2. 7*92e3bfefSLemover* You may obtain a copy of Mulan PSL v2 at: 8*92e3bfefSLemover* http://license.coscl.org.cn/MulanPSL2 9*92e3bfefSLemover* 10*92e3bfefSLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11*92e3bfefSLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12*92e3bfefSLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13*92e3bfefSLemover* 14*92e3bfefSLemover* See the Mulan PSL v2 for more details. 15*92e3bfefSLemover***************************************************************************************/ 16*92e3bfefSLemover 17*92e3bfefSLemoverpackage xiangshan.cache.mmu 18*92e3bfefSLemover 19*92e3bfefSLemoverimport chipsalliance.rocketchip.config.Parameters 20*92e3bfefSLemoverimport chisel3._ 21*92e3bfefSLemoverimport chisel3.experimental.ExtModule 22*92e3bfefSLemoverimport chisel3.util._ 23*92e3bfefSLemoverimport chisel3.internal.naming.chiselName 24*92e3bfefSLemoverimport xiangshan._ 25*92e3bfefSLemoverimport xiangshan.cache.{HasDCacheParameters, MemoryOpConstants} 26*92e3bfefSLemoverimport utils._ 27*92e3bfefSLemoverimport freechips.rocketchip.diplomacy.{IdRange, LazyModule, LazyModuleImp} 28*92e3bfefSLemoverimport freechips.rocketchip.tilelink._ 29*92e3bfefSLemoverimport xiangshan.backend.fu.{PMP, PMPChecker, PMPReqBundle, PMPRespBundle} 30*92e3bfefSLemoverimport xiangshan.backend.fu.util.HasCSRConst 31*92e3bfefSLemover 32*92e3bfefSLemoverclass L2TLB()(implicit p: Parameters) extends LazyModule with HasPtwConst { 33*92e3bfefSLemover 34*92e3bfefSLemover val node = TLClientNode(Seq(TLMasterPortParameters.v1( 35*92e3bfefSLemover clients = Seq(TLMasterParameters.v1( 36*92e3bfefSLemover "ptw", 37*92e3bfefSLemover sourceId = IdRange(0, MemReqWidth) 38*92e3bfefSLemover )) 39*92e3bfefSLemover ))) 40*92e3bfefSLemover 41*92e3bfefSLemover lazy val module = new L2TLBImp(this) 42*92e3bfefSLemover} 43*92e3bfefSLemover 44*92e3bfefSLemover@chiselName 45*92e3bfefSLemoverclass L2TLBImp(outer: L2TLB)(implicit p: Parameters) extends PtwModule(outer) with HasCSRConst with HasPerfEvents { 46*92e3bfefSLemover 47*92e3bfefSLemover val (mem, edge) = outer.node.out.head 48*92e3bfefSLemover 49*92e3bfefSLemover val io = IO(new L2TLBIO) 50*92e3bfefSLemover val difftestIO = IO(new Bundle() { 51*92e3bfefSLemover val ptwResp = Output(Bool()) 52*92e3bfefSLemover val ptwAddr = Output(UInt(64.W)) 53*92e3bfefSLemover val ptwData = Output(Vec(4, UInt(64.W))) 54*92e3bfefSLemover }) 55*92e3bfefSLemover 56*92e3bfefSLemover /* Ptw processes multiple requests 57*92e3bfefSLemover * Divide Ptw procedure into two stages: cache access ; mem access if cache miss 58*92e3bfefSLemover * miss queue itlb dtlb 59*92e3bfefSLemover * | | | 60*92e3bfefSLemover * ------arbiter------ 61*92e3bfefSLemover * | 62*92e3bfefSLemover * l1 - l2 - l3 - sp 63*92e3bfefSLemover * | 64*92e3bfefSLemover * ------------------------------------------- 65*92e3bfefSLemover * miss | queue | hit 66*92e3bfefSLemover * [][][][][][] | 67*92e3bfefSLemover * | | 68*92e3bfefSLemover * state machine accessing mem | 69*92e3bfefSLemover * | | 70*92e3bfefSLemover * ---------------arbiter--------------------- 71*92e3bfefSLemover * | | 72*92e3bfefSLemover * itlb dtlb 73*92e3bfefSLemover */ 74*92e3bfefSLemover 75*92e3bfefSLemover difftestIO <> DontCare 76*92e3bfefSLemover 77*92e3bfefSLemover val sfence = DelayN(io.sfence, 2) 78*92e3bfefSLemover val csr = DelayN(io.csr.tlb, 2) 79*92e3bfefSLemover val satp = csr.satp 80*92e3bfefSLemover val priv = csr.priv 81*92e3bfefSLemover val flush = sfence.valid || csr.satp.changed 82*92e3bfefSLemover 83*92e3bfefSLemover val pmp = Module(new PMP()) 84*92e3bfefSLemover val pmp_check = VecInit(Seq.fill(2)(Module(new PMPChecker(lgMaxSize = 3, sameCycle = true)).io)) 85*92e3bfefSLemover pmp.io.distribute_csr := io.csr.distribute_csr 86*92e3bfefSLemover pmp_check.foreach(_.check_env.apply(ModeS, pmp.io.pmp, pmp.io.pma)) 87*92e3bfefSLemover 88*92e3bfefSLemover val missQueue = Module(new L2TlbMissQueue) 89*92e3bfefSLemover val cache = Module(new PtwCache) 90*92e3bfefSLemover val ptw = Module(new PTW) 91*92e3bfefSLemover val llptw = Module(new LLPTW) 92*92e3bfefSLemover val arb1 = Module(new Arbiter(new PtwReq, PtwWidth)) 93*92e3bfefSLemover val arb2 = Module(new Arbiter(new Bundle { 94*92e3bfefSLemover val vpn = UInt(vpnLen.W) 95*92e3bfefSLemover val source = UInt(bSourceWidth.W) 96*92e3bfefSLemover }, if (l2tlbParams.enablePrefetch) 3 else 2)) 97*92e3bfefSLemover val outArb = (0 until PtwWidth).map(i => Module(new Arbiter(new PtwResp, 3)).io) 98*92e3bfefSLemover val outArbCachePort = 0 99*92e3bfefSLemover val outArbFsmPort = 1 100*92e3bfefSLemover val outArbMqPort = 2 101*92e3bfefSLemover 102*92e3bfefSLemover // NOTE: when cache out but miss and ptw doesnt accept, 103*92e3bfefSLemover arb1.io.in <> VecInit(io.tlb.map(_.req(0))) 104*92e3bfefSLemover arb1.io.out.ready := arb2.io.in(1).ready 105*92e3bfefSLemover 106*92e3bfefSLemover val InArbMissQueuePort = 0 107*92e3bfefSLemover val InArbTlbPort = 1 108*92e3bfefSLemover val InArbPrefetchPort = 2 109*92e3bfefSLemover block_decoupled(missQueue.io.out, arb2.io.in(InArbMissQueuePort), !ptw.io.req.ready) 110*92e3bfefSLemover arb2.io.in(InArbTlbPort).valid := arb1.io.out.valid 111*92e3bfefSLemover arb2.io.in(InArbTlbPort).bits.vpn := arb1.io.out.bits.vpn 112*92e3bfefSLemover arb2.io.in(InArbTlbPort).bits.source := arb1.io.chosen 113*92e3bfefSLemover if (l2tlbParams.enablePrefetch) { 114*92e3bfefSLemover val prefetch = Module(new L2TlbPrefetch()) 115*92e3bfefSLemover val recv = cache.io.resp 116*92e3bfefSLemover // NOTE: 1. prefetch doesn't gen prefetch 2. req from mq doesn't gen prefetch 117*92e3bfefSLemover // NOTE: 1. miss req gen prefetch 2. hit but prefetched gen prefetch 118*92e3bfefSLemover prefetch.io.in.valid := recv.fire() && !from_pre(recv.bits.req_info.source) && (!recv.bits.hit || 119*92e3bfefSLemover recv.bits.prefetch) && recv.bits.isFirst 120*92e3bfefSLemover prefetch.io.in.bits.vpn := recv.bits.req_info.vpn 121*92e3bfefSLemover prefetch.io.sfence := sfence 122*92e3bfefSLemover prefetch.io.csr := csr 123*92e3bfefSLemover arb2.io.in(InArbPrefetchPort) <> prefetch.io.out 124*92e3bfefSLemover } 125*92e3bfefSLemover arb2.io.out.ready := cache.io.req.ready 126*92e3bfefSLemover 127*92e3bfefSLemover val LLPTWARB_CACHE=0 128*92e3bfefSLemover val LLPTWARB_PTW=1 129*92e3bfefSLemover val llptw_arb = Module(new Arbiter(new LLPTWInBundle, 2)) 130*92e3bfefSLemover llptw_arb.io.in(LLPTWARB_CACHE).valid := cache.io.resp.valid && !cache.io.resp.bits.hit && cache.io.resp.bits.toFsm.l2Hit 131*92e3bfefSLemover llptw_arb.io.in(LLPTWARB_CACHE).bits.req_info := cache.io.resp.bits.req_info 132*92e3bfefSLemover llptw_arb.io.in(LLPTWARB_CACHE).bits.ppn := cache.io.resp.bits.toFsm.ppn 133*92e3bfefSLemover llptw_arb.io.in(LLPTWARB_PTW) <> ptw.io.llptw 134*92e3bfefSLemover llptw.io.in <> llptw_arb.io.out 135*92e3bfefSLemover llptw.io.sfence := sfence 136*92e3bfefSLemover llptw.io.csr := csr 137*92e3bfefSLemover 138*92e3bfefSLemover cache.io.req.valid := arb2.io.out.valid 139*92e3bfefSLemover cache.io.req.bits.req_info.vpn := arb2.io.out.bits.vpn 140*92e3bfefSLemover cache.io.req.bits.req_info.source := arb2.io.out.bits.source 141*92e3bfefSLemover cache.io.req.bits.isFirst := arb2.io.chosen =/= InArbMissQueuePort.U 142*92e3bfefSLemover cache.io.sfence := sfence 143*92e3bfefSLemover cache.io.csr := csr 144*92e3bfefSLemover cache.io.resp.ready := Mux(cache.io.resp.bits.hit, 145*92e3bfefSLemover outReady(cache.io.resp.bits.req_info.source, outArbCachePort), 146*92e3bfefSLemover Mux(cache.io.resp.bits.toFsm.l2Hit, llptw_arb.io.in(LLPTWARB_CACHE).ready, 147*92e3bfefSLemover missQueue.io.in.ready || ptw.io.req.ready)) 148*92e3bfefSLemover 149*92e3bfefSLemover missQueue.io.in.valid := cache.io.resp.valid && !cache.io.resp.bits.hit && 150*92e3bfefSLemover !cache.io.resp.bits.toFsm.l2Hit && !ptw.io.req.ready 151*92e3bfefSLemover missQueue.io.in.bits := cache.io.resp.bits.req_info 152*92e3bfefSLemover missQueue.io.sfence := sfence 153*92e3bfefSLemover missQueue.io.csr := csr 154*92e3bfefSLemover 155*92e3bfefSLemover // NOTE: missQueue req has higher priority 156*92e3bfefSLemover ptw.io.req.valid := cache.io.resp.valid && !cache.io.resp.bits.hit && !cache.io.resp.bits.toFsm.l2Hit 157*92e3bfefSLemover ptw.io.req.bits.req_info := cache.io.resp.bits.req_info 158*92e3bfefSLemover ptw.io.req.bits.l1Hit := cache.io.resp.bits.toFsm.l1Hit 159*92e3bfefSLemover ptw.io.req.bits.ppn := cache.io.resp.bits.toFsm.ppn 160*92e3bfefSLemover ptw.io.csr := csr 161*92e3bfefSLemover ptw.io.sfence := sfence 162*92e3bfefSLemover ptw.io.resp.ready := outReady(ptw.io.resp.bits.source, outArbFsmPort) 163*92e3bfefSLemover 164*92e3bfefSLemover 165*92e3bfefSLemover // mem req 166*92e3bfefSLemover def blockBytes_align(addr: UInt) = { 167*92e3bfefSLemover Cat(addr(PAddrBits - 1, log2Up(l2tlbParams.blockBytes)), 0.U(log2Up(l2tlbParams.blockBytes).W)) 168*92e3bfefSLemover } 169*92e3bfefSLemover def addr_low_from_vpn(vpn: UInt) = { 170*92e3bfefSLemover vpn(log2Ceil(l2tlbParams.blockBytes)-log2Ceil(XLEN/8)-1, 0) 171*92e3bfefSLemover } 172*92e3bfefSLemover def addr_low_from_paddr(paddr: UInt) = { 173*92e3bfefSLemover paddr(log2Up(l2tlbParams.blockBytes)-1, log2Up(XLEN/8)) 174*92e3bfefSLemover } 175*92e3bfefSLemover def from_missqueue(id: UInt) = { 176*92e3bfefSLemover (id =/= l2tlbParams.llptwsize.U) 177*92e3bfefSLemover } 178*92e3bfefSLemover val waiting_resp = RegInit(VecInit(Seq.fill(MemReqWidth)(false.B))) 179*92e3bfefSLemover val flush_latch = RegInit(VecInit(Seq.fill(MemReqWidth)(false.B))) 180*92e3bfefSLemover for (i <- waiting_resp.indices) { 181*92e3bfefSLemover assert(!flush_latch(i) || waiting_resp(i)) // when sfence_latch wait for mem resp, waiting_resp should be true 182*92e3bfefSLemover } 183*92e3bfefSLemover 184*92e3bfefSLemover val llptw_out = llptw.io.out 185*92e3bfefSLemover val llptw_mem = llptw.io.mem 186*92e3bfefSLemover llptw_mem.req_mask := waiting_resp.take(l2tlbParams.llptwsize) 187*92e3bfefSLemover ptw.io.mem.mask := waiting_resp.last 188*92e3bfefSLemover 189*92e3bfefSLemover val mem_arb = Module(new Arbiter(new L2TlbMemReqBundle(), 2)) 190*92e3bfefSLemover mem_arb.io.in(0) <> ptw.io.mem.req 191*92e3bfefSLemover mem_arb.io.in(1) <> llptw_mem.req 192*92e3bfefSLemover mem_arb.io.out.ready := mem.a.ready && !flush 193*92e3bfefSLemover 194*92e3bfefSLemover val req_addr_low = Reg(Vec(MemReqWidth, UInt((log2Up(l2tlbParams.blockBytes)-log2Up(XLEN/8)).W))) 195*92e3bfefSLemover 196*92e3bfefSLemover when (llptw.io.in.fire()) { 197*92e3bfefSLemover // when enq miss queue, set the req_addr_low to receive the mem resp data part 198*92e3bfefSLemover req_addr_low(llptw_mem.enq_ptr) := addr_low_from_vpn(llptw.io.in.bits.req_info.vpn) 199*92e3bfefSLemover } 200*92e3bfefSLemover when (mem_arb.io.out.fire()) { 201*92e3bfefSLemover req_addr_low(mem_arb.io.out.bits.id) := addr_low_from_paddr(mem_arb.io.out.bits.addr) 202*92e3bfefSLemover waiting_resp(mem_arb.io.out.bits.id) := true.B 203*92e3bfefSLemover } 204*92e3bfefSLemover // mem read 205*92e3bfefSLemover val memRead = edge.Get( 206*92e3bfefSLemover fromSource = mem_arb.io.out.bits.id, 207*92e3bfefSLemover // toAddress = memAddr(log2Up(CacheLineSize / 2 / 8) - 1, 0), 208*92e3bfefSLemover toAddress = blockBytes_align(mem_arb.io.out.bits.addr), 209*92e3bfefSLemover lgSize = log2Up(l2tlbParams.blockBytes).U 210*92e3bfefSLemover )._2 211*92e3bfefSLemover mem.a.bits := memRead 212*92e3bfefSLemover mem.a.valid := mem_arb.io.out.valid && !flush 213*92e3bfefSLemover mem.d.ready := true.B 214*92e3bfefSLemover // mem -> data buffer 215*92e3bfefSLemover val refill_data = Reg(Vec(blockBits / l1BusDataWidth, UInt(l1BusDataWidth.W))) 216*92e3bfefSLemover val refill_helper = edge.firstlastHelper(mem.d.bits, mem.d.fire()) 217*92e3bfefSLemover val mem_resp_done = refill_helper._3 218*92e3bfefSLemover val mem_resp_from_mq = from_missqueue(mem.d.bits.source) 219*92e3bfefSLemover when (mem.d.valid) { 220*92e3bfefSLemover assert(mem.d.bits.source <= l2tlbParams.llptwsize.U) 221*92e3bfefSLemover refill_data(refill_helper._4) := mem.d.bits.data 222*92e3bfefSLemover } 223*92e3bfefSLemover // save only one pte for each id 224*92e3bfefSLemover // (miss queue may can't resp to tlb with low latency, it should have highest priority, but diffcult to design cache) 225*92e3bfefSLemover val resp_pte = VecInit((0 until MemReqWidth).map(i => 226*92e3bfefSLemover if (i == l2tlbParams.llptwsize) {DataHoldBypass(get_part(refill_data, req_addr_low(i)), RegNext(mem_resp_done && !mem_resp_from_mq)) } 227*92e3bfefSLemover else { DataHoldBypass(get_part(refill_data, req_addr_low(i)), llptw_mem.buffer_it(i)) } 228*92e3bfefSLemover )) 229*92e3bfefSLemover 230*92e3bfefSLemover // mem -> miss queue 231*92e3bfefSLemover llptw_mem.resp.valid := mem_resp_done && mem_resp_from_mq 232*92e3bfefSLemover llptw_mem.resp.bits.id := mem.d.bits.source 233*92e3bfefSLemover // mem -> ptw 234*92e3bfefSLemover ptw.io.mem.req.ready := mem.a.ready 235*92e3bfefSLemover ptw.io.mem.resp.valid := mem_resp_done && !mem_resp_from_mq 236*92e3bfefSLemover ptw.io.mem.resp.bits := resp_pte.last 237*92e3bfefSLemover // mem -> cache 238*92e3bfefSLemover val refill_from_mq = RegNext(mem_resp_from_mq) 239*92e3bfefSLemover cache.io.refill.valid := RegNext(mem_resp_done && !flush && !flush_latch(mem.d.bits.source)) 240*92e3bfefSLemover cache.io.refill.bits.ptes := refill_data.asUInt 241*92e3bfefSLemover cache.io.refill.bits.req_info := Mux(refill_from_mq, llptw_mem.refill, ptw.io.refill.req_info) 242*92e3bfefSLemover cache.io.refill.bits.level := Mux(refill_from_mq, 2.U, RegEnable(ptw.io.refill.level, init = 0.U, ptw.io.mem.req.fire())) 243*92e3bfefSLemover cache.io.refill.bits.addr_low := RegNext(req_addr_low(mem.d.bits.source)) 244*92e3bfefSLemover 245*92e3bfefSLemover // pmp 246*92e3bfefSLemover pmp_check(0).req <> ptw.io.pmp.req 247*92e3bfefSLemover ptw.io.pmp.resp <> pmp_check(0).resp 248*92e3bfefSLemover pmp_check(1).req <> llptw.io.pmp.req 249*92e3bfefSLemover llptw.io.pmp.resp <> pmp_check(1).resp 250*92e3bfefSLemover 251*92e3bfefSLemover llptw_out.ready := outReady(llptw_out.bits.req_info.source, outArbMqPort) 252*92e3bfefSLemover for (i <- 0 until PtwWidth) { 253*92e3bfefSLemover outArb(i).in(outArbCachePort).valid := cache.io.resp.valid && cache.io.resp.bits.hit && cache.io.resp.bits.req_info.source===i.U 254*92e3bfefSLemover outArb(i).in(outArbCachePort).bits.entry := cache.io.resp.bits.toTlb 255*92e3bfefSLemover outArb(i).in(outArbCachePort).bits.pf := !cache.io.resp.bits.toTlb.v 256*92e3bfefSLemover outArb(i).in(outArbCachePort).bits.af := false.B 257*92e3bfefSLemover outArb(i).in(outArbFsmPort).valid := ptw.io.resp.valid && ptw.io.resp.bits.source===i.U 258*92e3bfefSLemover outArb(i).in(outArbFsmPort).bits := ptw.io.resp.bits.resp 259*92e3bfefSLemover outArb(i).in(outArbMqPort).valid := llptw_out.valid && llptw_out.bits.req_info.source===i.U 260*92e3bfefSLemover outArb(i).in(outArbMqPort).bits := pte_to_ptwResp(resp_pte(llptw_out.bits.id), llptw_out.bits.req_info.vpn, llptw_out.bits.af, true) 261*92e3bfefSLemover } 262*92e3bfefSLemover 263*92e3bfefSLemover // io.tlb.map(_.resp) <> outArb.map(_.out) 264*92e3bfefSLemover io.tlb.map(_.resp).zip(outArb.map(_.out)).map{ 265*92e3bfefSLemover case (resp, out) => resp <> out 266*92e3bfefSLemover } 267*92e3bfefSLemover 268*92e3bfefSLemover // sfence 269*92e3bfefSLemover when (flush) { 270*92e3bfefSLemover for (i <- 0 until MemReqWidth) { 271*92e3bfefSLemover when (waiting_resp(i)) { 272*92e3bfefSLemover flush_latch(i) := true.B 273*92e3bfefSLemover } 274*92e3bfefSLemover } 275*92e3bfefSLemover } 276*92e3bfefSLemover // mem -> control signal 277*92e3bfefSLemover // waiting_resp and sfence_latch will be reset when mem_resp_done 278*92e3bfefSLemover when (mem_resp_done) { 279*92e3bfefSLemover waiting_resp(mem.d.bits.source) := false.B 280*92e3bfefSLemover flush_latch(mem.d.bits.source) := false.B 281*92e3bfefSLemover } 282*92e3bfefSLemover 283*92e3bfefSLemover def block_decoupled[T <: Data](source: DecoupledIO[T], sink: DecoupledIO[T], block_signal: Bool) = { 284*92e3bfefSLemover sink.valid := source.valid && !block_signal 285*92e3bfefSLemover source.ready := sink.ready && !block_signal 286*92e3bfefSLemover sink.bits := source.bits 287*92e3bfefSLemover } 288*92e3bfefSLemover 289*92e3bfefSLemover def get_part(data: Vec[UInt], index: UInt): UInt = { 290*92e3bfefSLemover val inner_data = data.asTypeOf(Vec(data.getWidth / XLEN, UInt(XLEN.W))) 291*92e3bfefSLemover inner_data(index) 292*92e3bfefSLemover } 293*92e3bfefSLemover 294*92e3bfefSLemover def pte_to_ptwResp(pte: UInt, vpn: UInt, af: Bool, af_first: Boolean) : PtwResp = { 295*92e3bfefSLemover val pte_in = pte.asTypeOf(new PteBundle()) 296*92e3bfefSLemover val ptw_resp = Wire(new PtwResp()) 297*92e3bfefSLemover ptw_resp.entry.ppn := pte_in.ppn 298*92e3bfefSLemover ptw_resp.entry.level.map(_ := 2.U) 299*92e3bfefSLemover ptw_resp.entry.perm.map(_ := pte_in.getPerm()) 300*92e3bfefSLemover ptw_resp.entry.tag := vpn 301*92e3bfefSLemover ptw_resp.pf := (if (af_first) !af else true.B) && pte_in.isPf(2.U) 302*92e3bfefSLemover ptw_resp.af := (if (!af_first) pte_in.isPf(2.U) else true.B) && af 303*92e3bfefSLemover ptw_resp.entry.v := !ptw_resp.pf 304*92e3bfefSLemover ptw_resp.entry.prefetch := DontCare 305*92e3bfefSLemover ptw_resp.entry.asid := satp.asid 306*92e3bfefSLemover ptw_resp 307*92e3bfefSLemover } 308*92e3bfefSLemover 309*92e3bfefSLemover def outReady(source: UInt, port: Int): Bool = { 310*92e3bfefSLemover MuxLookup(source, true.B, 311*92e3bfefSLemover (0 until PtwWidth).map(i => i.U -> outArb(i).in(port).ready)) 312*92e3bfefSLemover } 313*92e3bfefSLemover 314*92e3bfefSLemover // debug info 315*92e3bfefSLemover for (i <- 0 until PtwWidth) { 316*92e3bfefSLemover XSDebug(p"[io.tlb(${i.U})] ${io.tlb(i)}\n") 317*92e3bfefSLemover } 318*92e3bfefSLemover XSDebug(p"[sfence] ${sfence}\n") 319*92e3bfefSLemover XSDebug(p"[io.csr.tlb] ${io.csr.tlb}\n") 320*92e3bfefSLemover 321*92e3bfefSLemover for (i <- 0 until PtwWidth) { 322*92e3bfefSLemover XSPerfAccumulate(s"req_count${i}", io.tlb(i).req(0).fire()) 323*92e3bfefSLemover XSPerfAccumulate(s"req_blocked_count_${i}", io.tlb(i).req(0).valid && !io.tlb(i).req(0).ready) 324*92e3bfefSLemover } 325*92e3bfefSLemover XSPerfAccumulate(s"req_blocked_by_mq", arb1.io.out.valid && missQueue.io.out.valid) 326*92e3bfefSLemover for (i <- 0 until (MemReqWidth + 1)) { 327*92e3bfefSLemover XSPerfAccumulate(s"mem_req_util${i}", PopCount(waiting_resp) === i.U) 328*92e3bfefSLemover } 329*92e3bfefSLemover XSPerfAccumulate("mem_cycle", PopCount(waiting_resp) =/= 0.U) 330*92e3bfefSLemover XSPerfAccumulate("mem_count", mem.a.fire()) 331*92e3bfefSLemover 332*92e3bfefSLemover // print configs 333*92e3bfefSLemover println(s"${l2tlbParams.name}: a ptw, a llptw with size ${l2tlbParams.llptwsize}, miss queue size ${MSHRSize} l1:${l2tlbParams.l1Size} fa l2: nSets ${l2tlbParams.l2nSets} nWays ${l2tlbParams.l2nWays} l3: ${l2tlbParams.l3nSets} nWays ${l2tlbParams.l3nWays} blockBytes:${l2tlbParams.blockBytes}") 334*92e3bfefSLemover 335*92e3bfefSLemover // time out assert 336*92e3bfefSLemover for (i <- 0 until MemReqWidth) { 337*92e3bfefSLemover TimeOutAssert(waiting_resp(i), timeOutThreshold, s"ptw mem resp time out wait_resp${i}") 338*92e3bfefSLemover TimeOutAssert(flush_latch(i), timeOutThreshold, s"ptw mem resp time out flush_latch${i}") 339*92e3bfefSLemover } 340*92e3bfefSLemover 341*92e3bfefSLemover 342*92e3bfefSLemover val perfEvents = Seq(llptw, cache, ptw).flatMap(_.getPerfEvents) 343*92e3bfefSLemover generatePerfEvent() 344*92e3bfefSLemover} 345*92e3bfefSLemover 346*92e3bfefSLemoverclass PTEHelper() extends ExtModule { 347*92e3bfefSLemover val clock = IO(Input(Clock())) 348*92e3bfefSLemover val enable = IO(Input(Bool())) 349*92e3bfefSLemover val satp = IO(Input(UInt(64.W))) 350*92e3bfefSLemover val vpn = IO(Input(UInt(64.W))) 351*92e3bfefSLemover val pte = IO(Output(UInt(64.W))) 352*92e3bfefSLemover val level = IO(Output(UInt(8.W))) 353*92e3bfefSLemover val pf = IO(Output(UInt(8.W))) 354*92e3bfefSLemover} 355*92e3bfefSLemover 356*92e3bfefSLemoverclass FakePTW()(implicit p: Parameters) extends XSModule with HasPtwConst { 357*92e3bfefSLemover val io = IO(new L2TLBIO) 358*92e3bfefSLemover 359*92e3bfefSLemover for (i <- 0 until PtwWidth) { 360*92e3bfefSLemover io.tlb(i).req(0).ready := true.B 361*92e3bfefSLemover 362*92e3bfefSLemover val helper = Module(new PTEHelper()) 363*92e3bfefSLemover helper.clock := clock 364*92e3bfefSLemover helper.enable := io.tlb(i).req(0).valid 365*92e3bfefSLemover helper.satp := io.csr.tlb.satp.ppn 366*92e3bfefSLemover helper.vpn := io.tlb(i).req(0).bits.vpn 367*92e3bfefSLemover val pte = helper.pte.asTypeOf(new PteBundle) 368*92e3bfefSLemover val level = helper.level 369*92e3bfefSLemover val pf = helper.pf 370*92e3bfefSLemover 371*92e3bfefSLemover io.tlb(i).resp.valid := RegNext(io.tlb(i).req(0).valid) 372*92e3bfefSLemover assert(!io.tlb(i).resp.valid || io.tlb(i).resp.ready) 373*92e3bfefSLemover io.tlb(i).resp.bits.entry.tag := RegNext(io.tlb(i).req(0).bits.vpn) 374*92e3bfefSLemover io.tlb(i).resp.bits.entry.ppn := pte.ppn 375*92e3bfefSLemover io.tlb(i).resp.bits.entry.perm.map(_ := pte.getPerm()) 376*92e3bfefSLemover io.tlb(i).resp.bits.entry.level.map(_ := level) 377*92e3bfefSLemover io.tlb(i).resp.bits.pf := pf 378*92e3bfefSLemover io.tlb(i).resp.bits.af := DontCare // TODO: implement it 379*92e3bfefSLemover } 380*92e3bfefSLemover} 381*92e3bfefSLemover 382*92e3bfefSLemoverclass L2TLBWrapper()(implicit p: Parameters) extends LazyModule with HasXSParameter { 383*92e3bfefSLemover val useSoftPTW = coreParams.softPTW 384*92e3bfefSLemover val node = if (!useSoftPTW) TLIdentityNode() else null 385*92e3bfefSLemover val ptw = if (!useSoftPTW) LazyModule(new L2TLB()) else null 386*92e3bfefSLemover if (!useSoftPTW) { 387*92e3bfefSLemover node := ptw.node 388*92e3bfefSLemover } 389*92e3bfefSLemover 390*92e3bfefSLemover lazy val module = new LazyModuleImp(this) with HasPerfEvents { 391*92e3bfefSLemover val io = IO(new L2TLBIO) 392*92e3bfefSLemover val perfEvents = if (useSoftPTW) { 393*92e3bfefSLemover val fake_ptw = Module(new FakePTW()) 394*92e3bfefSLemover io <> fake_ptw.io 395*92e3bfefSLemover Seq() 396*92e3bfefSLemover } 397*92e3bfefSLemover else { 398*92e3bfefSLemover io <> ptw.module.io 399*92e3bfefSLemover ptw.module.getPerfEvents 400*92e3bfefSLemover } 401*92e3bfefSLemover generatePerfEvent() 402*92e3bfefSLemover } 403*92e3bfefSLemover} 404