16d5ddbceSLemover/*************************************************************************************** 26d5ddbceSLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory 46d5ddbceSLemover* 56d5ddbceSLemover* XiangShan is licensed under Mulan PSL v2. 66d5ddbceSLemover* You can use this software according to the terms and conditions of the Mulan PSL v2. 76d5ddbceSLemover* You may obtain a copy of Mulan PSL v2 at: 86d5ddbceSLemover* http://license.coscl.org.cn/MulanPSL2 96d5ddbceSLemover* 106d5ddbceSLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 116d5ddbceSLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 126d5ddbceSLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 136d5ddbceSLemover* 146d5ddbceSLemover* See the Mulan PSL v2 for more details. 156d5ddbceSLemover***************************************************************************************/ 166d5ddbceSLemover 176d5ddbceSLemoverpackage xiangshan.cache.mmu 186d5ddbceSLemover 198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters 206d5ddbceSLemoverimport chisel3._ 216d5ddbceSLemoverimport chisel3.util._ 226d5ddbceSLemoverimport xiangshan._ 236d5ddbceSLemoverimport xiangshan.cache.{HasDCacheParameters, MemoryOpConstants} 246d5ddbceSLemoverimport utils._ 253c02ee8fSwakafaimport utility._ 266d5ddbceSLemoverimport freechips.rocketchip.diplomacy.{LazyModule, LazyModuleImp} 276d5ddbceSLemoverimport freechips.rocketchip.tilelink._ 28b6982e83SLemoverimport xiangshan.backend.fu.{PMPReqBundle, PMPRespBundle} 296d5ddbceSLemover 3092e3bfefSLemover/** Page Table Walk is divided into two parts 3192e3bfefSLemover * One, PTW: page walk for pde, except for leaf entries, one by one 3292e3bfefSLemover * Two, LLPTW: page walk for pte, only the leaf entries(4KB), in parallel 336d5ddbceSLemover */ 3492e3bfefSLemover 3592e3bfefSLemover 3692e3bfefSLemover/** PTW : page table walker 3792e3bfefSLemover * a finite state machine 3892e3bfefSLemover * only take 1GB and 2MB page walks 3992e3bfefSLemover * or in other words, except the last level(leaf) 4092e3bfefSLemover **/ 4192e3bfefSLemoverclass PTWIO()(implicit p: Parameters) extends MMUIOBaseBundle with HasPtwConst { 426d5ddbceSLemover val req = Flipped(DecoupledIO(new Bundle { 4345f497a4Shappy-lx val req_info = new L2TlbInnerBundle() 446d5ddbceSLemover val l1Hit = Bool() 456d5ddbceSLemover val ppn = UInt(ppnLen.W) 46*30104977Speixiaokun val stage1Hit = Bool() 47*30104977Speixiaokun val stage1 = new PtwMergeResp 486d5ddbceSLemover })) 496d5ddbceSLemover val resp = DecoupledIO(new Bundle { 50bc063562SLemover val source = UInt(bSourceWidth.W) 51eb4bf3f2Speixiaokun val s2xlate = UInt(2.W) 5263632028SHaoyuan Feng val resp = new PtwMergeResp 53d0de7e4aSpeixiaokun val h_resp = new HptwResp 546d5ddbceSLemover }) 556d5ddbceSLemover 5692e3bfefSLemover val llptw = DecoupledIO(new LLPTWInBundle()) 579c503409SLemover // NOTE: llptw change from "connect to llptw" to "connect to page cache" 589c503409SLemover // to avoid corner case that caused duplicate entries 59cc5a5f22SLemover 60d0de7e4aSpeixiaokun val hptw = new Bundle { 61d0de7e4aSpeixiaokun val req = DecoupledIO(new Bundle { 62eb4bf3f2Speixiaokun val source = UInt(bSourceWidth.W) 63d0de7e4aSpeixiaokun val id = UInt(log2Up(l2tlbParams.llptwsize).W) 6482978df9Speixiaokun val gvpn = UInt(vpnLen.W) 65d0de7e4aSpeixiaokun }) 66d0de7e4aSpeixiaokun val resp = Flipped(Valid(new Bundle { 67d0de7e4aSpeixiaokun val h_resp = Output(new HptwResp) 68d0de7e4aSpeixiaokun })) 69d0de7e4aSpeixiaokun } 706d5ddbceSLemover val mem = new Bundle { 71b848eea5SLemover val req = DecoupledIO(new L2TlbMemReqBundle()) 725854c1edSLemover val resp = Flipped(ValidIO(UInt(XLEN.W))) 73cc5a5f22SLemover val mask = Input(Bool()) 746d5ddbceSLemover } 75b6982e83SLemover val pmp = new Bundle { 76b6982e83SLemover val req = ValidIO(new PMPReqBundle()) 77b6982e83SLemover val resp = Flipped(new PMPRespBundle()) 78b6982e83SLemover } 796d5ddbceSLemover 806d5ddbceSLemover val refill = Output(new Bundle { 8145f497a4Shappy-lx val req_info = new L2TlbInnerBundle() 826d5ddbceSLemover val level = UInt(log2Up(Level).W) 836d5ddbceSLemover }) 846d5ddbceSLemover} 856d5ddbceSLemover 8692e3bfefSLemoverclass PTW()(implicit p: Parameters) extends XSModule with HasPtwConst with HasPerfEvents { 8792e3bfefSLemover val io = IO(new PTWIO) 886d5ddbceSLemover val sfence = io.sfence 896d5ddbceSLemover val mem = io.mem 90d0de7e4aSpeixiaokun val req_s2xlate = Reg(UInt(2.W)) 9103c1129fSpeixiaokun val enableS2xlate = req_s2xlate =/= noS2xlate 9203c1129fSpeixiaokun val onlyS1xlate = req_s2xlate === onlyStage1 9303c1129fSpeixiaokun val onlyS2xlate = req_s2xlate === onlyStage2 94d0de7e4aSpeixiaokun 95d0de7e4aSpeixiaokun val satp = Mux(enableS2xlate, io.csr.vsatp, io.csr.satp) 96d0de7e4aSpeixiaokun val hgatp = io.csr.hgatp 97d0de7e4aSpeixiaokun val flush = io.sfence.valid || satp.changed 98d0de7e4aSpeixiaokun val s2xlate = enableS2xlate && !onlyS1xlate 996d5ddbceSLemover val level = RegInit(0.U(log2Up(Level).W)) 100b6982e83SLemover val af_level = RegInit(0.U(log2Up(Level).W)) // access fault return this level 1016d5ddbceSLemover val ppn = Reg(UInt(ppnLen.W)) 10282978df9Speixiaokun val vpn = Reg(UInt(vpnLen.W)) // vpn or gvpn 1036d5ddbceSLemover val levelNext = level + 1.U 1046d5ddbceSLemover val l1Hit = Reg(Bool()) 105d0de7e4aSpeixiaokun val pte = mem.resp.bits.asTypeOf(new PteBundle().cloneType) 1066d5ddbceSLemover 10744b79566SXiaokun-Pei // s/w register 10844b79566SXiaokun-Pei val s_pmp_check = RegInit(true.B) 10944b79566SXiaokun-Pei val s_mem_req = RegInit(true.B) 11044b79566SXiaokun-Pei val s_llptw_req = RegInit(true.B) 11144b79566SXiaokun-Pei val w_mem_resp = RegInit(true.B) 112d0de7e4aSpeixiaokun val s_hptw_req = RegInit(true.B) 113d0de7e4aSpeixiaokun val w_hptw_resp = RegInit(true.B) 114d0de7e4aSpeixiaokun val s_last_hptw_req = RegInit(true.B) 115d0de7e4aSpeixiaokun val w_last_hptw_resp = RegInit(true.B) 11644b79566SXiaokun-Pei // for updating "level" 11744b79566SXiaokun-Pei val mem_addr_update = RegInit(false.B) 11844b79566SXiaokun-Pei 11944b79566SXiaokun-Pei val idle = RegInit(true.B) 1202a906a65SHaoyuan Feng val finish = WireInit(false.B) 1212a906a65SHaoyuan Feng val sent_to_pmp = idle === false.B && (s_pmp_check === false.B || mem_addr_update) && !finish 12244b79566SXiaokun-Pei 123d0de7e4aSpeixiaokun val pageFault = pte.isPf(level) 12444b79566SXiaokun-Pei val accessFault = RegEnable(io.pmp.resp.ld || io.pmp.resp.mmio, sent_to_pmp) 1256d5ddbceSLemover 126d0de7e4aSpeixiaokun val hptw_pageFault = RegInit(false.B) 127d0de7e4aSpeixiaokun val hptw_accessFault = RegInit(false.B) 128d0de7e4aSpeixiaokun val last_s2xlate = RegInit(false.B) 129*30104977Speixiaokun val stage1Hit = RegEnable(io.req.bits.stage1Hit, io.req.fire()) 130*30104977Speixiaokun val stage1 = RegEnable(io.req.bits.stage1, io.req.fire()) 131d0de7e4aSpeixiaokun 132d0de7e4aSpeixiaokun val ppn_af = pte.isAf() 133d0de7e4aSpeixiaokun val find_pte = pte.isLeaf() || ppn_af || pageFault 13444b79566SXiaokun-Pei val to_find_pte = level === 1.U && find_pte === false.B 135935edac4STang Haojin val source = RegEnable(io.req.bits.req_info.source, io.req.fire) 1366d5ddbceSLemover 1376d5ddbceSLemover val l1addr = MakeAddr(satp.ppn, getVpnn(vpn, 2)) 138d0de7e4aSpeixiaokun val l2addr = MakeAddr(Mux(l1Hit, ppn, pte.ppn), getVpnn(vpn, 1)) 139b6982e83SLemover val mem_addr = Mux(af_level === 0.U, l1addr, l2addr) 14044b79566SXiaokun-Pei 141b24e0a78Speixiaokun val hptw_resp = RegEnable(io.hptw.resp.bits.h_resp, io.hptw.resp.fire()) 142*30104977Speixiaokun val gpaddr = Mux(stage1Hit, stage1.genPPN(), Mux(onlyS2xlate, Cat(vpn, 0.U(offLen.W)), mem_addr)) 143b24e0a78Speixiaokun val hpaddr = Cat(hptw_resp.genPPNS2(), get_off(gpaddr)) 144d0de7e4aSpeixiaokun 14544b79566SXiaokun-Pei io.req.ready := idle 146*30104977Speixiaokun val ptw_resp = Wire(new PtwMergeResp) 147*30104977Speixiaokun ptw_resp.apply(pageFault && !accessFault && !ppn_af, accessFault || ppn_af, Mux(accessFault, af_level,level), pte, vpn, satp.asid, hgatp.asid, vpn(sectortlbwidth - 1, 0), not_super = false) 14844b79566SXiaokun-Pei 149d0de7e4aSpeixiaokun io.resp.valid := idle === false.B && mem_addr_update && !last_s2xlate && ((w_mem_resp && find_pte) || (s_pmp_check && accessFault) || onlyS2xlate) 15044b79566SXiaokun-Pei io.resp.bits.source := source 151*30104977Speixiaokun io.resp.bits.resp := Mux(stage1Hit, stage1, ptw_resp) 152d0de7e4aSpeixiaokun io.resp.bits.h_resp := io.hptw.resp.bits.h_resp 1536315ba2aSpeixiaokun io.resp.bits.s2xlate := req_s2xlate 15444b79566SXiaokun-Pei 15544b79566SXiaokun-Pei io.llptw.valid := s_llptw_req === false.B && to_find_pte && !accessFault 15644b79566SXiaokun-Pei io.llptw.bits.req_info.source := source 15744b79566SXiaokun-Pei io.llptw.bits.req_info.vpn := vpn 15882978df9Speixiaokun io.llptw.bits.req_info.s2xlate := req_s2xlate 159eb4bf3f2Speixiaokun io.llptw.bits.ppn := DontCare 16044b79566SXiaokun-Pei 161b6982e83SLemover io.pmp.req.valid := DontCare // samecycle, do not use valid 162d0de7e4aSpeixiaokun io.pmp.req.bits.addr := Mux(s2xlate, hpaddr, mem_addr) 163b6982e83SLemover io.pmp.req.bits.size := 3.U // TODO: fix it 164b6982e83SLemover io.pmp.req.bits.cmd := TlbCmd.read 165b6982e83SLemover 16644b79566SXiaokun-Pei mem.req.valid := s_mem_req === false.B && !mem.mask && !accessFault && s_pmp_check 167d0de7e4aSpeixiaokun mem.req.bits.addr := Mux(s2xlate, hpaddr, mem_addr) 168bc063562SLemover mem.req.bits.id := FsmReqID.U(bMemID.W) 1696d5ddbceSLemover 170eb4bf3f2Speixiaokun io.refill.req_info.s2xlate := req_s2xlate 17145f497a4Shappy-lx io.refill.req_info.vpn := vpn 1726d5ddbceSLemover io.refill.level := level 17345f497a4Shappy-lx io.refill.req_info.source := source 1746d5ddbceSLemover 175d0de7e4aSpeixiaokun io.hptw.req.valid := !s_hptw_req || !s_last_hptw_req 176d0de7e4aSpeixiaokun io.hptw.req.bits.id := FsmReqID.U(bMemID.W) 17782978df9Speixiaokun io.hptw.req.bits.gvpn := get_pn(gpaddr) 178eb4bf3f2Speixiaokun io.hptw.req.bits.source := source 179d0de7e4aSpeixiaokun 180*30104977Speixiaokun when (io.req.fire() && io.req.bits.stage1Hit){ 181*30104977Speixiaokun idle := false.B 182*30104977Speixiaokun s_hptw_req := false.B 183*30104977Speixiaokun } 184d0de7e4aSpeixiaokun 185*30104977Speixiaokun when (io.hptw.resp.fire() && w_hptw_resp === false.B && stage1Hit){ 186*30104977Speixiaokun w_hptw_resp := true.B 187*30104977Speixiaokun } 188*30104977Speixiaokun 189*30104977Speixiaokun when (io.resp.fire() && stage1Hit){ 190*30104977Speixiaokun idle := true.B 191*30104977Speixiaokun } 192*30104977Speixiaokun 193*30104977Speixiaokun when (io.req.fire() && !io.req.bits.stage1Hit){ 19444b79566SXiaokun-Pei val req = io.req.bits 19544b79566SXiaokun-Pei level := Mux(req.l1Hit, 1.U, 0.U) 19644b79566SXiaokun-Pei af_level := Mux(req.l1Hit, 1.U, 0.U) 19744b79566SXiaokun-Pei ppn := Mux(req.l1Hit, io.req.bits.ppn, satp.ppn) 19844b79566SXiaokun-Pei vpn := io.req.bits.req_info.vpn 19944b79566SXiaokun-Pei l1Hit := req.l1Hit 20044b79566SXiaokun-Pei accessFault := false.B 20144b79566SXiaokun-Pei idle := false.B 202d0de7e4aSpeixiaokun hptw_pageFault := false.B 20350c7aa78Speixiaokun req_s2xlate := io.req.bits.req_info.s2xlate 20482978df9Speixiaokun when(io.req.bits.req_info.s2xlate =/= noS2xlate && io.req.bits.req_info.s2xlate =/= onlyStage1){ 205d0de7e4aSpeixiaokun last_s2xlate := true.B 206d0de7e4aSpeixiaokun s_hptw_req := false.B 207d0de7e4aSpeixiaokun }.otherwise { 208d0de7e4aSpeixiaokun s_pmp_check := false.B 209d0de7e4aSpeixiaokun } 210d0de7e4aSpeixiaokun } 211d0de7e4aSpeixiaokun 212d0de7e4aSpeixiaokun when(io.hptw.req.fire() && s_hptw_req === false.B){ 213d0de7e4aSpeixiaokun s_hptw_req := true.B 214d0de7e4aSpeixiaokun w_hptw_resp := false.B 215d0de7e4aSpeixiaokun } 216d0de7e4aSpeixiaokun 217*30104977Speixiaokun when(io.hptw.resp.fire() && w_hptw_resp === false.B && !stage1Hit) { 218d0de7e4aSpeixiaokun hptw_pageFault := io.hptw.resp.bits.h_resp.gpf 219d0de7e4aSpeixiaokun hptw_accessFault := io.hptw.resp.bits.h_resp.gaf 220d0de7e4aSpeixiaokun w_hptw_resp := true.B 221d0de7e4aSpeixiaokun when(onlyS2xlate){ 222d0de7e4aSpeixiaokun mem_addr_update := true.B 223d0de7e4aSpeixiaokun last_s2xlate := false.B 224d0de7e4aSpeixiaokun }.otherwise { 225d0de7e4aSpeixiaokun s_pmp_check := false.B 226d0de7e4aSpeixiaokun } 227d0de7e4aSpeixiaokun } 228d0de7e4aSpeixiaokun 229d0de7e4aSpeixiaokun when(io.hptw.req.fire() && s_last_hptw_req === false.B) { 230d0de7e4aSpeixiaokun w_last_hptw_resp := false.B 231d0de7e4aSpeixiaokun s_last_hptw_req := true.B 232d0de7e4aSpeixiaokun } 233d0de7e4aSpeixiaokun 234d0de7e4aSpeixiaokun when(io.hptw.resp.fire() && w_last_hptw_resp === false.B){ 235d0de7e4aSpeixiaokun hptw_pageFault := io.hptw.resp.bits.h_resp.gpf 236d0de7e4aSpeixiaokun hptw_accessFault := io.hptw.resp.bits.h_resp.gaf 237d0de7e4aSpeixiaokun w_last_hptw_resp := true.B 238d0de7e4aSpeixiaokun mem_addr_update := true.B 239d0de7e4aSpeixiaokun last_s2xlate := false.B 24044b79566SXiaokun-Pei } 24144b79566SXiaokun-Pei 24244b79566SXiaokun-Pei when(sent_to_pmp && mem_addr_update === false.B){ 24344b79566SXiaokun-Pei s_mem_req := false.B 24444b79566SXiaokun-Pei s_pmp_check := true.B 24544b79566SXiaokun-Pei } 24644b79566SXiaokun-Pei 24744b79566SXiaokun-Pei when(accessFault && idle === false.B){ 24844b79566SXiaokun-Pei s_pmp_check := true.B 24944b79566SXiaokun-Pei s_mem_req := true.B 25044b79566SXiaokun-Pei w_mem_resp := true.B 25144b79566SXiaokun-Pei s_llptw_req := true.B 252d0de7e4aSpeixiaokun s_hptw_req := true.B 253d0de7e4aSpeixiaokun w_hptw_resp := true.B 254d0de7e4aSpeixiaokun s_last_hptw_req := true.B 255d0de7e4aSpeixiaokun w_last_hptw_resp := true.B 25644b79566SXiaokun-Pei mem_addr_update := true.B 257d0de7e4aSpeixiaokun last_s2xlate := false.B 25844b79566SXiaokun-Pei } 25944b79566SXiaokun-Pei 260935edac4STang Haojin when (mem.req.fire){ 26144b79566SXiaokun-Pei s_mem_req := true.B 26244b79566SXiaokun-Pei w_mem_resp := false.B 26344b79566SXiaokun-Pei } 26444b79566SXiaokun-Pei 265935edac4STang Haojin when(mem.resp.fire && w_mem_resp === false.B){ 26644b79566SXiaokun-Pei w_mem_resp := true.B 26744b79566SXiaokun-Pei af_level := af_level + 1.U 26844b79566SXiaokun-Pei s_llptw_req := false.B 26944b79566SXiaokun-Pei mem_addr_update := true.B 27044b79566SXiaokun-Pei } 27144b79566SXiaokun-Pei 27244b79566SXiaokun-Pei when(mem_addr_update){ 27344b79566SXiaokun-Pei when(level === 0.U && !(find_pte || accessFault)){ 27444b79566SXiaokun-Pei level := levelNext 275d0de7e4aSpeixiaokun when(s2xlate){ 276d0de7e4aSpeixiaokun s_hptw_req := false.B 277d0de7e4aSpeixiaokun }.otherwise{ 27844b79566SXiaokun-Pei s_mem_req := false.B 279d0de7e4aSpeixiaokun } 28044b79566SXiaokun-Pei s_llptw_req := true.B 28144b79566SXiaokun-Pei mem_addr_update := false.B 2822a906a65SHaoyuan Feng }.elsewhen(io.llptw.valid){ 283935edac4STang Haojin when(io.llptw.fire) { 28444b79566SXiaokun-Pei idle := true.B 28544b79566SXiaokun-Pei s_llptw_req := true.B 28644b79566SXiaokun-Pei mem_addr_update := false.B 287d0de7e4aSpeixiaokun last_s2xlate := false.B 2882a906a65SHaoyuan Feng } 2892a906a65SHaoyuan Feng finish := true.B 290d0de7e4aSpeixiaokun }.elsewhen(s2xlate && last_s2xlate === true.B) { 291d0de7e4aSpeixiaokun s_last_hptw_req := false.B 292d0de7e4aSpeixiaokun mem_addr_update := false.B 2932a906a65SHaoyuan Feng }.elsewhen(io.resp.valid){ 294935edac4STang Haojin when(io.resp.fire) { 29544b79566SXiaokun-Pei idle := true.B 29644b79566SXiaokun-Pei s_llptw_req := true.B 29744b79566SXiaokun-Pei mem_addr_update := false.B 29844b79566SXiaokun-Pei accessFault := false.B 29944b79566SXiaokun-Pei } 3002a906a65SHaoyuan Feng finish := true.B 3012a906a65SHaoyuan Feng } 30244b79566SXiaokun-Pei } 30344b79566SXiaokun-Pei 30444b79566SXiaokun-Pei 30544b79566SXiaokun-Pei when (sfence.valid) { 30644b79566SXiaokun-Pei idle := true.B 30744b79566SXiaokun-Pei s_pmp_check := true.B 30844b79566SXiaokun-Pei s_mem_req := true.B 30944b79566SXiaokun-Pei s_llptw_req := true.B 31044b79566SXiaokun-Pei w_mem_resp := true.B 31144b79566SXiaokun-Pei accessFault := false.B 312d826bce1SHaoyuan Feng mem_addr_update := false.B 313d0de7e4aSpeixiaokun s_hptw_req := true.B 314d0de7e4aSpeixiaokun w_hptw_resp := true.B 315d0de7e4aSpeixiaokun s_last_hptw_req := true.B 316d0de7e4aSpeixiaokun w_last_hptw_resp := true.B 31744b79566SXiaokun-Pei } 31844b79566SXiaokun-Pei 31944b79566SXiaokun-Pei 32044b79566SXiaokun-Pei XSDebug(p"[ptw] level:${level} notFound:${pageFault}\n") 3216d5ddbceSLemover 3226d5ddbceSLemover // perf 323935edac4STang Haojin XSPerfAccumulate("fsm_count", io.req.fire) 3246d5ddbceSLemover for (i <- 0 until PtwWidth) { 325935edac4STang Haojin XSPerfAccumulate(s"fsm_count_source${i}", io.req.fire && io.req.bits.req_info.source === i.U) 3266d5ddbceSLemover } 32744b79566SXiaokun-Pei XSPerfAccumulate("fsm_busy", !idle) 32844b79566SXiaokun-Pei XSPerfAccumulate("fsm_idle", idle) 3296d5ddbceSLemover XSPerfAccumulate("resp_blocked", io.resp.valid && !io.resp.ready) 330dd7fe201SHaoyuan Feng XSPerfAccumulate("ptw_ppn_af", io.resp.fire && ppn_af) 331935edac4STang Haojin XSPerfAccumulate("mem_count", mem.req.fire) 332935edac4STang Haojin XSPerfAccumulate("mem_cycle", BoolStopWatch(mem.req.fire, mem.resp.fire, true)) 3336d5ddbceSLemover XSPerfAccumulate("mem_blocked", mem.req.valid && !mem.req.ready) 334cc5a5f22SLemover 33544b79566SXiaokun-Pei TimeOutAssert(!idle, timeOutThreshold, "page table walker time out") 336cd365d4cSrvcoresjw 337cd365d4cSrvcoresjw val perfEvents = Seq( 338935edac4STang Haojin ("fsm_count ", io.req.fire ), 33944b79566SXiaokun-Pei ("fsm_busy ", !idle ), 34044b79566SXiaokun-Pei ("fsm_idle ", idle ), 341cd365d4cSrvcoresjw ("resp_blocked ", io.resp.valid && !io.resp.ready ), 342935edac4STang Haojin ("mem_count ", mem.req.fire ), 343935edac4STang Haojin ("mem_cycle ", BoolStopWatch(mem.req.fire, mem.resp.fire, true)), 344cd365d4cSrvcoresjw ("mem_blocked ", mem.req.valid && !mem.req.ready ), 345cd365d4cSrvcoresjw ) 3461ca0e4f3SYinan Xu generatePerfEvent() 3476d5ddbceSLemover} 34892e3bfefSLemover 34992e3bfefSLemover/*========================= LLPTW ==============================*/ 35092e3bfefSLemover 35192e3bfefSLemover/** LLPTW : Last Level Page Table Walker 35292e3bfefSLemover * the page walker that only takes 4KB(last level) page walk. 35392e3bfefSLemover **/ 35492e3bfefSLemover 35592e3bfefSLemoverclass LLPTWInBundle(implicit p: Parameters) extends XSBundle with HasPtwConst { 35692e3bfefSLemover val req_info = Output(new L2TlbInnerBundle()) 357d61cd5eeSpeixiaokun val ppn = Output(if(HasHExtension) UInt((vpnLen.max(ppnLen)).W) else UInt(ppnLen.W)) 35892e3bfefSLemover} 35992e3bfefSLemover 36092e3bfefSLemoverclass LLPTWIO(implicit p: Parameters) extends MMUIOBaseBundle with HasPtwConst { 36192e3bfefSLemover val in = Flipped(DecoupledIO(new LLPTWInBundle())) 36292e3bfefSLemover val out = DecoupledIO(new Bundle { 36392e3bfefSLemover val req_info = Output(new L2TlbInnerBundle()) 36492e3bfefSLemover val id = Output(UInt(bMemID.W)) 365d0de7e4aSpeixiaokun val h_resp = Output(new HptwResp) 36692e3bfefSLemover val af = Output(Bool()) 36792e3bfefSLemover }) 36892e3bfefSLemover val mem = new Bundle { 36992e3bfefSLemover val req = DecoupledIO(new L2TlbMemReqBundle()) 37092e3bfefSLemover val resp = Flipped(Valid(new Bundle { 37192e3bfefSLemover val id = Output(UInt(log2Up(l2tlbParams.llptwsize).W)) 372dc05c713Speixiaokun val value = Output(UInt(XLEN.W)) 37392e3bfefSLemover })) 37492e3bfefSLemover val enq_ptr = Output(UInt(log2Ceil(l2tlbParams.llptwsize).W)) 37592e3bfefSLemover val buffer_it = Output(Vec(l2tlbParams.llptwsize, Bool())) 37692e3bfefSLemover val refill = Output(new L2TlbInnerBundle()) 37792e3bfefSLemover val req_mask = Input(Vec(l2tlbParams.llptwsize, Bool())) 37892e3bfefSLemover } 3797797f035SbugGenerator val cache = DecoupledIO(new L2TlbInnerBundle()) 38092e3bfefSLemover val pmp = new Bundle { 38192e3bfefSLemover val req = Valid(new PMPReqBundle()) 38292e3bfefSLemover val resp = Flipped(new PMPRespBundle()) 38392e3bfefSLemover } 384d0de7e4aSpeixiaokun val hptw = new Bundle { 385d0de7e4aSpeixiaokun val req = DecoupledIO(new Bundle{ 386eb4bf3f2Speixiaokun val source = UInt(bSourceWidth.W) 387d0de7e4aSpeixiaokun val id = UInt(log2Up(l2tlbParams.llptwsize).W) 38882978df9Speixiaokun val gvpn = UInt(vpnLen.W) 389d0de7e4aSpeixiaokun }) 390d0de7e4aSpeixiaokun val resp = Flipped(Valid(new Bundle { 391d0de7e4aSpeixiaokun val id = Output(UInt(log2Up(l2tlbParams.llptwsize).W)) 392d0de7e4aSpeixiaokun val h_resp = Output(new HptwResp) 393d0de7e4aSpeixiaokun })) 394d0de7e4aSpeixiaokun } 39592e3bfefSLemover} 39692e3bfefSLemover 39792e3bfefSLemoverclass LLPTWEntry(implicit p: Parameters) extends XSBundle with HasPtwConst { 39892e3bfefSLemover val req_info = new L2TlbInnerBundle() 399d0de7e4aSpeixiaokun val s2xlate = Bool() 40092e3bfefSLemover val ppn = UInt(ppnLen.W) 40192e3bfefSLemover val wait_id = UInt(log2Up(l2tlbParams.llptwsize).W) 40292e3bfefSLemover val af = Bool() 403dc05c713Speixiaokun val hptw_resp = new HptwResp() 40492e3bfefSLemover} 40592e3bfefSLemover 40692e3bfefSLemover 40792e3bfefSLemoverclass LLPTW(implicit p: Parameters) extends XSModule with HasPtwConst with HasPerfEvents { 40892e3bfefSLemover val io = IO(new LLPTWIO()) 40982978df9Speixiaokun val enableS2xlate = io.in.bits.req_info.s2xlate =/= noS2xlate 410d0de7e4aSpeixiaokun val satp = Mux(enableS2xlate, io.csr.vsatp, io.csr.satp) 41192e3bfefSLemover 412d0de7e4aSpeixiaokun val flush = io.sfence.valid || satp.changed 41392e3bfefSLemover val entries = Reg(Vec(l2tlbParams.llptwsize, new LLPTWEntry())) 414d0de7e4aSpeixiaokun val state_idle :: state_hptw_req :: state_hptw_resp :: state_addr_check :: state_mem_req :: state_mem_waiting :: state_mem_out :: state_last_hptw_req :: state_last_hptw_resp :: state_cache :: Nil = Enum(10) 41592e3bfefSLemover val state = RegInit(VecInit(Seq.fill(l2tlbParams.llptwsize)(state_idle))) 4167797f035SbugGenerator 41792e3bfefSLemover val is_emptys = state.map(_ === state_idle) 41892e3bfefSLemover val is_mems = state.map(_ === state_mem_req) 41992e3bfefSLemover val is_waiting = state.map(_ === state_mem_waiting) 42092e3bfefSLemover val is_having = state.map(_ === state_mem_out) 4217797f035SbugGenerator val is_cache = state.map(_ === state_cache) 422d0de7e4aSpeixiaokun val is_hptw_req = state.map(_ === state_hptw_req) 423d0de7e4aSpeixiaokun val is_last_hptw_req = state.map(_ === state_last_hptw_req) 42492e3bfefSLemover 425935edac4STang Haojin val full = !ParallelOR(is_emptys).asBool 42692e3bfefSLemover val enq_ptr = ParallelPriorityEncoder(is_emptys) 42792e3bfefSLemover 4287797f035SbugGenerator val mem_ptr = ParallelPriorityEncoder(is_having) // TODO: optimize timing, bad: entries -> ptr -> entry 42992e3bfefSLemover val mem_arb = Module(new RRArbiter(new LLPTWEntry(), l2tlbParams.llptwsize)) 43092e3bfefSLemover for (i <- 0 until l2tlbParams.llptwsize) { 43192e3bfefSLemover mem_arb.io.in(i).bits := entries(i) 43292e3bfefSLemover mem_arb.io.in(i).valid := is_mems(i) && !io.mem.req_mask(i) 43392e3bfefSLemover } 434d0de7e4aSpeixiaokun val hyper_arb1 = Module(new RRArbiter(new LLPTWEntry(), l2tlbParams.llptwsize)) 435d0de7e4aSpeixiaokun for (i <- 0 until l2tlbParams.llptwsize) { 436d0de7e4aSpeixiaokun hyper_arb1.io.in(i).bits := entries(i) 437d0de7e4aSpeixiaokun hyper_arb1.io.in(i).valid := is_hptw_req(i) 438d0de7e4aSpeixiaokun } 439d0de7e4aSpeixiaokun val hyper_arb2 = Module(new RRArbiter(new LLPTWEntry(), l2tlbParams.llptwsize)) 440d0de7e4aSpeixiaokun for(i <- 0 until l2tlbParams.llptwsize) { 441d0de7e4aSpeixiaokun hyper_arb2.io.in(i).bits := entries(i) 442d0de7e4aSpeixiaokun hyper_arb2.io.in(i).valid := is_last_hptw_req(i) 443d0de7e4aSpeixiaokun } 44492e3bfefSLemover 445f3034303SHaoyuan Feng val cache_ptr = ParallelMux(is_cache, (0 until l2tlbParams.llptwsize).map(_.U(log2Up(l2tlbParams.llptwsize).W))) 4467797f035SbugGenerator 44792e3bfefSLemover // duplicate req 44892e3bfefSLemover // to_wait: wait for the last to access mem, set to mem_resp 44992e3bfefSLemover // to_cache: the last is back just right now, set to mem_cache 45092e3bfefSLemover val dup_vec = state.indices.map(i => 451cca17e78Speixiaokun dup(io.in.bits.req_info.vpn, entries(i).req_info.vpn) && io.in.bits.req_info.s2xlate === entries(i).req_info.s2xlate 45292e3bfefSLemover ) 453cca17e78Speixiaokun val dup_req_fire = mem_arb.io.out.fire && dup(io.in.bits.req_info.vpn, mem_arb.io.out.bits.req_info.vpn) && io.in.bits.req_info.s2xlate === mem_arb.io.out.bits.req_info.s2xlate // dup with the req fire entry 45492e3bfefSLemover val dup_vec_wait = dup_vec.zip(is_waiting).map{case (d, w) => d && w} // dup with "mem_waiting" entres, sending mem req already 45592e3bfefSLemover val dup_vec_having = dup_vec.zipWithIndex.map{case (d, i) => d && is_having(i)} // dup with the "mem_out" entry recv the data just now 45692e3bfefSLemover val wait_id = Mux(dup_req_fire, mem_arb.io.chosen, ParallelMux(dup_vec_wait zip entries.map(_.wait_id))) 457935edac4STang Haojin val dup_wait_resp = io.mem.resp.fire && VecInit(dup_vec_wait)(io.mem.resp.bits.id) // dup with the entry that data coming next cycle 45892e3bfefSLemover val to_wait = Cat(dup_vec_wait).orR || dup_req_fire 45992e3bfefSLemover val to_mem_out = dup_wait_resp 4607797f035SbugGenerator val to_cache = Cat(dup_vec_having).orR 4617274ec5cSpeixiaokun val to_hptw = io.in.bits.req_info.s2xlate =/= noS2xlate 4627797f035SbugGenerator XSError(RegNext(dup_req_fire && Cat(dup_vec_wait).orR, init = false.B), "mem req but some entries already waiting, should not happed") 46392e3bfefSLemover 464935edac4STang Haojin XSError(io.in.fire && ((to_mem_out && to_cache) || (to_wait && to_cache)), "llptw enq, to cache conflict with to mem") 46592e3bfefSLemover val mem_resp_hit = RegInit(VecInit(Seq.fill(l2tlbParams.llptwsize)(false.B))) 4667274ec5cSpeixiaokun val enq_state_normal = MuxCase(state_addr_check, Seq( 4677274ec5cSpeixiaokun to_mem_out -> state_mem_out, // same to the blew, but the mem resp now 4687274ec5cSpeixiaokun to_wait -> state_mem_waiting, 4697274ec5cSpeixiaokun to_cache -> state_cache, 4707274ec5cSpeixiaokun to_hptw -> state_hptw_req 4717274ec5cSpeixiaokun )) 4727797f035SbugGenerator val enq_state = Mux(from_pre(io.in.bits.req_info.source) && enq_state_normal =/= state_addr_check, state_idle, enq_state_normal) 473935edac4STang Haojin when (io.in.fire) { 47492e3bfefSLemover // if prefetch req does not need mem access, just give it up. 47592e3bfefSLemover // so there will be at most 1 + FilterSize entries that needs re-access page cache 47692e3bfefSLemover // so 2 + FilterSize is enough to avoid dead-lock 4777797f035SbugGenerator state(enq_ptr) := enq_state 47892e3bfefSLemover entries(enq_ptr).req_info := io.in.bits.req_info 47992e3bfefSLemover entries(enq_ptr).ppn := io.in.bits.ppn 48092e3bfefSLemover entries(enq_ptr).wait_id := Mux(to_wait, wait_id, enq_ptr) 48192e3bfefSLemover entries(enq_ptr).af := false.B 482d0de7e4aSpeixiaokun entries(enq_ptr).s2xlate := enableS2xlate 48392e3bfefSLemover mem_resp_hit(enq_ptr) := to_mem_out 48492e3bfefSLemover } 4857797f035SbugGenerator 4867797f035SbugGenerator val enq_ptr_reg = RegNext(enq_ptr) 4877274ec5cSpeixiaokun val need_addr_check = RegNext(enq_state === state_addr_check && io.in.fire() && !flush) 4887274ec5cSpeixiaokun 4897274ec5cSpeixiaokun val hasHptwResp = ParallelOR(state.map(_ === state_hptw_resp)).asBool() 4907274ec5cSpeixiaokun val hptw_resp_ptr_reg = RegNext(io.hptw.resp.bits.id) 4917274ec5cSpeixiaokun val hptw_need_addr_check = RegNext(hasHptwResp && io.hptw.resp.fire() && !flush) 492d0de7e4aSpeixiaokun 493b24e0a78Speixiaokun val gpaddr = MakeGPAddr(io.in.bits.ppn, getVpnn(io.in.bits.req_info.vpn, 0)) 4947274ec5cSpeixiaokun val hptw_resp = io.hptw.resp.bits.h_resp 4957274ec5cSpeixiaokun val hpaddr = Cat(hptw_resp.genPPNS2(), get_off(gpaddr)) 4967274ec5cSpeixiaokun val hpaddr_reg = RegEnable(hpaddr, hasHptwResp && io.hptw.resp.fire()) 4977274ec5cSpeixiaokun val addr = MakeAddr(io.in.bits.ppn, getVpnn(io.in.bits.req_info.vpn, 0)) 4987274ec5cSpeixiaokun val addr_reg = RegEnable(addr, io.in.fire()) 4997274ec5cSpeixiaokun io.pmp.req.valid := need_addr_check || hptw_need_addr_check 5007274ec5cSpeixiaokun io.pmp.req.bits.addr := Mux(enableS2xlate, hpaddr, addr) 5017797f035SbugGenerator io.pmp.req.bits.cmd := TlbCmd.read 5027797f035SbugGenerator io.pmp.req.bits.size := 3.U // TODO: fix it 5037797f035SbugGenerator val pmp_resp_valid = io.pmp.req.valid // same cycle 5047797f035SbugGenerator when (pmp_resp_valid) { 5057797f035SbugGenerator // NOTE: when pmp resp but state is not addr check, then the entry is dup with other entry, the state was changed before 5067797f035SbugGenerator // when dup with the req-ing entry, set to mem_waiting (above codes), and the ld must be false, so dontcare 5077274ec5cSpeixiaokun val ptr = Mux(hptw_need_addr_check, hptw_resp_ptr_reg, enq_ptr_reg); 5087797f035SbugGenerator val accessFault = io.pmp.resp.ld || io.pmp.resp.mmio 5097274ec5cSpeixiaokun entries(ptr).af := accessFault 5107274ec5cSpeixiaokun state(ptr) := Mux(accessFault, state_mem_out, state_mem_req) 5117797f035SbugGenerator } 5127797f035SbugGenerator 513935edac4STang Haojin when (mem_arb.io.out.fire) { 51492e3bfefSLemover for (i <- state.indices) { 51592e3bfefSLemover when (state(i) =/= state_idle && dup(entries(i).req_info.vpn, mem_arb.io.out.bits.req_info.vpn)) { 51692e3bfefSLemover // NOTE: "dup enq set state to mem_wait" -> "sending req set other dup entries to mem_wait" 51792e3bfefSLemover state(i) := state_mem_waiting 51892e3bfefSLemover entries(i).wait_id := mem_arb.io.chosen 51992e3bfefSLemover } 52092e3bfefSLemover } 52192e3bfefSLemover } 522935edac4STang Haojin when (io.mem.resp.fire) { 52392e3bfefSLemover state.indices.map{i => 52492e3bfefSLemover when (state(i) === state_mem_waiting && io.mem.resp.bits.id === entries(i).wait_id) { 525d0de7e4aSpeixiaokun state(i) := Mux(entries(i).s2xlate, state_last_hptw_req, state_mem_out) 52692e3bfefSLemover mem_resp_hit(i) := true.B 52792e3bfefSLemover } 52892e3bfefSLemover } 52992e3bfefSLemover } 530d0de7e4aSpeixiaokun 531d0de7e4aSpeixiaokun when (hyper_arb1.io.out.fire()) { 532d0de7e4aSpeixiaokun for (i <- state.indices) { 533d0de7e4aSpeixiaokun when (state(i) === state_hptw_req && entries(i).ppn === hyper_arb1.io.out.bits.ppn && entries(i).s2xlate) { 534d0de7e4aSpeixiaokun state(i) := state_hptw_resp 535d0de7e4aSpeixiaokun entries(i).wait_id := hyper_arb1.io.chosen 536d0de7e4aSpeixiaokun } 537d0de7e4aSpeixiaokun } 538d0de7e4aSpeixiaokun } 539d0de7e4aSpeixiaokun 540d0de7e4aSpeixiaokun when (hyper_arb2.io.out.fire()) { 541d0de7e4aSpeixiaokun for (i <- state.indices) { 542d0de7e4aSpeixiaokun when (state(i) === state_last_hptw_req && entries(i).ppn === hyper_arb2.io.out.bits.ppn && entries(i).s2xlate) { 543d0de7e4aSpeixiaokun state(i) := state_last_hptw_resp 544d0de7e4aSpeixiaokun entries(i).wait_id := hyper_arb2.io.chosen 545d0de7e4aSpeixiaokun } 546d0de7e4aSpeixiaokun } 547d0de7e4aSpeixiaokun } 548d0de7e4aSpeixiaokun 549d0de7e4aSpeixiaokun when (io.hptw.resp.fire()) { 550d0de7e4aSpeixiaokun for (i <- state.indices) { 551d0de7e4aSpeixiaokun when (state(i) === state_hptw_resp && io.hptw.resp.bits.id === entries(i).wait_id) { 552d0de7e4aSpeixiaokun state(i) := state_addr_check 553dc05c713Speixiaokun entries(i).hptw_resp := io.hptw.resp.bits.h_resp 554d0de7e4aSpeixiaokun } 555d0de7e4aSpeixiaokun when (state(i) === state_last_hptw_resp && io.hptw.resp.bits.id === entries(i).wait_id) { 556d0de7e4aSpeixiaokun state(i) := state_mem_out 557dc05c713Speixiaokun entries(i).hptw_resp := io.hptw.resp.bits.h_resp 558d0de7e4aSpeixiaokun } 559d0de7e4aSpeixiaokun } 560d0de7e4aSpeixiaokun } 561d0de7e4aSpeixiaokun 562935edac4STang Haojin when (io.out.fire) { 56392e3bfefSLemover assert(state(mem_ptr) === state_mem_out) 56492e3bfefSLemover state(mem_ptr) := state_idle 56592e3bfefSLemover } 56692e3bfefSLemover mem_resp_hit.map(a => when (a) { a := false.B } ) 56792e3bfefSLemover 5687797f035SbugGenerator when (io.cache.fire) { 5697797f035SbugGenerator state(cache_ptr) := state_idle 57092e3bfefSLemover } 5717797f035SbugGenerator XSError(io.out.fire && io.cache.fire && (mem_ptr === cache_ptr), "mem resp and cache fire at the same time at same entry") 57292e3bfefSLemover 57392e3bfefSLemover when (flush) { 57492e3bfefSLemover state.map(_ := state_idle) 57592e3bfefSLemover } 57692e3bfefSLemover 57792e3bfefSLemover io.in.ready := !full 57892e3bfefSLemover 579935edac4STang Haojin io.out.valid := ParallelOR(is_having).asBool 58092e3bfefSLemover io.out.bits.req_info := entries(mem_ptr).req_info 58192e3bfefSLemover io.out.bits.id := mem_ptr 58292e3bfefSLemover io.out.bits.af := entries(mem_ptr).af 583dc05c713Speixiaokun io.out.bits.h_resp := entries(mem_ptr).hptw_resp 584d0de7e4aSpeixiaokun 585dc05c713Speixiaokun val pte = io.mem.resp.bits.value.asTypeOf(new PteBundle().cloneType) 586dc05c713Speixiaokun val hptw_req_gvpn_1 = hyper_arb1.io.out.bits.ppn // first stage 2 translation 587dc05c713Speixiaokun val hptw_req_gvpn_2 = pte.ppn // last stage 2 translation 588d0de7e4aSpeixiaokun io.hptw.req.valid := (hyper_arb1.io.out.valid || hyper_arb2.io.out.valid) && !flush 589dc05c713Speixiaokun io.hptw.req.bits.gvpn := Mux(hyper_arb1.io.out.valid, hptw_req_gvpn_1, hptw_req_gvpn_2) 590d0de7e4aSpeixiaokun io.hptw.req.bits.id := Mux(hyper_arb1.io.out.valid, hyper_arb1.io.chosen, hyper_arb2.io.chosen) 591eb4bf3f2Speixiaokun io.hptw.req.bits.source := Mux(hyper_arb1.io.out.valid, hyper_arb1.io.out.bits.req_info.source, hyper_arb2.io.out.bits.req_info.source) 592d0de7e4aSpeixiaokun hyper_arb1.io.out.ready := io.hptw.req.ready 593d0de7e4aSpeixiaokun hyper_arb2.io.out.ready := io.hptw.req.ready 59492e3bfefSLemover 59592e3bfefSLemover io.mem.req.valid := mem_arb.io.out.valid && !flush 596dc05c713Speixiaokun val mem_paddr = MakeAddr(mem_arb.io.out.bits.ppn, getVpnn(mem_arb.io.out.bits.req_info.vpn, 0)) 597dc05c713Speixiaokun val mem_hpaddr = MakeAddr(mem_arb.io.out.bits.hptw_resp.genPPNS2(), getVpnn(mem_arb.io.out.bits.req_info.vpn, 0)) 598dc05c713Speixiaokun io.mem.req.bits.addr := Mux(mem_arb.io.out.bits.s2xlate, mem_hpaddr, mem_paddr) 59992e3bfefSLemover io.mem.req.bits.id := mem_arb.io.chosen 60092e3bfefSLemover mem_arb.io.out.ready := io.mem.req.ready 60192e3bfefSLemover io.mem.refill := entries(RegNext(io.mem.resp.bits.id(log2Up(l2tlbParams.llptwsize)-1, 0))).req_info 60292e3bfefSLemover io.mem.buffer_it := mem_resp_hit 60392e3bfefSLemover io.mem.enq_ptr := enq_ptr 60492e3bfefSLemover 6057797f035SbugGenerator io.cache.valid := Cat(is_cache).orR 6067797f035SbugGenerator io.cache.bits := ParallelMux(is_cache, entries.map(_.req_info)) 6077797f035SbugGenerator 608935edac4STang Haojin XSPerfAccumulate("llptw_in_count", io.in.fire) 60992e3bfefSLemover XSPerfAccumulate("llptw_in_block", io.in.valid && !io.in.ready) 61092e3bfefSLemover for (i <- 0 until 7) { 611935edac4STang Haojin XSPerfAccumulate(s"enq_state${i}", io.in.fire && enq_state === i.U) 61292e3bfefSLemover } 61392e3bfefSLemover for (i <- 0 until (l2tlbParams.llptwsize + 1)) { 61492e3bfefSLemover XSPerfAccumulate(s"util${i}", PopCount(is_emptys.map(!_)) === i.U) 61592e3bfefSLemover XSPerfAccumulate(s"mem_util${i}", PopCount(is_mems) === i.U) 61692e3bfefSLemover XSPerfAccumulate(s"waiting_util${i}", PopCount(is_waiting) === i.U) 61792e3bfefSLemover } 618935edac4STang Haojin XSPerfAccumulate("mem_count", io.mem.req.fire) 61992e3bfefSLemover XSPerfAccumulate("mem_cycle", PopCount(is_waiting) =/= 0.U) 62092e3bfefSLemover XSPerfAccumulate("blocked_in", io.in.valid && !io.in.ready) 62192e3bfefSLemover 62292e3bfefSLemover for (i <- 0 until l2tlbParams.llptwsize) { 62392e3bfefSLemover TimeOutAssert(state(i) =/= state_idle, timeOutThreshold, s"missqueue time out no out ${i}") 62492e3bfefSLemover } 62592e3bfefSLemover 62692e3bfefSLemover val perfEvents = Seq( 627935edac4STang Haojin ("tlbllptw_incount ", io.in.fire ), 62892e3bfefSLemover ("tlbllptw_inblock ", io.in.valid && !io.in.ready), 629935edac4STang Haojin ("tlbllptw_memcount ", io.mem.req.fire ), 63092e3bfefSLemover ("tlbllptw_memcycle ", PopCount(is_waiting) ), 63192e3bfefSLemover ) 63292e3bfefSLemover generatePerfEvent() 63392e3bfefSLemover} 634d0de7e4aSpeixiaokun 635d0de7e4aSpeixiaokun/*========================= HPTW ==============================*/ 636d0de7e4aSpeixiaokun 637d0de7e4aSpeixiaokun/** HPTW : Hypervisor Page Table Walker 638d0de7e4aSpeixiaokun * the page walker take the virtual machine's page walk. 639d0de7e4aSpeixiaokun * guest physical address translation, guest physical address -> host physical address 640d0de7e4aSpeixiaokun **/ 641d0de7e4aSpeixiaokunclass HPTWIO()(implicit p: Parameters) extends MMUIOBaseBundle with HasPtwConst { 642d0de7e4aSpeixiaokun val req = Flipped(DecoupledIO(new Bundle { 643eb4bf3f2Speixiaokun val source = UInt(bSourceWidth.W) 644d0de7e4aSpeixiaokun val id = UInt(log2Up(l2tlbParams.llptwsize).W) 64582978df9Speixiaokun val gvpn = UInt(vpnLen.W) 6466315ba2aSpeixiaokun val ppn = UInt(ppnLen.W) 647d0de7e4aSpeixiaokun val l1Hit = Bool() 648d0de7e4aSpeixiaokun val l2Hit = Bool() 649d0de7e4aSpeixiaokun })) 650d0de7e4aSpeixiaokun val resp = Valid(new Bundle { 651eb4bf3f2Speixiaokun val source = UInt(bSourceWidth.W) 652d0de7e4aSpeixiaokun val resp = Output(new HptwResp()) 653d0de7e4aSpeixiaokun val id = Output(UInt(bMemID.W)) 654d0de7e4aSpeixiaokun }) 655d0de7e4aSpeixiaokun 656d0de7e4aSpeixiaokun val mem = new Bundle { 657d0de7e4aSpeixiaokun val req = DecoupledIO(new L2TlbMemReqBundle()) 658d0de7e4aSpeixiaokun val resp = Flipped(ValidIO(UInt(XLEN.W))) 659d0de7e4aSpeixiaokun val mask = Input(Bool()) 660d0de7e4aSpeixiaokun } 661d0de7e4aSpeixiaokun val refill = Output(new Bundle { 662d0de7e4aSpeixiaokun val req_info = new L2TlbInnerBundle() 663d0de7e4aSpeixiaokun val level = UInt(log2Up(Level).W) 664d0de7e4aSpeixiaokun }) 665d0de7e4aSpeixiaokun val pmp = new Bundle { 666d0de7e4aSpeixiaokun val req = ValidIO(new PMPReqBundle()) 667d0de7e4aSpeixiaokun val resp = Flipped(new PMPRespBundle()) 668d0de7e4aSpeixiaokun } 669d0de7e4aSpeixiaokun} 670d0de7e4aSpeixiaokun 671d0de7e4aSpeixiaokun@chiselName 672d0de7e4aSpeixiaokunclass HPTW()(implicit p: Parameters) extends XSModule with HasPtwConst { 673d0de7e4aSpeixiaokun val io = IO(new HPTWIO) 674d0de7e4aSpeixiaokun val hgatp = io.csr.hgatp 675d0de7e4aSpeixiaokun val sfence = io.sfence 676d0de7e4aSpeixiaokun val flush = sfence.valid || hgatp.changed 677d0de7e4aSpeixiaokun 678d0de7e4aSpeixiaokun val level = RegInit(0.U(log2Up(Level).W)) 679d0de7e4aSpeixiaokun val gpaddr = Reg(UInt(GPAddrBits.W)) 680d0de7e4aSpeixiaokun val vpn = gpaddr(GPAddrBits-1, offLen) 681d0de7e4aSpeixiaokun val levelNext = level + 1.U 682d0de7e4aSpeixiaokun val l1Hit = Reg(Bool()) 683d0de7e4aSpeixiaokun val l2Hit = Reg(Bool()) 684b24e0a78Speixiaokun val pg_base = MakeGPAddr(hgatp.ppn, getGVpnn(vpn, 2.U)) // for l0 685d0de7e4aSpeixiaokun// val pte = io.mem.resp.bits.MergeRespToPte() 686d0de7e4aSpeixiaokun val pte = io.mem.resp.bits.asTypeOf(new PteBundle().cloneType) 6876315ba2aSpeixiaokun val ppn_l1 = Mux(l1Hit, io.req.bits.ppn, pte.ppn) 6886315ba2aSpeixiaokun val ppn_l2 = Mux(l2Hit, io.req.bits.ppn, pte.ppn) 6896315ba2aSpeixiaokun val ppn = Mux(level === 1.U, ppn_l1, ppn_l2) //for l1 and l2 6906315ba2aSpeixiaokun val p_pte = MakeAddr(ppn, getVpnn(vpn, 2.U - level)) 691d0de7e4aSpeixiaokun val mem_addr = Mux(level === 0.U, pg_base, p_pte) 692d0de7e4aSpeixiaokun 693d0de7e4aSpeixiaokun //s/w register 694d0de7e4aSpeixiaokun val s_pmp_check = RegInit(true.B) 695d0de7e4aSpeixiaokun val s_mem_req = RegInit(true.B) 696d0de7e4aSpeixiaokun val w_mem_resp = RegInit(true.B) 697d0de7e4aSpeixiaokun val idle = RegInit(true.B) 69803c1129fSpeixiaokun val mem_addr_update = RegInit(false.B) 699d0de7e4aSpeixiaokun val finish = WireInit(false.B) 700d0de7e4aSpeixiaokun 701d0de7e4aSpeixiaokun val sent_to_pmp = !idle && (!s_pmp_check || mem_addr_update) && !finish 702d0de7e4aSpeixiaokun val pageFault = pte.isPf(level) 703d0de7e4aSpeixiaokun val accessFault = RegEnable(io.pmp.resp.ld || io.pmp.resp.mmio, sent_to_pmp) 704d0de7e4aSpeixiaokun 705d0de7e4aSpeixiaokun val ppn_af = pte.isAf() 706d0de7e4aSpeixiaokun val find_pte = pte.isLeaf() || ppn_af || pageFault 707d0de7e4aSpeixiaokun 708d0de7e4aSpeixiaokun val resp_valid = !idle && mem_addr_update && ((w_mem_resp && find_pte) || (s_pmp_check && accessFault)) 709d0de7e4aSpeixiaokun val id = Reg(UInt(log2Up(l2tlbParams.llptwsize).W)) 710eb4bf3f2Speixiaokun val source = RegEnable(io.req.bits.source, io.req.fire()) 711eb4bf3f2Speixiaokun 712d0de7e4aSpeixiaokun io.req.ready := idle 713eb4bf3f2Speixiaokun val resp = Wire(new HptwResp()) 714d0de7e4aSpeixiaokun resp.apply(pageFault && !accessFault && !ppn_af, accessFault || ppn_af, level, pte, vpn, hgatp.asid) 715d0de7e4aSpeixiaokun io.resp.valid := resp_valid 716d0de7e4aSpeixiaokun io.resp.bits.id := id 717d0de7e4aSpeixiaokun io.resp.bits.resp := resp 718eb4bf3f2Speixiaokun io.resp.bits.source := source 719d0de7e4aSpeixiaokun 720d0de7e4aSpeixiaokun io.pmp.req.valid := DontCare 721d0de7e4aSpeixiaokun io.pmp.req.bits.addr := mem_addr 722d0de7e4aSpeixiaokun io.pmp.req.bits.size := 3.U 723d0de7e4aSpeixiaokun io.pmp.req.bits.cmd := TlbCmd.read 724d0de7e4aSpeixiaokun 725d0de7e4aSpeixiaokun io.mem.req.valid := !s_mem_req && !io.mem.mask && !accessFault && s_pmp_check 726d0de7e4aSpeixiaokun io.mem.req.bits.addr := mem_addr 727d0de7e4aSpeixiaokun io.mem.req.bits.id := HptwReqId.U(bMemID.W) 728d0de7e4aSpeixiaokun 72982978df9Speixiaokun io.refill.req_info.vpn := vpn 730d0de7e4aSpeixiaokun io.refill.level := level 731eb4bf3f2Speixiaokun io.refill.req_info.source := source 732eb4bf3f2Speixiaokun io.refill.req_info.s2xlate := onlyStage2 733d0de7e4aSpeixiaokun when (idle){ 734d0de7e4aSpeixiaokun when(io.req.fire()){ 735d0de7e4aSpeixiaokun level := Mux(io.req.bits.l2Hit, 2.U, Mux(io.req.bits.l1Hit, 1.U, 0.U)) 736d0de7e4aSpeixiaokun idle := false.B 737d0de7e4aSpeixiaokun gpaddr := Cat(io.req.bits.gvpn, 0.U(offLen.W)) 738d0de7e4aSpeixiaokun accessFault := false.B 739d0de7e4aSpeixiaokun s_pmp_check := false.B 740d0de7e4aSpeixiaokun id := io.req.bits.id 741d0de7e4aSpeixiaokun l1Hit := io.req.bits.l1Hit 742d0de7e4aSpeixiaokun l2Hit := io.req.bits.l2Hit 743d0de7e4aSpeixiaokun } 744d0de7e4aSpeixiaokun } 745d0de7e4aSpeixiaokun 746d0de7e4aSpeixiaokun when(sent_to_pmp && !mem_addr_update){ 747d0de7e4aSpeixiaokun s_mem_req := false.B 748d0de7e4aSpeixiaokun s_pmp_check := true.B 749d0de7e4aSpeixiaokun } 750d0de7e4aSpeixiaokun 751d0de7e4aSpeixiaokun when(accessFault && !idle){ 752d0de7e4aSpeixiaokun s_pmp_check := true.B 753d0de7e4aSpeixiaokun s_mem_req := true.B 754d0de7e4aSpeixiaokun w_mem_resp := true.B 755d0de7e4aSpeixiaokun mem_addr_update := true.B 756d0de7e4aSpeixiaokun } 757d0de7e4aSpeixiaokun 758d0de7e4aSpeixiaokun when(io.mem.req.fire()){ 759d0de7e4aSpeixiaokun s_mem_req := true.B 760d0de7e4aSpeixiaokun w_mem_resp := false.B 761d0de7e4aSpeixiaokun } 762d0de7e4aSpeixiaokun 763d0de7e4aSpeixiaokun when(io.mem.resp.fire() && !w_mem_resp){ 764d0de7e4aSpeixiaokun w_mem_resp := true.B 765d0de7e4aSpeixiaokun mem_addr_update := true.B 766d0de7e4aSpeixiaokun } 767d0de7e4aSpeixiaokun 768d0de7e4aSpeixiaokun when(mem_addr_update){ 769d0de7e4aSpeixiaokun when(!(find_pte || accessFault)){ 770d0de7e4aSpeixiaokun level := levelNext 771d0de7e4aSpeixiaokun s_mem_req := false.B 772d0de7e4aSpeixiaokun mem_addr_update := false.B 773d0de7e4aSpeixiaokun }.elsewhen(resp_valid){ 774d0de7e4aSpeixiaokun when(io.resp.fire()){ 775d0de7e4aSpeixiaokun idle := true.B 776d0de7e4aSpeixiaokun mem_addr_update := false.B 777d0de7e4aSpeixiaokun accessFault := false.B 778d0de7e4aSpeixiaokun } 779d0de7e4aSpeixiaokun finish := true.B 780d0de7e4aSpeixiaokun } 781d0de7e4aSpeixiaokun } 782d0de7e4aSpeixiaokun}