xref: /XiangShan/src/main/scala/xiangshan/cache/mmu/PageTableCache.scala (revision a1d4b4bfaad30c6cc4e94d9602e3f65b9e9899d7)
16d5ddbceSLemover/***************************************************************************************
26d5ddbceSLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory
46d5ddbceSLemover*
56d5ddbceSLemover* XiangShan is licensed under Mulan PSL v2.
66d5ddbceSLemover* You can use this software according to the terms and conditions of the Mulan PSL v2.
76d5ddbceSLemover* You may obtain a copy of Mulan PSL v2 at:
86d5ddbceSLemover*          http://license.coscl.org.cn/MulanPSL2
96d5ddbceSLemover*
106d5ddbceSLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
116d5ddbceSLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
126d5ddbceSLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
136d5ddbceSLemover*
146d5ddbceSLemover* See the Mulan PSL v2 for more details.
156d5ddbceSLemover***************************************************************************************/
166d5ddbceSLemover
176d5ddbceSLemoverpackage xiangshan.cache.mmu
186d5ddbceSLemover
198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters
206d5ddbceSLemoverimport chisel3._
216d5ddbceSLemoverimport chisel3.util._
226d5ddbceSLemoverimport xiangshan._
236d5ddbceSLemoverimport xiangshan.cache.{HasDCacheParameters, MemoryOpConstants}
246d5ddbceSLemoverimport utils._
253c02ee8fSwakafaimport utility._
266d5ddbceSLemoverimport freechips.rocketchip.diplomacy.{LazyModule, LazyModuleImp}
276d5ddbceSLemoverimport freechips.rocketchip.tilelink._
286d5ddbceSLemover
296d5ddbceSLemover/* ptw cache caches the page table of all the three layers
306d5ddbceSLemover * ptw cache resp at next cycle
316d5ddbceSLemover * the cache should not be blocked
326d5ddbceSLemover * when miss queue if full, just block req outside
336d5ddbceSLemover */
343889e11eSLemover
353889e11eSLemoverclass PageCachePerPespBundle(implicit p: Parameters) extends PtwBundle {
363889e11eSLemover  val hit = Bool()
373889e11eSLemover  val pre = Bool()
38d61cd5eeSpeixiaokun  val ppn = if (HasHExtension) UInt((vpnLen max ppnLen).W) else UInt(ppnLen.W)
393889e11eSLemover  val perm = new PtePermBundle()
403889e11eSLemover  val ecc = Bool()
413889e11eSLemover  val level = UInt(2.W)
428d8ac704SLemover  val v = Bool()
433889e11eSLemover
443889e11eSLemover  def apply(hit: Bool, pre: Bool, ppn: UInt, perm: PtePermBundle = 0.U.asTypeOf(new PtePermBundle()),
458d8ac704SLemover            ecc: Bool = false.B, level: UInt = 0.U, valid: Bool = true.B) {
463889e11eSLemover    this.hit := hit && !ecc
473889e11eSLemover    this.pre := pre
483889e11eSLemover    this.ppn := ppn
493889e11eSLemover    this.perm := perm
503889e11eSLemover    this.ecc := ecc && hit
513889e11eSLemover    this.level := level
528d8ac704SLemover    this.v := valid
533889e11eSLemover  }
543889e11eSLemover}
553889e11eSLemover
5663632028SHaoyuan Fengclass PageCacheMergePespBundle(implicit p: Parameters) extends PtwBundle {
5763632028SHaoyuan Feng  assert(tlbcontiguous == 8, "Only support tlbcontiguous = 8!")
5863632028SHaoyuan Feng  val hit = Bool()
5963632028SHaoyuan Feng  val pre = Bool()
60d61cd5eeSpeixiaokun  val ppn = Vec(tlbcontiguous, if(HasHExtension) UInt((vpnLen max ppnLen).W) else UInt(ppnLen.W))
6163632028SHaoyuan Feng  val perm = Vec(tlbcontiguous, new PtePermBundle())
6263632028SHaoyuan Feng  val ecc = Bool()
6363632028SHaoyuan Feng  val level = UInt(2.W)
6463632028SHaoyuan Feng  val v = Vec(tlbcontiguous, Bool())
6563632028SHaoyuan Feng
6663632028SHaoyuan Feng  def apply(hit: Bool, pre: Bool, ppn: Vec[UInt], perm: Vec[PtePermBundle] = Vec(tlbcontiguous, 0.U.asTypeOf(new PtePermBundle())),
6763632028SHaoyuan Feng            ecc: Bool = false.B, level: UInt = 0.U, valid: Vec[Bool] = Vec(tlbcontiguous, true.B)) {
6863632028SHaoyuan Feng    this.hit := hit && !ecc
6963632028SHaoyuan Feng    this.pre := pre
7063632028SHaoyuan Feng    this.ppn := ppn
7163632028SHaoyuan Feng    this.perm := perm
7263632028SHaoyuan Feng    this.ecc := ecc && hit
7363632028SHaoyuan Feng    this.level := level
7463632028SHaoyuan Feng    this.v := valid
7563632028SHaoyuan Feng  }
7663632028SHaoyuan Feng}
7763632028SHaoyuan Feng
783889e11eSLemoverclass PageCacheRespBundle(implicit p: Parameters) extends PtwBundle {
793889e11eSLemover  val l1 = new PageCachePerPespBundle
803889e11eSLemover  val l2 = new PageCachePerPespBundle
8163632028SHaoyuan Feng  val l3 = new PageCacheMergePespBundle
823889e11eSLemover  val sp = new PageCachePerPespBundle
833889e11eSLemover}
843889e11eSLemover
853889e11eSLemoverclass PtwCacheReq(implicit p: Parameters) extends PtwBundle {
863889e11eSLemover  val req_info = new L2TlbInnerBundle()
873889e11eSLemover  val isFirst = Bool()
881f4a7c0cSLemover  val bypassed = Vec(3, Bool())
89d0de7e4aSpeixiaokun  val isHptw = Bool()
90d0de7e4aSpeixiaokun  val hptwId = UInt(log2Up(l2tlbParams.llptwsize).W)
913889e11eSLemover}
923889e11eSLemover
933889e11eSLemoverclass PtwCacheIO()(implicit p: Parameters) extends MMUIOBaseBundle with HasPtwConst {
943889e11eSLemover  val req = Flipped(DecoupledIO(new PtwCacheReq()))
956d5ddbceSLemover  val resp = DecoupledIO(new Bundle {
9645f497a4Shappy-lx    val req_info = new L2TlbInnerBundle()
9794133605SLemover    val isFirst = Bool()
986d5ddbceSLemover    val hit = Bool()
99bc063562SLemover    val prefetch = Bool() // is the entry fetched by prefetch
1001f4a7c0cSLemover    val bypassed = Bool()
1016d5ddbceSLemover    val toFsm = new Bundle {
1026d5ddbceSLemover      val l1Hit = Bool()
1036d5ddbceSLemover      val l2Hit = Bool()
104d61cd5eeSpeixiaokun      val ppn = if(HasHExtension) UInt((vpnLen.max(ppnLen)).W) else UInt(ppnLen.W)
10530104977Speixiaokun      val stage1Hit = Bool() // find stage 1 pte in cache, but need to search stage 2 pte in cache at PTW
1066d5ddbceSLemover    }
10763632028SHaoyuan Feng    val toTlb = new PtwMergeResp()
108d0de7e4aSpeixiaokun    val isHptw = Bool()
109d0de7e4aSpeixiaokun    val toHptw = new Bundle {
110d0de7e4aSpeixiaokun      val l1Hit = Bool()
111d0de7e4aSpeixiaokun      val l2Hit = Bool()
112d0de7e4aSpeixiaokun      val ppn = UInt(ppnLen.W)
113d0de7e4aSpeixiaokun      val id = UInt(log2Up(l2tlbParams.llptwsize).W)
114d0de7e4aSpeixiaokun      val resp = new HptwResp() // used if hit
115d0de7e4aSpeixiaokun    }
1166d5ddbceSLemover  })
1176d5ddbceSLemover  val refill = Flipped(ValidIO(new Bundle {
1185854c1edSLemover    val ptes = UInt(blockBits.W)
1197797f035SbugGenerator    val levelOH = new Bundle {
1207797f035SbugGenerator      // NOTE: levelOH has (Level+1) bits, each stands for page cache entries
1217797f035SbugGenerator      val sp = Bool()
1227797f035SbugGenerator      val l3 = Bool()
1237797f035SbugGenerator      val l2 = Bool()
1247797f035SbugGenerator      val l1 = Bool()
1257797f035SbugGenerator      def apply(levelUInt: UInt, valid: Bool) = {
1267797f035SbugGenerator        sp := RegNext((levelUInt === 0.U || levelUInt === 1.U) && valid, false.B)
1277797f035SbugGenerator        l3 := RegNext((levelUInt === 2.U) & valid, false.B)
1287797f035SbugGenerator        l2 := RegNext((levelUInt === 1.U) & valid, false.B)
1297797f035SbugGenerator        l1 := RegNext((levelUInt === 0.U) & valid, false.B)
1307797f035SbugGenerator      }
1317797f035SbugGenerator    }
1327797f035SbugGenerator    // duplicate level and sel_pte for each page caches, for better fanout
1337797f035SbugGenerator    val req_info_dup = Vec(3, new L2TlbInnerBundle())
1347797f035SbugGenerator    val level_dup = Vec(3, UInt(log2Up(Level).W))
1357797f035SbugGenerator    val sel_pte_dup = Vec(3, UInt(XLEN.W))
1366d5ddbceSLemover  }))
1377797f035SbugGenerator  val sfence_dup = Vec(4, Input(new SfenceBundle()))
1387797f035SbugGenerator  val csr_dup = Vec(3, Input(new TlbCsrBundle()))
1396d5ddbceSLemover}
1406d5ddbceSLemover
1411ca0e4f3SYinan Xuclass PtwCache()(implicit p: Parameters) extends XSModule with HasPtwConst with HasPerfEvents {
1426d5ddbceSLemover  val io = IO(new PtwCacheIO)
1437196f5a2SLemover  val ecc = Code.fromString(l2tlbParams.ecc)
1447196f5a2SLemover  val l2EntryType = new PTWEntriesWithEcc(ecc, num = PtwL2SectorSize, tagLen = PtwL2TagLen, level = 1, hasPerm = false)
1457196f5a2SLemover  val l3EntryType = new PTWEntriesWithEcc(ecc, num = PtwL3SectorSize, tagLen = PtwL3TagLen, level = 2, hasPerm = true)
1467196f5a2SLemover
1476d5ddbceSLemover  // TODO: four caches make the codes dirty, think about how to deal with it
1486d5ddbceSLemover
1497797f035SbugGenerator  val sfence_dup = io.sfence_dup
1506d5ddbceSLemover  val refill = io.refill.bits
1517797f035SbugGenerator  val refill_prefetch_dup = io.refill.bits.req_info_dup.map(a => from_pre(a.source))
152d0de7e4aSpeixiaokun  val flush_dup = sfence_dup.zip(io.csr_dup).map(f => f._1.valid || f._2.satp.changed || f._2.vsatp.changed || f._2.hgatp.changed)
1537797f035SbugGenerator  val flush = flush_dup(0)
1546d5ddbceSLemover
1556d5ddbceSLemover  // when refill, refuce to accept new req
1565854c1edSLemover  val rwHarzad = if (sramSinglePort) io.refill.valid else false.B
1573889e11eSLemover
1583889e11eSLemover  // handle hand signal and req_info
1596c4dcc2dSLemover  // TODO: replace with FlushableQueue
1606c4dcc2dSLemover  val stageReq = Wire(Decoupled(new PtwCacheReq()))         // enq stage & read page cache valid
1616c4dcc2dSLemover  val stageDelay = Wire(Vec(2, Decoupled(new PtwCacheReq()))) // page cache resp
1626c4dcc2dSLemover  val stageCheck = Wire(Vec(2, Decoupled(new PtwCacheReq()))) // check hit & check ecc
1636c4dcc2dSLemover  val stageResp = Wire(Decoupled(new PtwCacheReq()))         // deq stage
1647797f035SbugGenerator
1657797f035SbugGenerator  val stageDelay_valid_1cycle = OneCycleValid(stageReq.fire, flush)      // catch ram data
1667797f035SbugGenerator  val stageCheck_valid_1cycle = OneCycleValid(stageDelay(1).fire, flush) // replace & perf counter
1677797f035SbugGenerator  val stageResp_valid_1cycle_dup = Wire(Vec(2, Bool()))
1687797f035SbugGenerator  stageResp_valid_1cycle_dup.map(_ := OneCycleValid(stageCheck(1).fire, flush))  // ecc flush
1697797f035SbugGenerator
1706c4dcc2dSLemover  stageReq <> io.req
1716c4dcc2dSLemover  PipelineConnect(stageReq, stageDelay(0), stageDelay(1).ready, flush, rwHarzad)
1727797f035SbugGenerator  InsideStageConnect(stageDelay(0), stageDelay(1), stageDelay_valid_1cycle)
1736c4dcc2dSLemover  PipelineConnect(stageDelay(1), stageCheck(0), stageCheck(1).ready, flush)
1747797f035SbugGenerator  InsideStageConnect(stageCheck(0), stageCheck(1), stageCheck_valid_1cycle)
1756c4dcc2dSLemover  PipelineConnect(stageCheck(1), stageResp, io.resp.ready, flush)
1766c4dcc2dSLemover  stageResp.ready := !stageResp.valid || io.resp.ready
1776d5ddbceSLemover
1786d5ddbceSLemover  // l1: level 0 non-leaf pte
1795854c1edSLemover  val l1 = Reg(Vec(l2tlbParams.l1Size, new PtwEntry(tagLen = PtwL1TagLen)))
1805854c1edSLemover  val l1v = RegInit(0.U(l2tlbParams.l1Size.W))
1815854c1edSLemover  val l1g = Reg(UInt(l2tlbParams.l1Size.W))
1821dd3e32dSHaoyuan Feng  val l1asids = l1.map(_.asid)
183d0de7e4aSpeixiaokun  val l1vmids = l1.map(_.vmid)
184d61cd5eeSpeixiaokun  val l1h = Reg(Vec(l2tlbParams.l1Size, UInt(2.W))) // 0 bit: s2xlate, 1 bit: stage 1 or stage 2
1856d5ddbceSLemover
1866d5ddbceSLemover  // l2: level 1 non-leaf pte
1876d5ddbceSLemover  val l2 = Module(new SRAMTemplate(
1887196f5a2SLemover    l2EntryType,
1895854c1edSLemover    set = l2tlbParams.l2nSets,
1905854c1edSLemover    way = l2tlbParams.l2nWays,
1915854c1edSLemover    singlePort = sramSinglePort
1926d5ddbceSLemover  ))
1935854c1edSLemover  val l2v = RegInit(0.U((l2tlbParams.l2nSets * l2tlbParams.l2nWays).W))
1945854c1edSLemover  val l2g = Reg(UInt((l2tlbParams.l2nSets * l2tlbParams.l2nWays).W))
195d0de7e4aSpeixiaokun  val l2h = Reg(Vec(l2tlbParams.l2nSets, Vec(l2tlbParams.l2nWays, UInt(2.W))))
1966d5ddbceSLemover  def getl2vSet(vpn: UInt) = {
1975854c1edSLemover    require(log2Up(l2tlbParams.l2nWays) == log2Down(l2tlbParams.l2nWays))
1986d5ddbceSLemover    val set = genPtwL2SetIdx(vpn)
1995854c1edSLemover    require(set.getWidth == log2Up(l2tlbParams.l2nSets))
2005854c1edSLemover    val l2vVec = l2v.asTypeOf(Vec(l2tlbParams.l2nSets, UInt(l2tlbParams.l2nWays.W)))
2016d5ddbceSLemover    l2vVec(set)
2026d5ddbceSLemover  }
203d0de7e4aSpeixiaokun  def getl2hSet(vpn: UInt) = {
20445f497a4Shappy-lx    require(log2Up(l2tlbParams.l2nWays) == log2Down(l2tlbParams.l2nWays))
20545f497a4Shappy-lx    val set = genPtwL2SetIdx(vpn)
20645f497a4Shappy-lx    require(set.getWidth == log2Up(l2tlbParams.l2nSets))
207d0de7e4aSpeixiaokun    l2h(set)
20845f497a4Shappy-lx  }
2096d5ddbceSLemover
210d0de7e4aSpeixiaokun
211d0de7e4aSpeixiaokun
2126d5ddbceSLemover  // l3: level 2 leaf pte of 4KB pages
2136d5ddbceSLemover  val l3 = Module(new SRAMTemplate(
2147196f5a2SLemover    l3EntryType,
2155854c1edSLemover    set = l2tlbParams.l3nSets,
2165854c1edSLemover    way = l2tlbParams.l3nWays,
2175854c1edSLemover    singlePort = sramSinglePort
2186d5ddbceSLemover  ))
2195854c1edSLemover  val l3v = RegInit(0.U((l2tlbParams.l3nSets * l2tlbParams.l3nWays).W))
2205854c1edSLemover  val l3g = Reg(UInt((l2tlbParams.l3nSets * l2tlbParams.l3nWays).W))
221d0de7e4aSpeixiaokun  val l3h = Reg(Vec(l2tlbParams.l3nSets, Vec(l2tlbParams.l3nWays, UInt(2.W))))
2226d5ddbceSLemover  def getl3vSet(vpn: UInt) = {
2235854c1edSLemover    require(log2Up(l2tlbParams.l3nWays) == log2Down(l2tlbParams.l3nWays))
2246d5ddbceSLemover    val set = genPtwL3SetIdx(vpn)
2255854c1edSLemover    require(set.getWidth == log2Up(l2tlbParams.l3nSets))
2265854c1edSLemover    val l3vVec = l3v.asTypeOf(Vec(l2tlbParams.l3nSets, UInt(l2tlbParams.l3nWays.W)))
2276d5ddbceSLemover    l3vVec(set)
2286d5ddbceSLemover  }
229d0de7e4aSpeixiaokun  def getl3hSet(vpn: UInt) = {
23045f497a4Shappy-lx    require(log2Up(l2tlbParams.l3nWays) == log2Down(l2tlbParams.l3nWays))
23145f497a4Shappy-lx    val set = genPtwL3SetIdx(vpn)
23245f497a4Shappy-lx    require(set.getWidth == log2Up(l2tlbParams.l3nSets))
233d0de7e4aSpeixiaokun    l3h(set)
23445f497a4Shappy-lx  }
2356d5ddbceSLemover
2366d5ddbceSLemover  // sp: level 0/1 leaf pte of 1GB/2MB super pages
2375854c1edSLemover  val sp = Reg(Vec(l2tlbParams.spSize, new PtwEntry(tagLen = SPTagLen, hasPerm = true, hasLevel = true)))
2385854c1edSLemover  val spv = RegInit(0.U(l2tlbParams.spSize.W))
2395854c1edSLemover  val spg = Reg(UInt(l2tlbParams.spSize.W))
2401dd3e32dSHaoyuan Feng  val spasids = sp.map(_.asid)
241d0de7e4aSpeixiaokun  val spvmids = sp.map(_.vmid)
242d61cd5eeSpeixiaokun  val sph = Reg(Vec(l2tlbParams.spSize, UInt(2.W)))
2436d5ddbceSLemover
2446d5ddbceSLemover  // Access Perf
2455854c1edSLemover  val l1AccessPerf = Wire(Vec(l2tlbParams.l1Size, Bool()))
2465854c1edSLemover  val l2AccessPerf = Wire(Vec(l2tlbParams.l2nWays, Bool()))
2475854c1edSLemover  val l3AccessPerf = Wire(Vec(l2tlbParams.l3nWays, Bool()))
2485854c1edSLemover  val spAccessPerf = Wire(Vec(l2tlbParams.spSize, Bool()))
2496d5ddbceSLemover  l1AccessPerf.map(_ := false.B)
2506d5ddbceSLemover  l2AccessPerf.map(_ := false.B)
2516d5ddbceSLemover  l3AccessPerf.map(_ := false.B)
2526d5ddbceSLemover  spAccessPerf.map(_ := false.B)
2536d5ddbceSLemover
2543889e11eSLemover
2551f4a7c0cSLemover
25682978df9Speixiaokun  def vpn_match(vpn1: UInt, vpn2: UInt, level: Int) = {
25782978df9Speixiaokun    (vpn1(vpnLen-1, vpnnLen*(2-level)+3) === vpn2(vpnLen-1, vpnnLen*(2-level)+3))
2581f4a7c0cSLemover  }
2591f4a7c0cSLemover  // NOTE: not actually bypassed, just check if hit, re-access the page cache
260d0de7e4aSpeixiaokun  def refill_bypass(vpn: UInt, level: Int, h_search: UInt) = {
261980ddf4cSpeixiaokun    val change_h = MuxLookup(h_search, noS2xlate, Seq(
262980ddf4cSpeixiaokun      allStage -> onlyStage1,
263980ddf4cSpeixiaokun      onlyStage1 -> onlyStage1,
264980ddf4cSpeixiaokun      onlyStage2 -> onlyStage2
265980ddf4cSpeixiaokun    ))
266d0de7e4aSpeixiaokun    val refill_vpn = io.refill.bits.req_info_dup(0).vpn
267980ddf4cSpeixiaokun    io.refill.valid && (level.U === io.refill.bits.level_dup(0)) && vpn_match(refill_vpn, vpn, level) && change_h === io.refill.bits.req_info_dup(0).s2xlate
2681f4a7c0cSLemover  }
2691f4a7c0cSLemover
27082978df9Speixiaokun  val vpn_search = stageReq.bits.req_info.vpn
27109280d15Speixiaokun  val h_search = MuxLookup(stageReq.bits.req_info.s2xlate, noS2xlate, Seq(
27209280d15Speixiaokun    allStage -> onlyStage1,
27309280d15Speixiaokun    onlyStage1 -> onlyStage1,
27409280d15Speixiaokun    onlyStage2 -> onlyStage2
27509280d15Speixiaokun  ))
2766d5ddbceSLemover  // l1
2775854c1edSLemover  val ptwl1replace = ReplacementPolicy.fromString(l2tlbParams.l1Replacer, l2tlbParams.l1Size)
278bc063562SLemover  val (l1Hit, l1HitPPN, l1Pre) = {
279d0de7e4aSpeixiaokun    val hitVecT = l1.zipWithIndex.map {
28082978df9Speixiaokun      case (e, i) => (e.hit(vpn_search, io.csr_dup(0).satp.asid, io.csr_dup(0).hgatp.asid, s2xlate = h_search =/= noS2xlate)
281d0de7e4aSpeixiaokun        && l1v(i) && h_search === l1h(i))
282d0de7e4aSpeixiaokun    }
2836c4dcc2dSLemover    val hitVec = hitVecT.map(RegEnable(_, stageReq.fire))
2841f4a7c0cSLemover
2851f4a7c0cSLemover    // stageDelay, but check for l1
2869c503409SLemover    val hitPPN = DataHoldBypass(ParallelPriorityMux(hitVec zip l1.map(_.ppn)), stageDelay_valid_1cycle)
2879c503409SLemover    val hitPre = DataHoldBypass(ParallelPriorityMux(hitVec zip l1.map(_.prefetch)), stageDelay_valid_1cycle)
2881f4a7c0cSLemover    val hit = DataHoldBypass(ParallelOR(hitVec), stageDelay_valid_1cycle)
2896d5ddbceSLemover
2906c4dcc2dSLemover    when (hit && stageDelay_valid_1cycle) { ptwl1replace.access(OHToUInt(hitVec)) }
2916d5ddbceSLemover
2926c4dcc2dSLemover    l1AccessPerf.zip(hitVec).map{ case (l, h) => l := h && stageDelay_valid_1cycle}
2935854c1edSLemover    for (i <- 0 until l2tlbParams.l1Size) {
294d61cd5eeSpeixiaokun      XSDebug(stageReq.fire, p"[l1] l1(${i.U}) ${l1(i)} hit:${l1(i).hit(vpn_search, Mux(h_search =/= noS2xlate, io.csr_dup(0).vsatp.asid, io.csr_dup(0).satp.asid), io.csr_dup(0).hgatp.asid, s2xlate = h_search =/= noS2xlate)}\n")
2956d5ddbceSLemover    }
2966c4dcc2dSLemover    XSDebug(stageReq.fire, p"[l1] l1v:${Binary(l1v)} hitVecT:${Binary(VecInit(hitVecT).asUInt)}\n")
2976c4dcc2dSLemover    XSDebug(stageDelay(0).valid, p"[l1] l1Hit:${hit} l1HitPPN:0x${Hexadecimal(hitPPN)} hitVec:${VecInit(hitVec).asUInt}\n")
2986d5ddbceSLemover
2996d5ddbceSLemover    VecInit(hitVecT).suggestName(s"l1_hitVecT")
3006d5ddbceSLemover    VecInit(hitVec).suggestName(s"l1_hitVec")
3016d5ddbceSLemover
3026c4dcc2dSLemover    // synchronize with other entries with RegEnable
3036c4dcc2dSLemover    (RegEnable(hit, stageDelay(1).fire),
3046c4dcc2dSLemover     RegEnable(hitPPN, stageDelay(1).fire),
3056c4dcc2dSLemover     RegEnable(hitPre, stageDelay(1).fire))
3066d5ddbceSLemover  }
3076d5ddbceSLemover
3086d5ddbceSLemover  // l2
3095854c1edSLemover  val ptwl2replace = ReplacementPolicy.fromString(l2tlbParams.l2Replacer,l2tlbParams.l2nWays,l2tlbParams.l2nSets)
310bc063562SLemover  val (l2Hit, l2HitPPN, l2Pre, l2eccError) = {
311d0de7e4aSpeixiaokun    val ridx = genPtwL2SetIdx(vpn_search)
3126c4dcc2dSLemover    l2.io.r.req.valid := stageReq.fire
3136d5ddbceSLemover    l2.io.r.req.bits.apply(setIdx = ridx)
314d0de7e4aSpeixiaokun    val vVec_req = getl2vSet(vpn_search)
315d0de7e4aSpeixiaokun    val hVec_req = getl2hSet(vpn_search)
3166c4dcc2dSLemover
3176c4dcc2dSLemover    // delay one cycle after sram read
31882978df9Speixiaokun    val delay_vpn = stageDelay(0).bits.req_info.vpn
319980ddf4cSpeixiaokun    val delay_h = MuxLookup(stageDelay(0).bits.req_info.s2xlate, noS2xlate, Seq(
320980ddf4cSpeixiaokun      allStage -> onlyStage1,
321980ddf4cSpeixiaokun      onlyStage1 -> onlyStage1,
322980ddf4cSpeixiaokun      onlyStage2 -> onlyStage2
323980ddf4cSpeixiaokun    ))
3246c4dcc2dSLemover    val data_resp = DataHoldBypass(l2.io.r.resp.data, stageDelay_valid_1cycle)
3257797f035SbugGenerator    val vVec_delay = RegEnable(vVec_req, stageReq.fire)
326d0de7e4aSpeixiaokun    val hVec_delay = RegEnable(hVec_req, stageReq.fire)
327d0de7e4aSpeixiaokun    val hitVec_delay = VecInit(data_resp.zip(vVec_delay.asBools).zip(hVec_delay).map { case ((wayData, v), h) =>
32882978df9Speixiaokun      wayData.entries.hit(delay_vpn, io.csr_dup(1).satp.asid, io.csr_dup(1).hgatp.asid, s2xlate = delay_h =/= noS2xlate) && v && (delay_h === h)})
3296c4dcc2dSLemover
3306c4dcc2dSLemover    // check hit and ecc
33182978df9Speixiaokun    val check_vpn = stageCheck(0).bits.req_info.vpn
3326c4dcc2dSLemover    val ramDatas = RegEnable(data_resp, stageDelay(1).fire)
333935edac4STang Haojin    val vVec = RegEnable(vVec_delay, stageDelay(1).fire).asBools
3346c4dcc2dSLemover
3357797f035SbugGenerator    val hitVec = RegEnable(hitVec_delay, stageDelay(1).fire)
3367196f5a2SLemover    val hitWayEntry = ParallelPriorityMux(hitVec zip ramDatas)
3377196f5a2SLemover    val hitWayData = hitWayEntry.entries
3386c4dcc2dSLemover    val hit = ParallelOR(hitVec)
339f3034303SHaoyuan Feng    val hitWay = ParallelPriorityMux(hitVec zip (0 until l2tlbParams.l2nWays).map(_.U(log2Up(l2tlbParams.l2nWays).W)))
3403889e11eSLemover    val eccError = hitWayEntry.decode()
3417196f5a2SLemover
3426d5ddbceSLemover    ridx.suggestName(s"l2_ridx")
3436d5ddbceSLemover    ramDatas.suggestName(s"l2_ramDatas")
3446d5ddbceSLemover    hitVec.suggestName(s"l2_hitVec")
3456d5ddbceSLemover    hitWayData.suggestName(s"l2_hitWayData")
3466d5ddbceSLemover    hitWay.suggestName(s"l2_hitWay")
3476d5ddbceSLemover
3486c4dcc2dSLemover    when (hit && stageCheck_valid_1cycle) { ptwl2replace.access(genPtwL2SetIdx(check_vpn), hitWay) }
3496d5ddbceSLemover
3506c4dcc2dSLemover    l2AccessPerf.zip(hitVec).map{ case (l, h) => l := h && stageCheck_valid_1cycle }
3516c4dcc2dSLemover    XSDebug(stageDelay_valid_1cycle, p"[l2] ridx:0x${Hexadecimal(ridx)}\n")
3525854c1edSLemover    for (i <- 0 until l2tlbParams.l2nWays) {
3536c4dcc2dSLemover      XSDebug(stageCheck_valid_1cycle, p"[l2] ramDatas(${i.U}) ${ramDatas(i)}  l2v:${vVec(i)}  hit:${hit}\n")
3546d5ddbceSLemover    }
3556c4dcc2dSLemover    XSDebug(stageCheck_valid_1cycle, p"[l2] l2Hit:${hit} l2HitPPN:0x${Hexadecimal(hitWayData.ppns(genPtwL2SectorIdx(check_vpn)))} hitVec:${Binary(hitVec.asUInt)} hitWay:${hitWay} vidx:${vVec}\n")
3566d5ddbceSLemover
3576c4dcc2dSLemover    (hit, hitWayData.ppns(genPtwL2SectorIdx(check_vpn)), hitWayData.prefetch, eccError)
3586d5ddbceSLemover  }
3596d5ddbceSLemover
3606d5ddbceSLemover  // l3
3615854c1edSLemover  val ptwl3replace = ReplacementPolicy.fromString(l2tlbParams.l3Replacer,l2tlbParams.l3nWays,l2tlbParams.l3nSets)
362bc063562SLemover  val (l3Hit, l3HitData, l3Pre, l3eccError) = {
363d0de7e4aSpeixiaokun    val ridx = genPtwL3SetIdx(vpn_search)
3646c4dcc2dSLemover    l3.io.r.req.valid := stageReq.fire
3656d5ddbceSLemover    l3.io.r.req.bits.apply(setIdx = ridx)
366d0de7e4aSpeixiaokun    val vVec_req = getl3vSet(vpn_search)
367d0de7e4aSpeixiaokun    val hVec_req = getl3hSet(vpn_search)
3686c4dcc2dSLemover
3696c4dcc2dSLemover    // delay one cycle after sram read
37082978df9Speixiaokun    val delay_vpn = stageDelay(0).bits.req_info.vpn
371980ddf4cSpeixiaokun    val delay_h = MuxLookup(stageDelay(0).bits.req_info.s2xlate, noS2xlate, Seq(
372980ddf4cSpeixiaokun      allStage -> onlyStage1,
373980ddf4cSpeixiaokun      onlyStage1 -> onlyStage1,
374980ddf4cSpeixiaokun      onlyStage2 -> onlyStage2
375980ddf4cSpeixiaokun    ))
3766c4dcc2dSLemover    val data_resp = DataHoldBypass(l3.io.r.resp.data, stageDelay_valid_1cycle)
3777797f035SbugGenerator    val vVec_delay = RegEnable(vVec_req, stageReq.fire)
378d0de7e4aSpeixiaokun    val hVec_delay = RegEnable(hVec_req, stageReq.fire)
379d0de7e4aSpeixiaokun    val hitVec_delay = VecInit(data_resp.zip(vVec_delay.asBools).zip(hVec_delay).map { case ((wayData, v), h) =>
38082978df9Speixiaokun      wayData.entries.hit(delay_vpn, io.csr_dup(2).satp.asid, io.csr_dup(2).hgatp.asid, s2xlate = delay_h =/= noS2xlate) && v && (delay_h === h)})
3816c4dcc2dSLemover
3826c4dcc2dSLemover    // check hit and ecc
38382978df9Speixiaokun    val check_vpn = stageCheck(0).bits.req_info.vpn
3846c4dcc2dSLemover    val ramDatas = RegEnable(data_resp, stageDelay(1).fire)
385935edac4STang Haojin    val vVec = RegEnable(vVec_delay, stageDelay(1).fire).asBools
3866c4dcc2dSLemover
3877797f035SbugGenerator    val hitVec = RegEnable(hitVec_delay, stageDelay(1).fire)
3887196f5a2SLemover    val hitWayEntry = ParallelPriorityMux(hitVec zip ramDatas)
3897196f5a2SLemover    val hitWayData = hitWayEntry.entries
3907196f5a2SLemover    val hitWayEcc = hitWayEntry.ecc
3916c4dcc2dSLemover    val hit = ParallelOR(hitVec)
392f3034303SHaoyuan Feng    val hitWay = ParallelPriorityMux(hitVec zip (0 until l2tlbParams.l3nWays).map(_.U(log2Up(l2tlbParams.l3nWays).W)))
3933889e11eSLemover    val eccError = hitWayEntry.decode()
3946d5ddbceSLemover
3956c4dcc2dSLemover    when (hit && stageCheck_valid_1cycle) { ptwl3replace.access(genPtwL3SetIdx(check_vpn), hitWay) }
3967196f5a2SLemover
3976c4dcc2dSLemover    l3AccessPerf.zip(hitVec).map{ case (l, h) => l := h && stageCheck_valid_1cycle }
3986c4dcc2dSLemover    XSDebug(stageReq.fire, p"[l3] ridx:0x${Hexadecimal(ridx)}\n")
3995854c1edSLemover    for (i <- 0 until l2tlbParams.l3nWays) {
4006c4dcc2dSLemover      XSDebug(stageCheck_valid_1cycle, p"[l3] ramDatas(${i.U}) ${ramDatas(i)}  l3v:${vVec(i)}  hit:${hitVec(i)}\n")
4016d5ddbceSLemover    }
4026c4dcc2dSLemover    XSDebug(stageCheck_valid_1cycle, p"[l3] l3Hit:${hit} l3HitData:${hitWayData} hitVec:${Binary(hitVec.asUInt)} hitWay:${hitWay} v:${vVec}\n")
4036d5ddbceSLemover
4046d5ddbceSLemover    ridx.suggestName(s"l3_ridx")
4056d5ddbceSLemover    ramDatas.suggestName(s"l3_ramDatas")
4066d5ddbceSLemover    hitVec.suggestName(s"l3_hitVec")
4076d5ddbceSLemover    hitWay.suggestName(s"l3_hitWay")
4086d5ddbceSLemover
4093889e11eSLemover    (hit, hitWayData, hitWayData.prefetch, eccError)
4106d5ddbceSLemover  }
41163632028SHaoyuan Feng  val l3HitPPN = l3HitData.ppns
41263632028SHaoyuan Feng  val l3HitPerm = l3HitData.perms.getOrElse(0.U.asTypeOf(Vec(PtwL3SectorSize, new PtePermBundle)))
41363632028SHaoyuan Feng  val l3HitValid = l3HitData.vs
4146d5ddbceSLemover
4156d5ddbceSLemover  // super page
4165854c1edSLemover  val spreplace = ReplacementPolicy.fromString(l2tlbParams.spReplacer, l2tlbParams.spSize)
4178d8ac704SLemover  val (spHit, spHitData, spPre, spValid) = {
41882978df9Speixiaokun    val hitVecT = sp.zipWithIndex.map { case (e, i) => e.hit(vpn_search, Mux(h_search =/= noS2xlate, io.csr_dup(0).vsatp.asid, io.csr_dup(0).satp.asid), io.csr_dup(0).hgatp.asid, s2xlate = h_search =/= noS2xlate) && spv(i) && (sph(i) === h_search) }
4196c4dcc2dSLemover    val hitVec = hitVecT.map(RegEnable(_, stageReq.fire))
4206d5ddbceSLemover    val hitData = ParallelPriorityMux(hitVec zip sp)
4216c4dcc2dSLemover    val hit = ParallelOR(hitVec)
4226d5ddbceSLemover
4236c4dcc2dSLemover    when (hit && stageDelay_valid_1cycle) { spreplace.access(OHToUInt(hitVec)) }
4246d5ddbceSLemover
4256c4dcc2dSLemover    spAccessPerf.zip(hitVec).map{ case (s, h) => s := h && stageDelay_valid_1cycle }
4265854c1edSLemover    for (i <- 0 until l2tlbParams.spSize) {
42782978df9Speixiaokun      XSDebug(stageReq.fire, p"[sp] sp(${i.U}) ${sp(i)} hit:${sp(i).hit(vpn_search, Mux(h_search =/= noS2xlate, io.csr_dup(0).vsatp.asid, io.csr_dup(0).satp.asid), io.csr_dup(0).hgatp.asid, s2xlate = h_search =/= noS2xlate)} spv:${spv(i)}\n")
4286d5ddbceSLemover    }
4296c4dcc2dSLemover    XSDebug(stageDelay_valid_1cycle, p"[sp] spHit:${hit} spHitData:${hitData} hitVec:${Binary(VecInit(hitVec).asUInt)}\n")
4306d5ddbceSLemover
4316d5ddbceSLemover    VecInit(hitVecT).suggestName(s"sp_hitVecT")
4326d5ddbceSLemover    VecInit(hitVec).suggestName(s"sp_hitVec")
4336d5ddbceSLemover
4346c4dcc2dSLemover    (RegEnable(hit, stageDelay(1).fire),
4356c4dcc2dSLemover     RegEnable(hitData, stageDelay(1).fire),
4366c4dcc2dSLemover     RegEnable(hitData.prefetch, stageDelay(1).fire),
437935edac4STang Haojin     RegEnable(hitData.v, stageDelay(1).fire))
4386d5ddbceSLemover  }
4396d5ddbceSLemover  val spHitPerm = spHitData.perm.getOrElse(0.U.asTypeOf(new PtePermBundle))
4406d5ddbceSLemover  val spHitLevel = spHitData.level.getOrElse(0.U)
4416d5ddbceSLemover
4426c4dcc2dSLemover  val check_res = Wire(new PageCacheRespBundle)
4436c4dcc2dSLemover  check_res.l1.apply(l1Hit, l1Pre, l1HitPPN)
4446c4dcc2dSLemover  check_res.l2.apply(l2Hit, l2Pre, l2HitPPN, ecc = l2eccError)
4451f4a7c0cSLemover  check_res.l3.apply(l3Hit, l3Pre, l3HitPPN, l3HitPerm, l3eccError, valid = l3HitValid)
4466c4dcc2dSLemover  check_res.sp.apply(spHit, spPre, spHitData.ppn, spHitPerm, false.B, spHitLevel, spValid)
4476d5ddbceSLemover
4486c4dcc2dSLemover  val resp_res = Reg(new PageCacheRespBundle)
4496c4dcc2dSLemover  when (stageCheck(1).fire) { resp_res := check_res }
4503889e11eSLemover
4511f4a7c0cSLemover  // stageResp bypass
4521f4a7c0cSLemover  val bypassed = Wire(Vec(3, Bool()))
4531f4a7c0cSLemover  bypassed.indices.foreach(i =>
4541f4a7c0cSLemover    bypassed(i) := stageResp.bits.bypassed(i) ||
45509280d15Speixiaokun      ValidHoldBypass(refill_bypass(vpn_search, i, stageResp.bits.req_info.s2xlate),
4561f4a7c0cSLemover        OneCycleValid(stageCheck(1).fire, false.B) || io.refill.valid)
4571f4a7c0cSLemover  )
4581f4a7c0cSLemover
45930104977Speixiaokun  val isAllStage = stageResp.bits.req_info.s2xlate === allStage
460c0991f6aSpeixiaokun  val isOnlyStage2 = stageResp.bits.req_info.s2xlate === onlyStage2
461980ddf4cSpeixiaokun  val stage1Hit = (resp_res.l3.hit || resp_res.sp.hit) && isAllStage
4626c4dcc2dSLemover  io.resp.bits.req_info   := stageResp.bits.req_info
4636c4dcc2dSLemover  io.resp.bits.isFirst  := stageResp.bits.isFirst
46430104977Speixiaokun  io.resp.bits.hit      := (resp_res.l3.hit || resp_res.sp.hit) && !isAllStage
465c0991f6aSpeixiaokun  io.resp.bits.bypassed := (bypassed(2) || (bypassed(1) && !resp_res.l2.hit) || (bypassed(0) && !resp_res.l1.hit)) && !isAllStage && !isOnlyStage2
4666c4dcc2dSLemover  io.resp.bits.prefetch := resp_res.l3.pre && resp_res.l3.hit || resp_res.sp.pre && resp_res.sp.hit
467c0991f6aSpeixiaokun  io.resp.bits.toFsm.l1Hit := resp_res.l1.hit && !stage1Hit && !isOnlyStage2
468c0991f6aSpeixiaokun  io.resp.bits.toFsm.l2Hit := resp_res.l2.hit && !stage1Hit && !isOnlyStage2
4696c4dcc2dSLemover  io.resp.bits.toFsm.ppn   := Mux(resp_res.l2.hit, resp_res.l2.ppn, resp_res.l1.ppn)
470980ddf4cSpeixiaokun  io.resp.bits.toFsm.stage1Hit := stage1Hit
471d0de7e4aSpeixiaokun
472d0de7e4aSpeixiaokun  io.resp.bits.isHptw := stageResp.bits.isHptw
473d0de7e4aSpeixiaokun  io.resp.bits.toHptw.id := stageResp.bits.hptwId
474d0de7e4aSpeixiaokun  io.resp.bits.toHptw.l1Hit := resp_res.l1.hit
475d0de7e4aSpeixiaokun  io.resp.bits.toHptw.l2Hit := resp_res.l2.hit
476d0de7e4aSpeixiaokun  io.resp.bits.toHptw.ppn := Mux(resp_res.l2.hit, resp_res.l2.ppn, resp_res.l1.ppn)
47782978df9Speixiaokun  val idx = stageResp.bits.req_info.vpn(2, 0)
47882978df9Speixiaokun  io.resp.bits.toHptw.resp.entry.tag := stageResp.bits.req_info.vpn
479eb4bf3f2Speixiaokun  io.resp.bits.toHptw.resp.entry.asid := DontCare
480d61cd5eeSpeixiaokun  io.resp.bits.toHptw.resp.entry.vmid.map(_ := io.csr_dup(0).hgatp.asid)
481d0de7e4aSpeixiaokun  io.resp.bits.toHptw.resp.entry.level.map(_ := Mux(resp_res.l3.hit, 2.U, resp_res.sp.level))
482d0de7e4aSpeixiaokun  io.resp.bits.toHptw.resp.entry.prefetch := from_pre(stageResp.bits.req_info.source)
483d0de7e4aSpeixiaokun  io.resp.bits.toHptw.resp.entry.ppn := Mux(resp_res.l3.hit, resp_res.l3.ppn(idx), resp_res.sp.ppn)
484d61cd5eeSpeixiaokun  io.resp.bits.toHptw.resp.entry.perm.map(_ := Mux(resp_res.l3.hit, resp_res.l3.perm(idx), resp_res.sp.perm))
485d0de7e4aSpeixiaokun  io.resp.bits.toHptw.resp.entry.v := Mux(resp_res.l3.hit, resp_res.l3.v(idx), resp_res.sp.v)
486d0de7e4aSpeixiaokun  io.resp.bits.toHptw.resp.gpf := !io.resp.bits.toHptw.resp.entry.v
487d0de7e4aSpeixiaokun  io.resp.bits.toHptw.resp.gaf := false.B
488d0de7e4aSpeixiaokun
48982978df9Speixiaokun  io.resp.bits.toTlb.entry.map(_.tag := stageResp.bits.req_info.vpn(vpnLen - 1, 3))
490eb4bf3f2Speixiaokun  io.resp.bits.toTlb.entry.map(_.asid := Mux(stageResp.bits.req_info.hasS2xlate(), io.csr_dup(0).vsatp.asid, io.csr_dup(0).satp.asid)) // DontCare
491eb4bf3f2Speixiaokun  io.resp.bits.toTlb.entry.map(_.vmid.map(_ := io.csr_dup(0).hgatp.asid))
49263632028SHaoyuan Feng  io.resp.bits.toTlb.entry.map(_.level.map(_ := Mux(resp_res.l3.hit, 2.U, resp_res.sp.level)))
49363632028SHaoyuan Feng  io.resp.bits.toTlb.entry.map(_.prefetch := from_pre(stageResp.bits.req_info.source))
49463632028SHaoyuan Feng  for (i <- 0 until tlbcontiguous) {
49563632028SHaoyuan Feng    io.resp.bits.toTlb.entry(i).ppn := Mux(resp_res.l3.hit, resp_res.l3.ppn(i)(ppnLen - 1, sectortlbwidth), resp_res.sp.ppn(ppnLen - 1, sectortlbwidth))
49663632028SHaoyuan Feng    io.resp.bits.toTlb.entry(i).ppn_low := Mux(resp_res.l3.hit, resp_res.l3.ppn(i)(sectortlbwidth - 1, 0), resp_res.sp.ppn(sectortlbwidth - 1, 0))
49763632028SHaoyuan Feng    io.resp.bits.toTlb.entry(i).perm.map(_ := Mux(resp_res.l3.hit, resp_res.l3.perm(i), resp_res.sp.perm))
49863632028SHaoyuan Feng    io.resp.bits.toTlb.entry(i).v := Mux(resp_res.l3.hit, resp_res.l3.v(i), resp_res.sp.v)
49963632028SHaoyuan Feng    io.resp.bits.toTlb.entry(i).pf := !io.resp.bits.toTlb.entry(i).v
50063632028SHaoyuan Feng    io.resp.bits.toTlb.entry(i).af := false.B
50163632028SHaoyuan Feng  }
50263632028SHaoyuan Feng  io.resp.bits.toTlb.pteidx := UIntToOH(stageResp.bits.req_info.vpn(2, 0)).asBools
50363632028SHaoyuan Feng  io.resp.bits.toTlb.not_super := Mux(resp_res.l3.hit, true.B, false.B)
5046c4dcc2dSLemover  io.resp.valid := stageResp.valid
5056c4dcc2dSLemover  XSError(stageResp.valid && resp_res.l3.hit && resp_res.sp.hit, "normal page and super page both hit")
5061f4a7c0cSLemover  XSError(stageResp.valid && io.resp.bits.hit && bypassed(2), "page cache, bypassed but hit")
5076d5ddbceSLemover
5086d5ddbceSLemover  // refill Perf
5095854c1edSLemover  val l1RefillPerf = Wire(Vec(l2tlbParams.l1Size, Bool()))
5105854c1edSLemover  val l2RefillPerf = Wire(Vec(l2tlbParams.l2nWays, Bool()))
5115854c1edSLemover  val l3RefillPerf = Wire(Vec(l2tlbParams.l3nWays, Bool()))
5125854c1edSLemover  val spRefillPerf = Wire(Vec(l2tlbParams.spSize, Bool()))
5136d5ddbceSLemover  l1RefillPerf.map(_ := false.B)
5146d5ddbceSLemover  l2RefillPerf.map(_ := false.B)
5156d5ddbceSLemover  l3RefillPerf.map(_ := false.B)
5166d5ddbceSLemover  spRefillPerf.map(_ := false.B)
5176d5ddbceSLemover
5186d5ddbceSLemover  // refill
5196d5ddbceSLemover  l2.io.w.req <> DontCare
5206d5ddbceSLemover  l3.io.w.req <> DontCare
5216d5ddbceSLemover  l2.io.w.req.valid := false.B
5226d5ddbceSLemover  l3.io.w.req.valid := false.B
5236d5ddbceSLemover
5246d5ddbceSLemover  val memRdata = refill.ptes
5255854c1edSLemover  val memPtes = (0 until (l2tlbParams.blockBytes/(XLEN/8))).map(i => memRdata((i+1)*XLEN-1, i*XLEN).asTypeOf(new PteBundle))
5267797f035SbugGenerator  val memSelData = io.refill.bits.sel_pte_dup
5277797f035SbugGenerator  val memPte = memSelData.map(a => a.asTypeOf(new PteBundle))
528b848eea5SLemover
5296d5ddbceSLemover  // TODO: handle sfenceLatch outsize
5300d94d540SHaoyuan Feng  when (!flush_dup(0) && refill.levelOH.l1 && !memPte(0).isLeaf() && !memPte(0).isPf(refill.level_dup(0)) && !memPte(0).isAf()) {
5315854c1edSLemover    // val refillIdx = LFSR64()(log2Up(l2tlbParams.l1Size)-1,0) // TODO: may be LRU
5326d5ddbceSLemover    val refillIdx = replaceWrapper(l1v, ptwl1replace.way)
5336d5ddbceSLemover    refillIdx.suggestName(s"PtwL1RefillIdx")
5346d5ddbceSLemover    val rfOH = UIntToOH(refillIdx)
53545f497a4Shappy-lx    l1(refillIdx).refill(
53682978df9Speixiaokun      refill.req_info_dup(0).vpn,
537980ddf4cSpeixiaokun      Mux(refill.req_info_dup(0).s2xlate =/= noS2xlate, io.csr_dup(0).vsatp.asid, io.csr_dup(0).satp.asid),
538d0de7e4aSpeixiaokun      io.csr_dup(0).hgatp.asid,
5397797f035SbugGenerator      memSelData(0),
54045f497a4Shappy-lx      0.U,
5417797f035SbugGenerator      refill_prefetch_dup(0)
54245f497a4Shappy-lx    )
5436d5ddbceSLemover    ptwl1replace.access(refillIdx)
5446d5ddbceSLemover    l1v := l1v | rfOH
5457797f035SbugGenerator    l1g := (l1g & ~rfOH) | Mux(memPte(0).perm.g, rfOH, 0.U)
546d0de7e4aSpeixiaokun    l1h(refillIdx) := refill.req_info_dup(0).s2xlate
5476d5ddbceSLemover
5485854c1edSLemover    for (i <- 0 until l2tlbParams.l1Size) {
5496d5ddbceSLemover      l1RefillPerf(i) := i.U === refillIdx
5506d5ddbceSLemover    }
5516d5ddbceSLemover
5527797f035SbugGenerator    XSDebug(p"[l1 refill] refillIdx:${refillIdx} refillEntry:${l1(refillIdx).genPtwEntry(refill.req_info_dup(0).vpn, io.csr_dup(0).satp.asid, memSelData(0), 0.U, prefetch = refill_prefetch_dup(0))}\n")
5537797f035SbugGenerator    XSDebug(p"[l1 refill] l1v:${Binary(l1v)}->${Binary(l1v | rfOH)} l1g:${Binary(l1g)}->${Binary((l1g & ~rfOH) | Mux(memPte(0).perm.g, rfOH, 0.U))}\n")
5546d5ddbceSLemover
5556d5ddbceSLemover    refillIdx.suggestName(s"l1_refillIdx")
5566d5ddbceSLemover    rfOH.suggestName(s"l1_rfOH")
5576d5ddbceSLemover  }
5586d5ddbceSLemover
5590d94d540SHaoyuan Feng  when (!flush_dup(1) && refill.levelOH.l2 && !memPte(1).isLeaf() && !memPte(1).isPf(refill.level_dup(1)) && !memPte(1).isAf()) {
5607797f035SbugGenerator    val refillIdx = genPtwL2SetIdx(refill.req_info_dup(1).vpn)
5617797f035SbugGenerator    val victimWay = replaceWrapper(getl2vSet(refill.req_info_dup(1).vpn), ptwl2replace.way(refillIdx))
5626d5ddbceSLemover    val victimWayOH = UIntToOH(victimWay)
5636d5ddbceSLemover    val rfvOH = UIntToOH(Cat(refillIdx, victimWay))
5647196f5a2SLemover    val wdata = Wire(l2EntryType)
5653889e11eSLemover    wdata.gen(
56682978df9Speixiaokun      vpn = refill.req_info_dup(1).vpn,
567cca17e78Speixiaokun      asid = Mux(refill.req_info_dup(1).s2xlate =/= noS2xlate, io.csr_dup(1).vsatp.asid, io.csr_dup(1).satp.asid),
568d0de7e4aSpeixiaokun      vmid = io.csr_dup(1).hgatp.asid,
56945f497a4Shappy-lx      data = memRdata,
57045f497a4Shappy-lx      levelUInt = 1.U,
5717797f035SbugGenerator      refill_prefetch_dup(1)
57245f497a4Shappy-lx    )
5736d5ddbceSLemover    l2.io.w.apply(
5746d5ddbceSLemover      valid = true.B,
5756d5ddbceSLemover      setIdx = refillIdx,
5767196f5a2SLemover      data = wdata,
5776d5ddbceSLemover      waymask = victimWayOH
5786d5ddbceSLemover    )
5796d5ddbceSLemover    ptwl2replace.access(refillIdx, victimWay)
5806d5ddbceSLemover    l2v := l2v | rfvOH
5816d5ddbceSLemover    l2g := l2g & ~rfvOH | Mux(Cat(memPtes.map(_.perm.g)).andR, rfvOH, 0.U)
582980ddf4cSpeixiaokun    l2h(refillIdx)(victimWay) := refill.req_info_dup(1).s2xlate
5836d5ddbceSLemover
5845854c1edSLemover    for (i <- 0 until l2tlbParams.l2nWays) {
5856d5ddbceSLemover      l2RefillPerf(i) := i.U === victimWay
5866d5ddbceSLemover    }
5876d5ddbceSLemover
5886d5ddbceSLemover    XSDebug(p"[l2 refill] refillIdx:0x${Hexadecimal(refillIdx)} victimWay:${victimWay} victimWayOH:${Binary(victimWayOH)} rfvOH(in UInt):${Cat(refillIdx, victimWay)}\n")
58945f497a4Shappy-lx    XSDebug(p"[l2 refill] refilldata:0x${wdata}\n")
5906d5ddbceSLemover    XSDebug(p"[l2 refill] l2v:${Binary(l2v)} -> ${Binary(l2v | rfvOH)}\n")
5916d5ddbceSLemover    XSDebug(p"[l2 refill] l2g:${Binary(l2g)} -> ${Binary(l2g & ~rfvOH | Mux(Cat(memPtes.map(_.perm.g)).andR, rfvOH, 0.U))}\n")
5926d5ddbceSLemover
5936d5ddbceSLemover    refillIdx.suggestName(s"l2_refillIdx")
5946d5ddbceSLemover    victimWay.suggestName(s"l2_victimWay")
5956d5ddbceSLemover    victimWayOH.suggestName(s"l2_victimWayOH")
5966d5ddbceSLemover    rfvOH.suggestName(s"l2_rfvOH")
5976d5ddbceSLemover  }
5986d5ddbceSLemover
5990d94d540SHaoyuan Feng  when (!flush_dup(2) && refill.levelOH.l3 && !memPte(2).isAf()) {
6007797f035SbugGenerator    val refillIdx = genPtwL3SetIdx(refill.req_info_dup(2).vpn)
6017797f035SbugGenerator    val victimWay = replaceWrapper(getl3vSet(refill.req_info_dup(2).vpn), ptwl3replace.way(refillIdx))
6026d5ddbceSLemover    val victimWayOH = UIntToOH(victimWay)
6036d5ddbceSLemover    val rfvOH = UIntToOH(Cat(refillIdx, victimWay))
6047196f5a2SLemover    val wdata = Wire(l3EntryType)
6053889e11eSLemover    wdata.gen(
60682978df9Speixiaokun      vpn =  refill.req_info_dup(2).vpn,
607cca17e78Speixiaokun      asid = Mux(refill.req_info_dup(2).s2xlate =/= noS2xlate, io.csr_dup(2).vsatp.asid, io.csr_dup(2).satp.asid),
608d0de7e4aSpeixiaokun      vmid = io.csr_dup(2).hgatp.asid,
60945f497a4Shappy-lx      data = memRdata,
61045f497a4Shappy-lx      levelUInt = 2.U,
6117797f035SbugGenerator      refill_prefetch_dup(2)
61245f497a4Shappy-lx    )
6136d5ddbceSLemover    l3.io.w.apply(
6146d5ddbceSLemover      valid = true.B,
6156d5ddbceSLemover      setIdx = refillIdx,
6167196f5a2SLemover      data = wdata,
6176d5ddbceSLemover      waymask = victimWayOH
6186d5ddbceSLemover    )
6196d5ddbceSLemover    ptwl3replace.access(refillIdx, victimWay)
6206d5ddbceSLemover    l3v := l3v | rfvOH
6216d5ddbceSLemover    l3g := l3g & ~rfvOH | Mux(Cat(memPtes.map(_.perm.g)).andR, rfvOH, 0.U)
622d0de7e4aSpeixiaokun    l3h(refillIdx)(victimWay) := refill.req_info_dup(2).s2xlate
6236d5ddbceSLemover
6245854c1edSLemover    for (i <- 0 until l2tlbParams.l3nWays) {
6256d5ddbceSLemover      l3RefillPerf(i) := i.U === victimWay
6266d5ddbceSLemover    }
6276d5ddbceSLemover
6286d5ddbceSLemover    XSDebug(p"[l3 refill] refillIdx:0x${Hexadecimal(refillIdx)} victimWay:${victimWay} victimWayOH:${Binary(victimWayOH)} rfvOH(in UInt):${Cat(refillIdx, victimWay)}\n")
62945f497a4Shappy-lx    XSDebug(p"[l3 refill] refilldata:0x${wdata}\n")
6306d5ddbceSLemover    XSDebug(p"[l3 refill] l3v:${Binary(l3v)} -> ${Binary(l3v | rfvOH)}\n")
6316d5ddbceSLemover    XSDebug(p"[l3 refill] l3g:${Binary(l3g)} -> ${Binary(l3g & ~rfvOH | Mux(Cat(memPtes.map(_.perm.g)).andR, rfvOH, 0.U))}\n")
6326d5ddbceSLemover
6336d5ddbceSLemover    refillIdx.suggestName(s"l3_refillIdx")
6346d5ddbceSLemover    victimWay.suggestName(s"l3_victimWay")
6356d5ddbceSLemover    victimWayOH.suggestName(s"l3_victimWayOH")
6366d5ddbceSLemover    rfvOH.suggestName(s"l3_rfvOH")
6376d5ddbceSLemover  }
6387797f035SbugGenerator
6398d8ac704SLemover
6408d8ac704SLemover  // misc entries: super & invalid
6410d94d540SHaoyuan Feng  when (!flush_dup(0) && refill.levelOH.sp && (memPte(0).isLeaf() || memPte(0).isPf(refill.level_dup(0))) && !memPte(0).isAf()) {
6425854c1edSLemover    val refillIdx = spreplace.way// LFSR64()(log2Up(l2tlbParams.spSize)-1,0) // TODO: may be LRU
6436d5ddbceSLemover    val rfOH = UIntToOH(refillIdx)
64445f497a4Shappy-lx    sp(refillIdx).refill(
6457797f035SbugGenerator      refill.req_info_dup(0).vpn,
6467797f035SbugGenerator      io.csr_dup(0).satp.asid,
647d0de7e4aSpeixiaokun      io.csr_dup(0).hgatp.asid,
6487797f035SbugGenerator      memSelData(0),
6497797f035SbugGenerator      refill.level_dup(2),
6507797f035SbugGenerator      refill_prefetch_dup(0),
6517797f035SbugGenerator      !memPte(0).isPf(refill.level_dup(0)),
65245f497a4Shappy-lx    )
6536d5ddbceSLemover    spreplace.access(refillIdx)
6546d5ddbceSLemover    spv := spv | rfOH
6557797f035SbugGenerator    spg := spg & ~rfOH | Mux(memPte(0).perm.g, rfOH, 0.U)
656d0de7e4aSpeixiaokun    sph(refillIdx) := refill.req_info_dup(0).s2xlate
6576d5ddbceSLemover
6585854c1edSLemover    for (i <- 0 until l2tlbParams.spSize) {
6596d5ddbceSLemover      spRefillPerf(i) := i.U === refillIdx
6606d5ddbceSLemover    }
6616d5ddbceSLemover
6627797f035SbugGenerator    XSDebug(p"[sp refill] refillIdx:${refillIdx} refillEntry:${sp(refillIdx).genPtwEntry(refill.req_info_dup(0).vpn, io.csr_dup(0).satp.asid, memSelData(0), refill.level_dup(0), refill_prefetch_dup(0))}\n")
6637797f035SbugGenerator    XSDebug(p"[sp refill] spv:${Binary(spv)}->${Binary(spv | rfOH)} spg:${Binary(spg)}->${Binary(spg & ~rfOH | Mux(memPte(0).perm.g, rfOH, 0.U))}\n")
6646d5ddbceSLemover
6656d5ddbceSLemover    refillIdx.suggestName(s"sp_refillIdx")
6666d5ddbceSLemover    rfOH.suggestName(s"sp_rfOH")
6676d5ddbceSLemover  }
6686d5ddbceSLemover
6697797f035SbugGenerator  val l2eccFlush = resp_res.l2.ecc && stageResp_valid_1cycle_dup(0) // RegNext(l2eccError, init = false.B)
6707797f035SbugGenerator  val l3eccFlush = resp_res.l3.ecc && stageResp_valid_1cycle_dup(1) // RegNext(l3eccError, init = false.B)
6716c4dcc2dSLemover  val eccVpn = stageResp.bits.req_info.vpn
6727196f5a2SLemover
6736c4dcc2dSLemover  XSError(l2eccFlush, "l2tlb.cache.l2 ecc error. Should not happen at sim stage")
6746c4dcc2dSLemover  XSError(l3eccFlush, "l2tlb.cache.l3 ecc error. Should not happen at sim stage")
6757196f5a2SLemover  when (l2eccFlush) {
6767196f5a2SLemover    val flushSetIdxOH = UIntToOH(genPtwL2SetIdx(eccVpn))
6777196f5a2SLemover    val flushMask = VecInit(flushSetIdxOH.asBools.map { a => Fill(l2tlbParams.l2nWays, a.asUInt) }).asUInt
6787196f5a2SLemover    l2v := l2v & ~flushMask
6797196f5a2SLemover    l2g := l2g & ~flushMask
6807196f5a2SLemover  }
6817196f5a2SLemover
6827196f5a2SLemover  when (l3eccFlush) {
6837196f5a2SLemover    val flushSetIdxOH = UIntToOH(genPtwL3SetIdx(eccVpn))
6847196f5a2SLemover    val flushMask = VecInit(flushSetIdxOH.asBools.map { a => Fill(l2tlbParams.l3nWays, a.asUInt) }).asUInt
6857196f5a2SLemover    l3v := l3v & ~flushMask
6867196f5a2SLemover    l3g := l3g & ~flushMask
6877196f5a2SLemover  }
6887196f5a2SLemover
689*a1d4b4bfSpeixiaokun  // sfence for l3
690d0de7e4aSpeixiaokun  val sfence_valid_l3 = sfence_dup(3).valid && !sfence_dup(3).bits.hg && !sfence_dup(3).bits.hv
691*a1d4b4bfSpeixiaokun  when (sfence_valid_l3) {
692*a1d4b4bfSpeixiaokun    val l3hhit = VecInit(l3h.flatMap(_.map(_ === onlyStage1 && io.csr_dup(0).priv.virt || !io.csr_dup(0).priv.virt))).asUInt
6937797f035SbugGenerator    val sfence_vpn = sfence_dup(3).bits.addr(sfence_dup(3).bits.addr.getWidth-1, offLen)
6947797f035SbugGenerator    when (sfence_dup(3).bits.rs1/*va*/) {
6957797f035SbugGenerator      when (sfence_dup(3).bits.rs2) {
6967797f035SbugGenerator        // all va && all asid
697*a1d4b4bfSpeixiaokun        l3v := l3v & ~l3hhit
6987797f035SbugGenerator      } .otherwise {
6997797f035SbugGenerator        // all va && specific asid except global
700*a1d4b4bfSpeixiaokun        l3v := l3v & l3g & ~l3hhit
7017797f035SbugGenerator      }
7027797f035SbugGenerator    } .otherwise {
7037797f035SbugGenerator      // val flushMask = UIntToOH(genTlbL2Idx(sfence.bits.addr(sfence.bits.addr.getWidth-1, offLen)))
7047797f035SbugGenerator      val flushSetIdxOH = UIntToOH(genPtwL3SetIdx(sfence_vpn))
7057797f035SbugGenerator      // val flushMask = VecInit(flushSetIdxOH.asBools.map(Fill(l2tlbParams.l3nWays, _.asUInt))).asUInt
7067797f035SbugGenerator      val flushMask = VecInit(flushSetIdxOH.asBools.map { a => Fill(l2tlbParams.l3nWays, a.asUInt) }).asUInt
7077797f035SbugGenerator      flushSetIdxOH.suggestName(s"sfence_nrs1_flushSetIdxOH")
7087797f035SbugGenerator      flushMask.suggestName(s"sfence_nrs1_flushMask")
7097797f035SbugGenerator
7107797f035SbugGenerator      when (sfence_dup(3).bits.rs2) {
7117797f035SbugGenerator        // specific leaf of addr && all asid
712*a1d4b4bfSpeixiaokun        l3v := l3v & ~flushMask & ~l3hhit
7137797f035SbugGenerator      } .otherwise {
7147797f035SbugGenerator        // specific leaf of addr && specific asid
715*a1d4b4bfSpeixiaokun        l3v := l3v & (~flushMask | l3g | ~l3hhit)
7167797f035SbugGenerator      }
7177797f035SbugGenerator    }
7187797f035SbugGenerator  }
7197797f035SbugGenerator
720*a1d4b4bfSpeixiaokun  // sfence for virtualization and hfencev, simple implementation for l3
721d0de7e4aSpeixiaokun  val hfencev_valid_l3 = sfence_dup(3).valid && sfence_dup(3).bits.hv
722*a1d4b4bfSpeixiaokun  when(hfencev_valid_l3) {
723cca17e78Speixiaokun    val flushMask = VecInit(l3h.flatMap(_.map(_  === onlyStage1))).asUInt
724d0de7e4aSpeixiaokun    l3v := l3v & ~flushMask // all VS-stage l3 pte
725d0de7e4aSpeixiaokun  }
726d0de7e4aSpeixiaokun
727d0de7e4aSpeixiaokun  // hfenceg, simple implementation for l3
728d0de7e4aSpeixiaokun  val hfenceg_valid_l3 = sfence_dup(3).valid && sfence_dup(3).bits.hg
729d0de7e4aSpeixiaokun  when(hfenceg_valid_l3) {
730cca17e78Speixiaokun    val flushMask = VecInit(l3h.flatMap(_.map(_ === onlyStage2))).asUInt
731d0de7e4aSpeixiaokun    l3v := l3v & ~flushMask // all G-stage l3 pte
732d0de7e4aSpeixiaokun  }
733d0de7e4aSpeixiaokun
734d0de7e4aSpeixiaokun
735d0de7e4aSpeixiaokun  val l1asidhit = VecInit(l1asids.map(_ === sfence_dup(0).bits.id)).asUInt
736d0de7e4aSpeixiaokun  val spasidhit = VecInit(spasids.map(_ === sfence_dup(0).bits.id)).asUInt
737d0de7e4aSpeixiaokun  val sfence_valid = sfence_dup(0).valid && !sfence_dup(0).bits.hg && !sfence_dup(0).bits.hv
738d0de7e4aSpeixiaokun  when (sfence_valid) {
739cca17e78Speixiaokun    val l1vmidhit = VecInit(l1vmids.map(_.getOrElse(0.U) === io.csr_dup(0).hgatp.asid)).asUInt
740cca17e78Speixiaokun    val spvmidhit = VecInit(spvmids.map(_.getOrElse(0.U) === io.csr_dup(0).hgatp.asid)).asUInt
741*a1d4b4bfSpeixiaokun    val l1hhit = VecInit(l1h.map(_ === onlyStage1 && io.csr_dup(0).priv.virt || !io.csr_dup(0).priv.virt)).asUInt
742*a1d4b4bfSpeixiaokun    val sphhit = VecInit(sph.map(_ === onlyStage1 && io.csr_dup(0).priv.virt || !io.csr_dup(0).priv.virt)).asUInt
743*a1d4b4bfSpeixiaokun    val l2hhit = VecInit(l2h.flatMap(_.map(_ === onlyStage1 && io.csr_dup(0).priv.virt || !io.csr_dup(0).priv.virt))).asUInt
7447797f035SbugGenerator    val sfence_vpn = sfence_dup(0).bits.addr(sfence_dup(0).bits.addr.getWidth-1, offLen)
745d0de7e4aSpeixiaokun    val l2h_set = getl2hSet(sfence_vpn)
7467797f035SbugGenerator
7477797f035SbugGenerator    when (sfence_dup(0).bits.rs1/*va*/) {
7487797f035SbugGenerator      when (sfence_dup(0).bits.rs2) {
7496d5ddbceSLemover        // all va && all asid
750d0de7e4aSpeixiaokun        l2v := l2v & ~l2hhit
7510214776eSpeixiaokun        l1v := l1v & ~(l1hhit & VecInit(UIntToOH(l1vmidhit).asBools.map{a => io.csr_dup(0).priv.virt && a || !io.csr_dup(0).priv.virt}).asUInt)
7520214776eSpeixiaokun        spv := spv & ~(l2hhit & VecInit(UIntToOH(spvmidhit).asBools.map{a => io.csr_dup(0).priv.virt && a || !io.csr_dup(0).priv.virt}).asUInt)
7536d5ddbceSLemover      } .otherwise {
7546d5ddbceSLemover        // all va && specific asid except global
755d0de7e4aSpeixiaokun        l2v := l2v & (l2g | ~l2hhit)
7560214776eSpeixiaokun        l1v := l1v & ~(~l1g & l1hhit & l1asidhit & VecInit(UIntToOH(l1vmidhit).asBools.map{a => io.csr_dup(0).priv.virt && a || !io.csr_dup(0).priv.virt}).asUInt)
7570214776eSpeixiaokun        spv := spv & ~(~spg & sphhit & spasidhit & VecInit(UIntToOH(spvmidhit).asBools.map{a => io.csr_dup(0).priv.virt && a || !io.csr_dup(0).priv.virt}).asUInt)
7586d5ddbceSLemover      }
7596d5ddbceSLemover    } .otherwise {
7607797f035SbugGenerator      when (sfence_dup(0).bits.rs2) {
7616d5ddbceSLemover        // specific leaf of addr && all asid
76282978df9Speixiaokun        spv := spv & (~VecInit(sp.map(_.hit(sfence_vpn, sfence_dup(0).bits.id, io.csr_dup(0).hgatp.asid, ignoreAsid = true, s2xlate = io.csr_dup(0).priv.virt))).asUInt)
7636d5ddbceSLemover      } .otherwise {
7646d5ddbceSLemover        // specific leaf of addr && specific asid
76582978df9Speixiaokun        spv := spv & (~VecInit(sp.map(_.hit(sfence_vpn, sfence_dup(0).bits.id, io.csr_dup(0).hgatp.asid, s2xlate = io.csr_dup(0).priv.virt))).asUInt | spg)
766d0de7e4aSpeixiaokun      }
767d0de7e4aSpeixiaokun    }
768d0de7e4aSpeixiaokun  }
769d0de7e4aSpeixiaokun
770d0de7e4aSpeixiaokun  val hfencev_valid = sfence_dup(0).valid && sfence_dup(0).bits.hv
771d0de7e4aSpeixiaokun  when (hfencev_valid) {
772cca17e78Speixiaokun    val l1vmidhit = VecInit(l1vmids.map(_.getOrElse(0.U) === io.csr_dup(0).hgatp.asid)).asUInt
773cca17e78Speixiaokun    val spvmidhit = VecInit(spvmids.map(_.getOrElse(0.U) === io.csr_dup(0).hgatp.asid)).asUInt
774cca17e78Speixiaokun    val l1hhit = VecInit(l1h.map(_ === onlyStage1)).asUInt
775cca17e78Speixiaokun    val sphhit = VecInit(sph.map(_ === onlyStage1)).asUInt
776cca17e78Speixiaokun    val l2hhit = VecInit(l2h.flatMap(_.map(_ === onlyStage1))).asUInt
777d0de7e4aSpeixiaokun    val hfencev_vpn = sfence_dup(0).bits.addr(sfence_dup(0).bits.addr.getWidth-1, offLen)
778d0de7e4aSpeixiaokun    when(sfence_dup(0).bits.rs1) {
779d0de7e4aSpeixiaokun      when(sfence_dup(0).bits.rs2) {
780d0de7e4aSpeixiaokun        l2v := l2v & ~l2hhit
781d0de7e4aSpeixiaokun        l1v := l1v & ~(l1hhit & l1vmidhit)
782d0de7e4aSpeixiaokun        spv := spv & ~(l2hhit & spvmidhit)
783d0de7e4aSpeixiaokun      }.otherwise {
784d0de7e4aSpeixiaokun        l2v := l2v & (l2g | ~l2hhit)
785d0de7e4aSpeixiaokun        l1v := l1v & ~(~l1g & l1hhit & l1asidhit & l1vmidhit)
786d0de7e4aSpeixiaokun        spv := spv & ~(~spg & sphhit & spasidhit & spvmidhit)
787d0de7e4aSpeixiaokun      }
788d0de7e4aSpeixiaokun    }.otherwise {
789d0de7e4aSpeixiaokun      when(sfence_dup(0).bits.rs2) {
79082978df9Speixiaokun        spv := spv & (~VecInit(sp.map(_.hit(hfencev_vpn, sfence_dup(0).bits.id, io.csr_dup(0).hgatp.asid, ignoreAsid = true, s2xlate = true.B))).asUInt)
791d0de7e4aSpeixiaokun      }.otherwise {
79282978df9Speixiaokun        spv := spv & (~VecInit(sp.map(_.hit(hfencev_vpn, sfence_dup(0).bits.id, io.csr_dup(0).hgatp.asid, s2xlate = true.B))).asUInt | spg)
793d0de7e4aSpeixiaokun      }
794d0de7e4aSpeixiaokun    }
795d0de7e4aSpeixiaokun  }
796d0de7e4aSpeixiaokun
797d0de7e4aSpeixiaokun
798d0de7e4aSpeixiaokun  val hfenceg_valid = sfence_dup(0).valid && sfence_dup(0).bits.hg
799d0de7e4aSpeixiaokun  when(hfenceg_valid) {
800cca17e78Speixiaokun    val l1vmidhit = VecInit(l1vmids.map(_.getOrElse(0.U) === sfence_dup(0).bits.id)).asUInt
801cca17e78Speixiaokun    val spvmidhit = VecInit(spvmids.map(_.getOrElse(0.U) === sfence_dup(0).bits.id)).asUInt
802cca17e78Speixiaokun    val l1hhit = VecInit(l1h.map(_ === onlyStage2)).asUInt
803cca17e78Speixiaokun    val sphhit = VecInit(sph.map(_ === onlyStage2)).asUInt
804cca17e78Speixiaokun    val l2hhit = VecInit(l2h.flatMap(_.map(_ === onlyStage2))).asUInt
805d0de7e4aSpeixiaokun    val hfenceg_gvpn = sfence_dup(0).bits.addr(sfence_dup(0).bits.addr.getWidth - 1, offLen)
806d0de7e4aSpeixiaokun    when(sfence_dup(0).bits.rs1) {
807d0de7e4aSpeixiaokun      when(sfence_dup(0).bits.rs2) {
808d0de7e4aSpeixiaokun        l2v := l2v & ~l2hhit
809d0de7e4aSpeixiaokun        l1v := l1v & ~l1hhit
810d0de7e4aSpeixiaokun        spv := spv & ~sphhit
811d0de7e4aSpeixiaokun      }.otherwise {
812d0de7e4aSpeixiaokun        l2v := l2v & ~l2hhit
813d0de7e4aSpeixiaokun        l1v := l1v & ~(l1hhit & l1vmidhit)
814d0de7e4aSpeixiaokun        spv := spv & ~(sphhit & spvmidhit)
815d0de7e4aSpeixiaokun      }
816d0de7e4aSpeixiaokun    }.otherwise {
817d0de7e4aSpeixiaokun      when(sfence_dup(0).bits.rs2) {
81882978df9Speixiaokun        spv := spv & (~VecInit(sp.map(_.hit(hfenceg_gvpn, 0.U, sfence_dup(0).bits.id, ignoreAsid = true, s2xlate = true.B))).asUInt)
819d0de7e4aSpeixiaokun      }.otherwise {
82082978df9Speixiaokun        spv := spv & (~VecInit(sp.map(_.hit(hfenceg_gvpn, 0.U, sfence_dup(0).bits.id, ignoreAsid = true, s2xlate = false.B))).asUInt)
8216d5ddbceSLemover      }
8226d5ddbceSLemover    }
8236d5ddbceSLemover  }
8246d5ddbceSLemover
8257797f035SbugGenerator  def InsideStageConnect(in: DecoupledIO[PtwCacheReq], out: DecoupledIO[PtwCacheReq], inFire: Bool): Unit = {
8262c86e165SZhangZifei    in.ready := !in.valid || out.ready
8272c86e165SZhangZifei    out.valid := in.valid
8282c86e165SZhangZifei    out.bits := in.bits
8291f4a7c0cSLemover    out.bits.bypassed.zip(in.bits.bypassed).zipWithIndex.map{ case (b, i) =>
8307797f035SbugGenerator      val bypassed_reg = Reg(Bool())
831d0de7e4aSpeixiaokun      val bypassed_wire = refill_bypass(in.bits.req_info.vpn, i, in.bits.req_info.s2xlate) && io.refill.valid
8327797f035SbugGenerator      when (inFire) { bypassed_reg := bypassed_wire }
8337797f035SbugGenerator      .elsewhen (io.refill.valid) { bypassed_reg := bypassed_reg || bypassed_wire }
8347797f035SbugGenerator
8357797f035SbugGenerator      b._1 := b._2 || (bypassed_wire || (bypassed_reg && !inFire))
8361f4a7c0cSLemover    }
8372c86e165SZhangZifei  }
8382c86e165SZhangZifei
8396d5ddbceSLemover  // Perf Count
8406c4dcc2dSLemover  val resp_l3 = resp_res.l3.hit
8416c4dcc2dSLemover  val resp_sp = resp_res.sp.hit
8426c4dcc2dSLemover  val resp_l1_pre = resp_res.l1.pre
8436c4dcc2dSLemover  val resp_l2_pre = resp_res.l2.pre
8446c4dcc2dSLemover  val resp_l3_pre = resp_res.l3.pre
8456c4dcc2dSLemover  val resp_sp_pre = resp_res.sp.pre
846935edac4STang Haojin  val base_valid_access_0 = !from_pre(io.resp.bits.req_info.source) && io.resp.fire
847bc063562SLemover  XSPerfAccumulate("access", base_valid_access_0)
848bc063562SLemover  XSPerfAccumulate("l1_hit", base_valid_access_0 && io.resp.bits.toFsm.l1Hit && !io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
849bc063562SLemover  XSPerfAccumulate("l2_hit", base_valid_access_0 && io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
850bc063562SLemover  XSPerfAccumulate("l3_hit", base_valid_access_0 && resp_l3)
851bc063562SLemover  XSPerfAccumulate("sp_hit", base_valid_access_0 && resp_sp)
852bc063562SLemover  XSPerfAccumulate("pte_hit",base_valid_access_0 && io.resp.bits.hit)
853bc063562SLemover
854bc063562SLemover  XSPerfAccumulate("l1_hit_pre", base_valid_access_0 && resp_l1_pre && io.resp.bits.toFsm.l1Hit && !io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
855bc063562SLemover  XSPerfAccumulate("l2_hit_pre", base_valid_access_0 && resp_l2_pre && io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
856bc063562SLemover  XSPerfAccumulate("l3_hit_pre", base_valid_access_0 && resp_l3_pre && resp_l3)
857bc063562SLemover  XSPerfAccumulate("sp_hit_pre", base_valid_access_0 && resp_sp_pre && resp_sp)
858bc063562SLemover  XSPerfAccumulate("pte_hit_pre",base_valid_access_0 && (resp_l3_pre && resp_l3 || resp_sp_pre && resp_sp) && io.resp.bits.hit)
859bc063562SLemover
860935edac4STang Haojin  val base_valid_access_1 = from_pre(io.resp.bits.req_info.source) && io.resp.fire
861bc063562SLemover  XSPerfAccumulate("pre_access", base_valid_access_1)
862bc063562SLemover  XSPerfAccumulate("pre_l1_hit", base_valid_access_1 && io.resp.bits.toFsm.l1Hit && !io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
863bc063562SLemover  XSPerfAccumulate("pre_l2_hit", base_valid_access_1 && io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
864bc063562SLemover  XSPerfAccumulate("pre_l3_hit", base_valid_access_1 && resp_l3)
865bc063562SLemover  XSPerfAccumulate("pre_sp_hit", base_valid_access_1 && resp_sp)
866bc063562SLemover  XSPerfAccumulate("pre_pte_hit",base_valid_access_1 && io.resp.bits.hit)
867bc063562SLemover
868bc063562SLemover  XSPerfAccumulate("pre_l1_hit_pre", base_valid_access_1 && resp_l1_pre && io.resp.bits.toFsm.l1Hit && !io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
869bc063562SLemover  XSPerfAccumulate("pre_l2_hit_pre", base_valid_access_1 && resp_l2_pre && io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
870bc063562SLemover  XSPerfAccumulate("pre_l3_hit_pre", base_valid_access_1 && resp_l3_pre && resp_l3)
871bc063562SLemover  XSPerfAccumulate("pre_sp_hit_pre", base_valid_access_1 && resp_sp_pre && resp_sp)
872bc063562SLemover  XSPerfAccumulate("pre_pte_hit_pre",base_valid_access_1 && (resp_l3_pre && resp_l3 || resp_sp_pre && resp_sp) && io.resp.bits.hit)
873bc063562SLemover
874935edac4STang Haojin  val base_valid_access_2 = stageResp.bits.isFirst && !from_pre(io.resp.bits.req_info.source) && io.resp.fire
875bc063562SLemover  XSPerfAccumulate("access_first", base_valid_access_2)
876bc063562SLemover  XSPerfAccumulate("l1_hit_first", base_valid_access_2 && io.resp.bits.toFsm.l1Hit && !io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
877bc063562SLemover  XSPerfAccumulate("l2_hit_first", base_valid_access_2 && io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
878bc063562SLemover  XSPerfAccumulate("l3_hit_first", base_valid_access_2 && resp_l3)
879bc063562SLemover  XSPerfAccumulate("sp_hit_first", base_valid_access_2 && resp_sp)
880bc063562SLemover  XSPerfAccumulate("pte_hit_first",base_valid_access_2 && io.resp.bits.hit)
881bc063562SLemover
882bc063562SLemover  XSPerfAccumulate("l1_hit_pre_first", base_valid_access_2 && resp_l1_pre && io.resp.bits.toFsm.l1Hit && !io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
883bc063562SLemover  XSPerfAccumulate("l2_hit_pre_first", base_valid_access_2 && resp_l2_pre && io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
884bc063562SLemover  XSPerfAccumulate("l3_hit_pre_first", base_valid_access_2 && resp_l3_pre && resp_l3)
885bc063562SLemover  XSPerfAccumulate("sp_hit_pre_first", base_valid_access_2 && resp_sp_pre && resp_sp)
886bc063562SLemover  XSPerfAccumulate("pte_hit_pre_first",base_valid_access_2 && (resp_l3_pre && resp_l3 || resp_sp_pre && resp_sp) && io.resp.bits.hit)
887bc063562SLemover
888935edac4STang Haojin  val base_valid_access_3 = stageResp.bits.isFirst && from_pre(io.resp.bits.req_info.source) && io.resp.fire
889bc063562SLemover  XSPerfAccumulate("pre_access_first", base_valid_access_3)
890bc063562SLemover  XSPerfAccumulate("pre_l1_hit_first", base_valid_access_3 && io.resp.bits.toFsm.l1Hit && !io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
891bc063562SLemover  XSPerfAccumulate("pre_l2_hit_first", base_valid_access_3 && io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
892bc063562SLemover  XSPerfAccumulate("pre_l3_hit_first", base_valid_access_3 && resp_l3)
893bc063562SLemover  XSPerfAccumulate("pre_sp_hit_first", base_valid_access_3 && resp_sp)
894bc063562SLemover  XSPerfAccumulate("pre_pte_hit_first", base_valid_access_3 && io.resp.bits.hit)
895bc063562SLemover
896bc063562SLemover  XSPerfAccumulate("pre_l1_hit_pre_first", base_valid_access_3 && resp_l1_pre && io.resp.bits.toFsm.l1Hit && !io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
897bc063562SLemover  XSPerfAccumulate("pre_l2_hit_pre_first", base_valid_access_3 && resp_l2_pre && io.resp.bits.toFsm.l2Hit && !io.resp.bits.hit)
898bc063562SLemover  XSPerfAccumulate("pre_l3_hit_pre_first", base_valid_access_3 && resp_l3_pre && resp_l3)
899bc063562SLemover  XSPerfAccumulate("pre_sp_hit_pre_first", base_valid_access_3 && resp_sp_pre && resp_sp)
900bc063562SLemover  XSPerfAccumulate("pre_pte_hit_pre_first",base_valid_access_3 && (resp_l3_pre && resp_l3 || resp_sp_pre && resp_sp) && io.resp.bits.hit)
901bc063562SLemover
9026d5ddbceSLemover  XSPerfAccumulate("rwHarzad", io.req.valid && !io.req.ready)
9036d5ddbceSLemover  XSPerfAccumulate("out_blocked", io.resp.valid && !io.resp.ready)
9046d5ddbceSLemover  l1AccessPerf.zipWithIndex.map{ case (l, i) => XSPerfAccumulate(s"L1AccessIndex${i}", l) }
9056d5ddbceSLemover  l2AccessPerf.zipWithIndex.map{ case (l, i) => XSPerfAccumulate(s"L2AccessIndex${i}", l) }
9066d5ddbceSLemover  l3AccessPerf.zipWithIndex.map{ case (l, i) => XSPerfAccumulate(s"L3AccessIndex${i}", l) }
9076d5ddbceSLemover  spAccessPerf.zipWithIndex.map{ case (l, i) => XSPerfAccumulate(s"SPAccessIndex${i}", l) }
9086d5ddbceSLemover  l1RefillPerf.zipWithIndex.map{ case (l, i) => XSPerfAccumulate(s"L1RefillIndex${i}", l) }
9096d5ddbceSLemover  l2RefillPerf.zipWithIndex.map{ case (l, i) => XSPerfAccumulate(s"L2RefillIndex${i}", l) }
9106d5ddbceSLemover  l3RefillPerf.zipWithIndex.map{ case (l, i) => XSPerfAccumulate(s"L3RefillIndex${i}", l) }
9116d5ddbceSLemover  spRefillPerf.zipWithIndex.map{ case (l, i) => XSPerfAccumulate(s"SPRefillIndex${i}", l) }
9126d5ddbceSLemover
913bc063562SLemover  XSPerfAccumulate("l1Refill", Cat(l1RefillPerf).orR)
914bc063562SLemover  XSPerfAccumulate("l2Refill", Cat(l2RefillPerf).orR)
915bc063562SLemover  XSPerfAccumulate("l3Refill", Cat(l3RefillPerf).orR)
916bc063562SLemover  XSPerfAccumulate("spRefill", Cat(spRefillPerf).orR)
9177797f035SbugGenerator  XSPerfAccumulate("l1Refill_pre", Cat(l1RefillPerf).orR && refill_prefetch_dup(0))
9187797f035SbugGenerator  XSPerfAccumulate("l2Refill_pre", Cat(l2RefillPerf).orR && refill_prefetch_dup(0))
9197797f035SbugGenerator  XSPerfAccumulate("l3Refill_pre", Cat(l3RefillPerf).orR && refill_prefetch_dup(0))
9207797f035SbugGenerator  XSPerfAccumulate("spRefill_pre", Cat(spRefillPerf).orR && refill_prefetch_dup(0))
921bc063562SLemover
9226d5ddbceSLemover  // debug
9237797f035SbugGenerator  XSDebug(sfence_dup(0).valid, p"[sfence] original v and g vector:\n")
9247797f035SbugGenerator  XSDebug(sfence_dup(0).valid, p"[sfence] l1v:${Binary(l1v)}\n")
9257797f035SbugGenerator  XSDebug(sfence_dup(0).valid, p"[sfence] l2v:${Binary(l2v)}\n")
9267797f035SbugGenerator  XSDebug(sfence_dup(0).valid, p"[sfence] l3v:${Binary(l3v)}\n")
9277797f035SbugGenerator  XSDebug(sfence_dup(0).valid, p"[sfence] l3g:${Binary(l3g)}\n")
9287797f035SbugGenerator  XSDebug(sfence_dup(0).valid, p"[sfence] spv:${Binary(spv)}\n")
9297797f035SbugGenerator  XSDebug(RegNext(sfence_dup(0).valid), p"[sfence] new v and g vector:\n")
9307797f035SbugGenerator  XSDebug(RegNext(sfence_dup(0).valid), p"[sfence] l1v:${Binary(l1v)}\n")
9317797f035SbugGenerator  XSDebug(RegNext(sfence_dup(0).valid), p"[sfence] l2v:${Binary(l2v)}\n")
9327797f035SbugGenerator  XSDebug(RegNext(sfence_dup(0).valid), p"[sfence] l3v:${Binary(l3v)}\n")
9337797f035SbugGenerator  XSDebug(RegNext(sfence_dup(0).valid), p"[sfence] l3g:${Binary(l3g)}\n")
9347797f035SbugGenerator  XSDebug(RegNext(sfence_dup(0).valid), p"[sfence] spv:${Binary(spv)}\n")
935cd365d4cSrvcoresjw
936cd365d4cSrvcoresjw  val perfEvents = Seq(
93756be8e20SYinan Xu    ("access           ", base_valid_access_0             ),
938cd365d4cSrvcoresjw    ("l1_hit           ", l1Hit                           ),
939cd365d4cSrvcoresjw    ("l2_hit           ", l2Hit                           ),
940cd365d4cSrvcoresjw    ("l3_hit           ", l3Hit                           ),
941cd365d4cSrvcoresjw    ("sp_hit           ", spHit                           ),
942cd365d4cSrvcoresjw    ("pte_hit          ", l3Hit || spHit                  ),
943cd365d4cSrvcoresjw    ("rwHarzad         ",  io.req.valid && !io.req.ready  ),
944cd365d4cSrvcoresjw    ("out_blocked      ",  io.resp.valid && !io.resp.ready),
945cd365d4cSrvcoresjw  )
9461ca0e4f3SYinan Xu  generatePerfEvent()
9476d5ddbceSLemover}
948