xref: /XiangShan/src/main/scala/xiangshan/cache/mmu/Repeater.scala (revision 45f497a4abde3fa5930268b418d634554b21b0b8)
16d5ddbceSLemover/***************************************************************************************
26d5ddbceSLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory
46d5ddbceSLemover*
56d5ddbceSLemover* XiangShan is licensed under Mulan PSL v2.
66d5ddbceSLemover* You can use this software according to the terms and conditions of the Mulan PSL v2.
76d5ddbceSLemover* You may obtain a copy of Mulan PSL v2 at:
86d5ddbceSLemover*          http://license.coscl.org.cn/MulanPSL2
96d5ddbceSLemover*
106d5ddbceSLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
116d5ddbceSLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
126d5ddbceSLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
136d5ddbceSLemover*
146d5ddbceSLemover* See the Mulan PSL v2 for more details.
156d5ddbceSLemover***************************************************************************************/
166d5ddbceSLemover
176d5ddbceSLemoverpackage xiangshan.cache.mmu
186d5ddbceSLemover
196d5ddbceSLemoverimport chipsalliance.rocketchip.config.Parameters
206d5ddbceSLemoverimport chisel3._
216d5ddbceSLemoverimport chisel3.util._
226d5ddbceSLemoverimport xiangshan._
236d5ddbceSLemoverimport xiangshan.cache.{HasDCacheParameters, MemoryOpConstants}
246d5ddbceSLemoverimport utils._
256d5ddbceSLemoverimport freechips.rocketchip.diplomacy.{LazyModule, LazyModuleImp}
266d5ddbceSLemoverimport freechips.rocketchip.tilelink._
276d5ddbceSLemover
28*45f497a4Shappy-lxclass PTWReapterIO(Width: Int)(implicit p: Parameters) extends MMUIOBaseBundle {
296d5ddbceSLemover  val tlb = Flipped(new TlbPtwIO(Width))
306d5ddbceSLemover  val ptw = new TlbPtwIO
31*45f497a4Shappy-lx
32*45f497a4Shappy-lx  override def cloneType: this.type = (new PTWReapterIO(Width)).asInstanceOf[this.type]
33*45f497a4Shappy-lx}
34*45f497a4Shappy-lx
35*45f497a4Shappy-lxclass PTWRepeater(Width: Int = 1)(implicit p: Parameters) extends XSModule with HasPtwConst {
36*45f497a4Shappy-lx  val io = IO(new PTWReapterIO(Width))
37*45f497a4Shappy-lx
386d5ddbceSLemover  val req_in = if (Width == 1) {
396d5ddbceSLemover    io.tlb.req(0)
406d5ddbceSLemover  } else {
416d5ddbceSLemover    val arb = Module(new RRArbiter(io.tlb.req(0).bits.cloneType, Width))
426d5ddbceSLemover    arb.io.in <> io.tlb.req
436d5ddbceSLemover    arb.io.out
446d5ddbceSLemover  }
45*45f497a4Shappy-lx  val (tlb, ptw, flush) = (io.tlb, io.ptw, RegNext(io.sfence.valid || io.csr.satp.changed))
466d5ddbceSLemover  val req = RegEnable(req_in.bits, req_in.fire())
476d5ddbceSLemover  val resp = RegEnable(ptw.resp.bits, ptw.resp.fire())
48*45f497a4Shappy-lx  val haveOne = BoolStopWatch(req_in.fire(), tlb.resp.fire() || flush)
49*45f497a4Shappy-lx  val sent = BoolStopWatch(ptw.req(0).fire(), req_in.fire() || flush)
50*45f497a4Shappy-lx  val recv = BoolStopWatch(ptw.resp.fire(), req_in.fire() || flush)
516d5ddbceSLemover
526d5ddbceSLemover  req_in.ready := !haveOne
536d5ddbceSLemover  ptw.req(0).valid := haveOne && !sent
546d5ddbceSLemover  ptw.req(0).bits := req
556d5ddbceSLemover
566d5ddbceSLemover  tlb.resp.bits := resp
576d5ddbceSLemover  tlb.resp.valid := haveOne && recv
586d5ddbceSLemover  ptw.resp.ready := !recv
596d5ddbceSLemover
606d5ddbceSLemover  XSPerfAccumulate("req_count", ptw.req(0).fire())
61*45f497a4Shappy-lx  XSPerfAccumulate("tlb_req_cycle", BoolStopWatch(req_in.fire(), tlb.resp.fire() || flush))
62*45f497a4Shappy-lx  XSPerfAccumulate("ptw_req_cycle", BoolStopWatch(ptw.req(0).fire(), ptw.resp.fire() || flush))
636d5ddbceSLemover
64*45f497a4Shappy-lx  XSDebug(haveOne, p"haveOne:${haveOne} sent:${sent} recv:${recv} sfence:${flush} req:${req} resp:${resp}")
656d5ddbceSLemover  XSDebug(req_in.valid || io.tlb.resp.valid, p"tlb: ${tlb}\n")
666d5ddbceSLemover  XSDebug(io.ptw.req(0).valid || io.ptw.resp.valid, p"ptw: ${ptw}\n")
676d5ddbceSLemover  assert(!RegNext(recv && io.ptw.resp.valid, init = false.B), "re-receive ptw.resp")
689bd9cdfaSLemover  TimeOutAssert(sent && !recv, timeOutThreshold, "Repeater doesn't recv resp in time")
696d5ddbceSLemover}
706d5ddbceSLemover
716d5ddbceSLemover/* dtlb
726d5ddbceSLemover *
736d5ddbceSLemover */
74*45f497a4Shappy-lxclass PTWFilterIO(Width: Int)(implicit p: Parameters) extends MMUIOBaseBundle {
75a0301c0dSLemover  val tlb = Flipped(new BTlbPtwIO(Width))
76a0301c0dSLemover  val ptw = new TlbPtwIO()
776d5ddbceSLemover
78*45f497a4Shappy-lx  override def cloneType: this.type = (new PTWFilterIO(Width)).asInstanceOf[this.type]
79*45f497a4Shappy-lx}
80*45f497a4Shappy-lx
81*45f497a4Shappy-lxclass PTWFilter(Width: Int, Size: Int)(implicit p: Parameters) extends XSModule with HasPtwConst {
826d5ddbceSLemover  require(Size >= Width)
836d5ddbceSLemover
84*45f497a4Shappy-lx  val io = IO(new PTWFilterIO(Width))
85*45f497a4Shappy-lx
866d5ddbceSLemover  val v = RegInit(VecInit(Seq.fill(Size)(false.B)))
87a0301c0dSLemover  val ports = Reg(Vec(Size, Vec(Width, Bool()))) // record which port(s) the entry come from, may not able to cover all the ports
886d5ddbceSLemover  val vpn = Reg(Vec(Size, UInt(vpnLen.W)))
896d5ddbceSLemover  val enqPtr = RegInit(0.U(log2Up(Size).W)) // Enq
906d5ddbceSLemover  val issPtr = RegInit(0.U(log2Up(Size).W)) // Iss to Ptw
916d5ddbceSLemover  val deqPtr = RegInit(0.U(log2Up(Size).W)) // Deq
926d5ddbceSLemover  val mayFullDeq = RegInit(false.B)
936d5ddbceSLemover  val mayFullIss = RegInit(false.B)
946d5ddbceSLemover  val counter = RegInit(0.U(log2Up(Size+1).W))
956d5ddbceSLemover
96*45f497a4Shappy-lx  val flush = RegNext(io.sfence.valid || io.csr.satp.changed)
976d5ddbceSLemover  val ptwResp = RegEnable(io.ptw.resp.bits, io.ptw.resp.fire())
986d5ddbceSLemover  val ptwResp_valid = RegNext(io.ptw.resp.valid, init = false.B)
99a0301c0dSLemover  val tlb_req = io.tlb.req
100a0301c0dSLemover  val oldMatchVec = tlb_req.map(a => vpn.zip(v).map{case (pi, vi) => vi && a.valid && pi === a.bits.vpn })
101a0301c0dSLemover  val newMatchVec = tlb_req.map(a => tlb_req.map(b => b.valid && a.valid && b.bits.vpn === a.bits.vpn ))
102*45f497a4Shappy-lx  val ptwResp_newMatchVec = tlb_req.map(a => ptwResp_valid && ptwResp.entry.hit(a.bits.vpn, io.csr.satp.asid, allType = true) && a.valid) // TODO: may have long latency
103*45f497a4Shappy-lx  val ptwResp_oldMatchVec = vpn.zip(v).map{ case (pi, vi) => vi && ptwResp.entry.hit(pi, io.csr.satp.asid, allType = true) }
104a0301c0dSLemover  val update_ports = v.indices.map(i => oldMatchVec.map(j => j(i)))
105a0301c0dSLemover  val ports_init = (0 until Width).map(i => (1 << i).U(Width.W))
106a0301c0dSLemover  val filter_ports = (0 until Width).map(i => ParallelMux(newMatchVec(i).zip(ports_init).drop(i)))
107a0301c0dSLemover  val resp_vector = ParallelMux(ptwResp_oldMatchVec zip ports)
108a0301c0dSLemover  val resp_still_valid = ParallelOR(ptwResp_oldMatchVec).asBool
1096d5ddbceSLemover
110a0301c0dSLemover  def canMerge(index: Int) : Bool = {
111a0301c0dSLemover    ptwResp_newMatchVec(index) ||
112a0301c0dSLemover    Cat(oldMatchVec(index)).orR ||
113a0301c0dSLemover    Cat(newMatchVec(index).take(index)).orR
114a0301c0dSLemover  }
115a0301c0dSLemover
116a0301c0dSLemover  def filter_req() = {
117a0301c0dSLemover    val reqs =  tlb_req.indices.map{ i =>
118a0301c0dSLemover      val req = Wire(ValidIO(new PtwReq()))
119a0301c0dSLemover      val merge = canMerge(i)
120a0301c0dSLemover      req.bits := tlb_req(i).bits
121a0301c0dSLemover      req.valid := !merge && tlb_req(i).valid
122a0301c0dSLemover      req
123a0301c0dSLemover    }
124a0301c0dSLemover    reqs
125a0301c0dSLemover  }
126a0301c0dSLemover
127a0301c0dSLemover  val reqs = filter_req()
128a0301c0dSLemover  val req_ports = filter_ports
1296d5ddbceSLemover  var enqPtr_next = WireInit(deqPtr)
1306d5ddbceSLemover  val isFull = enqPtr === deqPtr && mayFullDeq
1316d5ddbceSLemover  val isEmptyDeq = enqPtr === deqPtr && !mayFullDeq
1326d5ddbceSLemover  val isEmptyIss = enqPtr === issPtr && !mayFullIss
1336d5ddbceSLemover  val accumEnqNum = (0 until Width).map(i => PopCount(reqs.take(i).map(_.valid)))
1346d5ddbceSLemover  val enqPtrVec = VecInit((0 until Width).map(i => enqPtr + accumEnqNum(i)))
1356d5ddbceSLemover  val enqNum = PopCount(reqs.map(_.valid))
1366d5ddbceSLemover  val canEnqueue = counter +& enqNum <= Size.U
1376d5ddbceSLemover
1386d5ddbceSLemover  io.tlb.req.map(_.ready := true.B) // NOTE: just drop un-fire reqs
139a0301c0dSLemover  io.tlb.resp.valid := ptwResp_valid && resp_still_valid
140a0301c0dSLemover  io.tlb.resp.bits.data := ptwResp
141a0301c0dSLemover  io.tlb.resp.bits.vector := resp_vector
142*45f497a4Shappy-lx  io.ptw.req(0).valid := v(issPtr) && !isEmptyIss && !(ptwResp_valid && ptwResp.entry.hit(io.ptw.req(0).bits.vpn, io.csr.satp.asid, ignoreAsid = true))
1436d5ddbceSLemover  io.ptw.req(0).bits.vpn := vpn(issPtr)
1446d5ddbceSLemover  io.ptw.resp.ready := true.B
1456d5ddbceSLemover
1466d5ddbceSLemover  reqs.zipWithIndex.map{
1476d5ddbceSLemover    case (req, i) =>
1486d5ddbceSLemover      when (req.valid && canEnqueue) {
1496d5ddbceSLemover        v(enqPtrVec(i)) := true.B
1506d5ddbceSLemover        vpn(enqPtrVec(i)) := req.bits.vpn
151a0301c0dSLemover        ports(enqPtrVec(i)) := req_ports(i).asBools
152a0301c0dSLemover      }
153a0301c0dSLemover  }
154a0301c0dSLemover  for (i <- ports.indices) {
155a0301c0dSLemover    when (v(i)) {
156a0301c0dSLemover      ports(i) := ports(i).zip(update_ports(i)).map(a => a._1 || a._2)
1576d5ddbceSLemover    }
1586d5ddbceSLemover  }
1596d5ddbceSLemover
1606d5ddbceSLemover  val do_enq = canEnqueue && Cat(reqs.map(_.valid)).orR
1616d5ddbceSLemover  val do_deq = (!v(deqPtr) && !isEmptyDeq)
1626d5ddbceSLemover  val do_iss = io.ptw.req(0).fire() || (!v(issPtr) && !isEmptyIss)
1636d5ddbceSLemover  when (do_enq) {
1646d5ddbceSLemover    enqPtr := enqPtr + enqNum
1656d5ddbceSLemover  }
1666d5ddbceSLemover  when (do_deq) {
1676d5ddbceSLemover    deqPtr := deqPtr + 1.U
1686d5ddbceSLemover  }
1696d5ddbceSLemover  when (do_iss) {
1706d5ddbceSLemover    issPtr := issPtr + 1.U
1716d5ddbceSLemover  }
1726d5ddbceSLemover  when (do_enq =/= do_deq) {
1736d5ddbceSLemover    mayFullDeq := do_enq
1746d5ddbceSLemover  }
1756d5ddbceSLemover  when (do_enq =/= do_iss) {
1766d5ddbceSLemover    mayFullIss := do_enq
1776d5ddbceSLemover  }
1786d5ddbceSLemover
1796d5ddbceSLemover  when (ptwResp_valid) {
180a0301c0dSLemover    v.zip(ptwResp_oldMatchVec).map{ case (vi, mi) => when (mi) { vi := false.B }}
1816d5ddbceSLemover  }
1826d5ddbceSLemover
1836d5ddbceSLemover  counter := counter - do_deq + Mux(do_enq, enqNum, 0.U)
1846d5ddbceSLemover  assert(counter <= Size.U, "counter should be less than Size")
1856d5ddbceSLemover  when (counter === 0.U) {
1866d5ddbceSLemover    assert(!io.ptw.req(0).fire(), "when counter is 0, should not req")
1876d5ddbceSLemover    assert(isEmptyDeq && isEmptyIss, "when counter is 0, should be empty")
1886d5ddbceSLemover  }
1896d5ddbceSLemover  when (counter === Size.U) {
1906d5ddbceSLemover    assert(mayFullDeq, "when counter is Size, should be full")
1916d5ddbceSLemover  }
1926d5ddbceSLemover
193*45f497a4Shappy-lx  when (flush) {
1946d5ddbceSLemover    v.map(_ := false.B)
1956d5ddbceSLemover    deqPtr := 0.U
1966d5ddbceSLemover    enqPtr := 0.U
1976d5ddbceSLemover    issPtr := 0.U
1986d5ddbceSLemover    ptwResp_valid := false.B
1996d5ddbceSLemover    mayFullDeq := false.B
2006d5ddbceSLemover    mayFullIss := false.B
2016d5ddbceSLemover    counter := 0.U
2026d5ddbceSLemover  }
2036d5ddbceSLemover
2046d5ddbceSLemover  // perf
2056d5ddbceSLemover  val inflight_counter = RegInit(0.U(log2Up(Size + 1).W))
2066d5ddbceSLemover  when (io.ptw.req(0).fire() =/= io.ptw.resp.fire()) {
2076d5ddbceSLemover    inflight_counter := Mux(io.ptw.req(0).fire(), inflight_counter + 1.U, inflight_counter - 1.U)
2086d5ddbceSLemover  }
209*45f497a4Shappy-lx  when (flush) {
2106d5ddbceSLemover    inflight_counter := 0.U
2116d5ddbceSLemover  }
2126d5ddbceSLemover  XSPerfAccumulate("tlb_req_count", PopCount(Cat(io.tlb.req.map(_.valid))))
2136d5ddbceSLemover  XSPerfAccumulate("tlb_req_count_filtered", Mux(do_enq, accumEnqNum(Width - 1), 0.U))
2146d5ddbceSLemover  XSPerfAccumulate("ptw_req_count", io.ptw.req(0).fire())
2156d5ddbceSLemover  XSPerfAccumulate("ptw_req_cycle", inflight_counter)
2166d5ddbceSLemover  XSPerfAccumulate("tlb_resp_count", io.tlb.resp.fire())
2176d5ddbceSLemover  XSPerfAccumulate("ptw_resp_count", io.ptw.resp.fire())
2186d5ddbceSLemover  XSPerfAccumulate("inflight_cycle", !isEmptyDeq)
2196d5ddbceSLemover  for (i <- 0 until Size + 1) {
2206d5ddbceSLemover    XSPerfAccumulate(s"counter${i}", counter === i.U)
2216d5ddbceSLemover  }
2229bd9cdfaSLemover
2239bd9cdfaSLemover  for (i <- 0 until Size) {
2249bd9cdfaSLemover    TimeOutAssert(v(i), timeOutThreshold, s"Filter ${i} doesn't recv resp in time")
2259bd9cdfaSLemover  }
2266d5ddbceSLemover}
227