xref: /XiangShan/src/main/scala/xiangshan/frontend/icache/ICacheMissUnit.scala (revision 00240ba60853d0c9a5dc31089dee22d7fe1d7afd)
11d8f4dcbSJay/***************************************************************************************
21d8f4dcbSJay* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
31d8f4dcbSJay* Copyright (c) 2020-2021 Peng Cheng Laboratory
41d8f4dcbSJay*
51d8f4dcbSJay* XiangShan is licensed under Mulan PSL v2.
61d8f4dcbSJay* You can use this software according to the terms and conditions of the Mulan PSL v2.
71d8f4dcbSJay* You may obtain a copy of Mulan PSL v2 at:
81d8f4dcbSJay*          http://license.coscl.org.cn/MulanPSL2
91d8f4dcbSJay*
101d8f4dcbSJay* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
111d8f4dcbSJay* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
121d8f4dcbSJay* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
131d8f4dcbSJay*
141d8f4dcbSJay* See the Mulan PSL v2 for more details.
151d8f4dcbSJay***************************************************************************************/
161d8f4dcbSJay
171d8f4dcbSJaypackage xiangshan.frontend.icache
181d8f4dcbSJay
191d8f4dcbSJayimport chipsalliance.rocketchip.config.Parameters
201d8f4dcbSJayimport chisel3._
211d8f4dcbSJayimport chisel3.util._
221d8f4dcbSJayimport freechips.rocketchip.diplomacy.IdRange
231d8f4dcbSJayimport freechips.rocketchip.tilelink.ClientStates._
241d8f4dcbSJayimport freechips.rocketchip.tilelink.TLPermissions._
251d8f4dcbSJayimport freechips.rocketchip.tilelink._
261d8f4dcbSJayimport xiangshan._
271d8f4dcbSJayimport huancun.{AliasKey, DirtyKey}
281d8f4dcbSJayimport xiangshan.cache._
291d8f4dcbSJayimport utils._
301d8f4dcbSJay
311d8f4dcbSJay
321d8f4dcbSJayabstract class ICacheMissUnitModule(implicit p: Parameters) extends XSModule
331d8f4dcbSJay  with HasICacheParameters
341d8f4dcbSJay
351d8f4dcbSJayabstract class ICacheMissUnitBundle(implicit p: Parameters) extends XSBundle
361d8f4dcbSJay  with HasICacheParameters
371d8f4dcbSJay
381d8f4dcbSJayclass ICacheMissReq(implicit p: Parameters) extends ICacheBundle
391d8f4dcbSJay{
401d8f4dcbSJay    val paddr      = UInt(PAddrBits.W)
411d8f4dcbSJay    val vaddr      = UInt(VAddrBits.W)
421d8f4dcbSJay    val waymask   = UInt(nWays.W)
431d8f4dcbSJay    val coh       = new ClientMetadata
441d8f4dcbSJay
451d8f4dcbSJay    def getVirSetIdx = get_idx(vaddr)
461d8f4dcbSJay    def getPhyTag    = get_phy_tag(paddr)
471d8f4dcbSJay}
481d8f4dcbSJay
491d8f4dcbSJay
501d8f4dcbSJayclass ICacheMissResp(implicit p: Parameters) extends ICacheBundle
511d8f4dcbSJay{
521d8f4dcbSJay    val data     = UInt(blockBits.W)
5358dbdfc2SJay    val corrupt  = Bool()
541d8f4dcbSJay}
551d8f4dcbSJay
561d8f4dcbSJayclass ICacheMissBundle(implicit p: Parameters) extends ICacheBundle{
571d8f4dcbSJay    val req       =   Vec(2, Flipped(DecoupledIO(new ICacheMissReq)))
581d8f4dcbSJay    val resp      =   Vec(2,ValidIO(new ICacheMissResp))
591d8f4dcbSJay    val flush     =   Input(Bool())
601d8f4dcbSJay}
611d8f4dcbSJay
621d8f4dcbSJay
631d8f4dcbSJayclass ICacheMissEntry(edge: TLEdgeOut, id: Int)(implicit p: Parameters) extends ICacheMissUnitModule
641d8f4dcbSJay  with MemoryOpConstants
651d8f4dcbSJay{
661d8f4dcbSJay  val io = IO(new Bundle {
677052722fSJay    val id = Input(UInt(log2Ceil(PortNumber).W))
681d8f4dcbSJay
691d8f4dcbSJay    val req = Flipped(DecoupledIO(new ICacheMissReq))
701d8f4dcbSJay    val resp = ValidIO(new ICacheMissResp)
711d8f4dcbSJay
721d8f4dcbSJay    //tilelink channel
731d8f4dcbSJay    val mem_acquire = DecoupledIO(new TLBundleA(edge.bundle))
741d8f4dcbSJay    val mem_grant = Flipped(DecoupledIO(new TLBundleD(edge.bundle)))
751d8f4dcbSJay    val mem_finish = DecoupledIO(new TLBundleE(edge.bundle))
761d8f4dcbSJay
771d8f4dcbSJay    val meta_write = DecoupledIO(new ICacheMetaWriteBundle)
781d8f4dcbSJay    val data_write = DecoupledIO(new ICacheDataWriteBundle)
791d8f4dcbSJay
802a25dbb4SJay    val release_req    =  DecoupledIO(new ReplacePipeReq)
812a25dbb4SJay    val release_resp   =  Flipped(ValidIO(UInt(ReplaceIdWid.W)))
822a25dbb4SJay    val victimInfor    =  Output(new ICacheVictimInfor())
837052722fSJay
84*00240ba6SJay    val toPrefetch    = ValidIO(UInt(PAddrBits.W))
85*00240ba6SJay
861d8f4dcbSJay  })
871d8f4dcbSJay
881d8f4dcbSJay  /** default value for control signals */
891d8f4dcbSJay  io.resp := DontCare
901d8f4dcbSJay  io.mem_acquire.bits := DontCare
911d8f4dcbSJay  io.mem_grant.ready := true.B
921d8f4dcbSJay  io.meta_write.bits := DontCare
931d8f4dcbSJay  io.data_write.bits := DontCare
941d8f4dcbSJay
952a25dbb4SJay  val s_idle  :: s_send_mem_aquire :: s_wait_mem_grant :: s_write_back :: s_send_grant_ack :: s_send_replace :: s_wait_replace :: s_wait_resp :: Nil = Enum(8)
961d8f4dcbSJay  val state = RegInit(s_idle)
971d8f4dcbSJay  /** control logic transformation */
981d8f4dcbSJay  //request register
991d8f4dcbSJay  val req = Reg(new ICacheMissReq)
1001d8f4dcbSJay  val req_idx = req.getVirSetIdx //virtual index
1011d8f4dcbSJay  val req_tag = req.getPhyTag //physical tag
1021d8f4dcbSJay  val req_waymask = req.waymask
1037052722fSJay  val release_id  = Cat(MainPipeKey.U, id.U)
10458dbdfc2SJay  val req_corrupt = RegInit(false.B)
1051d8f4dcbSJay
1062a25dbb4SJay  io.victimInfor.valid := state === s_send_replace || state === s_wait_replace || state === s_wait_resp
1072a25dbb4SJay  io.victimInfor.vidx  := req_idx
1081d8f4dcbSJay
1091d8f4dcbSJay  val (_, _, refill_done, refill_address_inc) = edge.addr_inc(io.mem_grant)
1101d8f4dcbSJay
1111d8f4dcbSJay  //cacheline register
1121d8f4dcbSJay  val readBeatCnt = Reg(UInt(log2Up(refillCycles).W))
1131d8f4dcbSJay  val respDataReg = Reg(Vec(refillCycles, UInt(beatBits.W)))
1141d8f4dcbSJay
1151d8f4dcbSJay  //initial
1161d8f4dcbSJay  io.resp.bits := DontCare
1171d8f4dcbSJay  io.mem_acquire.bits := DontCare
1181d8f4dcbSJay  io.mem_grant.ready := true.B
1191d8f4dcbSJay  io.meta_write.bits := DontCare
1201d8f4dcbSJay  io.data_write.bits := DontCare
1211d8f4dcbSJay
1222a25dbb4SJay  io.release_req.bits.paddr := req.paddr
1232a25dbb4SJay  io.release_req.bits.vaddr := req.vaddr
1242a25dbb4SJay  io.release_req.bits.voluntary := true.B
1252a25dbb4SJay  io.release_req.bits.waymask   := req.waymask
1260bebd829SJay  io.release_req.bits.needData   := false.B
1272a25dbb4SJay  io.release_req.bits.id   := release_id
1282a25dbb4SJay  io.release_req.bits.param := DontCare //release will not care tilelink param
1291d8f4dcbSJay
1301d8f4dcbSJay  io.req.ready := (state === s_idle)
1312a25dbb4SJay  io.mem_acquire.valid := (state === s_send_mem_aquire)
1322a25dbb4SJay  io.release_req.valid := (state === s_send_replace)
1331d8f4dcbSJay
134*00240ba6SJay  io.toPrefetch.valid := (state =/= s_idle)
135*00240ba6SJay  io.toPrefetch.bits  :=  addrAlign(req.paddr, blockBytes, PAddrBits)
136*00240ba6SJay
1371d8f4dcbSJay  val grantack = RegEnable(edge.GrantAck(io.mem_grant.bits), io.mem_grant.fire())
1381d8f4dcbSJay  val grant_param = Reg(UInt(TLPermissions.bdWidth.W))
1391d8f4dcbSJay  val is_dirty = RegInit(false.B)
1401d8f4dcbSJay  val is_grant = RegEnable(edge.isRequest(io.mem_grant.bits), io.mem_grant.fire())
1411d8f4dcbSJay
1421d8f4dcbSJay  //state change
1431d8f4dcbSJay  switch(state) {
1441d8f4dcbSJay    is(s_idle) {
1451d8f4dcbSJay      when(io.req.fire()) {
1461d8f4dcbSJay        readBeatCnt := 0.U
1471d8f4dcbSJay        state := s_send_mem_aquire
1481d8f4dcbSJay        req := io.req.bits
1491d8f4dcbSJay      }
1501d8f4dcbSJay    }
1511d8f4dcbSJay
1521d8f4dcbSJay    // memory request
1531d8f4dcbSJay    is(s_send_mem_aquire) {
1541d8f4dcbSJay      when(io.mem_acquire.fire()) {
1551d8f4dcbSJay        state := s_wait_mem_grant
1561d8f4dcbSJay      }
1571d8f4dcbSJay    }
1581d8f4dcbSJay
1591d8f4dcbSJay    is(s_wait_mem_grant) {
1601d8f4dcbSJay      when(edge.hasData(io.mem_grant.bits)) {
1611d8f4dcbSJay        when(io.mem_grant.fire()) {
1621d8f4dcbSJay          readBeatCnt := readBeatCnt + 1.U
1631d8f4dcbSJay          respDataReg(readBeatCnt) := io.mem_grant.bits.data
16458dbdfc2SJay          req_corrupt := io.mem_grant.bits.corrupt
1651d8f4dcbSJay          grant_param := io.mem_grant.bits.param
1661d8f4dcbSJay          is_dirty    := io.mem_grant.bits.echo.lift(DirtyKey).getOrElse(false.B)
1671d8f4dcbSJay          when(readBeatCnt === (refillCycles - 1).U) {
1681d8f4dcbSJay            assert(refill_done, "refill not done!")
1692a25dbb4SJay            state := s_send_grant_ack
1701d8f4dcbSJay          }
1711d8f4dcbSJay        }
1721d8f4dcbSJay      }
1731d8f4dcbSJay    }
1741d8f4dcbSJay
1751d8f4dcbSJay    is(s_send_grant_ack) {
1761d8f4dcbSJay      when(io.mem_finish.fire()) {
1776cc2baa1SJay        state := s_send_replace
1781d8f4dcbSJay      }
1791d8f4dcbSJay    }
1801d8f4dcbSJay
1812a25dbb4SJay    is(s_send_replace){
1822a25dbb4SJay      when(io.release_req.fire()){
1832a25dbb4SJay        state := s_wait_replace
1842a25dbb4SJay      }
1852a25dbb4SJay    }
1862a25dbb4SJay
1872a25dbb4SJay    is(s_wait_replace){
1882a25dbb4SJay      when(io.release_resp.valid && io.release_resp.bits === release_id){
1892a25dbb4SJay        state := s_write_back
1902a25dbb4SJay      }
1912a25dbb4SJay    }
1922a25dbb4SJay
1932a25dbb4SJay    is(s_write_back) {
1942a25dbb4SJay      state := Mux(io.meta_write.fire() && io.data_write.fire(), s_wait_resp, s_write_back)
1952a25dbb4SJay    }
1962a25dbb4SJay
1971d8f4dcbSJay    is(s_wait_resp) {
1981d8f4dcbSJay      io.resp.bits.data := respDataReg.asUInt
19958dbdfc2SJay      io.resp.bits.corrupt := req_corrupt
2001d8f4dcbSJay      when(io.resp.fire()) {
2011d8f4dcbSJay        state := s_idle
2021d8f4dcbSJay      }
2031d8f4dcbSJay    }
2041d8f4dcbSJay  }
2051d8f4dcbSJay
2061d8f4dcbSJay  /** refill write and meta write */
2071d8f4dcbSJay  val missCoh    = ClientMetadata(Nothing)
2081d8f4dcbSJay  val grow_param = missCoh.onAccess(M_XRD)._2
2091d8f4dcbSJay  val acquireBlock = edge.AcquireBlock(
2101d8f4dcbSJay    fromSource = io.id,
2111d8f4dcbSJay    toAddress = addrAlign(req.paddr, blockBytes, PAddrBits),
2121d8f4dcbSJay    lgSize = (log2Up(cacheParams.blockBytes)).U,
2131d8f4dcbSJay    growPermissions = grow_param
2141d8f4dcbSJay  )._2
2151d8f4dcbSJay  io.mem_acquire.bits := acquireBlock
2161d8f4dcbSJay  // resolve cache alias by L2
2171d8f4dcbSJay  io.mem_acquire.bits.user.lift(AliasKey).foreach(_ := req.vaddr(13, 12))
2181d8f4dcbSJay  require(nSets <= 256) // icache size should not be more than 128KB
2191d8f4dcbSJay
2201d8f4dcbSJay  /** Grant ACK */
2211d8f4dcbSJay  io.mem_finish.valid := (state === s_send_grant_ack) && is_grant
2221d8f4dcbSJay  io.mem_finish.bits := grantack
2231d8f4dcbSJay
2241d8f4dcbSJay  //resp to ifu
2251d8f4dcbSJay  io.resp.valid := state === s_wait_resp
2262a25dbb4SJay  /** update coh meta */
2272a25dbb4SJay  def missCohGen(param: UInt, dirty: Bool): UInt = {
2282a25dbb4SJay    MuxLookup(Cat(param, dirty), Nothing, Seq(
2292a25dbb4SJay      Cat(toB, false.B) -> Branch,
2302a25dbb4SJay      Cat(toB, true.B)  -> Branch,
2312a25dbb4SJay      Cat(toT, false.B) -> Trunk,
2322a25dbb4SJay      Cat(toT, true.B)  -> Dirty))
2332a25dbb4SJay  }
2342a25dbb4SJay
2352a25dbb4SJay  val miss_new_coh = ClientMetadata(missCohGen(grant_param, is_dirty))
2362a25dbb4SJay
2372a25dbb4SJay  io.meta_write.valid := (state === s_write_back)
2382a25dbb4SJay  io.meta_write.bits.generate(tag = req_tag, coh = miss_new_coh, idx = req_idx, waymask = req_waymask, bankIdx = req_idx(0))
2392a25dbb4SJay
2402a25dbb4SJay  io.data_write.valid := (state === s_write_back)
2412a25dbb4SJay  io.data_write.bits.generate(data = respDataReg.asUInt, idx = req_idx, waymask = req_waymask, bankIdx = req_idx(0))
2421d8f4dcbSJay
2431d8f4dcbSJay  XSPerfAccumulate(
2441d8f4dcbSJay    "entryPenalty" + Integer.toString(id, 10),
2451d8f4dcbSJay    BoolStopWatch(
2461d8f4dcbSJay      start = io.req.fire(),
2471d8f4dcbSJay      stop = io.resp.valid,
2481d8f4dcbSJay      startHighPriority = true)
2491d8f4dcbSJay  )
2501d8f4dcbSJay  XSPerfAccumulate("entryReq" + Integer.toString(id, 10), io.req.fire())
2511d8f4dcbSJay
2521d8f4dcbSJay}
2531d8f4dcbSJay
2541d8f4dcbSJay
2551d8f4dcbSJayclass ICacheMissUnit(edge: TLEdgeOut)(implicit p: Parameters) extends ICacheMissUnitModule
2561d8f4dcbSJay{
2571d8f4dcbSJay  val io = IO(new Bundle{
2581d8f4dcbSJay    val req         = Vec(2, Flipped(DecoupledIO(new ICacheMissReq)))
2591d8f4dcbSJay    val resp        = Vec(2, ValidIO(new ICacheMissResp))
2601d8f4dcbSJay
2611d8f4dcbSJay    val mem_acquire = DecoupledIO(new TLBundleA(edge.bundle))
2621d8f4dcbSJay    val mem_grant   = Flipped(DecoupledIO(new TLBundleD(edge.bundle)))
2631d8f4dcbSJay    val mem_finish  = DecoupledIO(new TLBundleE(edge.bundle))
2641d8f4dcbSJay
2651d8f4dcbSJay    val meta_write  = DecoupledIO(new ICacheMetaWriteBundle)
2661d8f4dcbSJay    val data_write  = DecoupledIO(new ICacheDataWriteBundle)
2671d8f4dcbSJay
2682a25dbb4SJay    val release_req    =  DecoupledIO(new ReplacePipeReq)
2692a25dbb4SJay    val release_resp   =  Flipped(ValidIO(UInt(ReplaceIdWid.W)))
2701d8f4dcbSJay
2712a25dbb4SJay    val victimInfor = Vec(PortNumber, Output(new ICacheVictimInfor()))
2722a25dbb4SJay
2737052722fSJay    val prefetch_req          =  Flipped(DecoupledIO(new PIQReq))
274*00240ba6SJay    val prefetch_check        =  Vec(PortNumber,ValidIO(UInt(PAddrBits.W)))
275*00240ba6SJay
2767052722fSJay
2771d8f4dcbSJay  })
2781d8f4dcbSJay  // assign default values to output signals
2791d8f4dcbSJay  io.mem_grant.ready := false.B
2801d8f4dcbSJay
2811d8f4dcbSJay  val meta_write_arb = Module(new Arbiter(new ICacheMetaWriteBundle,  PortNumber))
2821d8f4dcbSJay  val refill_arb     = Module(new Arbiter(new ICacheDataWriteBundle,  PortNumber))
2832a25dbb4SJay  val release_arb    = Module(new Arbiter(new ReplacePipeReq,  PortNumber))
2841d8f4dcbSJay
2851d8f4dcbSJay  io.mem_grant.ready := true.B
2861d8f4dcbSJay
2872a25dbb4SJay  val entries = (0 until PortNumber) map { i =>
2881d8f4dcbSJay    val entry = Module(new ICacheMissEntry(edge, i))
2891d8f4dcbSJay
2901d8f4dcbSJay    entry.io.id := i.U
2911d8f4dcbSJay
2921d8f4dcbSJay    // entry req
2931d8f4dcbSJay    entry.io.req.valid := io.req(i).valid
2941d8f4dcbSJay    entry.io.req.bits  := io.req(i).bits
2951d8f4dcbSJay    io.req(i).ready    := entry.io.req.ready
2961d8f4dcbSJay
2971d8f4dcbSJay    // entry resp
2981d8f4dcbSJay    meta_write_arb.io.in(i)     <>  entry.io.meta_write
2991d8f4dcbSJay    refill_arb.io.in(i)         <>  entry.io.data_write
3002a25dbb4SJay    release_arb.io.in(i)        <>  entry.io.release_req
3011d8f4dcbSJay
3021d8f4dcbSJay    entry.io.mem_grant.valid := false.B
3031d8f4dcbSJay    entry.io.mem_grant.bits  := DontCare
3041d8f4dcbSJay    when (io.mem_grant.bits.source === i.U) {
3051d8f4dcbSJay      entry.io.mem_grant <> io.mem_grant
3061d8f4dcbSJay    }
3071d8f4dcbSJay
3081d8f4dcbSJay    io.resp(i) <> entry.io.resp
3091d8f4dcbSJay
3102a25dbb4SJay    io.victimInfor(i) := entry.io.victimInfor
311*00240ba6SJay    io.prefetch_check(i) <> entry.io.toPrefetch
3122a25dbb4SJay
3132a25dbb4SJay    entry.io.release_resp <> io.release_resp
3142a25dbb4SJay
3151d8f4dcbSJay    XSPerfAccumulate(
3161d8f4dcbSJay      "entryPenalty" + Integer.toString(i, 10),
3171d8f4dcbSJay      BoolStopWatch(
3181d8f4dcbSJay        start = entry.io.req.fire(),
3191d8f4dcbSJay        stop = entry.io.resp.fire(),
3201d8f4dcbSJay        startHighPriority = true)
3211d8f4dcbSJay    )
3221d8f4dcbSJay    XSPerfAccumulate("entryReq" + Integer.toString(i, 10), entry.io.req.fire())
3231d8f4dcbSJay
3241d8f4dcbSJay    entry
3251d8f4dcbSJay  }
3261d8f4dcbSJay
3277052722fSJay  val alloc = Wire(UInt(log2Ceil(nPrefetchEntries).W))
3287052722fSJay
329de7689fcSJay  val prefEntries = (PortNumber until PortNumber + nPrefetchEntries) map { i =>
3307052722fSJay    val prefetchEntry = Module(new IPrefetchEntry(edge, PortNumber))
3317052722fSJay
3327052722fSJay    prefetchEntry.io.mem_hint_ack.valid := false.B
3337052722fSJay    prefetchEntry.io.mem_hint_ack.bits := DontCare
3347052722fSJay
3357052722fSJay    when(io.mem_grant.bits.source === PortNumber.U) {
3367052722fSJay      prefetchEntry.io.mem_hint_ack <> io.mem_grant
3377052722fSJay    }
3387052722fSJay
339de7689fcSJay    prefetchEntry.io.req.valid := io.prefetch_req.valid && ((i-PortNumber).U === alloc)
3407052722fSJay    prefetchEntry.io.req.bits  := io.prefetch_req.bits
3417052722fSJay
3427052722fSJay    prefetchEntry.io.id := i.U
3437052722fSJay
3447052722fSJay    prefetchEntry
3457052722fSJay  }
3467052722fSJay
3477052722fSJay  alloc := PriorityEncoder(prefEntries.map(_.io.req.ready))
3487052722fSJay  io.prefetch_req.ready := ParallelOR(prefEntries.map(_.io.req.ready))
3497052722fSJay  val tl_a_chanel = entries.map(_.io.mem_acquire) ++ prefEntries.map(_.io.mem_hint)
3507052722fSJay  TLArbiter.lowest(edge, io.mem_acquire, tl_a_chanel:_*)
3517052722fSJay
3521d8f4dcbSJay  TLArbiter.lowest(edge, io.mem_finish,  entries.map(_.io.mem_finish):_*)
3531d8f4dcbSJay
3541d8f4dcbSJay  io.meta_write     <> meta_write_arb.io.out
3551d8f4dcbSJay  io.data_write     <> refill_arb.io.out
3562a25dbb4SJay  io.release_req        <> release_arb.io.out
3571d8f4dcbSJay
3581d8f4dcbSJay  (0 until nWays).map{ w =>
3591d8f4dcbSJay    XSPerfAccumulate("line_0_refill_way_" + Integer.toString(w, 10),  entries(0).io.meta_write.valid && OHToUInt(entries(0).io.meta_write.bits.waymask)  === w.U)
3601d8f4dcbSJay    XSPerfAccumulate("line_1_refill_way_" + Integer.toString(w, 10),  entries(1).io.meta_write.valid && OHToUInt(entries(1).io.meta_write.bits.waymask)  === w.U)
3611d8f4dcbSJay  }
3621d8f4dcbSJay
3631d8f4dcbSJay}
3641d8f4dcbSJay
3651d8f4dcbSJay
3661d8f4dcbSJay
367