1/*************************************************************************************** 2* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3* Copyright (c) 2020-2021 Peng Cheng Laboratory 4* 5* XiangShan is licensed under Mulan PSL v2. 6* You can use this software according to the terms and conditions of the Mulan PSL v2. 7* You may obtain a copy of Mulan PSL v2 at: 8* http://license.coscl.org.cn/MulanPSL2 9* 10* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13* 14* See the Mulan PSL v2 for more details. 15***************************************************************************************/ 16 17package xiangshan.frontend.icache 18 19import chipsalliance.rocketchip.config.Parameters 20import chisel3._ 21import chisel3.util.{DecoupledIO, _} 22import freechips.rocketchip.diplomacy.{IdRange, LazyModule, LazyModuleImp, TransferSizes} 23import freechips.rocketchip.tilelink._ 24import freechips.rocketchip.util.BundleFieldBase 25import coupledL2.{AliasField, DirtyField, PrefetchField} 26import xiangshan._ 27import xiangshan.frontend._ 28import xiangshan.cache._ 29import utils._ 30import utility._ 31import xiangshan.backend.fu.PMPReqBundle 32import xiangshan.cache.mmu.{TlbRequestIO, TlbReq} 33import difftest._ 34 35case class ICacheParameters( 36 nSets: Int = 256, 37 nWays: Int = 8, 38 rowBits: Int = 64, 39 nTLBEntries: Int = 32, 40 tagECC: Option[String] = None, 41 dataECC: Option[String] = None, 42 replacer: Option[String] = Some("random"), 43 nMissEntries: Int = 2, 44 nReleaseEntries: Int = 1, 45 nProbeEntries: Int = 2, 46 nPrefetchEntries: Int = 12, 47 nPrefBufferEntries: Int = 64, 48 prefetchPipeNum: Int = 2, 49 hasPrefetch: Boolean = true, 50 nMMIOs: Int = 1, 51 blockBytes: Int = 64 52)extends L1CacheParameters { 53 54 val setBytes = nSets * blockBytes 55 val aliasBitsOpt = DCacheParameters().aliasBitsOpt //if(setBytes > pageSize) Some(log2Ceil(setBytes / pageSize)) else None 56 val reqFields: Seq[BundleFieldBase] = Seq( 57 PrefetchField() 58 ) ++ aliasBitsOpt.map(AliasField) 59 val echoFields: Seq[BundleFieldBase] = Nil 60 def tagCode: Code = Code.fromString(tagECC) 61 def dataCode: Code = Code.fromString(dataECC) 62 def replacement = ReplacementPolicy.fromString(replacer,nWays,nSets) 63} 64 65trait HasICacheParameters extends HasL1CacheParameters with HasInstrMMIOConst with HasIFUConst{ 66 val cacheParams = icacheParameters 67 val dataCodeUnit = 16 68 val dataCodeUnitNum = blockBits/dataCodeUnit 69 70 def highestIdxBit = log2Ceil(nSets) - 1 71 def encDataUnitBits = cacheParams.dataCode.width(dataCodeUnit) 72 def dataCodeBits = encDataUnitBits - dataCodeUnit 73 def dataCodeEntryBits = dataCodeBits * dataCodeUnitNum 74 75 val ICacheSets = cacheParams.nSets 76 val ICacheWays = cacheParams.nWays 77 78 val ICacheSameVPAddrLength = 12 79 val ReplaceIdWid = 5 80 81 val ICacheWordOffset = 0 82 val ICacheSetOffset = ICacheWordOffset + log2Up(blockBytes) 83 val ICacheAboveIndexOffset = ICacheSetOffset + log2Up(ICacheSets) 84 val ICacheTagOffset = ICacheAboveIndexOffset min ICacheSameVPAddrLength 85 86 def PortNumber = 2 87 88 def partWayNum = 4 89 def pWay = nWays/partWayNum 90 91 def nPrefetchEntries = cacheParams.nPrefetchEntries 92 def totalMSHRNum = PortNumber + nPrefetchEntries 93 def nIPFBufferSize = cacheParams.nPrefBufferEntries 94 def maxIPFMoveConf = 1 // temporary use small value to cause more "move" operation 95 def prefetchPipeNum = ICacheParameters().prefetchPipeNum 96 97 def getBits(num: Int) = log2Ceil(num).W 98 99 100 def generatePipeControl(lastFire: Bool, thisFire: Bool, thisFlush: Bool, lastFlush: Bool): Bool = { 101 val valid = RegInit(false.B) 102 when(thisFlush) {valid := false.B} 103 .elsewhen(lastFire && !lastFlush) {valid := true.B} 104 .elsewhen(thisFire) {valid := false.B} 105 valid 106 } 107 108 def ResultHoldBypass[T<:Data](data: T, valid: Bool): T = { 109 Mux(valid, data, RegEnable(data, valid)) 110 } 111 112 def holdReleaseLatch(valid: Bool, release: Bool, flush: Bool): Bool ={ 113 val bit = RegInit(false.B) 114 when(flush) { bit := false.B } 115 .elsewhen(valid && !release) { bit := true.B } 116 .elsewhen(release) { bit := false.B } 117 bit || valid 118 } 119 120 def blockCounter(block: Bool, flush: Bool, threshold: Int): Bool = { 121 val counter = RegInit(0.U(log2Up(threshold + 1).W)) 122 when (block) { counter := counter + 1.U } 123 when (flush) { counter := 0.U} 124 counter > threshold.U 125 } 126 127 require(isPow2(nSets), s"nSets($nSets) must be pow2") 128 require(isPow2(nWays), s"nWays($nWays) must be pow2") 129} 130 131abstract class ICacheBundle(implicit p: Parameters) extends XSBundle 132 with HasICacheParameters 133 134abstract class ICacheModule(implicit p: Parameters) extends XSModule 135 with HasICacheParameters 136 137abstract class ICacheArray(implicit p: Parameters) extends XSModule 138 with HasICacheParameters 139 140class ICacheMetadata(implicit p: Parameters) extends ICacheBundle { 141 val tag = UInt(tagBits.W) 142} 143 144object ICacheMetadata { 145 def apply(tag: Bits)(implicit p: Parameters) = { 146 val meta = Wire(new ICacheMetadata) 147 meta.tag := tag 148 meta 149 } 150} 151 152 153class ICacheMetaArray()(implicit p: Parameters) extends ICacheArray 154{ 155 def onReset = ICacheMetadata(0.U) 156 val metaBits = onReset.getWidth 157 val metaEntryBits = cacheParams.tagCode.width(metaBits) 158 159 val io=IO{new Bundle{ 160 val write = Flipped(DecoupledIO(new ICacheMetaWriteBundle)) 161 val read = Flipped(DecoupledIO(new ICacheReadBundle)) 162 val readResp = Output(new ICacheMetaRespBundle) 163 val cacheOp = Flipped(new L1CacheInnerOpIO) // customized cache op port 164 val fencei = Input(Bool()) 165 }} 166 167 io.read.ready := !io.write.valid 168 169 val port_0_read_0 = io.read.valid && !io.read.bits.vSetIdx(0)(0) 170 val port_0_read_1 = io.read.valid && io.read.bits.vSetIdx(0)(0) 171 val port_1_read_1 = io.read.valid && io.read.bits.vSetIdx(1)(0) && io.read.bits.isDoubleLine 172 val port_1_read_0 = io.read.valid && !io.read.bits.vSetIdx(1)(0) && io.read.bits.isDoubleLine 173 174 val port_0_read_0_reg = RegEnable(next = port_0_read_0, enable = io.read.fire()) 175 val port_0_read_1_reg = RegEnable(next = port_0_read_1, enable = io.read.fire()) 176 val port_1_read_1_reg = RegEnable(next = port_1_read_1, enable = io.read.fire()) 177 val port_1_read_0_reg = RegEnable(next = port_1_read_0, enable = io.read.fire()) 178 179 val bank_0_idx = Mux(port_0_read_0, io.read.bits.vSetIdx(0), io.read.bits.vSetIdx(1)) 180 val bank_1_idx = Mux(port_0_read_1, io.read.bits.vSetIdx(0), io.read.bits.vSetIdx(1)) 181 val bank_idx = Seq(bank_0_idx, bank_1_idx) 182 183 val write_bank_0 = io.write.valid && !io.write.bits.bankIdx 184 val write_bank_1 = io.write.valid && io.write.bits.bankIdx 185 186 val write_meta_bits = Wire(UInt(metaEntryBits.W)) 187 188 val tagArrays = (0 until 2) map { bank => 189 val tagArray = Module(new SRAMTemplate( 190 UInt(metaEntryBits.W), 191 set=nSets/2, 192 way=nWays, 193 shouldReset = true, 194 holdRead = true, 195 singlePort = true 196 )) 197 198 //meta connection 199 if(bank == 0) { 200 tagArray.io.r.req.valid := port_0_read_0 || port_1_read_0 201 tagArray.io.r.req.bits.apply(setIdx=bank_0_idx(highestIdxBit,1)) 202 tagArray.io.w.req.valid := write_bank_0 203 tagArray.io.w.req.bits.apply(data=write_meta_bits, setIdx=io.write.bits.virIdx(highestIdxBit,1), waymask=io.write.bits.waymask) 204 } 205 else { 206 tagArray.io.r.req.valid := port_0_read_1 || port_1_read_1 207 tagArray.io.r.req.bits.apply(setIdx=bank_1_idx(highestIdxBit,1)) 208 tagArray.io.w.req.valid := write_bank_1 209 tagArray.io.w.req.bits.apply(data=write_meta_bits, setIdx=io.write.bits.virIdx(highestIdxBit,1), waymask=io.write.bits.waymask) 210 } 211 212 tagArray 213 } 214 215 val read_set_idx_next = RegEnable(next = io.read.bits.vSetIdx, enable = io.read.fire) 216 val valid_array = RegInit(VecInit(Seq.fill(nWays)(0.U(nSets.W)))) 217 val valid_metas = Wire(Vec(PortNumber, Vec(nWays, Bool()))) 218 // valid read 219 (0 until PortNumber).foreach( i => 220 (0 until nWays).foreach( way => 221 valid_metas(i)(way) := valid_array(way)(read_set_idx_next(i)) 222 )) 223 io.readResp.entryValid := valid_metas 224 225 io.read.ready := !io.write.valid && !io.fencei && tagArrays.map(_.io.r.req.ready).reduce(_&&_) 226 227 //Parity Decode 228 val read_metas = Wire(Vec(2,Vec(nWays,new ICacheMetadata()))) 229 for((tagArray,i) <- tagArrays.zipWithIndex){ 230 val read_meta_bits = tagArray.io.r.resp.asTypeOf(Vec(nWays,UInt(metaEntryBits.W))) 231 val read_meta_decoded = read_meta_bits.map{ way_bits => cacheParams.tagCode.decode(way_bits)} 232 val read_meta_wrong = read_meta_decoded.map{ way_bits_decoded => way_bits_decoded.error} 233 val read_meta_corrected = VecInit(read_meta_decoded.map{ way_bits_decoded => way_bits_decoded.corrected}) 234 read_metas(i) := read_meta_corrected.asTypeOf(Vec(nWays,new ICacheMetadata())) 235 (0 until nWays).map{ w => io.readResp.errors(i)(w) := RegNext(read_meta_wrong(w)) && RegNext(RegNext(io.read.fire))} 236 } 237 238 //Parity Encode 239 val write = io.write.bits 240 write_meta_bits := cacheParams.tagCode.encode(ICacheMetadata(tag = write.phyTag).asUInt) 241 242 // valid write 243 val way_num = OHToUInt(io.write.bits.waymask) 244 when (io.write.valid) { 245 valid_array(way_num) := valid_array(way_num).bitSet(io.write.bits.virIdx, true.B) 246 } 247 248 XSPerfAccumulate("meta_refill_num", io.write.valid) 249 250 io.readResp.metaData <> DontCare 251 when(port_0_read_0_reg){ 252 io.readResp.metaData(0) := read_metas(0) 253 }.elsewhen(port_0_read_1_reg){ 254 io.readResp.metaData(0) := read_metas(1) 255 } 256 257 when(port_1_read_0_reg){ 258 io.readResp.metaData(1) := read_metas(0) 259 }.elsewhen(port_1_read_1_reg){ 260 io.readResp.metaData(1) := read_metas(1) 261 } 262 263 264 io.write.ready := true.B // TODO : has bug ? should be !io.cacheOp.req.valid 265 // deal with customized cache op 266 require(nWays <= 32) 267 io.cacheOp.resp.bits := DontCare 268 val cacheOpShouldResp = WireInit(false.B) 269 when(io.cacheOp.req.valid){ 270 when( 271 CacheInstrucion.isReadTag(io.cacheOp.req.bits.opCode) || 272 CacheInstrucion.isReadTagECC(io.cacheOp.req.bits.opCode) 273 ){ 274 for (i <- 0 until 2) { 275 tagArrays(i).io.r.req.valid := true.B 276 tagArrays(i).io.r.req.bits.apply(setIdx = io.cacheOp.req.bits.index) 277 } 278 cacheOpShouldResp := true.B 279 } 280 when(CacheInstrucion.isWriteTag(io.cacheOp.req.bits.opCode)){ 281 for (i <- 0 until 2) { 282 tagArrays(i).io.w.req.valid := true.B 283 tagArrays(i).io.w.req.bits.apply( 284 data = io.cacheOp.req.bits.write_tag_low, 285 setIdx = io.cacheOp.req.bits.index, 286 waymask = UIntToOH(io.cacheOp.req.bits.wayNum(4, 0)) 287 ) 288 } 289 cacheOpShouldResp := true.B 290 } 291 // TODO 292 // when(CacheInstrucion.isWriteTagECC(io.cacheOp.req.bits.opCode)){ 293 // for (i <- 0 until readPorts) { 294 // array(i).io.ecc_write.valid := true.B 295 // array(i).io.ecc_write.bits.idx := io.cacheOp.req.bits.index 296 // array(i).io.ecc_write.bits.way_en := UIntToOH(io.cacheOp.req.bits.wayNum(4, 0)) 297 // array(i).io.ecc_write.bits.ecc := io.cacheOp.req.bits.write_tag_ecc 298 // } 299 // cacheOpShouldResp := true.B 300 // } 301 } 302 io.cacheOp.resp.valid := RegNext(io.cacheOp.req.valid && cacheOpShouldResp) 303 io.cacheOp.resp.bits.read_tag_low := Mux(io.cacheOp.resp.valid, 304 tagArrays(0).io.r.resp.asTypeOf(Vec(nWays, UInt(tagBits.W)))(io.cacheOp.req.bits.wayNum), 305 0.U 306 ) 307 io.cacheOp.resp.bits.read_tag_ecc := DontCare // TODO 308 // TODO: deal with duplicated array 309 310 // fencei logic : reset valid_array 311 when (io.fencei) { 312 (0 until nWays).foreach( way => 313 valid_array(way) := 0.U 314 ) 315 } 316} 317 318 319 320class ICacheDataArray(implicit p: Parameters) extends ICacheArray 321{ 322 323 def getECCFromEncUnit(encUnit: UInt) = { 324 require(encUnit.getWidth == encDataUnitBits) 325 if (encDataUnitBits == dataCodeUnit) { 326 0.U.asTypeOf(UInt(1.W)) 327 } else { 328 encUnit(encDataUnitBits - 1, dataCodeUnit) 329 } 330 } 331 332 def getECCFromBlock(cacheblock: UInt) = { 333 // require(cacheblock.getWidth == blockBits) 334 VecInit((0 until dataCodeUnitNum).map { w => 335 val unit = cacheblock(dataCodeUnit * (w + 1) - 1, dataCodeUnit * w) 336 getECCFromEncUnit(cacheParams.dataCode.encode(unit)) 337 }) 338 } 339 340 val io=IO{new Bundle{ 341 val write = Flipped(DecoupledIO(new ICacheDataWriteBundle)) 342 val read = Flipped(DecoupledIO(Vec(partWayNum, new ICacheReadBundle))) 343 val readResp = Output(new ICacheDataRespBundle) 344 val cacheOp = Flipped(new L1CacheInnerOpIO) // customized cache op port 345 }} 346 347 val write_data_bits = Wire(UInt(blockBits.W)) 348 349 val port_0_read_0_reg = RegEnable(next = io.read.valid && io.read.bits.head.port_0_read_0, enable = io.read.fire()) 350 val port_0_read_1_reg = RegEnable(next = io.read.valid && io.read.bits.head.port_0_read_1, enable = io.read.fire()) 351 val port_1_read_1_reg = RegEnable(next = io.read.valid && io.read.bits.head.port_1_read_1, enable = io.read.fire()) 352 val port_1_read_0_reg = RegEnable(next = io.read.valid && io.read.bits.head.port_1_read_0, enable = io.read.fire()) 353 354 val bank_0_idx_vec = io.read.bits.map(copy => Mux(io.read.valid && copy.port_0_read_0, copy.vSetIdx(0), copy.vSetIdx(1))) 355 val bank_1_idx_vec = io.read.bits.map(copy => Mux(io.read.valid && copy.port_0_read_1, copy.vSetIdx(0), copy.vSetIdx(1))) 356 357 val dataArrays = (0 until partWayNum).map{ i => 358 val dataArray = Module(new ICachePartWayArray( 359 UInt(blockBits.W), 360 pWay, 361 )) 362 363 dataArray.io.read.req(0).valid := io.read.bits(i).read_bank_0 && io.read.valid 364 dataArray.io.read.req(0).bits.ridx := bank_0_idx_vec(i)(highestIdxBit,1) 365 dataArray.io.read.req(1).valid := io.read.bits(i).read_bank_1 && io.read.valid 366 dataArray.io.read.req(1).bits.ridx := bank_1_idx_vec(i)(highestIdxBit,1) 367 368 369 dataArray.io.write.valid := io.write.valid 370 dataArray.io.write.bits.wdata := write_data_bits 371 dataArray.io.write.bits.widx := io.write.bits.virIdx(highestIdxBit,1) 372 dataArray.io.write.bits.wbankidx := io.write.bits.bankIdx 373 dataArray.io.write.bits.wmask := io.write.bits.waymask.asTypeOf(Vec(partWayNum, Vec(pWay, Bool())))(i) 374 375 dataArray 376 } 377 378 val read_datas = Wire(Vec(2,Vec(nWays,UInt(blockBits.W) ))) 379 380 (0 until PortNumber).map { port => 381 (0 until nWays).map { w => 382 read_datas(port)(w) := dataArrays(w / pWay).io.read.resp.rdata(port).asTypeOf(Vec(pWay, UInt(blockBits.W)))(w % pWay) 383 } 384 } 385 386 io.readResp.datas(0) := Mux( port_0_read_1_reg, read_datas(1) , read_datas(0)) 387 io.readResp.datas(1) := Mux( port_1_read_0_reg, read_datas(0) , read_datas(1)) 388 389 390 val write_data_code = Wire(UInt(dataCodeEntryBits.W)) 391 val write_bank_0 = WireInit(io.write.valid && !io.write.bits.bankIdx) 392 val write_bank_1 = WireInit(io.write.valid && io.write.bits.bankIdx) 393 394 val bank_0_idx = bank_0_idx_vec.last 395 val bank_1_idx = bank_1_idx_vec.last 396 397 val codeArrays = (0 until 2) map { i => 398 val codeArray = Module(new SRAMTemplate( 399 UInt(dataCodeEntryBits.W), 400 set=nSets/2, 401 way=nWays, 402 shouldReset = true, 403 holdRead = true, 404 singlePort = true 405 )) 406 407 if(i == 0) { 408 codeArray.io.r.req.valid := io.read.valid && io.read.bits.last.read_bank_0 409 codeArray.io.r.req.bits.apply(setIdx=bank_0_idx(highestIdxBit,1)) 410 codeArray.io.w.req.valid := write_bank_0 411 codeArray.io.w.req.bits.apply(data=write_data_code, setIdx=io.write.bits.virIdx(highestIdxBit,1), waymask=io.write.bits.waymask) 412 } 413 else { 414 codeArray.io.r.req.valid := io.read.valid && io.read.bits.last.read_bank_1 415 codeArray.io.r.req.bits.apply(setIdx=bank_1_idx(highestIdxBit,1)) 416 codeArray.io.w.req.valid := write_bank_1 417 codeArray.io.w.req.bits.apply(data=write_data_code, setIdx=io.write.bits.virIdx(highestIdxBit,1), waymask=io.write.bits.waymask) 418 } 419 420 codeArray 421 } 422 423 io.read.ready := !io.write.valid && 424 dataArrays.map(_.io.read.req.map(_.ready).reduce(_&&_)).reduce(_&&_) && 425 codeArrays.map(_.io.r.req.ready).reduce(_ && _) 426 427 //Parity Decode 428 val read_codes = Wire(Vec(2,Vec(nWays,UInt(dataCodeEntryBits.W) ))) 429 for(((dataArray,codeArray),i) <- dataArrays.zip(codeArrays).zipWithIndex){ 430 read_codes(i) := codeArray.io.r.resp.asTypeOf(Vec(nWays,UInt(dataCodeEntryBits.W))) 431 } 432 433 //Parity Encode 434 val write = io.write.bits 435 val write_data = WireInit(write.data) 436 write_data_code := getECCFromBlock(write_data).asUInt 437 write_data_bits := write_data 438 439 io.readResp.codes(0) := Mux( port_0_read_1_reg, read_codes(1) , read_codes(0)) 440 io.readResp.codes(1) := Mux( port_1_read_0_reg, read_codes(0) , read_codes(1)) 441 442 io.write.ready := true.B 443 444 // deal with customized cache op 445 require(nWays <= 32) 446 io.cacheOp.resp.bits := DontCare 447 io.cacheOp.resp.valid := false.B 448 val cacheOpShouldResp = WireInit(false.B) 449 val dataresp = Wire(Vec(nWays,UInt(blockBits.W) )) 450 dataresp := DontCare 451 when(io.cacheOp.req.valid){ 452 when( 453 CacheInstrucion.isReadData(io.cacheOp.req.bits.opCode) 454 ){ 455 for (i <- 0 until partWayNum) { 456 dataArrays(i).io.read.req.zipWithIndex.map{ case(port,i) => 457 if(i ==0) port.valid := !io.cacheOp.req.bits.bank_num(0) 458 else port.valid := io.cacheOp.req.bits.bank_num(0) 459 port.bits.ridx := io.cacheOp.req.bits.index(highestIdxBit,1) 460 } 461 } 462 cacheOpShouldResp := dataArrays.head.io.read.req.map(_.fire()).reduce(_||_) 463 dataresp :=Mux(io.cacheOp.req.bits.bank_num(0).asBool, read_datas(1), read_datas(0)) 464 } 465 when(CacheInstrucion.isWriteData(io.cacheOp.req.bits.opCode)){ 466 for (i <- 0 until partWayNum) { 467 dataArrays(i).io.write.valid := true.B 468 dataArrays(i).io.write.bits.wdata := io.cacheOp.req.bits.write_data_vec.asTypeOf(write_data.cloneType) 469 dataArrays(i).io.write.bits.wbankidx := io.cacheOp.req.bits.bank_num(0) 470 dataArrays(i).io.write.bits.widx := io.cacheOp.req.bits.index(highestIdxBit,1) 471 dataArrays(i).io.write.bits.wmask := UIntToOH(io.cacheOp.req.bits.wayNum(4, 0)).asTypeOf(Vec(partWayNum, Vec(pWay, Bool())))(i) 472 } 473 cacheOpShouldResp := true.B 474 } 475 } 476 477 io.cacheOp.resp.valid := RegNext(cacheOpShouldResp) 478 val numICacheLineWords = blockBits / 64 479 require(blockBits >= 64 && isPow2(blockBits)) 480 for (wordIndex <- 0 until numICacheLineWords) { 481 io.cacheOp.resp.bits.read_data_vec(wordIndex) := dataresp(io.cacheOp.req.bits.wayNum(4, 0))(64*(wordIndex+1)-1, 64*wordIndex) 482 } 483 484} 485 486 487class ICacheIO(implicit p: Parameters) extends ICacheBundle 488{ 489 val hartId = Input(UInt(8.W)) 490 val prefetch = Flipped(new FtqPrefechBundle) 491 val stop = Input(Bool()) 492 val fetch = new ICacheMainPipeBundle 493 val toIFU = Output(Bool()) 494 val pmp = Vec(PortNumber + prefetchPipeNum, new ICachePMPBundle) 495 val itlb = Vec(PortNumber + prefetchPipeNum, new TlbRequestIO) 496 val perfInfo = Output(new ICachePerfInfo) 497 val error = new L1CacheErrorInfo 498 /* Cache Instruction */ 499 val csr = new L1CacheToCsrIO 500 /* CSR control signal */ 501 val csr_pf_enable = Input(Bool()) 502 val csr_parity_enable = Input(Bool()) 503 val fencei = Input(Bool()) 504} 505 506class ICache()(implicit p: Parameters) extends LazyModule with HasICacheParameters { 507 508 val clientParameters = TLMasterPortParameters.v1( 509 Seq(TLMasterParameters.v1( 510 name = "icache", 511 sourceId = IdRange(0, cacheParams.nMissEntries + cacheParams.nPrefetchEntries), 512 )), 513 requestFields = cacheParams.reqFields, 514 echoFields = cacheParams.echoFields 515 ) 516 517 val clientNode = TLClientNode(Seq(clientParameters)) 518 519 lazy val module = new ICacheImp(this) 520} 521 522class ICacheImp(outer: ICache) extends LazyModuleImp(outer) with HasICacheParameters with HasPerfEvents { 523 val io = IO(new ICacheIO) 524 525 println("ICache:") 526 println(" ICacheSets: " + cacheParams.nSets) 527 println(" ICacheWays: " + cacheParams.nWays) 528 println(" ICacheBanks: " + PortNumber) 529 println(" hasPrefetch: " + cacheParams.hasPrefetch) 530 if(cacheParams.hasPrefetch){ 531 println(" nPrefetchEntries: " + cacheParams.nPrefetchEntries) 532 println(" nPrefetchBufferEntries: " + cacheParams.nPrefBufferEntries) 533 println(" prefetchPipeNum: " + cacheParams.prefetchPipeNum) 534 } 535 536 val (bus, edge) = outer.clientNode.out.head 537 538 val metaArray = Module(new ICacheMetaArray) 539 val bankedMetaArray = Module(new ICacheBankedMetaArray(prefetchPipeNum + 1)) // need add 1 port for IPF filter 540 val dataArray = Module(new ICacheDataArray) 541 val mainPipe = Module(new ICacheMainPipe) 542 val missUnit = Module(new ICacheMissUnit(edge)) 543 val prefetchPipes = (0 until prefetchPipeNum).map( i => Module(new IPrefetchPipe)) 544 val ipfBuffer = Module(new PrefetchBuffer) 545 546 val meta_read_arb = Module(new Arbiter(new ICacheReadBundle, 1)) 547 val data_read_arb = Module(new Arbiter(Vec(partWayNum, new ICacheReadBundle), 1)) 548 val meta_write_arb = Module(new Arbiter(new ICacheMetaWriteBundle(), 2)) 549 val data_write_arb = Module(new Arbiter(new ICacheDataWriteBundle(), 2)) 550 val prefetch_req_arb = Module(new Arbiter(new PIQReq, prefetchPipeNum)) 551 552 mainPipe.io.hartId := io.hartId 553 ipfBuffer.io.hartId := io.hartId 554 mainPipe.io.PIQ <> missUnit.io.to_main_pipe 555 ipfBuffer.io.read <> mainPipe.io.iprefetchBuf 556 meta_write_arb.io.in(1) <> ipfBuffer.io.move.meta_write 557 data_write_arb.io.in(1) <> ipfBuffer.io.move.data_write 558 mainPipe.io.IPFBufMove <> ipfBuffer.io.replace 559 (0 until prefetchPipeNum).foreach(i => ipfBuffer.io.filter_read(i) <> prefetchPipes(i).io.IPFBufferRead) 560 (0 until prefetchPipeNum).foreach(i => mainPipe.io.missSlotInfo <> prefetchPipes(i).io.mainPipeMissSlotInfo) 561 mainPipe.io.mainPipeMissInfo <> ipfBuffer.io.mainpipe_missinfo 562 563 ipfBuffer.io.write <> missUnit.io.piq_write_ipbuffer 564 565 meta_read_arb.io.in(0) <> mainPipe.io.metaArray.toIMeta 566 metaArray.io.read <> meta_read_arb.io.out 567 bankedMetaArray.io.read(0) <> ipfBuffer.io.meta_filter_read_req 568 (0 until prefetchPipeNum).foreach(i => bankedMetaArray.io.read(i + 1) <> prefetchPipes(i).io.toIMeta) 569 570 mainPipe.io.metaArray.fromIMeta <> metaArray.io.readResp 571 ipfBuffer.io.meta_filter_read_resp <> bankedMetaArray.io.readResp(0) 572 (0 until prefetchPipeNum).foreach(i => bankedMetaArray.io.readResp(i + 1) <> prefetchPipes(i).io.fromIMeta) 573 574 data_read_arb.io.in(0) <> mainPipe.io.dataArray.toIData 575 dataArray.io.read <> data_read_arb.io.out 576 mainPipe.io.dataArray.fromIData <> dataArray.io.readResp 577 578 mainPipe.io.respStall := io.stop 579 io.perfInfo := mainPipe.io.perfInfo 580 581 meta_write_arb.io.in(0) <> missUnit.io.meta_write 582 data_write_arb.io.in(0) <> missUnit.io.data_write 583 584 metaArray.io.write <> meta_write_arb.io.out 585 bankedMetaArray.io.write <> meta_write_arb.io.out 586 587 dataArray.io.write <> data_write_arb.io.out 588 589 mainPipe.io.csr_parity_enable := io.csr_parity_enable 590 591 if(cacheParams.hasPrefetch){ 592 // TODO : perf enhance 593 val prefetchPipe_ready_vec = WireInit(VecInit(Seq.fill(prefetchPipeNum)(false.B))) 594 val alloc = RegInit(0.U(log2Up(prefetchPipeNum).W)) 595 alloc := alloc + io.prefetch.req.fire 596 (0 until prefetchPipeNum).foreach(i => { 597 prefetchPipes(i).io.fromFtq.req.valid := io.prefetch.req.valid && i.U === alloc 598 prefetchPipes(i).io.fromFtq.req.bits := io.prefetch.req.bits 599 prefetchPipe_ready_vec(i) := prefetchPipes(i).io.fromFtq.req.ready && i.U === alloc 600 }) 601 io.prefetch.req.ready := prefetchPipe_ready_vec.reduce(_||_) 602 when(!io.csr_pf_enable){ 603 (0 until prefetchPipeNum).foreach(i => { 604 prefetchPipes(i).io.fromFtq.req.valid := false.B 605 }) 606 io.prefetch.req.ready := true.B 607 } 608 } else { 609 (0 until prefetchPipeNum).foreach(i => prefetchPipes(i).io.fromFtq <> DontCare) 610 } 611 612 io.pmp(0) <> mainPipe.io.pmp(0) 613 io.pmp(1) <> mainPipe.io.pmp(1) 614 (0 until prefetchPipeNum).foreach(i => io.pmp(2 + i) <> prefetchPipes(i).io.pmp) 615 (0 until prefetchPipeNum).foreach(i => { 616 prefetchPipes(i).io.prefetchEnable := mainPipe.io.prefetchEnable 617 prefetchPipes(i).io.prefetchDisable := mainPipe.io.prefetchDisable 618 }) 619 620 621 //notify IFU that Icache pipeline is available 622 io.toIFU := mainPipe.io.fetch.req.ready 623 624 625 io.itlb(0) <> mainPipe.io.itlb(0) 626 io.itlb(1) <> mainPipe.io.itlb(1) 627 (0 until prefetchPipeNum).foreach(i => io.itlb(2 + i) <> prefetchPipes(i).io.iTLBInter) 628 629 630 io.fetch.resp <> mainPipe.io.fetch.resp 631 632 for(i <- 0 until PortNumber){ 633 missUnit.io.req(i) <> mainPipe.io.mshr(i).toMSHR 634 mainPipe.io.mshr(i).fromMSHR <> missUnit.io.resp(i) 635 } 636 637 (0 until prefetchPipeNum).foreach(i => prefetch_req_arb.io.in(i) <> prefetchPipes(i).io.toMissUnit.enqReq) 638 missUnit.io.prefetch_req <> prefetch_req_arb.io.out 639 missUnit.io.hartId := io.hartId 640 (0 until prefetchPipeNum).foreach(i => { 641 prefetchPipes(i).io.fromMSHR <> missUnit.io.mshr_info 642 prefetchPipes(i).io.fencei := false.B 643 prefetchPipes(i).io.freePIQEntry := missUnit.io.freePIQEntry 644 }) 645 646 bus.b.ready := false.B 647 bus.c.valid := false.B 648 bus.c.bits := DontCare 649 bus.e.valid := false.B 650 bus.e.bits := DontCare 651 652 bus.a <> missUnit.io.mem_acquire 653 654 // connect bus d 655 missUnit.io.mem_grant.valid := false.B 656 missUnit.io.mem_grant.bits := DontCare 657 658 //Parity error port 659 val errors = mainPipe.io.errors 660 io.error <> RegNext(Mux1H(errors.map(e => e.valid -> e))) 661 662 663 mainPipe.io.fetch.req <> io.fetch.req 664 bus.d.ready := false.B 665 missUnit.io.mem_grant <> bus.d 666 667 // fencei connect 668 metaArray.io.fencei := io.fencei 669 bankedMetaArray.io.fencei := io.fencei 670 ipfBuffer.io.fencei := io.fencei 671 missUnit.io.fencei := io.fencei 672 673 674 val perfEvents = Seq( 675 ("icache_miss_cnt ", false.B), 676 ("icache_miss_penty", BoolStopWatch(start = false.B, stop = false.B || false.B, startHighPriority = true)), 677 ) 678 generatePerfEvent() 679 680 // Customized csr cache op support 681 val cacheOpDecoder = Module(new CSRCacheOpDecoder("icache", CacheInstrucion.COP_ID_ICACHE)) 682 cacheOpDecoder.io.csr <> io.csr 683 dataArray.io.cacheOp.req := cacheOpDecoder.io.cache.req 684 metaArray.io.cacheOp.req := cacheOpDecoder.io.cache.req 685 bankedMetaArray.io.cacheOp.req := cacheOpDecoder.io.cache.req 686 cacheOpDecoder.io.cache.resp.valid := 687 dataArray.io.cacheOp.resp.valid || 688 metaArray.io.cacheOp.resp.valid 689 cacheOpDecoder.io.cache.resp.bits := Mux1H(List( 690 dataArray.io.cacheOp.resp.valid -> dataArray.io.cacheOp.resp.bits, 691 metaArray.io.cacheOp.resp.valid -> metaArray.io.cacheOp.resp.bits, 692 )) 693 cacheOpDecoder.io.error := io.error 694 assert(!((dataArray.io.cacheOp.resp.valid +& metaArray.io.cacheOp.resp.valid) > 1.U)) 695 696} 697 698class ICachePartWayReadBundle[T <: Data](gen: T, pWay: Int)(implicit p: Parameters) 699 extends ICacheBundle 700{ 701 val req = Flipped(Vec(PortNumber, Decoupled(new Bundle{ 702 val ridx = UInt((log2Ceil(nSets) - 1).W) 703 }))) 704 val resp = Output(new Bundle{ 705 val rdata = Vec(PortNumber,Vec(pWay, gen)) 706 }) 707} 708 709class ICacheWriteBundle[T <: Data](gen: T, pWay: Int)(implicit p: Parameters) 710 extends ICacheBundle 711{ 712 val wdata = gen 713 val widx = UInt((log2Ceil(nSets) - 1).W) 714 val wbankidx = Bool() 715 val wmask = Vec(pWay, Bool()) 716} 717 718class ICachePartWayArray[T <: Data](gen: T, pWay: Int)(implicit p: Parameters) extends ICacheArray 719{ 720 721 //including part way data 722 val io = IO{new Bundle { 723 val read = new ICachePartWayReadBundle(gen,pWay) 724 val write = Flipped(ValidIO(new ICacheWriteBundle(gen, pWay))) 725 }} 726 727 io.read.req.map(_.ready := !io.write.valid) 728 729 val srams = (0 until PortNumber) map { bank => 730 val sramBank = Module(new SRAMTemplate( 731 gen, 732 set=nSets/2, 733 way=pWay, 734 shouldReset = true, 735 holdRead = true, 736 singlePort = true 737 )) 738 739 sramBank.io.r.req.valid := io.read.req(bank).valid 740 sramBank.io.r.req.bits.apply(setIdx= io.read.req(bank).bits.ridx) 741 742 if(bank == 0) sramBank.io.w.req.valid := io.write.valid && !io.write.bits.wbankidx 743 else sramBank.io.w.req.valid := io.write.valid && io.write.bits.wbankidx 744 sramBank.io.w.req.bits.apply(data=io.write.bits.wdata, setIdx=io.write.bits.widx, waymask=io.write.bits.wmask.asUInt()) 745 746 sramBank 747 } 748 749 io.read.req.map(_.ready := !io.write.valid && srams.map(_.io.r.req.ready).reduce(_&&_)) 750 751 io.read.resp.rdata := VecInit(srams.map(bank => bank.io.r.resp.asTypeOf(Vec(pWay,gen)))) 752 753} 754