1c7658a75SYinan Xupackage xiangshan.mem 2c7658a75SYinan Xu 3c7658a75SYinan Xuimport chisel3._ 4c7658a75SYinan Xuimport chisel3.util._ 5c7658a75SYinan Xuimport utils._ 6c7658a75SYinan Xuimport xiangshan._ 7c7658a75SYinan Xuimport xiangshan.cache._ 8c7658a75SYinan Xuimport xiangshan.cache.{DCacheWordIO, DCacheLineIO, TlbRequestIO, MemoryOpConstants} 9c7658a75SYinan Xuimport xiangshan.backend.LSUOpType 10c7658a75SYinan Xuimport xiangshan.mem._ 11c7658a75SYinan Xuimport xiangshan.backend.roq.RoqPtr 12c7658a75SYinan Xu 13c7658a75SYinan Xuclass ExceptionAddrIO extends XSBundle { 14c7658a75SYinan Xu val lsIdx = Input(new LSIdx) 15c7658a75SYinan Xu val isStore = Input(Bool()) 16c7658a75SYinan Xu val vaddr = Output(UInt(VAddrBits.W)) 17c7658a75SYinan Xu} 18c7658a75SYinan Xu 19c7658a75SYinan Xu 200bd67ba5SYinan Xuclass LsqEntry extends XSBundle { 21c7658a75SYinan Xu val vaddr = UInt(VAddrBits.W) // TODO: need opt 22c7658a75SYinan Xu val paddr = UInt(PAddrBits.W) 23c7658a75SYinan Xu val op = UInt(6.W) 24c7658a75SYinan Xu val mask = UInt(8.W) 25c7658a75SYinan Xu val data = UInt(XLEN.W) 26c7658a75SYinan Xu val exception = UInt(16.W) // TODO: opt size 27c7658a75SYinan Xu val mmio = Bool() 28c7658a75SYinan Xu val fwdMask = Vec(8, Bool()) 29c7658a75SYinan Xu val fwdData = Vec(8, UInt(8.W)) 30c7658a75SYinan Xu} 31c7658a75SYinan Xu 32*eb8f00f4SWilliam Wang 33*eb8f00f4SWilliam Wangclass LSQueueData(size: Int, nchannel: Int) extends XSModule with HasDCacheParameters with HasCircularQueuePtrHelper { 34*eb8f00f4SWilliam Wang val io = IO(new Bundle() { 35*eb8f00f4SWilliam Wang val wb = Vec(nchannel, new Bundle() { 36*eb8f00f4SWilliam Wang val wen = Input(Bool()) 37*eb8f00f4SWilliam Wang val index = Input(UInt(log2Up(size).W)) 38*eb8f00f4SWilliam Wang val wdata = Input(new LsRoqEntry) 39*eb8f00f4SWilliam Wang }) 40*eb8f00f4SWilliam Wang val uncache = new Bundle() { 41*eb8f00f4SWilliam Wang val wen = Input(Bool()) 42*eb8f00f4SWilliam Wang val index = Input(UInt(log2Up(size).W)) 43*eb8f00f4SWilliam Wang val wdata = Input(UInt(XLEN.W)) 44*eb8f00f4SWilliam Wang } 45*eb8f00f4SWilliam Wang val refill = new Bundle() { 46*eb8f00f4SWilliam Wang val wen = Input(Vec(size, Bool())) 47*eb8f00f4SWilliam Wang val dcache = Input(new DCacheLineResp) 48*eb8f00f4SWilliam Wang } 49*eb8f00f4SWilliam Wang val needForward = Input(Vec(nchannel, Vec(2, UInt(size.W)))) 50*eb8f00f4SWilliam Wang val forward = Vec(nchannel, Flipped(new LoadForwardQueryIO)) 51*eb8f00f4SWilliam Wang val rdata = Output(Vec(size, new LsRoqEntry)) 52*eb8f00f4SWilliam Wang 53*eb8f00f4SWilliam Wang // val debug = new Bundle() { 54*eb8f00f4SWilliam Wang // val debug_data = Vec(LoadQueueSize, new LsRoqEntry) 55*eb8f00f4SWilliam Wang // } 56*eb8f00f4SWilliam Wang 57*eb8f00f4SWilliam Wang def wbWrite(channel: Int, index: UInt, wdata: LsRoqEntry): Unit = { 58*eb8f00f4SWilliam Wang require(channel < nchannel && channel >= 0) 59*eb8f00f4SWilliam Wang // need extra "this.wb(channel).wen := true.B" 60*eb8f00f4SWilliam Wang this.wb(channel).index := index 61*eb8f00f4SWilliam Wang this.wb(channel).wdata := wdata 62*eb8f00f4SWilliam Wang } 63*eb8f00f4SWilliam Wang 64*eb8f00f4SWilliam Wang def uncacheWrite(index: UInt, wdata: UInt): Unit = { 65*eb8f00f4SWilliam Wang // need extra "this.uncache.wen := true.B" 66*eb8f00f4SWilliam Wang this.uncache.index := index 67*eb8f00f4SWilliam Wang this.uncache.wdata := wdata 68*eb8f00f4SWilliam Wang } 69*eb8f00f4SWilliam Wang 70*eb8f00f4SWilliam Wang def forwardQuery(channel: Int, paddr: UInt, needForward1: Data, needForward2: Data): Unit = { 71*eb8f00f4SWilliam Wang this.needForward(channel)(0) := needForward1 72*eb8f00f4SWilliam Wang this.needForward(channel)(1) := needForward2 73*eb8f00f4SWilliam Wang this.forward(channel).paddr := paddr 74*eb8f00f4SWilliam Wang } 75*eb8f00f4SWilliam Wang 76*eb8f00f4SWilliam Wang // def refillWrite(ldIdx: Int): Unit = { 77*eb8f00f4SWilliam Wang // } 78*eb8f00f4SWilliam Wang // use "this.refill.wen(ldIdx) := true.B" instead 79*eb8f00f4SWilliam Wang }) 80*eb8f00f4SWilliam Wang 81*eb8f00f4SWilliam Wang io := DontCare 82*eb8f00f4SWilliam Wang 83*eb8f00f4SWilliam Wang val data = Reg(Vec(size, new LsRoqEntry)) 84*eb8f00f4SWilliam Wang 85*eb8f00f4SWilliam Wang // writeback to lq/sq 86*eb8f00f4SWilliam Wang (0 until 2).map(i => { 87*eb8f00f4SWilliam Wang when(io.wb(i).wen){ 88*eb8f00f4SWilliam Wang data(io.wb(i).index) := io.wb(i).wdata 89*eb8f00f4SWilliam Wang } 90*eb8f00f4SWilliam Wang }) 91*eb8f00f4SWilliam Wang 92*eb8f00f4SWilliam Wang when(io.uncache.wen){ 93*eb8f00f4SWilliam Wang data(io.uncache.index).data := io.uncache.wdata 94*eb8f00f4SWilliam Wang } 95*eb8f00f4SWilliam Wang 96*eb8f00f4SWilliam Wang // refill missed load 97*eb8f00f4SWilliam Wang def mergeRefillData(refill: UInt, fwd: UInt, fwdMask: UInt): UInt = { 98*eb8f00f4SWilliam Wang val res = Wire(Vec(8, UInt(8.W))) 99*eb8f00f4SWilliam Wang (0 until 8).foreach(i => { 100*eb8f00f4SWilliam Wang res(i) := Mux(fwdMask(i), fwd(8 * (i + 1) - 1, 8 * i), refill(8 * (i + 1) - 1, 8 * i)) 101*eb8f00f4SWilliam Wang }) 102*eb8f00f4SWilliam Wang res.asUInt 103*eb8f00f4SWilliam Wang } 104*eb8f00f4SWilliam Wang 105*eb8f00f4SWilliam Wang // split dcache result into words 106*eb8f00f4SWilliam Wang val words = VecInit((0 until blockWords) map { i => 107*eb8f00f4SWilliam Wang io.refill.dcache.data(DataBits * (i + 1) - 1, DataBits * i) 108*eb8f00f4SWilliam Wang }) 109*eb8f00f4SWilliam Wang 110*eb8f00f4SWilliam Wang 111*eb8f00f4SWilliam Wang (0 until size).map(i => { 112*eb8f00f4SWilliam Wang when(io.refill.wen(i) ){ 113*eb8f00f4SWilliam Wang val refillData = words(get_word(data(i).paddr)) 114*eb8f00f4SWilliam Wang data(i).data := mergeRefillData(refillData, data(i).fwdData.asUInt, data(i).fwdMask.asUInt) 115*eb8f00f4SWilliam Wang XSDebug("miss resp: pos %d addr %x data %x + %x(%b)\n", i.U, data(i).paddr, refillData, data(i).fwdData.asUInt, data(i).fwdMask.asUInt) 116*eb8f00f4SWilliam Wang } 117*eb8f00f4SWilliam Wang }) 118*eb8f00f4SWilliam Wang 119*eb8f00f4SWilliam Wang // forwarding 120*eb8f00f4SWilliam Wang // Compare ringBufferTail (deqPtr) and forward.sqIdx, we have two cases: 121*eb8f00f4SWilliam Wang // (1) if they have the same flag, we need to check range(tail, sqIdx) 122*eb8f00f4SWilliam Wang // (2) if they have different flags, we need to check range(tail, LoadQueueSize) and range(0, sqIdx) 123*eb8f00f4SWilliam Wang // Forward1: Mux(same_flag, range(tail, sqIdx), range(tail, LoadQueueSize)) 124*eb8f00f4SWilliam Wang // Forward2: Mux(same_flag, 0.U, range(0, sqIdx) ) 125*eb8f00f4SWilliam Wang // i.e. forward1 is the target entries with the same flag bits and forward2 otherwise 126*eb8f00f4SWilliam Wang 127*eb8f00f4SWilliam Wang // entry with larger index should have higher priority since it's data is younger 128*eb8f00f4SWilliam Wang (0 until nchannel).map(i => { 129*eb8f00f4SWilliam Wang 130*eb8f00f4SWilliam Wang val forwardMask1 = WireInit(VecInit(Seq.fill(8)(false.B))) 131*eb8f00f4SWilliam Wang val forwardData1 = WireInit(VecInit(Seq.fill(8)(0.U(8.W)))) 132*eb8f00f4SWilliam Wang val forwardMask2 = WireInit(VecInit(Seq.fill(8)(false.B))) 133*eb8f00f4SWilliam Wang val forwardData2 = WireInit(VecInit(Seq.fill(8)(0.U(8.W)))) 134*eb8f00f4SWilliam Wang 135*eb8f00f4SWilliam Wang for (j <- 0 until size) { 136*eb8f00f4SWilliam Wang val needCheck = io.forward(i).paddr(PAddrBits - 1, 3) === data(j).paddr(PAddrBits - 1, 3) 137*eb8f00f4SWilliam Wang (0 until XLEN / 8).foreach(k => { 138*eb8f00f4SWilliam Wang when (needCheck && data(j).mask(k)) { 139*eb8f00f4SWilliam Wang when (io.needForward(i)(0)(j)) { 140*eb8f00f4SWilliam Wang forwardMask1(k) := true.B 141*eb8f00f4SWilliam Wang forwardData1(k) := data(j).data(8 * (k + 1) - 1, 8 * k) 142*eb8f00f4SWilliam Wang } 143*eb8f00f4SWilliam Wang when (io.needForward(i)(1)(j)) { 144*eb8f00f4SWilliam Wang forwardMask2(k) := true.B 145*eb8f00f4SWilliam Wang forwardData2(k) := data(j).data(8 * (k + 1) - 1, 8 * k) 146*eb8f00f4SWilliam Wang } 147*eb8f00f4SWilliam Wang XSDebug(io.needForward(i)(0)(j) || io.needForward(i)(1)(j), 148*eb8f00f4SWilliam Wang p"forwarding $k-th byte ${Hexadecimal(data(j).data(8 * (k + 1) - 1, 8 * k))} " + 149*eb8f00f4SWilliam Wang p"from ptr $j\n") 150*eb8f00f4SWilliam Wang } 151*eb8f00f4SWilliam Wang }) 152*eb8f00f4SWilliam Wang } 153*eb8f00f4SWilliam Wang 154*eb8f00f4SWilliam Wang // merge forward lookup results 155*eb8f00f4SWilliam Wang // forward2 is younger than forward1 and should have higher priority 156*eb8f00f4SWilliam Wang (0 until XLEN / 8).map(k => { 157*eb8f00f4SWilliam Wang io.forward(i).forwardMask(k) := forwardMask1(k) || forwardMask2(k) 158*eb8f00f4SWilliam Wang io.forward(i).forwardData(k) := Mux(forwardMask2(k), forwardData2(k), forwardData1(k)) 159*eb8f00f4SWilliam Wang }) 160*eb8f00f4SWilliam Wang }) 161*eb8f00f4SWilliam Wang 162*eb8f00f4SWilliam Wang // data read 163*eb8f00f4SWilliam Wang io.rdata := data 164*eb8f00f4SWilliam Wang // io.debug.debug_data := data 165*eb8f00f4SWilliam Wang} 166*eb8f00f4SWilliam Wang 167c7658a75SYinan Xu// inflight miss block reqs 168c7658a75SYinan Xuclass InflightBlockInfo extends XSBundle { 169c7658a75SYinan Xu val block_addr = UInt(PAddrBits.W) 170c7658a75SYinan Xu val valid = Bool() 171c7658a75SYinan Xu} 172c7658a75SYinan Xu 173c7658a75SYinan Xu// Load / Store Queue Wrapper for XiangShan Out of Order LSU 174c7658a75SYinan Xuclass LsqWrappper extends XSModule with HasDCacheParameters { 175c7658a75SYinan Xu val io = IO(new Bundle() { 176c7658a75SYinan Xu val dp1Req = Vec(RenameWidth, Flipped(DecoupledIO(new MicroOp))) 177c7658a75SYinan Xu val lsIdxs = Output(Vec(RenameWidth, new LSIdx)) 178c7658a75SYinan Xu val brqRedirect = Input(Valid(new Redirect)) 179c7658a75SYinan Xu val loadIn = Vec(LoadPipelineWidth, Flipped(Valid(new LsPipelineBundle))) 180c7658a75SYinan Xu val storeIn = Vec(StorePipelineWidth, Flipped(Valid(new LsPipelineBundle))) 181c7658a75SYinan Xu val sbuffer = Vec(StorePipelineWidth, Decoupled(new DCacheWordReq)) 182c7658a75SYinan Xu val ldout = Vec(2, DecoupledIO(new ExuOutput)) // writeback store 183c7658a75SYinan Xu val stout = Vec(2, DecoupledIO(new ExuOutput)) // writeback store 184c7658a75SYinan Xu val forward = Vec(LoadPipelineWidth, Flipped(new LoadForwardQueryIO)) 185c7658a75SYinan Xu val commits = Flipped(Vec(CommitWidth, Valid(new RoqCommit))) 186c7658a75SYinan Xu val rollback = Output(Valid(new Redirect)) 187c7658a75SYinan Xu val dcache = new DCacheLineIO 188c7658a75SYinan Xu val uncache = new DCacheWordIO 189c7658a75SYinan Xu val roqDeqPtr = Input(new RoqPtr) 190c7658a75SYinan Xu val oldestStore = Output(Valid(new RoqPtr)) 191c7658a75SYinan Xu val exceptionAddr = new ExceptionAddrIO 192c7658a75SYinan Xu }) 193c7658a75SYinan Xu 194c7658a75SYinan Xu val loadQueue = Module(new LoadQueue) 195c7658a75SYinan Xu val storeQueue = Module(new StoreQueue) 196c7658a75SYinan Xu 197c7658a75SYinan Xu // load queue wiring 198c7658a75SYinan Xu loadQueue.io.dp1Req <> io.dp1Req 199c7658a75SYinan Xu loadQueue.io.brqRedirect <> io.brqRedirect 200c7658a75SYinan Xu loadQueue.io.loadIn <> io.loadIn 201c7658a75SYinan Xu loadQueue.io.storeIn <> io.storeIn 202c7658a75SYinan Xu loadQueue.io.ldout <> io.ldout 203c7658a75SYinan Xu loadQueue.io.commits <> io.commits 204c7658a75SYinan Xu loadQueue.io.rollback <> io.rollback 205c7658a75SYinan Xu loadQueue.io.dcache <> io.dcache 206c7658a75SYinan Xu loadQueue.io.roqDeqPtr <> io.roqDeqPtr 207c7658a75SYinan Xu loadQueue.io.exceptionAddr.lsIdx := io.exceptionAddr.lsIdx 208c7658a75SYinan Xu loadQueue.io.exceptionAddr.isStore := DontCare 209c7658a75SYinan Xu 210c7658a75SYinan Xu // store queue wiring 211c7658a75SYinan Xu // storeQueue.io <> DontCare 212c7658a75SYinan Xu storeQueue.io.dp1Req <> io.dp1Req 213c7658a75SYinan Xu storeQueue.io.brqRedirect <> io.brqRedirect 214c7658a75SYinan Xu storeQueue.io.storeIn <> io.storeIn 215c7658a75SYinan Xu storeQueue.io.sbuffer <> io.sbuffer 216c7658a75SYinan Xu storeQueue.io.stout <> io.stout 217c7658a75SYinan Xu storeQueue.io.commits <> io.commits 218c7658a75SYinan Xu storeQueue.io.roqDeqPtr <> io.roqDeqPtr 219c7658a75SYinan Xu storeQueue.io.oldestStore <> io.oldestStore 220c7658a75SYinan Xu storeQueue.io.exceptionAddr.lsIdx := io.exceptionAddr.lsIdx 221c7658a75SYinan Xu storeQueue.io.exceptionAddr.isStore := DontCare 222c7658a75SYinan Xu 223c7658a75SYinan Xu loadQueue.io.forward <> io.forward 224c7658a75SYinan Xu storeQueue.io.forward <> io.forward // overlap forwardMask & forwardData, DO NOT CHANGE SEQUENCE 225c7658a75SYinan Xu 226c7658a75SYinan Xu io.exceptionAddr.vaddr := Mux(io.exceptionAddr.isStore, storeQueue.io.exceptionAddr.vaddr, loadQueue.io.exceptionAddr.vaddr) 227c7658a75SYinan Xu 228c7658a75SYinan Xu // naive uncache arbiter 229c7658a75SYinan Xu val s_idle :: s_load :: s_store :: Nil = Enum(3) 230c7658a75SYinan Xu val uncacheState = RegInit(s_idle) 231c7658a75SYinan Xu 232c7658a75SYinan Xu switch(uncacheState){ 233c7658a75SYinan Xu is(s_idle){ 234c7658a75SYinan Xu when(io.uncache.req.fire()){ 235c7658a75SYinan Xu uncacheState := Mux(loadQueue.io.uncache.req.valid, s_load, s_store) 236c7658a75SYinan Xu } 237c7658a75SYinan Xu } 238c7658a75SYinan Xu is(s_load){ 239c7658a75SYinan Xu when(io.uncache.resp.fire()){ 240c7658a75SYinan Xu uncacheState := s_idle 241c7658a75SYinan Xu } 242c7658a75SYinan Xu } 243c7658a75SYinan Xu is(s_store){ 244c7658a75SYinan Xu when(io.uncache.resp.fire()){ 245c7658a75SYinan Xu uncacheState := s_idle 246c7658a75SYinan Xu } 247c7658a75SYinan Xu } 248c7658a75SYinan Xu } 249c7658a75SYinan Xu 250c7658a75SYinan Xu loadQueue.io.uncache := DontCare 251c7658a75SYinan Xu storeQueue.io.uncache := DontCare 252c7658a75SYinan Xu loadQueue.io.uncache.resp.valid := false.B 253c7658a75SYinan Xu storeQueue.io.uncache.resp.valid := false.B 254c7658a75SYinan Xu when(loadQueue.io.uncache.req.valid){ 255c7658a75SYinan Xu io.uncache.req <> loadQueue.io.uncache.req 256c7658a75SYinan Xu }.otherwise{ 257c7658a75SYinan Xu io.uncache.req <> storeQueue.io.uncache.req 258c7658a75SYinan Xu } 259c7658a75SYinan Xu when(uncacheState === s_load){ 260c7658a75SYinan Xu io.uncache.resp <> loadQueue.io.uncache.resp 261c7658a75SYinan Xu }.otherwise{ 262c7658a75SYinan Xu io.uncache.resp <> storeQueue.io.uncache.resp 263c7658a75SYinan Xu } 264c7658a75SYinan Xu 265c7658a75SYinan Xu assert(!(loadQueue.io.uncache.req.valid && storeQueue.io.uncache.req.valid)) 266c7658a75SYinan Xu assert(!(loadQueue.io.uncache.resp.valid && storeQueue.io.uncache.resp.valid)) 267c7658a75SYinan Xu assert(!((loadQueue.io.uncache.resp.valid || storeQueue.io.uncache.resp.valid) && uncacheState === s_idle)) 268c7658a75SYinan Xu 269c7658a75SYinan Xu // fix valid, allocate lq / sq index 270c7658a75SYinan Xu (0 until RenameWidth).map(i => { 271c7658a75SYinan Xu val isStore = CommitType.lsInstIsStore(io.dp1Req(i).bits.ctrl.commitType) 272*eb8f00f4SWilliam Wang loadQueue.io.dp1Req(i).valid := !isStore && io.dp1Req(i).valid 273*eb8f00f4SWilliam Wang storeQueue.io.dp1Req(i).valid := isStore && io.dp1Req(i).valid 274c7658a75SYinan Xu loadQueue.io.lqIdxs(i) <> io.lsIdxs(i).lqIdx 275c7658a75SYinan Xu storeQueue.io.sqIdxs(i) <> io.lsIdxs(i).sqIdx 276*eb8f00f4SWilliam Wang loadQueue.io.lqReady <> storeQueue.io.lqReady 277*eb8f00f4SWilliam Wang loadQueue.io.sqReady <> storeQueue.io.sqReady 278*eb8f00f4SWilliam Wang io.lsIdxs(i).lsroqIdx := DontCare 279c7658a75SYinan Xu io.dp1Req(i).ready := storeQueue.io.dp1Req(i).ready && loadQueue.io.dp1Req(i).ready 280c7658a75SYinan Xu }) 281c7658a75SYinan Xu } 282*eb8f00f4SWilliam Wang} 283