xref: /XiangShan/src/main/scala/xiangshan/mem/lsqueue/LSQWrapper.scala (revision eb8f00f495e15db4736a081008ef42b091d7d463)
1c7658a75SYinan Xupackage xiangshan.mem
2c7658a75SYinan Xu
3c7658a75SYinan Xuimport chisel3._
4c7658a75SYinan Xuimport chisel3.util._
5c7658a75SYinan Xuimport utils._
6c7658a75SYinan Xuimport xiangshan._
7c7658a75SYinan Xuimport xiangshan.cache._
8c7658a75SYinan Xuimport xiangshan.cache.{DCacheWordIO, DCacheLineIO, TlbRequestIO, MemoryOpConstants}
9c7658a75SYinan Xuimport xiangshan.backend.LSUOpType
10c7658a75SYinan Xuimport xiangshan.mem._
11c7658a75SYinan Xuimport xiangshan.backend.roq.RoqPtr
12c7658a75SYinan Xu
13c7658a75SYinan Xuclass ExceptionAddrIO extends XSBundle {
14c7658a75SYinan Xu  val lsIdx = Input(new LSIdx)
15c7658a75SYinan Xu  val isStore = Input(Bool())
16c7658a75SYinan Xu  val vaddr = Output(UInt(VAddrBits.W))
17c7658a75SYinan Xu}
18c7658a75SYinan Xu
19c7658a75SYinan Xu
200bd67ba5SYinan Xuclass LsqEntry extends XSBundle {
21c7658a75SYinan Xu  val vaddr = UInt(VAddrBits.W) // TODO: need opt
22c7658a75SYinan Xu  val paddr = UInt(PAddrBits.W)
23c7658a75SYinan Xu  val op = UInt(6.W)
24c7658a75SYinan Xu  val mask = UInt(8.W)
25c7658a75SYinan Xu  val data = UInt(XLEN.W)
26c7658a75SYinan Xu  val exception = UInt(16.W) // TODO: opt size
27c7658a75SYinan Xu  val mmio = Bool()
28c7658a75SYinan Xu  val fwdMask = Vec(8, Bool())
29c7658a75SYinan Xu  val fwdData = Vec(8, UInt(8.W))
30c7658a75SYinan Xu}
31c7658a75SYinan Xu
32*eb8f00f4SWilliam Wang
33*eb8f00f4SWilliam Wangclass LSQueueData(size: Int, nchannel: Int) extends XSModule with HasDCacheParameters with HasCircularQueuePtrHelper {
34*eb8f00f4SWilliam Wang  val io = IO(new Bundle() {
35*eb8f00f4SWilliam Wang    val wb = Vec(nchannel, new Bundle() {
36*eb8f00f4SWilliam Wang      val wen = Input(Bool())
37*eb8f00f4SWilliam Wang      val index = Input(UInt(log2Up(size).W))
38*eb8f00f4SWilliam Wang      val wdata = Input(new LsRoqEntry)
39*eb8f00f4SWilliam Wang    })
40*eb8f00f4SWilliam Wang    val uncache = new Bundle() {
41*eb8f00f4SWilliam Wang      val wen = Input(Bool())
42*eb8f00f4SWilliam Wang      val index = Input(UInt(log2Up(size).W))
43*eb8f00f4SWilliam Wang      val wdata = Input(UInt(XLEN.W))
44*eb8f00f4SWilliam Wang    }
45*eb8f00f4SWilliam Wang    val refill = new Bundle() {
46*eb8f00f4SWilliam Wang      val wen = Input(Vec(size, Bool()))
47*eb8f00f4SWilliam Wang      val dcache = Input(new DCacheLineResp)
48*eb8f00f4SWilliam Wang    }
49*eb8f00f4SWilliam Wang    val needForward = Input(Vec(nchannel, Vec(2, UInt(size.W))))
50*eb8f00f4SWilliam Wang    val forward = Vec(nchannel, Flipped(new LoadForwardQueryIO))
51*eb8f00f4SWilliam Wang    val rdata = Output(Vec(size, new LsRoqEntry))
52*eb8f00f4SWilliam Wang
53*eb8f00f4SWilliam Wang    // val debug = new Bundle() {
54*eb8f00f4SWilliam Wang    //   val debug_data = Vec(LoadQueueSize, new LsRoqEntry)
55*eb8f00f4SWilliam Wang    // }
56*eb8f00f4SWilliam Wang
57*eb8f00f4SWilliam Wang    def wbWrite(channel: Int, index: UInt, wdata: LsRoqEntry): Unit = {
58*eb8f00f4SWilliam Wang      require(channel < nchannel && channel >= 0)
59*eb8f00f4SWilliam Wang      // need extra "this.wb(channel).wen := true.B"
60*eb8f00f4SWilliam Wang      this.wb(channel).index := index
61*eb8f00f4SWilliam Wang      this.wb(channel).wdata := wdata
62*eb8f00f4SWilliam Wang    }
63*eb8f00f4SWilliam Wang
64*eb8f00f4SWilliam Wang    def uncacheWrite(index: UInt, wdata: UInt): Unit = {
65*eb8f00f4SWilliam Wang      // need extra "this.uncache.wen := true.B"
66*eb8f00f4SWilliam Wang      this.uncache.index := index
67*eb8f00f4SWilliam Wang      this.uncache.wdata := wdata
68*eb8f00f4SWilliam Wang    }
69*eb8f00f4SWilliam Wang
70*eb8f00f4SWilliam Wang    def forwardQuery(channel: Int, paddr: UInt, needForward1: Data, needForward2: Data): Unit = {
71*eb8f00f4SWilliam Wang      this.needForward(channel)(0) := needForward1
72*eb8f00f4SWilliam Wang      this.needForward(channel)(1) := needForward2
73*eb8f00f4SWilliam Wang      this.forward(channel).paddr := paddr
74*eb8f00f4SWilliam Wang    }
75*eb8f00f4SWilliam Wang
76*eb8f00f4SWilliam Wang    // def refillWrite(ldIdx: Int): Unit = {
77*eb8f00f4SWilliam Wang    // }
78*eb8f00f4SWilliam Wang    // use "this.refill.wen(ldIdx) := true.B" instead
79*eb8f00f4SWilliam Wang  })
80*eb8f00f4SWilliam Wang
81*eb8f00f4SWilliam Wang  io := DontCare
82*eb8f00f4SWilliam Wang
83*eb8f00f4SWilliam Wang  val data = Reg(Vec(size, new LsRoqEntry))
84*eb8f00f4SWilliam Wang
85*eb8f00f4SWilliam Wang  // writeback to lq/sq
86*eb8f00f4SWilliam Wang  (0 until 2).map(i => {
87*eb8f00f4SWilliam Wang    when(io.wb(i).wen){
88*eb8f00f4SWilliam Wang      data(io.wb(i).index) := io.wb(i).wdata
89*eb8f00f4SWilliam Wang    }
90*eb8f00f4SWilliam Wang  })
91*eb8f00f4SWilliam Wang
92*eb8f00f4SWilliam Wang  when(io.uncache.wen){
93*eb8f00f4SWilliam Wang    data(io.uncache.index).data := io.uncache.wdata
94*eb8f00f4SWilliam Wang  }
95*eb8f00f4SWilliam Wang
96*eb8f00f4SWilliam Wang  // refill missed load
97*eb8f00f4SWilliam Wang  def mergeRefillData(refill: UInt, fwd: UInt, fwdMask: UInt): UInt = {
98*eb8f00f4SWilliam Wang    val res = Wire(Vec(8, UInt(8.W)))
99*eb8f00f4SWilliam Wang    (0 until 8).foreach(i => {
100*eb8f00f4SWilliam Wang      res(i) := Mux(fwdMask(i), fwd(8 * (i + 1) - 1, 8 * i), refill(8 * (i + 1) - 1, 8 * i))
101*eb8f00f4SWilliam Wang    })
102*eb8f00f4SWilliam Wang    res.asUInt
103*eb8f00f4SWilliam Wang  }
104*eb8f00f4SWilliam Wang
105*eb8f00f4SWilliam Wang  // split dcache result into words
106*eb8f00f4SWilliam Wang  val words = VecInit((0 until blockWords) map { i =>
107*eb8f00f4SWilliam Wang    io.refill.dcache.data(DataBits * (i + 1) - 1, DataBits * i)
108*eb8f00f4SWilliam Wang  })
109*eb8f00f4SWilliam Wang
110*eb8f00f4SWilliam Wang
111*eb8f00f4SWilliam Wang  (0 until size).map(i => {
112*eb8f00f4SWilliam Wang    when(io.refill.wen(i) ){
113*eb8f00f4SWilliam Wang      val refillData = words(get_word(data(i).paddr))
114*eb8f00f4SWilliam Wang      data(i).data := mergeRefillData(refillData, data(i).fwdData.asUInt, data(i).fwdMask.asUInt)
115*eb8f00f4SWilliam Wang      XSDebug("miss resp: pos %d addr %x data %x + %x(%b)\n", i.U, data(i).paddr, refillData, data(i).fwdData.asUInt, data(i).fwdMask.asUInt)
116*eb8f00f4SWilliam Wang    }
117*eb8f00f4SWilliam Wang  })
118*eb8f00f4SWilliam Wang
119*eb8f00f4SWilliam Wang  // forwarding
120*eb8f00f4SWilliam Wang  // Compare ringBufferTail (deqPtr) and forward.sqIdx, we have two cases:
121*eb8f00f4SWilliam Wang  // (1) if they have the same flag, we need to check range(tail, sqIdx)
122*eb8f00f4SWilliam Wang  // (2) if they have different flags, we need to check range(tail, LoadQueueSize) and range(0, sqIdx)
123*eb8f00f4SWilliam Wang  // Forward1: Mux(same_flag, range(tail, sqIdx), range(tail, LoadQueueSize))
124*eb8f00f4SWilliam Wang  // Forward2: Mux(same_flag, 0.U,                   range(0, sqIdx)    )
125*eb8f00f4SWilliam Wang  // i.e. forward1 is the target entries with the same flag bits and forward2 otherwise
126*eb8f00f4SWilliam Wang
127*eb8f00f4SWilliam Wang  // entry with larger index should have higher priority since it's data is younger
128*eb8f00f4SWilliam Wang  (0 until nchannel).map(i => {
129*eb8f00f4SWilliam Wang
130*eb8f00f4SWilliam Wang    val forwardMask1 = WireInit(VecInit(Seq.fill(8)(false.B)))
131*eb8f00f4SWilliam Wang    val forwardData1 = WireInit(VecInit(Seq.fill(8)(0.U(8.W))))
132*eb8f00f4SWilliam Wang    val forwardMask2 = WireInit(VecInit(Seq.fill(8)(false.B)))
133*eb8f00f4SWilliam Wang    val forwardData2 = WireInit(VecInit(Seq.fill(8)(0.U(8.W))))
134*eb8f00f4SWilliam Wang
135*eb8f00f4SWilliam Wang    for (j <- 0 until size) {
136*eb8f00f4SWilliam Wang      val needCheck = io.forward(i).paddr(PAddrBits - 1, 3) === data(j).paddr(PAddrBits - 1, 3)
137*eb8f00f4SWilliam Wang      (0 until XLEN / 8).foreach(k => {
138*eb8f00f4SWilliam Wang        when (needCheck && data(j).mask(k)) {
139*eb8f00f4SWilliam Wang          when (io.needForward(i)(0)(j)) {
140*eb8f00f4SWilliam Wang            forwardMask1(k) := true.B
141*eb8f00f4SWilliam Wang            forwardData1(k) := data(j).data(8 * (k + 1) - 1, 8 * k)
142*eb8f00f4SWilliam Wang          }
143*eb8f00f4SWilliam Wang          when (io.needForward(i)(1)(j)) {
144*eb8f00f4SWilliam Wang            forwardMask2(k) := true.B
145*eb8f00f4SWilliam Wang            forwardData2(k) := data(j).data(8 * (k + 1) - 1, 8 * k)
146*eb8f00f4SWilliam Wang          }
147*eb8f00f4SWilliam Wang          XSDebug(io.needForward(i)(0)(j) || io.needForward(i)(1)(j),
148*eb8f00f4SWilliam Wang            p"forwarding $k-th byte ${Hexadecimal(data(j).data(8 * (k + 1) - 1, 8 * k))} " +
149*eb8f00f4SWilliam Wang            p"from ptr $j\n")
150*eb8f00f4SWilliam Wang        }
151*eb8f00f4SWilliam Wang      })
152*eb8f00f4SWilliam Wang    }
153*eb8f00f4SWilliam Wang
154*eb8f00f4SWilliam Wang    // merge forward lookup results
155*eb8f00f4SWilliam Wang    // forward2 is younger than forward1 and should have higher priority
156*eb8f00f4SWilliam Wang    (0 until XLEN / 8).map(k => {
157*eb8f00f4SWilliam Wang      io.forward(i).forwardMask(k) := forwardMask1(k) || forwardMask2(k)
158*eb8f00f4SWilliam Wang      io.forward(i).forwardData(k) := Mux(forwardMask2(k), forwardData2(k), forwardData1(k))
159*eb8f00f4SWilliam Wang    })
160*eb8f00f4SWilliam Wang  })
161*eb8f00f4SWilliam Wang
162*eb8f00f4SWilliam Wang  // data read
163*eb8f00f4SWilliam Wang  io.rdata := data
164*eb8f00f4SWilliam Wang  // io.debug.debug_data := data
165*eb8f00f4SWilliam Wang}
166*eb8f00f4SWilliam Wang
167c7658a75SYinan Xu// inflight miss block reqs
168c7658a75SYinan Xuclass InflightBlockInfo extends XSBundle {
169c7658a75SYinan Xu  val block_addr = UInt(PAddrBits.W)
170c7658a75SYinan Xu  val valid = Bool()
171c7658a75SYinan Xu}
172c7658a75SYinan Xu
173c7658a75SYinan Xu// Load / Store Queue Wrapper for XiangShan Out of Order LSU
174c7658a75SYinan Xuclass LsqWrappper extends XSModule with HasDCacheParameters {
175c7658a75SYinan Xu  val io = IO(new Bundle() {
176c7658a75SYinan Xu    val dp1Req = Vec(RenameWidth, Flipped(DecoupledIO(new MicroOp)))
177c7658a75SYinan Xu    val lsIdxs = Output(Vec(RenameWidth, new LSIdx))
178c7658a75SYinan Xu    val brqRedirect = Input(Valid(new Redirect))
179c7658a75SYinan Xu    val loadIn = Vec(LoadPipelineWidth, Flipped(Valid(new LsPipelineBundle)))
180c7658a75SYinan Xu    val storeIn = Vec(StorePipelineWidth, Flipped(Valid(new LsPipelineBundle)))
181c7658a75SYinan Xu    val sbuffer = Vec(StorePipelineWidth, Decoupled(new DCacheWordReq))
182c7658a75SYinan Xu    val ldout = Vec(2, DecoupledIO(new ExuOutput)) // writeback store
183c7658a75SYinan Xu    val stout = Vec(2, DecoupledIO(new ExuOutput)) // writeback store
184c7658a75SYinan Xu    val forward = Vec(LoadPipelineWidth, Flipped(new LoadForwardQueryIO))
185c7658a75SYinan Xu    val commits = Flipped(Vec(CommitWidth, Valid(new RoqCommit)))
186c7658a75SYinan Xu    val rollback = Output(Valid(new Redirect))
187c7658a75SYinan Xu    val dcache = new DCacheLineIO
188c7658a75SYinan Xu    val uncache = new DCacheWordIO
189c7658a75SYinan Xu    val roqDeqPtr = Input(new RoqPtr)
190c7658a75SYinan Xu    val oldestStore = Output(Valid(new RoqPtr))
191c7658a75SYinan Xu    val exceptionAddr = new ExceptionAddrIO
192c7658a75SYinan Xu  })
193c7658a75SYinan Xu
194c7658a75SYinan Xu  val loadQueue = Module(new LoadQueue)
195c7658a75SYinan Xu  val storeQueue = Module(new StoreQueue)
196c7658a75SYinan Xu
197c7658a75SYinan Xu  // load queue wiring
198c7658a75SYinan Xu  loadQueue.io.dp1Req <> io.dp1Req
199c7658a75SYinan Xu  loadQueue.io.brqRedirect <> io.brqRedirect
200c7658a75SYinan Xu  loadQueue.io.loadIn <> io.loadIn
201c7658a75SYinan Xu  loadQueue.io.storeIn <> io.storeIn
202c7658a75SYinan Xu  loadQueue.io.ldout <> io.ldout
203c7658a75SYinan Xu  loadQueue.io.commits <> io.commits
204c7658a75SYinan Xu  loadQueue.io.rollback <> io.rollback
205c7658a75SYinan Xu  loadQueue.io.dcache <> io.dcache
206c7658a75SYinan Xu  loadQueue.io.roqDeqPtr <> io.roqDeqPtr
207c7658a75SYinan Xu  loadQueue.io.exceptionAddr.lsIdx := io.exceptionAddr.lsIdx
208c7658a75SYinan Xu  loadQueue.io.exceptionAddr.isStore := DontCare
209c7658a75SYinan Xu
210c7658a75SYinan Xu  // store queue wiring
211c7658a75SYinan Xu  // storeQueue.io <> DontCare
212c7658a75SYinan Xu  storeQueue.io.dp1Req <> io.dp1Req
213c7658a75SYinan Xu  storeQueue.io.brqRedirect <> io.brqRedirect
214c7658a75SYinan Xu  storeQueue.io.storeIn <> io.storeIn
215c7658a75SYinan Xu  storeQueue.io.sbuffer <> io.sbuffer
216c7658a75SYinan Xu  storeQueue.io.stout <> io.stout
217c7658a75SYinan Xu  storeQueue.io.commits <> io.commits
218c7658a75SYinan Xu  storeQueue.io.roqDeqPtr <> io.roqDeqPtr
219c7658a75SYinan Xu  storeQueue.io.oldestStore <> io.oldestStore
220c7658a75SYinan Xu  storeQueue.io.exceptionAddr.lsIdx := io.exceptionAddr.lsIdx
221c7658a75SYinan Xu  storeQueue.io.exceptionAddr.isStore := DontCare
222c7658a75SYinan Xu
223c7658a75SYinan Xu  loadQueue.io.forward <> io.forward
224c7658a75SYinan Xu  storeQueue.io.forward <> io.forward // overlap forwardMask & forwardData, DO NOT CHANGE SEQUENCE
225c7658a75SYinan Xu
226c7658a75SYinan Xu  io.exceptionAddr.vaddr := Mux(io.exceptionAddr.isStore, storeQueue.io.exceptionAddr.vaddr, loadQueue.io.exceptionAddr.vaddr)
227c7658a75SYinan Xu
228c7658a75SYinan Xu  // naive uncache arbiter
229c7658a75SYinan Xu  val s_idle :: s_load :: s_store :: Nil = Enum(3)
230c7658a75SYinan Xu  val uncacheState = RegInit(s_idle)
231c7658a75SYinan Xu
232c7658a75SYinan Xu  switch(uncacheState){
233c7658a75SYinan Xu    is(s_idle){
234c7658a75SYinan Xu      when(io.uncache.req.fire()){
235c7658a75SYinan Xu        uncacheState := Mux(loadQueue.io.uncache.req.valid, s_load, s_store)
236c7658a75SYinan Xu      }
237c7658a75SYinan Xu    }
238c7658a75SYinan Xu    is(s_load){
239c7658a75SYinan Xu      when(io.uncache.resp.fire()){
240c7658a75SYinan Xu        uncacheState := s_idle
241c7658a75SYinan Xu      }
242c7658a75SYinan Xu    }
243c7658a75SYinan Xu    is(s_store){
244c7658a75SYinan Xu      when(io.uncache.resp.fire()){
245c7658a75SYinan Xu        uncacheState := s_idle
246c7658a75SYinan Xu      }
247c7658a75SYinan Xu    }
248c7658a75SYinan Xu  }
249c7658a75SYinan Xu
250c7658a75SYinan Xu  loadQueue.io.uncache := DontCare
251c7658a75SYinan Xu  storeQueue.io.uncache := DontCare
252c7658a75SYinan Xu  loadQueue.io.uncache.resp.valid := false.B
253c7658a75SYinan Xu  storeQueue.io.uncache.resp.valid := false.B
254c7658a75SYinan Xu  when(loadQueue.io.uncache.req.valid){
255c7658a75SYinan Xu    io.uncache.req <> loadQueue.io.uncache.req
256c7658a75SYinan Xu  }.otherwise{
257c7658a75SYinan Xu    io.uncache.req <> storeQueue.io.uncache.req
258c7658a75SYinan Xu  }
259c7658a75SYinan Xu  when(uncacheState === s_load){
260c7658a75SYinan Xu    io.uncache.resp <> loadQueue.io.uncache.resp
261c7658a75SYinan Xu  }.otherwise{
262c7658a75SYinan Xu    io.uncache.resp <> storeQueue.io.uncache.resp
263c7658a75SYinan Xu  }
264c7658a75SYinan Xu
265c7658a75SYinan Xu  assert(!(loadQueue.io.uncache.req.valid && storeQueue.io.uncache.req.valid))
266c7658a75SYinan Xu  assert(!(loadQueue.io.uncache.resp.valid && storeQueue.io.uncache.resp.valid))
267c7658a75SYinan Xu  assert(!((loadQueue.io.uncache.resp.valid || storeQueue.io.uncache.resp.valid) && uncacheState === s_idle))
268c7658a75SYinan Xu
269c7658a75SYinan Xu  // fix valid, allocate lq / sq index
270c7658a75SYinan Xu    (0 until RenameWidth).map(i => {
271c7658a75SYinan Xu      val isStore = CommitType.lsInstIsStore(io.dp1Req(i).bits.ctrl.commitType)
272*eb8f00f4SWilliam Wang      loadQueue.io.dp1Req(i).valid := !isStore && io.dp1Req(i).valid
273*eb8f00f4SWilliam Wang      storeQueue.io.dp1Req(i).valid := isStore && io.dp1Req(i).valid
274c7658a75SYinan Xu      loadQueue.io.lqIdxs(i) <> io.lsIdxs(i).lqIdx
275c7658a75SYinan Xu      storeQueue.io.sqIdxs(i) <> io.lsIdxs(i).sqIdx
276*eb8f00f4SWilliam Wang      loadQueue.io.lqReady <> storeQueue.io.lqReady
277*eb8f00f4SWilliam Wang      loadQueue.io.sqReady <> storeQueue.io.sqReady
278*eb8f00f4SWilliam Wang      io.lsIdxs(i).lsroqIdx := DontCare
279c7658a75SYinan Xu      io.dp1Req(i).ready := storeQueue.io.dp1Req(i).ready && loadQueue.io.dp1Req(i).ready
280c7658a75SYinan Xu    })
281c7658a75SYinan Xu  }
282*eb8f00f4SWilliam Wang}
283