xref: /XiangShan/src/main/scala/xiangshan/backend/issue/IssueQueue.scala (revision 8db72c71b2456cd46d489843914ffad7c41c08c8)
1package xiangshan.backend.issue
2
3import chipsalliance.rocketchip.config.Parameters
4import chisel3._
5import chisel3.util._
6import freechips.rocketchip.diplomacy.{LazyModule, LazyModuleImp}
7import utility.HasCircularQueuePtrHelper
8import xiangshan._
9import xiangshan.backend.fu.{FuConfig, FuType}
10import xiangshan.mem.{MemWaitUpdateReq, SqPtr}
11import xiangshan.backend.Bundles.{DynInst, IssueQueueIssueBundle, IssueQueueWakeUpBundle}
12import xiangshan.backend.datapath.DataConfig._
13import xiangshan.backend.exu.ExeUnitParams
14
15class IssueQueue(params: IssueBlockParams)(implicit p: Parameters) extends LazyModule with HasXSParameter {
16  implicit val iqParams = params
17  lazy val module = iqParams.schdType match {
18    case IntScheduler() => new IssueQueueIntImp(this)
19    case VfScheduler() => new IssueQueueVfImp(this)
20    case MemScheduler() => if (iqParams.StdCnt == 0) new IssueQueueMemAddrImp(this)
21      else new IssueQueueIntImp(this)
22    case _ => null
23  }
24}
25
26class IssueQueueStatusBundle(numEnq: Int) extends Bundle {
27  val empty = Output(Bool())
28  val full = Output(Bool())
29  val leftVec = Output(Vec(numEnq + 1, Bool()))
30}
31
32class IssueQueueDeqRespBundle(implicit p:Parameters, params: IssueBlockParams) extends StatusArrayDeqRespBundle
33
34class IssueQueueIO()(implicit p: Parameters, params: IssueBlockParams) extends XSBundle {
35  val flush = Flipped(ValidIO(new Redirect))
36
37  val enq = Vec(params.numEnq, Flipped(DecoupledIO(new DynInst)))
38
39  val deq: MixedVec[DecoupledIO[IssueQueueIssueBundle]] = params.genIssueDecoupledBundle
40  val deqResp = Vec(params.numDeq, Flipped(ValidIO(new IssueQueueDeqRespBundle)))
41  val og0Resp = Vec(params.numDeq, Flipped(ValidIO(new IssueQueueDeqRespBundle)))
42  val og1Resp = Vec(params.numDeq, Flipped(ValidIO(new IssueQueueDeqRespBundle)))
43  val wbBusyTableRead = Input(params.genWbFuBusyTableReadBundle())
44  val wakeup = Vec(params.numWakeupFromWB, Flipped(ValidIO(new IssueQueueWakeUpBundle(params.pregBits))))
45  val status = Output(new IssueQueueStatusBundle(params.numEnq))
46  val statusNext = Output(new IssueQueueStatusBundle(params.numEnq))
47  // Todo: wake up bundle
48}
49
50class IssueQueueImp(override val wrapper: IssueQueue)(implicit p: Parameters, val params: IssueBlockParams)
51  extends LazyModuleImp(wrapper)
52  with HasXSParameter {
53
54  println(s"[IssueQueueImp] ${params.getIQName} wakeupFromWB: ${params.numWakeupFromWB}, " +
55    s"numEntries: ${params.numEntries}, numRegSrc: ${params.numRegSrc}")
56
57  require(params.numExu <= 2, "IssueQueue has not supported more than 2 deq ports")
58  val deqFuCfgs     : Seq[Seq[FuConfig]] = params.exuBlockParams.map(_.fuConfigs)
59  val fuLatencyMaps :  Seq[Option[Seq[(Int, Int)]]]  = params.exuBlockParams.map(x => x.fuLatencyMap)
60  val intFuLatencyMaps: Seq[Option[Seq[(Int, Int)]]]  = params.exuBlockParams.map(x => x.intFuLatencyMap)
61  val vfFuLatencyMaps : Seq[Option[Seq[(Int, Int)]]]  = params.exuBlockParams.map(x => x.vfFuLatencyMap)
62  val latencyValMaxs: Seq[Option[Int]] = params.exuBlockParams.map(x => x.latencyValMax)
63  val allDeqFuCfgs: Seq[FuConfig] = params.exuBlockParams.flatMap(_.fuConfigs)
64  val fuCfgsCnt     : Map[FuConfig, Int] = allDeqFuCfgs.groupBy(x => x).map { case (cfg, cfgSeq) => (cfg, cfgSeq.length) }
65  val commonFuCfgs  : Seq[FuConfig] = fuCfgsCnt.filter(_._2 > 1).keys.toSeq
66  println(s"[IssueQueueImp] ${params.getIQName} commonFuCfgs: ${commonFuCfgs.map(_.name)}")
67  lazy val io = IO(new IssueQueueIO())
68  dontTouch(io.deq)
69  dontTouch(io.deqResp)
70  // Modules
71  val statusArray   = Module(StatusArray(p, params))
72  val immArray      = Module(new DataArray(UInt(XLEN.W), params.numDeq, params.numEnq, params.numEntries))
73  val payloadArray  = Module(new DataArray(Output(new DynInst), params.numDeq, params.numEnq, params.numEntries))
74  val enqPolicy     = Module(new EnqPolicy)
75  val subDeqPolicies  = deqFuCfgs.map(x => if (x.nonEmpty) Some(Module(new DeqPolicy())) else None)
76  val fuBusyTable = latencyValMaxs.map { case y => if (y.getOrElse(0)>0) Some(Reg(UInt(y.getOrElse(1).W))) else None }
77
78  // Wires
79  val resps = Seq(io.deqResp, io.og0Resp, io.og1Resp)
80
81  val intWbBusyTableRead = io.wbBusyTableRead.map(_.intWbBusyTable)
82  val vfWbBusyTableRead = io.wbBusyTableRead.map(_.vfWbBusyTable)
83  val fuBusyTableMask = Wire(Vec(params.numDeq, UInt(params.numEntries.W)))
84  val wbBusyTableMask = Wire(Vec(params.numDeq, UInt(params.numEntries.W)))
85  val s0_enqValidVec = io.enq.map(_.valid)
86  val s0_enqSelValidVec = Wire(Vec(params.numEnq, Bool()))
87  val s0_enqSelOHVec = Wire(Vec(params.numEnq, UInt(params.numEntries.W)))
88  val s0_enqNotFlush = !io.flush.valid
89  val s0_enqBits = WireInit(VecInit(io.enq.map(_.bits)))
90  val s0_doEnqSelValidVec = s0_enqSelValidVec.map(_ && s0_enqNotFlush)
91  val s0_doEnqOH: Vec[UInt] = VecInit((s0_doEnqSelValidVec zip s0_enqSelOHVec).map { case (valid, oh) =>
92    Mux(valid, oh, 0.U)
93  })
94
95  val s0_enqImmValidVec = io.enq.map(enq => enq.valid)
96  val s0_enqImmVec = VecInit(io.enq.map(_.bits.imm))
97
98  // One deq port only need one special deq policy
99  val subDeqSelValidVec: Seq[Option[Vec[Bool]]] = subDeqPolicies.map(_.map(_ => Wire(Vec(params.numDeq, Bool()))))
100  val subDeqSelOHVec: Seq[Option[Vec[UInt]]] = subDeqPolicies.map(_.map(_ => Wire(Vec(params.numDeq, UInt(params.numEntries.W)))))
101
102  val finalDeqSelValidVec = Wire(Vec(params.numDeq, Bool()))
103  val finalDeqSelOHVec    = Wire(Vec(params.numDeq, UInt(params.numEntries.W)))
104  val finalDeqOH: IndexedSeq[UInt] = (finalDeqSelValidVec zip finalDeqSelOHVec).map { case (valid, oh) =>
105    Mux(valid, oh, 0.U)
106  }
107  val finalDeqMask: UInt = finalDeqOH.reduce(_ | _)
108
109  val deqRespVec = io.deqResp
110
111  val validVec = VecInit(statusArray.io.valid.asBools)
112  val canIssueVec = VecInit(statusArray.io.canIssue.asBools)
113  val clearVec = VecInit(statusArray.io.clear.asBools)
114  val deqFirstIssueVec = VecInit(statusArray.io.deq.map(_.isFirstIssue))
115
116  val wakeupEnqSrcStateBypass = Wire(Vec(io.enq.size, Vec(io.enq.head.bits.srcType.size, SrcState())))
117  for (i <- io.enq.indices) {
118    for (j <- s0_enqBits(i).srcType.indices) {
119      wakeupEnqSrcStateBypass(i)(j) := Cat(
120        io.wakeup.map(x => x.bits.wakeUp(Seq((s0_enqBits(i).psrc(j), s0_enqBits(i).srcType(j))), x.valid).head)
121      ).orR
122    }
123  }
124
125  statusArray.io match { case statusArrayIO: StatusArrayIO =>
126    statusArrayIO.flush  <> io.flush
127    statusArrayIO.wakeup <> io.wakeup
128    statusArrayIO.enq.zipWithIndex.foreach { case (enq: ValidIO[StatusArrayEnqBundle], i) =>
129      enq.valid                 := s0_doEnqSelValidVec(i)
130      enq.bits.addrOH           := s0_enqSelOHVec(i)
131      val numLSrc = s0_enqBits(i).srcType.size.min(enq.bits.data.srcType.size)
132      for (j <- 0 until numLSrc) {
133        enq.bits.data.srcState(j) := s0_enqBits(i).srcState(j) | wakeupEnqSrcStateBypass(i)(j)
134        enq.bits.data.psrc(j)     := s0_enqBits(i).psrc(j)
135        enq.bits.data.srcType(j)  := s0_enqBits(i).srcType(j)
136      }
137      enq.bits.data.robIdx      := s0_enqBits(i).robIdx
138      enq.bits.data.ready       := false.B
139      enq.bits.data.issued      := false.B
140      enq.bits.data.firstIssue  := false.B
141      enq.bits.data.blocked     := false.B
142    }
143    statusArrayIO.deq.zipWithIndex.foreach { case (deq, i) =>
144      deq.deqSelOH.valid  := finalDeqSelValidVec(i)
145      deq.deqSelOH.bits   := finalDeqSelOHVec(i)
146    }
147    statusArrayIO.deqResp.zipWithIndex.foreach { case (deqResp, i) =>
148      deqResp.valid      := io.deqResp(i).valid
149      deqResp.bits.addrOH := io.deqResp(i).bits.addrOH
150      deqResp.bits.success := io.deqResp(i).bits.success
151      deqResp.bits.dataInvalidSqIdx := io.deqResp(i).bits.dataInvalidSqIdx
152      deqResp.bits.respType := io.deqResp(i).bits.respType
153      deqResp.bits.rfWen := io.deqResp(i).bits.rfWen
154      deqResp.bits.fuType := io.deqResp(i).bits.fuType
155    }
156    statusArrayIO.og0Resp.zipWithIndex.foreach { case (og0Resp, i) =>
157      og0Resp.valid := io.og0Resp(i).valid
158      og0Resp.bits.addrOH := io.og0Resp(i).bits.addrOH
159      og0Resp.bits.success := io.og0Resp(i).bits.success
160      og0Resp.bits.dataInvalidSqIdx := io.og0Resp(i).bits.dataInvalidSqIdx
161      og0Resp.bits.respType := io.og0Resp(i).bits.respType
162      og0Resp.bits.rfWen := io.og0Resp(i).bits.rfWen
163      og0Resp.bits.fuType := io.og0Resp(i).bits.fuType
164    }
165    statusArrayIO.og1Resp.zipWithIndex.foreach { case (og1Resp, i) =>
166      og1Resp.valid := io.og1Resp(i).valid
167      og1Resp.bits.addrOH := io.og1Resp(i).bits.addrOH
168      og1Resp.bits.success := io.og1Resp(i).bits.success
169      og1Resp.bits.dataInvalidSqIdx := io.og1Resp(i).bits.dataInvalidSqIdx
170      og1Resp.bits.respType := io.og1Resp(i).bits.respType
171      og1Resp.bits.rfWen := io.og1Resp(i).bits.rfWen
172      og1Resp.bits.fuType := io.og1Resp(i).bits.fuType
173    }
174  }
175
176  val immArrayRdataVec = immArray.io.read.map(_.data)
177  immArray.io match { case immArrayIO: DataArrayIO[UInt] =>
178    immArrayIO.write.zipWithIndex.foreach { case (w, i) =>
179      w.en := s0_doEnqSelValidVec(i) && s0_enqImmValidVec(i)
180      w.addr := s0_enqSelOHVec(i)
181      w.data := s0_enqImmVec(i)
182    }
183    immArrayIO.read.zipWithIndex.foreach { case (r, i) =>
184      r.addr := finalDeqOH(i)
185    }
186  }
187
188  val payloadArrayRdata = Wire(Vec(params.numDeq, Output(new DynInst)))
189  payloadArray.io match { case payloadArrayIO: DataArrayIO[DynInst] =>
190    payloadArrayIO.write.zipWithIndex.foreach { case (w, i) =>
191      w.en := s0_doEnqSelValidVec(i)
192      w.addr := s0_enqSelOHVec(i)
193      w.data := s0_enqBits(i)
194    }
195    payloadArrayIO.read.zipWithIndex.foreach { case (r, i) =>
196      r.addr := finalDeqOH(i)
197      payloadArrayRdata(i) := r.data
198    }
199  }
200
201  val fuTypeRegVec = Reg(Vec(params.numEntries, FuType()))
202  val fuTypeNextVec = WireInit(fuTypeRegVec)
203  fuTypeRegVec := fuTypeNextVec
204
205  s0_doEnqSelValidVec.zip(s0_enqSelOHVec).zipWithIndex.foreach { case ((valid, oh), i) =>
206    when (valid) {
207      fuTypeNextVec(OHToUInt(oh)) := s0_enqBits(i).fuType
208    }
209  }
210
211  enqPolicy match { case ep =>
212    ep.io.valid     := validVec.asUInt
213    s0_enqSelValidVec  := ep.io.enqSelOHVec.map(oh => oh.valid).zip(s0_enqValidVec).zip(io.enq).map { case((sel, enqValid), enq) => enqValid && sel && enq.ready}
214    s0_enqSelOHVec     := ep.io.enqSelOHVec.map(oh => oh.bits)
215  }
216
217  protected val commonAccept: UInt = Cat(fuTypeRegVec.map(fuType =>
218    Cat(commonFuCfgs.map(_.fuType.U === fuType)).orR
219  ).reverse)
220
221  // if deq port can accept the uop
222  protected val canAcceptVec: Seq[UInt] = deqFuCfgs.map { fuCfgs: Seq[FuConfig] =>
223    Cat(fuTypeRegVec.map(fuType => Cat(fuCfgs.map(_.fuType.U === fuType)).orR).reverse).asUInt
224  }
225
226  protected val deqCanAcceptVec: Seq[IndexedSeq[Bool]] = deqFuCfgs.map { fuCfgs: Seq[FuConfig] =>
227    fuTypeRegVec.map(fuType =>
228      Cat(fuCfgs.map(_.fuType.U === fuType)).asUInt.orR) // C+E0    C+E1
229  }
230
231  subDeqPolicies.zipWithIndex.map { case (dpOption: Option[DeqPolicy], i) =>
232    if (dpOption.nonEmpty) {
233      val dp = dpOption.get
234      dp.io.request             := canIssueVec.asUInt & VecInit(deqCanAcceptVec(i)).asUInt & (~fuBusyTableMask(i)).asUInt & (~wbBusyTableMask(i)).asUInt
235      subDeqSelValidVec(i).get  := dp.io.deqSelOHVec.map(oh => oh.valid)
236      subDeqSelOHVec(i).get     := dp.io.deqSelOHVec.map(oh => oh.bits)
237    }
238  }
239
240  protected val enqCanAcceptVec: Seq[IndexedSeq[Bool]] = deqFuCfgs.map { fuCfgs: Seq[FuConfig] =>
241    io.enq.map(_.bits.fuType).map(fuType =>
242      Cat(fuCfgs.map(_.fuType.U === fuType)).asUInt.orR) // C+E0    C+E1
243  }
244
245  val ageDetectorEnqVec: Vec[Vec[UInt]] = WireInit(VecInit(Seq.fill(params.numDeq)(VecInit(Seq.fill(params.numEnq)(0.U(params.numEntries.W))))))
246
247  ageDetectorEnqVec.zip(enqCanAcceptVec) foreach {
248    case (ageDetectorEnq, enqCanAccept) =>
249      ageDetectorEnq := enqCanAccept.zip(s0_doEnqOH).map {
250        case (enqCanAccept, s0_doEnqOH) => Mux(enqCanAccept, s0_doEnqOH, 0.U)
251      }
252  }
253
254  val oldestSelVec = (0 until params.numDeq).map {
255    case deqIdx =>
256      AgeDetector(numEntries = params.numEntries,
257        enq = ageDetectorEnqVec(deqIdx),
258        deq = clearVec.asUInt,
259        canIssue = canIssueVec.asUInt & (~fuBusyTableMask(deqIdx)).asUInt)
260  }
261
262  finalDeqSelValidVec.head := oldestSelVec.head.valid || subDeqSelValidVec.head.getOrElse(Seq(false.B)).head
263  finalDeqSelOHVec.head := Mux(oldestSelVec.head.valid, oldestSelVec.head.bits, subDeqSelOHVec.head.getOrElse(Seq(0.U)).head)
264
265  if (params.numDeq == 2) {
266    val chooseOldest = oldestSelVec(1).valid && oldestSelVec(1).bits =/= finalDeqSelOHVec.head
267    val choose1stSub = subDeqSelOHVec(1).getOrElse(Seq(0.U)).head =/= finalDeqSelOHVec.head
268
269    finalDeqSelValidVec(1) := MuxCase(subDeqSelValidVec(1).getOrElse(Seq(false.B)).last, Seq(
270      (chooseOldest) -> oldestSelVec(1).valid,
271      (choose1stSub) -> subDeqSelValidVec(1).getOrElse(Seq(false.B)).head)
272    )
273    finalDeqSelOHVec(1) := MuxCase(subDeqSelOHVec(1).getOrElse(Seq(0.U)).last, Seq(
274      (chooseOldest) -> oldestSelVec(1).bits,
275      (choose1stSub) -> subDeqSelOHVec(1).getOrElse(Seq(0.U)).head)
276    )
277  }
278
279  // fuBusyTable write
280  for (i <- 0 until params.numDeq){
281    if (fuBusyTable(i).nonEmpty) {
282      val isLatencyNumVec = Mux(resps(0)(i).valid && resps(0)(i).bits.respType === RSFeedbackType.issueSuccess,
283        Cat((0 until latencyValMaxs(i).get).map { case num =>
284          val latencyNumFuType = fuLatencyMaps(i).get.filter(_._2 == num+1).map(_._1) // futype with latency equal to num+1
285          val isLatencyNum = Cat(latencyNumFuType.map(futype => fuTypeRegVec(OHToUInt(io.deqResp(i).bits.addrOH)) === futype.U)).asUInt().orR() // The latency of the deq inst is Num
286          isLatencyNum
287        }),
288        0.U
289      ) // |  when N cycle is 2 latency, N+1 cycle could not 1 latency
290      val isLNumVecOg0 = WireInit(~(0.U.asTypeOf(isLatencyNumVec)))
291      isLNumVecOg0 := Mux(resps(1)(i).valid && resps(1)(i).bits.respType === RSFeedbackType.rfArbitFail,
292        ~(Cat(Cat((0 until latencyValMaxs(i).get).map { case num =>
293          val latencyNumFuType = fuLatencyMaps(i).get.filter(_._2 == num+1).map(_._1) // futype with latency equal to num+1
294          val isLatencyNum = Cat(latencyNumFuType.map(futype => fuTypeRegVec(OHToUInt(io.og0Resp(i).bits.addrOH)) === futype.U)).asUInt().orR() // The latency of the deq inst is Num
295          isLatencyNum
296        }), 0.U(1.W))),
297        ~(0.U.asTypeOf(isLatencyNumVec))
298        // & ~
299      )
300      val isLNumVecOg1 = WireInit(~(0.U.asTypeOf(isLatencyNumVec)))
301      isLNumVecOg1 := Mux(resps(2)(i).valid && resps(2)(i).bits.respType === RSFeedbackType.fuBusy,
302        ~(Cat(Cat((0 until latencyValMaxs(i).get).map { case num =>
303          val latencyNumFuType = fuLatencyMaps(i).get.filter(_._2 == num+1).map(_._1) // futype with latency equal to num+1
304          val isLatencyNum = Cat(latencyNumFuType.map(futype => fuTypeRegVec(OHToUInt(io.og1Resp(i).bits.addrOH)) === futype.U)).asUInt().orR() // The latency of the deq inst is Num
305          isLatencyNum
306        }), 0.U(2.W))),
307        ~(0.U.asTypeOf(isLatencyNumVec))
308      )
309      // & ~
310
311
312      fuBusyTable(i).get := ((fuBusyTable(i).get << 1.U).asUInt() | isLatencyNumVec) & isLNumVecOg0.asUInt() & isLNumVecOg1.asUInt()
313    }
314  }
315
316  for (i <- 0 until params.numDeq){
317    // fuBusyTable read
318    if(fuBusyTable(i).nonEmpty){
319      val isReadLatencyNumVec2 = fuBusyTable(i).get.asBools().reverse.zipWithIndex.map { case (en, idx) =>
320        val isLatencyNumVec = WireInit(0.U(params.numEntries.W))
321        when(en) {
322          isLatencyNumVec := VecInit(fuTypeRegVec.map { case futype =>
323            val latencyNumFuType = fuLatencyMaps(i).get.filter(_._2 == idx).map(_._1)
324            val isLatencyNum = Cat(latencyNumFuType.map(_.U === futype)).asUInt.orR
325            isLatencyNum
326          }).asUInt
327        }
328        isLatencyNumVec
329      }
330      if ( latencyValMaxs(i).get > 1 ){
331        fuBusyTableMask(i) := isReadLatencyNumVec2.reduce(_ | _)
332      }else{
333        fuBusyTableMask(i) := isReadLatencyNumVec2.head
334      }
335    } else {
336      fuBusyTableMask(i) := 0.U(params.numEntries.W)
337    }
338
339    // intWbFuBusyTable read
340    val intWbBusyTableMask = if (intWbBusyTableRead(i).isDefined) {
341      intWbBusyTableRead(i).get.asBools.zipWithIndex.map { case (en, idx) =>
342        val isLatencyNumVec = WireInit(0.U(params.numEntries.W))
343        when(en) {
344          isLatencyNumVec := VecInit(fuTypeRegVec.map { case futype =>
345            val latencyNumFuType = intFuLatencyMaps(i).get.filter(_._2 == idx).map(_._1)
346            val isLatencyNum = Cat(latencyNumFuType.map(_.U === futype)).asUInt.orR
347            isLatencyNum
348          }).asUInt
349        }
350        isLatencyNumVec
351      }
352    }.fold(0.U)(_ | _)
353    else{
354      0.U(params.numEntries.W)
355    }
356    // vfWbFuBusyTable read
357    val vfWbBusyTableMask = if (vfWbBusyTableRead(i).isDefined) {
358      vfWbBusyTableRead(i).get.asBools.zipWithIndex.map { case (en, idx) =>
359        val isLatencyNumVec = WireInit(0.U(params.numEntries.W))
360        when(en) {
361          isLatencyNumVec := VecInit(fuTypeRegVec.map { case futype =>
362            val latencyNumFuType = vfFuLatencyMaps(i).get.filter(_._2 == idx).map(_._1)
363            val isLatencyNum = Cat(latencyNumFuType.map(_.U === futype)).asUInt().orR()
364            isLatencyNum
365          }).asUInt()
366        }
367        isLatencyNumVec
368      }
369    }.fold(0.U)(_ | _)
370    else{
371      0.U(params.numEntries.W)
372    }
373
374    wbBusyTableMask(i) := intWbBusyTableMask | vfWbBusyTableMask
375  }
376
377  io.deq.zipWithIndex.foreach { case (deq, i) =>
378    deq.valid                := finalDeqSelValidVec(i)
379    deq.bits.addrOH          := finalDeqSelOHVec(i)
380    deq.bits.common.isFirstIssue := deqFirstIssueVec(i)
381    deq.bits.common.iqIdx    := OHToUInt(finalDeqSelOHVec(i))
382    deq.bits.common.fuType   := payloadArrayRdata(i).fuType
383    deq.bits.common.fuOpType := payloadArrayRdata(i).fuOpType
384    deq.bits.common.rfWen.foreach(_ := payloadArrayRdata(i).rfWen)
385    deq.bits.common.fpWen.foreach(_ := payloadArrayRdata(i).fpWen)
386    deq.bits.common.vecWen.foreach(_ := payloadArrayRdata(i).vecWen)
387    deq.bits.common.flushPipe.foreach(_ := payloadArrayRdata(i).flushPipe)
388    deq.bits.common.pdest := payloadArrayRdata(i).pdest
389    deq.bits.common.robIdx := payloadArrayRdata(i).robIdx
390    deq.bits.common.imm := immArrayRdataVec(i)
391    deq.bits.rf.zip(payloadArrayRdata(i).psrc).foreach { case (rf, psrc) =>
392      rf.foreach(_.addr := psrc) // psrc in payload array can be pregIdx of IntRegFile or VfRegFile
393    }
394    deq.bits.rf.zip(payloadArrayRdata(i).srcType).foreach { case (rf, srcType) =>
395      rf.foreach(_.srcType := srcType) // psrc in payload array can be pregIdx of IntRegFile or VfRegFile
396    }
397    deq.bits.srcType.zip(payloadArrayRdata(i).srcType).foreach { case (sink, source) =>
398      sink := source
399    }
400    deq.bits.immType := payloadArrayRdata(i).selImm
401  }
402
403  // Todo: better counter implementation
404  private val validCnt = PopCount(validVec)
405  private val enqSelCnt = PopCount(s0_doEnqSelValidVec)
406  private val validCntNext = validCnt + enqSelCnt
407  io.status.full := validVec.asUInt.andR
408  io.status.empty := !validVec.asUInt.orR
409  io.status.leftVec(0) := io.status.full
410  for (i <- 0 until params.numEnq) {
411    io.status.leftVec(i + 1) := validCnt === (params.numEntries - (i + 1)).U
412  }
413  io.statusNext.full := validCntNext === params.numEntries.U
414  io.statusNext.empty := validCntNext === 0.U // always false now
415  io.statusNext.leftVec(0) := io.statusNext.full
416  for (i <- 0 until params.numEnq) {
417    io.statusNext.leftVec(i + 1) := validCntNext === (params.numEntries - (i + 1)).U
418  }
419  io.enq.foreach(_.ready := !Cat(io.status.leftVec).orR) // Todo: more efficient implementation
420}
421
422class IssueQueueJumpBundle extends Bundle {
423  val pc = UInt(VAddrData().dataWidth.W)
424  val target = UInt(VAddrData().dataWidth.W)
425}
426
427class IssueQueueLoadBundle(implicit p: Parameters) extends XSBundle {
428  val fastMatch = UInt(backendParams.LduCnt.W)
429  val fastImm = UInt(12.W)
430}
431
432class IssueQueueIntIO()(implicit p: Parameters, params: IssueBlockParams) extends IssueQueueIO {
433  val enqJmp = if(params.numPcReadPort > 0) Some(Input(Vec(params.numPcReadPort, new IssueQueueJumpBundle))) else None
434}
435
436class IssueQueueIntImp(override val wrapper: IssueQueue)(implicit p: Parameters, iqParams: IssueBlockParams)
437  extends IssueQueueImp(wrapper)
438{
439  io.suggestName("none")
440  override lazy val io = IO(new IssueQueueIntIO).suggestName("io")
441  val pcArray: Option[DataArray[UInt]] = if(params.needPc) Some(Module(
442    new DataArray(UInt(VAddrData().dataWidth.W), params.numDeq, params.numEnq, params.numEntries)
443  )) else None
444  val targetArray: Option[DataArray[UInt]] = if(params.needPc) Some(Module(
445    new DataArray(UInt(VAddrData().dataWidth.W), params.numDeq, params.numEnq, params.numEntries)
446  )) else None
447
448  if (pcArray.nonEmpty) {
449    val pcArrayIO = pcArray.get.io
450    pcArrayIO.read.zipWithIndex.foreach { case (r, i) =>
451      r.addr := finalDeqSelOHVec(i)
452    }
453    pcArrayIO.write.zipWithIndex.foreach { case (w, i) =>
454      w.en := s0_doEnqSelValidVec(i)
455      w.addr := s0_enqSelOHVec(i)
456//      w.data := io.enqJmp.get(i).pc
457      w.data := io.enq(i).bits.pc
458    }
459  }
460
461  if (targetArray.nonEmpty) {
462    val arrayIO = targetArray.get.io
463    arrayIO.read.zipWithIndex.foreach { case (r, i) =>
464      r.addr := finalDeqSelOHVec(i)
465    }
466    arrayIO.write.zipWithIndex.foreach { case (w, i) =>
467      w.en := s0_doEnqSelValidVec(i)
468      w.addr := s0_enqSelOHVec(i)
469      w.data := io.enqJmp.get(i).target
470    }
471  }
472
473  io.deq.zipWithIndex.foreach{ case (deq, i) => {
474    deq.bits.jmp.foreach((deqJmp: IssueQueueJumpBundle) => {
475      deqJmp.pc := pcArray.get.io.read(i).data
476      deqJmp.target := targetArray.get.io.read(i).data
477    })
478    deq.bits.common.preDecode.foreach(_ := payloadArrayRdata(i).preDecodeInfo)
479    deq.bits.common.ftqIdx.foreach(_ := payloadArrayRdata(i).ftqPtr)
480    deq.bits.common.ftqOffset.foreach(_ := payloadArrayRdata(i).ftqOffset)
481    deq.bits.common.predictInfo.foreach(x => {
482      x.target := targetArray.get.io.read(i).data
483      x.taken := payloadArrayRdata(i).pred_taken
484    })
485    // for std
486    deq.bits.common.sqIdx.foreach(_ := payloadArrayRdata(i).sqIdx)
487    // for i2f
488    deq.bits.common.fpu.foreach(_ := payloadArrayRdata(i).fpu)
489  }}
490}
491
492class IssueQueueVfImp(override val wrapper: IssueQueue)(implicit p: Parameters, iqParams: IssueBlockParams)
493  extends IssueQueueImp(wrapper)
494{
495  statusArray.io match { case statusArrayIO: StatusArrayIO =>
496    statusArrayIO.enq.zipWithIndex.foreach { case (enq: ValidIO[StatusArrayEnqBundle], i) =>
497      val numLSrc = s0_enqBits(i).srcType.size min enq.bits.data.srcType.size
498      val numPSrc = s0_enqBits(i).srcState.size min enq.bits.data.srcState.size
499
500      for (j <- 0 until numPSrc) {
501        enq.bits.data.srcState(j) := s0_enqBits(i).srcState(j) | wakeupEnqSrcStateBypass(i)(j)
502        enq.bits.data.psrc(j)     := s0_enqBits(i).psrc(j)
503      }
504
505      for (j <- 0 until numLSrc) {
506        enq.bits.data.srcType(j) := s0_enqBits(i).srcType(j)
507      }
508      if (enq.bits.data.srcType.isDefinedAt(3)) enq.bits.data.srcType(3) := SrcType.vp // v0: mask src
509      if (enq.bits.data.srcType.isDefinedAt(4)) enq.bits.data.srcType(4) := SrcType.vp // vl&vtype
510    }
511  }
512  io.deq.zipWithIndex.foreach{ case (deq, i) => {
513    deq.bits.common.fpu.foreach(_ := payloadArrayRdata(i).fpu)
514    deq.bits.common.vpu.foreach(_ := payloadArrayRdata(i).vpu)
515    deq.bits.common.vpu.foreach(_.vuopIdx := payloadArrayRdata(i).uopIdx)
516  }}
517}
518
519class IssueQueueMemBundle(implicit p: Parameters, params: IssueBlockParams) extends Bundle {
520  val feedbackIO = Flipped(Vec(params.numDeq, new MemRSFeedbackIO))
521  val checkWait = new Bundle {
522    val stIssuePtr = Input(new SqPtr)
523    val memWaitUpdateReq = Flipped(new MemWaitUpdateReq)
524  }
525  val loadFastMatch = Output(Vec(params.LduCnt, new IssueQueueLoadBundle))
526}
527
528class IssueQueueMemIO(implicit p: Parameters, params: IssueBlockParams) extends IssueQueueIO {
529  val memIO = Some(new IssueQueueMemBundle)
530}
531
532class IssueQueueMemAddrImp(override val wrapper: IssueQueue)(implicit p: Parameters, params: IssueBlockParams)
533  extends IssueQueueImp(wrapper) with HasCircularQueuePtrHelper {
534
535  require(params.StdCnt == 0 && (params.LduCnt + params.StaCnt + params.VlduCnt) > 0, "IssueQueueMemAddrImp can only be instance of MemAddr IQ")
536
537  io.suggestName("none")
538  override lazy val io = IO(new IssueQueueMemIO).suggestName("io")
539  private val memIO = io.memIO.get
540
541  for (i <- io.enq.indices) {
542    val blockNotReleased = isAfter(io.enq(i).bits.sqIdx, memIO.checkWait.stIssuePtr)
543    val storeAddrWaitForIsIssuing = VecInit((0 until StorePipelineWidth).map(i => {
544      memIO.checkWait.memWaitUpdateReq.staIssue(i).valid &&
545        memIO.checkWait.memWaitUpdateReq.staIssue(i).bits.uop.robIdx.value === io.enq(i).bits.waitForRobIdx.value
546    })).asUInt.orR && !io.enq(i).bits.loadWaitStrict // is waiting for store addr ready
547    s0_enqBits(i).loadWaitBit := io.enq(i).bits.loadWaitBit && !storeAddrWaitForIsIssuing && blockNotReleased
548  }
549
550  for (i <- statusArray.io.enq.indices) {
551    statusArray.io.enq(i).bits.data match { case enqData =>
552      enqData.blocked := s0_enqBits(i).loadWaitBit
553      enqData.mem.get.strictWait := s0_enqBits(i).loadWaitStrict
554      enqData.mem.get.waitForStd := false.B
555      enqData.mem.get.waitForRobIdx := s0_enqBits(i).waitForRobIdx
556      enqData.mem.get.waitForSqIdx := 0.U.asTypeOf(enqData.mem.get.waitForSqIdx) // generated by sq, will be updated later
557      enqData.mem.get.sqIdx := s0_enqBits(i).sqIdx
558    }
559
560    statusArray.io.deqResp.zipWithIndex.foreach { case (deqResp, i) =>
561      deqResp.valid        := io.deqResp(i).valid
562      deqResp.bits.addrOH  := io.deqResp(i).bits.addrOH
563      deqResp.bits.success := io.deqResp(i).bits.success
564      deqResp.bits.dataInvalidSqIdx := io.deqResp(i).bits.dataInvalidSqIdx
565      deqResp.bits.respType := io.deqResp(i).bits.respType
566      deqResp.bits.rfWen := io.deqResp(i).bits.rfWen
567      deqResp.bits.fuType := io.deqResp(i).bits.fuType
568    }
569
570    statusArray.io.og0Resp.zipWithIndex.foreach { case (og0Resp, i) =>
571      og0Resp.valid := io.og0Resp(i).valid
572      og0Resp.bits.addrOH := io.og0Resp(i).bits.addrOH
573      og0Resp.bits.success := io.og0Resp(i).bits.success
574      og0Resp.bits.dataInvalidSqIdx := io.og0Resp(i).bits.dataInvalidSqIdx
575      og0Resp.bits.respType := io.og0Resp(i).bits.respType
576      og0Resp.bits.rfWen := io.og0Resp(i).bits.rfWen
577      og0Resp.bits.fuType := io.og0Resp(i).bits.fuType
578    }
579    statusArray.io.og1Resp.zipWithIndex.foreach { case (og1Resp, i) =>
580      og1Resp.valid := io.og1Resp(i).valid
581      og1Resp.bits.addrOH := io.og1Resp(i).bits.addrOH
582      og1Resp.bits.success := io.og1Resp(i).bits.success
583      og1Resp.bits.dataInvalidSqIdx := io.og1Resp(i).bits.dataInvalidSqIdx
584      og1Resp.bits.respType := io.og1Resp(i).bits.respType
585      og1Resp.bits.rfWen := io.og1Resp(i).bits.rfWen
586      og1Resp.bits.fuType := io.og1Resp(i).bits.fuType
587    }
588
589    statusArray.io.fromMem.get.slowResp.zipWithIndex.foreach { case (slowResp, i) =>
590      slowResp.valid                 := memIO.feedbackIO(i).feedbackSlow.valid
591      slowResp.bits.addrOH           := UIntToOH(memIO.feedbackIO(i).feedbackSlow.bits.rsIdx)
592      slowResp.bits.success          := memIO.feedbackIO(i).feedbackSlow.bits.hit
593      slowResp.bits.respType         := Mux(memIO.feedbackIO(i).feedbackSlow.bits.hit, 0.U, RSFeedbackType.feedbackInvalid)
594      slowResp.bits.dataInvalidSqIdx := memIO.feedbackIO(i).feedbackSlow.bits.dataInvalidSqIdx
595      slowResp.bits.rfWen := DontCare
596      slowResp.bits.fuType := DontCare
597    }
598
599    statusArray.io.fromMem.get.fastResp.zipWithIndex.foreach { case (fastResp, i) =>
600      fastResp.valid                 := memIO.feedbackIO(i).feedbackFast.valid
601      fastResp.bits.addrOH           := UIntToOH(memIO.feedbackIO(i).feedbackFast.bits.rsIdx)
602      fastResp.bits.success          := memIO.feedbackIO(i).feedbackFast.bits.hit
603      fastResp.bits.respType         := memIO.feedbackIO(i).feedbackFast.bits.sourceType
604      fastResp.bits.dataInvalidSqIdx := 0.U.asTypeOf(fastResp.bits.dataInvalidSqIdx)
605      fastResp.bits.rfWen := DontCare
606      fastResp.bits.fuType := DontCare
607    }
608
609    statusArray.io.fromMem.get.memWaitUpdateReq := memIO.checkWait.memWaitUpdateReq
610    statusArray.io.fromMem.get.stIssuePtr := memIO.checkWait.stIssuePtr
611  }
612
613  io.deq.zipWithIndex.foreach { case (deq, i) =>
614    deq.bits.common.sqIdx.get := payloadArrayRdata(i).sqIdx
615    deq.bits.common.lqIdx.get := payloadArrayRdata(i).lqIdx
616    if (params.isLdAddrIQ) {
617      deq.bits.common.ftqIdx.get := payloadArrayRdata(i).ftqPtr
618      deq.bits.common.ftqOffset.get := payloadArrayRdata(i).ftqOffset
619    }
620  }
621}