1package xiangshan.backend.issue 2 3import chipsalliance.rocketchip.config.Parameters 4import chisel3._ 5import chisel3.util._ 6import freechips.rocketchip.diplomacy.{LazyModule, LazyModuleImp} 7import utility.HasCircularQueuePtrHelper 8import xiangshan._ 9import xiangshan.backend.fu.{FuConfig, FuType} 10import xiangshan.mem.{MemWaitUpdateReq, SqPtr} 11import xiangshan.backend.Bundles.{DynInst, IssueQueueIssueBundle, IssueQueueWakeUpBundle} 12import xiangshan.backend.datapath.DataConfig._ 13import xiangshan.backend.exu.ExeUnitParams 14 15class IssueQueue(params: IssueBlockParams)(implicit p: Parameters) extends LazyModule with HasXSParameter { 16 implicit val iqParams = params 17 lazy val module = iqParams.schdType match { 18 case IntScheduler() => new IssueQueueIntImp(this) 19 case VfScheduler() => new IssueQueueVfImp(this) 20 case MemScheduler() => if (iqParams.StdCnt == 0) new IssueQueueMemAddrImp(this) 21 else new IssueQueueIntImp(this) 22 case _ => null 23 } 24} 25 26class IssueQueueStatusBundle(numEnq: Int) extends Bundle { 27 val empty = Output(Bool()) 28 val full = Output(Bool()) 29 val leftVec = Output(Vec(numEnq + 1, Bool())) 30} 31 32class IssueQueueDeqRespBundle(implicit p:Parameters, params: IssueBlockParams) extends StatusArrayDeqRespBundle 33 34class IssueQueueIO()(implicit p: Parameters, params: IssueBlockParams) extends XSBundle { 35 val flush = Flipped(ValidIO(new Redirect)) 36 37 val enq = Vec(params.numEnq, Flipped(DecoupledIO(new DynInst))) 38 39 val deq: MixedVec[DecoupledIO[IssueQueueIssueBundle]] = params.genIssueDecoupledBundle 40 val deqResp = Vec(params.numDeq, Flipped(ValidIO(new IssueQueueDeqRespBundle))) 41 val og0Resp = Vec(params.numDeq, Flipped(ValidIO(new IssueQueueDeqRespBundle))) 42 val og1Resp = Vec(params.numDeq, Flipped(ValidIO(new IssueQueueDeqRespBundle))) 43 val wbBusyTableRead = Input(params.genWbFuBusyTableReadBundle()) 44 val wakeup = Vec(params.numWakeupFromWB, Flipped(ValidIO(new IssueQueueWakeUpBundle(params.pregBits)))) 45 val status = Output(new IssueQueueStatusBundle(params.numEnq)) 46 val statusNext = Output(new IssueQueueStatusBundle(params.numEnq)) 47 // Todo: wake up bundle 48} 49 50class IssueQueueImp(override val wrapper: IssueQueue)(implicit p: Parameters, val params: IssueBlockParams) 51 extends LazyModuleImp(wrapper) 52 with HasXSParameter { 53 54 println(s"[IssueQueueImp] ${params.getIQName} wakeupFromWB: ${params.numWakeupFromWB}, " + 55 s"numEntries: ${params.numEntries}, numRegSrc: ${params.numRegSrc}") 56 57 require(params.numExu <= 2, "IssueQueue has not supported more than 2 deq ports") 58 val deqFuCfgs : Seq[Seq[FuConfig]] = params.exuBlockParams.map(_.fuConfigs) 59 val fuLatencyMaps : Seq[Option[Seq[(Int, Int)]]] = params.exuBlockParams.map(x => x.fuLatencyMap) 60 val intFuLatencyMaps: Seq[Option[Seq[(Int, Int)]]] = params.exuBlockParams.map(x => x.intFuLatencyMap) 61 val vfFuLatencyMaps : Seq[Option[Seq[(Int, Int)]]] = params.exuBlockParams.map(x => x.vfFuLatencyMap) 62 val latencyValMaxs: Seq[Option[Int]] = params.exuBlockParams.map(x => x.latencyValMax) 63 val allDeqFuCfgs: Seq[FuConfig] = params.exuBlockParams.flatMap(_.fuConfigs) 64 val fuCfgsCnt : Map[FuConfig, Int] = allDeqFuCfgs.groupBy(x => x).map { case (cfg, cfgSeq) => (cfg, cfgSeq.length) } 65 val commonFuCfgs : Seq[FuConfig] = fuCfgsCnt.filter(_._2 > 1).keys.toSeq 66 println(s"[IssueQueueImp] ${params.getIQName} commonFuCfgs: ${commonFuCfgs.map(_.name)}") 67 lazy val io = IO(new IssueQueueIO()) 68 dontTouch(io.deq) 69 dontTouch(io.deqResp) 70 // Modules 71 val statusArray = Module(StatusArray(p, params)) 72 val immArray = Module(new DataArray(UInt(XLEN.W), params.numDeq, params.numEnq, params.numEntries)) 73 val payloadArray = Module(new DataArray(Output(new DynInst), params.numDeq, params.numEnq, params.numEntries)) 74 val enqPolicy = Module(new EnqPolicy) 75 val subDeqPolicies = deqFuCfgs.map(x => if (x.nonEmpty) Some(Module(new DeqPolicy())) else None) 76 val fuBusyTable = latencyValMaxs.map { case y => if (y.getOrElse(0)>0) Some(Reg(UInt(y.getOrElse(1).W))) else None } 77 78 // Wires 79 val resps = Seq(io.deqResp, io.og0Resp, io.og1Resp) 80 81 val intWbBusyTableRead = io.wbBusyTableRead.map(_.intWbBusyTable) 82 val vfWbBusyTableRead = io.wbBusyTableRead.map(_.vfWbBusyTable) 83 val fuBusyTableMask = Wire(Vec(params.numDeq, UInt(params.numEntries.W))) 84 val wbBusyTableMask = Wire(Vec(params.numDeq, UInt(params.numEntries.W))) 85 val s0_enqValidVec = io.enq.map(_.valid) 86 val s0_enqSelValidVec = Wire(Vec(params.numEnq, Bool())) 87 val s0_enqSelOHVec = Wire(Vec(params.numEnq, UInt(params.numEntries.W))) 88 val s0_enqNotFlush = !io.flush.valid 89 val s0_enqBits = WireInit(VecInit(io.enq.map(_.bits))) 90 val s0_doEnqSelValidVec = s0_enqSelValidVec.map(_ && s0_enqNotFlush) 91 val s0_doEnqOH: Vec[UInt] = VecInit((s0_doEnqSelValidVec zip s0_enqSelOHVec).map { case (valid, oh) => 92 Mux(valid, oh, 0.U) 93 }) 94 95 val s0_enqImmValidVec = io.enq.map(enq => enq.valid) 96 val s0_enqImmVec = VecInit(io.enq.map(_.bits.imm)) 97 98 // One deq port only need one special deq policy 99 val subDeqSelValidVec: Seq[Option[Vec[Bool]]] = subDeqPolicies.map(_.map(_ => Wire(Vec(params.numDeq, Bool())))) 100 val subDeqSelOHVec: Seq[Option[Vec[UInt]]] = subDeqPolicies.map(_.map(_ => Wire(Vec(params.numDeq, UInt(params.numEntries.W))))) 101 102 val finalDeqSelValidVec = Wire(Vec(params.numDeq, Bool())) 103 val finalDeqSelOHVec = Wire(Vec(params.numDeq, UInt(params.numEntries.W))) 104 val finalDeqOH: IndexedSeq[UInt] = (finalDeqSelValidVec zip finalDeqSelOHVec).map { case (valid, oh) => 105 Mux(valid, oh, 0.U) 106 } 107 val finalDeqMask: UInt = finalDeqOH.reduce(_ | _) 108 109 val deqRespVec = io.deqResp 110 111 val validVec = VecInit(statusArray.io.valid.asBools) 112 val canIssueVec = VecInit(statusArray.io.canIssue.asBools) 113 val clearVec = VecInit(statusArray.io.clear.asBools) 114 val deqFirstIssueVec = VecInit(statusArray.io.deq.map(_.isFirstIssue)) 115 116 val wakeupEnqSrcStateBypass = Wire(Vec(io.enq.size, Vec(io.enq.head.bits.srcType.size, SrcState()))) 117 for (i <- io.enq.indices) { 118 for (j <- s0_enqBits(i).srcType.indices) { 119 wakeupEnqSrcStateBypass(i)(j) := Cat( 120 io.wakeup.map(x => x.bits.wakeUp(Seq((s0_enqBits(i).psrc(j), s0_enqBits(i).srcType(j))), x.valid).head) 121 ).orR 122 } 123 } 124 125 statusArray.io match { case statusArrayIO: StatusArrayIO => 126 statusArrayIO.flush <> io.flush 127 statusArrayIO.wakeup <> io.wakeup 128 statusArrayIO.enq.zipWithIndex.foreach { case (enq: ValidIO[StatusArrayEnqBundle], i) => 129 enq.valid := s0_doEnqSelValidVec(i) 130 enq.bits.addrOH := s0_enqSelOHVec(i) 131 val numLSrc = s0_enqBits(i).srcType.size.min(enq.bits.data.srcType.size) 132 for (j <- 0 until numLSrc) { 133 enq.bits.data.srcState(j) := s0_enqBits(i).srcState(j) | wakeupEnqSrcStateBypass(i)(j) 134 enq.bits.data.psrc(j) := s0_enqBits(i).psrc(j) 135 enq.bits.data.srcType(j) := s0_enqBits(i).srcType(j) 136 } 137 enq.bits.data.robIdx := s0_enqBits(i).robIdx 138 enq.bits.data.ready := false.B 139 enq.bits.data.issued := false.B 140 enq.bits.data.firstIssue := false.B 141 enq.bits.data.blocked := false.B 142 } 143 statusArrayIO.deq.zipWithIndex.foreach { case (deq, i) => 144 deq.deqSelOH.valid := finalDeqSelValidVec(i) 145 deq.deqSelOH.bits := finalDeqSelOHVec(i) 146 } 147 statusArrayIO.deqResp.zipWithIndex.foreach { case (deqResp, i) => 148 deqResp.valid := io.deqResp(i).valid 149 deqResp.bits.addrOH := io.deqResp(i).bits.addrOH 150 deqResp.bits.success := io.deqResp(i).bits.success 151 deqResp.bits.dataInvalidSqIdx := io.deqResp(i).bits.dataInvalidSqIdx 152 deqResp.bits.respType := io.deqResp(i).bits.respType 153 deqResp.bits.rfWen := io.deqResp(i).bits.rfWen 154 deqResp.bits.fuType := io.deqResp(i).bits.fuType 155 } 156 statusArrayIO.og0Resp.zipWithIndex.foreach { case (og0Resp, i) => 157 og0Resp.valid := io.og0Resp(i).valid 158 og0Resp.bits.addrOH := io.og0Resp(i).bits.addrOH 159 og0Resp.bits.success := io.og0Resp(i).bits.success 160 og0Resp.bits.dataInvalidSqIdx := io.og0Resp(i).bits.dataInvalidSqIdx 161 og0Resp.bits.respType := io.og0Resp(i).bits.respType 162 og0Resp.bits.rfWen := io.og0Resp(i).bits.rfWen 163 og0Resp.bits.fuType := io.og0Resp(i).bits.fuType 164 } 165 statusArrayIO.og1Resp.zipWithIndex.foreach { case (og1Resp, i) => 166 og1Resp.valid := io.og1Resp(i).valid 167 og1Resp.bits.addrOH := io.og1Resp(i).bits.addrOH 168 og1Resp.bits.success := io.og1Resp(i).bits.success 169 og1Resp.bits.dataInvalidSqIdx := io.og1Resp(i).bits.dataInvalidSqIdx 170 og1Resp.bits.respType := io.og1Resp(i).bits.respType 171 og1Resp.bits.rfWen := io.og1Resp(i).bits.rfWen 172 og1Resp.bits.fuType := io.og1Resp(i).bits.fuType 173 } 174 } 175 176 val immArrayRdataVec = immArray.io.read.map(_.data) 177 immArray.io match { case immArrayIO: DataArrayIO[UInt] => 178 immArrayIO.write.zipWithIndex.foreach { case (w, i) => 179 w.en := s0_doEnqSelValidVec(i) && s0_enqImmValidVec(i) 180 w.addr := s0_enqSelOHVec(i) 181 w.data := s0_enqImmVec(i) 182 } 183 immArrayIO.read.zipWithIndex.foreach { case (r, i) => 184 r.addr := finalDeqOH(i) 185 } 186 } 187 188 val payloadArrayRdata = Wire(Vec(params.numDeq, Output(new DynInst))) 189 payloadArray.io match { case payloadArrayIO: DataArrayIO[DynInst] => 190 payloadArrayIO.write.zipWithIndex.foreach { case (w, i) => 191 w.en := s0_doEnqSelValidVec(i) 192 w.addr := s0_enqSelOHVec(i) 193 w.data := s0_enqBits(i) 194 } 195 payloadArrayIO.read.zipWithIndex.foreach { case (r, i) => 196 r.addr := finalDeqOH(i) 197 payloadArrayRdata(i) := r.data 198 } 199 } 200 201 val fuTypeRegVec = Reg(Vec(params.numEntries, FuType())) 202 val fuTypeNextVec = WireInit(fuTypeRegVec) 203 fuTypeRegVec := fuTypeNextVec 204 205 s0_doEnqSelValidVec.zip(s0_enqSelOHVec).zipWithIndex.foreach { case ((valid, oh), i) => 206 when (valid) { 207 fuTypeNextVec(OHToUInt(oh)) := s0_enqBits(i).fuType 208 } 209 } 210 211 enqPolicy match { case ep => 212 ep.io.valid := validVec.asUInt 213 s0_enqSelValidVec := ep.io.enqSelOHVec.map(oh => oh.valid).zip(s0_enqValidVec).zip(io.enq).map { case((sel, enqValid), enq) => enqValid && sel && enq.ready} 214 s0_enqSelOHVec := ep.io.enqSelOHVec.map(oh => oh.bits) 215 } 216 217 protected val commonAccept: UInt = Cat(fuTypeRegVec.map(fuType => 218 Cat(commonFuCfgs.map(_.fuType.U === fuType)).orR 219 ).reverse) 220 221 // if deq port can accept the uop 222 protected val canAcceptVec: Seq[UInt] = deqFuCfgs.map { fuCfgs: Seq[FuConfig] => 223 Cat(fuTypeRegVec.map(fuType => Cat(fuCfgs.map(_.fuType.U === fuType)).orR).reverse).asUInt 224 } 225 226 protected val deqCanAcceptVec: Seq[IndexedSeq[Bool]] = deqFuCfgs.map { fuCfgs: Seq[FuConfig] => 227 fuTypeRegVec.map(fuType => 228 Cat(fuCfgs.map(_.fuType.U === fuType)).asUInt.orR) // C+E0 C+E1 229 } 230 231 subDeqPolicies.zipWithIndex.map { case (dpOption: Option[DeqPolicy], i) => 232 if (dpOption.nonEmpty) { 233 val dp = dpOption.get 234 dp.io.request := canIssueVec.asUInt & VecInit(deqCanAcceptVec(i)).asUInt & (~fuBusyTableMask(i)).asUInt & (~wbBusyTableMask(i)).asUInt 235 subDeqSelValidVec(i).get := dp.io.deqSelOHVec.map(oh => oh.valid) 236 subDeqSelOHVec(i).get := dp.io.deqSelOHVec.map(oh => oh.bits) 237 } 238 } 239 240 protected val enqCanAcceptVec: Seq[IndexedSeq[Bool]] = deqFuCfgs.map { fuCfgs: Seq[FuConfig] => 241 io.enq.map(_.bits.fuType).map(fuType => 242 Cat(fuCfgs.map(_.fuType.U === fuType)).asUInt.orR) // C+E0 C+E1 243 } 244 245 val ageDetectorEnqVec: Vec[Vec[UInt]] = WireInit(VecInit(Seq.fill(params.numDeq)(VecInit(Seq.fill(params.numEnq)(0.U(params.numEntries.W)))))) 246 247 ageDetectorEnqVec.zip(enqCanAcceptVec) foreach { 248 case (ageDetectorEnq, enqCanAccept) => 249 ageDetectorEnq := enqCanAccept.zip(s0_doEnqOH).map { 250 case (enqCanAccept, s0_doEnqOH) => Mux(enqCanAccept, s0_doEnqOH, 0.U) 251 } 252 } 253 254 val oldestSelVec = (0 until params.numDeq).map { 255 case deqIdx => 256 AgeDetector(numEntries = params.numEntries, 257 enq = ageDetectorEnqVec(deqIdx), 258 deq = clearVec.asUInt, 259 canIssue = canIssueVec.asUInt & (~fuBusyTableMask(deqIdx)).asUInt) 260 } 261 262 finalDeqSelValidVec.head := oldestSelVec.head.valid || subDeqSelValidVec.head.getOrElse(Seq(false.B)).head 263 finalDeqSelOHVec.head := Mux(oldestSelVec.head.valid, oldestSelVec.head.bits, subDeqSelOHVec.head.getOrElse(Seq(0.U)).head) 264 265 if (params.numDeq == 2) { 266 val chooseOldest = oldestSelVec(1).valid && oldestSelVec(1).bits =/= finalDeqSelOHVec.head 267 val choose1stSub = subDeqSelOHVec(1).getOrElse(Seq(0.U)).head =/= finalDeqSelOHVec.head 268 269 finalDeqSelValidVec(1) := MuxCase(subDeqSelValidVec(1).getOrElse(Seq(false.B)).last, Seq( 270 (chooseOldest) -> oldestSelVec(1).valid, 271 (choose1stSub) -> subDeqSelValidVec(1).getOrElse(Seq(false.B)).head) 272 ) 273 finalDeqSelOHVec(1) := MuxCase(subDeqSelOHVec(1).getOrElse(Seq(0.U)).last, Seq( 274 (chooseOldest) -> oldestSelVec(1).bits, 275 (choose1stSub) -> subDeqSelOHVec(1).getOrElse(Seq(0.U)).head) 276 ) 277 } 278 279 // fuBusyTable write 280 for (i <- 0 until params.numDeq){ 281 if (fuBusyTable(i).nonEmpty) { 282 val isLatencyNumVec = Mux(resps(0)(i).valid && resps(0)(i).bits.respType === RSFeedbackType.issueSuccess, 283 Cat((0 until latencyValMaxs(i).get).map { case num => 284 val latencyNumFuType = fuLatencyMaps(i).get.filter(_._2 == num+1).map(_._1) // futype with latency equal to num+1 285 val isLatencyNum = Cat(latencyNumFuType.map(futype => fuTypeRegVec(OHToUInt(io.deqResp(i).bits.addrOH)) === futype.U)).asUInt().orR() // The latency of the deq inst is Num 286 isLatencyNum 287 }), 288 0.U 289 ) // | when N cycle is 2 latency, N+1 cycle could not 1 latency 290 val isLNumVecOg0 = WireInit(~(0.U.asTypeOf(isLatencyNumVec))) 291 isLNumVecOg0 := Mux(resps(1)(i).valid && resps(1)(i).bits.respType === RSFeedbackType.rfArbitFail, 292 ~(Cat(Cat((0 until latencyValMaxs(i).get).map { case num => 293 val latencyNumFuType = fuLatencyMaps(i).get.filter(_._2 == num+1).map(_._1) // futype with latency equal to num+1 294 val isLatencyNum = Cat(latencyNumFuType.map(futype => fuTypeRegVec(OHToUInt(io.og0Resp(i).bits.addrOH)) === futype.U)).asUInt().orR() // The latency of the deq inst is Num 295 isLatencyNum 296 }), 0.U(1.W))), 297 ~(0.U.asTypeOf(isLatencyNumVec)) 298 // & ~ 299 ) 300 val isLNumVecOg1 = WireInit(~(0.U.asTypeOf(isLatencyNumVec))) 301 isLNumVecOg1 := Mux(resps(2)(i).valid && resps(2)(i).bits.respType === RSFeedbackType.fuBusy, 302 ~(Cat(Cat((0 until latencyValMaxs(i).get).map { case num => 303 val latencyNumFuType = fuLatencyMaps(i).get.filter(_._2 == num+1).map(_._1) // futype with latency equal to num+1 304 val isLatencyNum = Cat(latencyNumFuType.map(futype => fuTypeRegVec(OHToUInt(io.og1Resp(i).bits.addrOH)) === futype.U)).asUInt().orR() // The latency of the deq inst is Num 305 isLatencyNum 306 }), 0.U(2.W))), 307 ~(0.U.asTypeOf(isLatencyNumVec)) 308 ) 309 // & ~ 310 311 312 fuBusyTable(i).get := ((fuBusyTable(i).get << 1.U).asUInt() | isLatencyNumVec) & isLNumVecOg0.asUInt() & isLNumVecOg1.asUInt() 313 } 314 } 315 316 for (i <- 0 until params.numDeq){ 317 // fuBusyTable read 318 if(fuBusyTable(i).nonEmpty){ 319 val isReadLatencyNumVec2 = fuBusyTable(i).get.asBools().reverse.zipWithIndex.map { case (en, idx) => 320 val isLatencyNumVec = WireInit(0.U(params.numEntries.W)) 321 when(en) { 322 isLatencyNumVec := VecInit(fuTypeRegVec.map { case futype => 323 val latencyNumFuType = fuLatencyMaps(i).get.filter(_._2 == idx).map(_._1) 324 val isLatencyNum = Cat(latencyNumFuType.map(_.U === futype)).asUInt.orR 325 isLatencyNum 326 }).asUInt 327 } 328 isLatencyNumVec 329 } 330 if ( latencyValMaxs(i).get > 1 ){ 331 fuBusyTableMask(i) := isReadLatencyNumVec2.reduce(_ | _) 332 }else{ 333 fuBusyTableMask(i) := isReadLatencyNumVec2.head 334 } 335 } else { 336 fuBusyTableMask(i) := 0.U(params.numEntries.W) 337 } 338 339 // intWbFuBusyTable read 340 val intWbBusyTableMask = if (intWbBusyTableRead(i).isDefined) { 341 intWbBusyTableRead(i).get.asBools.zipWithIndex.map { case (en, idx) => 342 val isLatencyNumVec = WireInit(0.U(params.numEntries.W)) 343 when(en) { 344 isLatencyNumVec := VecInit(fuTypeRegVec.map { case futype => 345 val latencyNumFuType = intFuLatencyMaps(i).get.filter(_._2 == idx).map(_._1) 346 val isLatencyNum = Cat(latencyNumFuType.map(_.U === futype)).asUInt.orR 347 isLatencyNum 348 }).asUInt 349 } 350 isLatencyNumVec 351 } 352 }.fold(0.U)(_ | _) 353 else{ 354 0.U(params.numEntries.W) 355 } 356 // vfWbFuBusyTable read 357 val vfWbBusyTableMask = if (vfWbBusyTableRead(i).isDefined) { 358 vfWbBusyTableRead(i).get.asBools.zipWithIndex.map { case (en, idx) => 359 val isLatencyNumVec = WireInit(0.U(params.numEntries.W)) 360 when(en) { 361 isLatencyNumVec := VecInit(fuTypeRegVec.map { case futype => 362 val latencyNumFuType = vfFuLatencyMaps(i).get.filter(_._2 == idx).map(_._1) 363 val isLatencyNum = Cat(latencyNumFuType.map(_.U === futype)).asUInt().orR() 364 isLatencyNum 365 }).asUInt() 366 } 367 isLatencyNumVec 368 } 369 }.fold(0.U)(_ | _) 370 else{ 371 0.U(params.numEntries.W) 372 } 373 374 wbBusyTableMask(i) := intWbBusyTableMask | vfWbBusyTableMask 375 } 376 377 io.deq.zipWithIndex.foreach { case (deq, i) => 378 deq.valid := finalDeqSelValidVec(i) 379 deq.bits.addrOH := finalDeqSelOHVec(i) 380 deq.bits.common.isFirstIssue := deqFirstIssueVec(i) 381 deq.bits.common.iqIdx := OHToUInt(finalDeqSelOHVec(i)) 382 deq.bits.common.fuType := payloadArrayRdata(i).fuType 383 deq.bits.common.fuOpType := payloadArrayRdata(i).fuOpType 384 deq.bits.common.rfWen.foreach(_ := payloadArrayRdata(i).rfWen) 385 deq.bits.common.fpWen.foreach(_ := payloadArrayRdata(i).fpWen) 386 deq.bits.common.vecWen.foreach(_ := payloadArrayRdata(i).vecWen) 387 deq.bits.common.flushPipe.foreach(_ := payloadArrayRdata(i).flushPipe) 388 deq.bits.common.pdest := payloadArrayRdata(i).pdest 389 deq.bits.common.robIdx := payloadArrayRdata(i).robIdx 390 deq.bits.common.imm := immArrayRdataVec(i) 391 deq.bits.rf.zip(payloadArrayRdata(i).psrc).foreach { case (rf, psrc) => 392 rf.foreach(_.addr := psrc) // psrc in payload array can be pregIdx of IntRegFile or VfRegFile 393 } 394 deq.bits.rf.zip(payloadArrayRdata(i).srcType).foreach { case (rf, srcType) => 395 rf.foreach(_.srcType := srcType) // psrc in payload array can be pregIdx of IntRegFile or VfRegFile 396 } 397 deq.bits.srcType.zip(payloadArrayRdata(i).srcType).foreach { case (sink, source) => 398 sink := source 399 } 400 deq.bits.immType := payloadArrayRdata(i).selImm 401 } 402 403 // Todo: better counter implementation 404 private val validCnt = PopCount(validVec) 405 private val enqSelCnt = PopCount(s0_doEnqSelValidVec) 406 private val validCntNext = validCnt + enqSelCnt 407 io.status.full := validVec.asUInt.andR 408 io.status.empty := !validVec.asUInt.orR 409 io.status.leftVec(0) := io.status.full 410 for (i <- 0 until params.numEnq) { 411 io.status.leftVec(i + 1) := validCnt === (params.numEntries - (i + 1)).U 412 } 413 io.statusNext.full := validCntNext === params.numEntries.U 414 io.statusNext.empty := validCntNext === 0.U // always false now 415 io.statusNext.leftVec(0) := io.statusNext.full 416 for (i <- 0 until params.numEnq) { 417 io.statusNext.leftVec(i + 1) := validCntNext === (params.numEntries - (i + 1)).U 418 } 419 io.enq.foreach(_.ready := !Cat(io.status.leftVec).orR) // Todo: more efficient implementation 420} 421 422class IssueQueueJumpBundle extends Bundle { 423 val pc = UInt(VAddrData().dataWidth.W) 424 val target = UInt(VAddrData().dataWidth.W) 425} 426 427class IssueQueueLoadBundle(implicit p: Parameters) extends XSBundle { 428 val fastMatch = UInt(backendParams.LduCnt.W) 429 val fastImm = UInt(12.W) 430} 431 432class IssueQueueIntIO()(implicit p: Parameters, params: IssueBlockParams) extends IssueQueueIO { 433 val enqJmp = if(params.numPcReadPort > 0) Some(Input(Vec(params.numPcReadPort, new IssueQueueJumpBundle))) else None 434} 435 436class IssueQueueIntImp(override val wrapper: IssueQueue)(implicit p: Parameters, iqParams: IssueBlockParams) 437 extends IssueQueueImp(wrapper) 438{ 439 io.suggestName("none") 440 override lazy val io = IO(new IssueQueueIntIO).suggestName("io") 441 val pcArray: Option[DataArray[UInt]] = if(params.needPc) Some(Module( 442 new DataArray(UInt(VAddrData().dataWidth.W), params.numDeq, params.numEnq, params.numEntries) 443 )) else None 444 val targetArray: Option[DataArray[UInt]] = if(params.needPc) Some(Module( 445 new DataArray(UInt(VAddrData().dataWidth.W), params.numDeq, params.numEnq, params.numEntries) 446 )) else None 447 448 if (pcArray.nonEmpty) { 449 val pcArrayIO = pcArray.get.io 450 pcArrayIO.read.zipWithIndex.foreach { case (r, i) => 451 r.addr := finalDeqSelOHVec(i) 452 } 453 pcArrayIO.write.zipWithIndex.foreach { case (w, i) => 454 w.en := s0_doEnqSelValidVec(i) 455 w.addr := s0_enqSelOHVec(i) 456// w.data := io.enqJmp.get(i).pc 457 w.data := io.enq(i).bits.pc 458 } 459 } 460 461 if (targetArray.nonEmpty) { 462 val arrayIO = targetArray.get.io 463 arrayIO.read.zipWithIndex.foreach { case (r, i) => 464 r.addr := finalDeqSelOHVec(i) 465 } 466 arrayIO.write.zipWithIndex.foreach { case (w, i) => 467 w.en := s0_doEnqSelValidVec(i) 468 w.addr := s0_enqSelOHVec(i) 469 w.data := io.enqJmp.get(i).target 470 } 471 } 472 473 io.deq.zipWithIndex.foreach{ case (deq, i) => { 474 deq.bits.jmp.foreach((deqJmp: IssueQueueJumpBundle) => { 475 deqJmp.pc := pcArray.get.io.read(i).data 476 deqJmp.target := targetArray.get.io.read(i).data 477 }) 478 deq.bits.common.preDecode.foreach(_ := payloadArrayRdata(i).preDecodeInfo) 479 deq.bits.common.ftqIdx.foreach(_ := payloadArrayRdata(i).ftqPtr) 480 deq.bits.common.ftqOffset.foreach(_ := payloadArrayRdata(i).ftqOffset) 481 deq.bits.common.predictInfo.foreach(x => { 482 x.target := targetArray.get.io.read(i).data 483 x.taken := payloadArrayRdata(i).pred_taken 484 }) 485 // for std 486 deq.bits.common.sqIdx.foreach(_ := payloadArrayRdata(i).sqIdx) 487 // for i2f 488 deq.bits.common.fpu.foreach(_ := payloadArrayRdata(i).fpu) 489 }} 490} 491 492class IssueQueueVfImp(override val wrapper: IssueQueue)(implicit p: Parameters, iqParams: IssueBlockParams) 493 extends IssueQueueImp(wrapper) 494{ 495 statusArray.io match { case statusArrayIO: StatusArrayIO => 496 statusArrayIO.enq.zipWithIndex.foreach { case (enq: ValidIO[StatusArrayEnqBundle], i) => 497 val numLSrc = s0_enqBits(i).srcType.size min enq.bits.data.srcType.size 498 val numPSrc = s0_enqBits(i).srcState.size min enq.bits.data.srcState.size 499 500 for (j <- 0 until numPSrc) { 501 enq.bits.data.srcState(j) := s0_enqBits(i).srcState(j) | wakeupEnqSrcStateBypass(i)(j) 502 enq.bits.data.psrc(j) := s0_enqBits(i).psrc(j) 503 } 504 505 for (j <- 0 until numLSrc) { 506 enq.bits.data.srcType(j) := s0_enqBits(i).srcType(j) 507 } 508 if (enq.bits.data.srcType.isDefinedAt(3)) enq.bits.data.srcType(3) := SrcType.vp // v0: mask src 509 if (enq.bits.data.srcType.isDefinedAt(4)) enq.bits.data.srcType(4) := SrcType.vp // vl&vtype 510 } 511 } 512 io.deq.zipWithIndex.foreach{ case (deq, i) => { 513 deq.bits.common.fpu.foreach(_ := payloadArrayRdata(i).fpu) 514 deq.bits.common.vpu.foreach(_ := payloadArrayRdata(i).vpu) 515 deq.bits.common.vpu.foreach(_.vuopIdx := payloadArrayRdata(i).uopIdx) 516 }} 517} 518 519class IssueQueueMemBundle(implicit p: Parameters, params: IssueBlockParams) extends Bundle { 520 val feedbackIO = Flipped(Vec(params.numDeq, new MemRSFeedbackIO)) 521 val checkWait = new Bundle { 522 val stIssuePtr = Input(new SqPtr) 523 val memWaitUpdateReq = Flipped(new MemWaitUpdateReq) 524 } 525 val loadFastMatch = Output(Vec(params.LduCnt, new IssueQueueLoadBundle)) 526} 527 528class IssueQueueMemIO(implicit p: Parameters, params: IssueBlockParams) extends IssueQueueIO { 529 val memIO = Some(new IssueQueueMemBundle) 530} 531 532class IssueQueueMemAddrImp(override val wrapper: IssueQueue)(implicit p: Parameters, params: IssueBlockParams) 533 extends IssueQueueImp(wrapper) with HasCircularQueuePtrHelper { 534 535 require(params.StdCnt == 0 && (params.LduCnt + params.StaCnt + params.VlduCnt) > 0, "IssueQueueMemAddrImp can only be instance of MemAddr IQ") 536 537 io.suggestName("none") 538 override lazy val io = IO(new IssueQueueMemIO).suggestName("io") 539 private val memIO = io.memIO.get 540 541 for (i <- io.enq.indices) { 542 val blockNotReleased = isAfter(io.enq(i).bits.sqIdx, memIO.checkWait.stIssuePtr) 543 val storeAddrWaitForIsIssuing = VecInit((0 until StorePipelineWidth).map(i => { 544 memIO.checkWait.memWaitUpdateReq.staIssue(i).valid && 545 memIO.checkWait.memWaitUpdateReq.staIssue(i).bits.uop.robIdx.value === io.enq(i).bits.waitForRobIdx.value 546 })).asUInt.orR && !io.enq(i).bits.loadWaitStrict // is waiting for store addr ready 547 s0_enqBits(i).loadWaitBit := io.enq(i).bits.loadWaitBit && !storeAddrWaitForIsIssuing && blockNotReleased 548 } 549 550 for (i <- statusArray.io.enq.indices) { 551 statusArray.io.enq(i).bits.data match { case enqData => 552 enqData.blocked := s0_enqBits(i).loadWaitBit 553 enqData.mem.get.strictWait := s0_enqBits(i).loadWaitStrict 554 enqData.mem.get.waitForStd := false.B 555 enqData.mem.get.waitForRobIdx := s0_enqBits(i).waitForRobIdx 556 enqData.mem.get.waitForSqIdx := 0.U.asTypeOf(enqData.mem.get.waitForSqIdx) // generated by sq, will be updated later 557 enqData.mem.get.sqIdx := s0_enqBits(i).sqIdx 558 } 559 560 statusArray.io.deqResp.zipWithIndex.foreach { case (deqResp, i) => 561 deqResp.valid := io.deqResp(i).valid 562 deqResp.bits.addrOH := io.deqResp(i).bits.addrOH 563 deqResp.bits.success := io.deqResp(i).bits.success 564 deqResp.bits.dataInvalidSqIdx := io.deqResp(i).bits.dataInvalidSqIdx 565 deqResp.bits.respType := io.deqResp(i).bits.respType 566 deqResp.bits.rfWen := io.deqResp(i).bits.rfWen 567 deqResp.bits.fuType := io.deqResp(i).bits.fuType 568 } 569 570 statusArray.io.og0Resp.zipWithIndex.foreach { case (og0Resp, i) => 571 og0Resp.valid := io.og0Resp(i).valid 572 og0Resp.bits.addrOH := io.og0Resp(i).bits.addrOH 573 og0Resp.bits.success := io.og0Resp(i).bits.success 574 og0Resp.bits.dataInvalidSqIdx := io.og0Resp(i).bits.dataInvalidSqIdx 575 og0Resp.bits.respType := io.og0Resp(i).bits.respType 576 og0Resp.bits.rfWen := io.og0Resp(i).bits.rfWen 577 og0Resp.bits.fuType := io.og0Resp(i).bits.fuType 578 } 579 statusArray.io.og1Resp.zipWithIndex.foreach { case (og1Resp, i) => 580 og1Resp.valid := io.og1Resp(i).valid 581 og1Resp.bits.addrOH := io.og1Resp(i).bits.addrOH 582 og1Resp.bits.success := io.og1Resp(i).bits.success 583 og1Resp.bits.dataInvalidSqIdx := io.og1Resp(i).bits.dataInvalidSqIdx 584 og1Resp.bits.respType := io.og1Resp(i).bits.respType 585 og1Resp.bits.rfWen := io.og1Resp(i).bits.rfWen 586 og1Resp.bits.fuType := io.og1Resp(i).bits.fuType 587 } 588 589 statusArray.io.fromMem.get.slowResp.zipWithIndex.foreach { case (slowResp, i) => 590 slowResp.valid := memIO.feedbackIO(i).feedbackSlow.valid 591 slowResp.bits.addrOH := UIntToOH(memIO.feedbackIO(i).feedbackSlow.bits.rsIdx) 592 slowResp.bits.success := memIO.feedbackIO(i).feedbackSlow.bits.hit 593 slowResp.bits.respType := Mux(memIO.feedbackIO(i).feedbackSlow.bits.hit, 0.U, RSFeedbackType.feedbackInvalid) 594 slowResp.bits.dataInvalidSqIdx := memIO.feedbackIO(i).feedbackSlow.bits.dataInvalidSqIdx 595 slowResp.bits.rfWen := DontCare 596 slowResp.bits.fuType := DontCare 597 } 598 599 statusArray.io.fromMem.get.fastResp.zipWithIndex.foreach { case (fastResp, i) => 600 fastResp.valid := memIO.feedbackIO(i).feedbackFast.valid 601 fastResp.bits.addrOH := UIntToOH(memIO.feedbackIO(i).feedbackFast.bits.rsIdx) 602 fastResp.bits.success := memIO.feedbackIO(i).feedbackFast.bits.hit 603 fastResp.bits.respType := memIO.feedbackIO(i).feedbackFast.bits.sourceType 604 fastResp.bits.dataInvalidSqIdx := 0.U.asTypeOf(fastResp.bits.dataInvalidSqIdx) 605 fastResp.bits.rfWen := DontCare 606 fastResp.bits.fuType := DontCare 607 } 608 609 statusArray.io.fromMem.get.memWaitUpdateReq := memIO.checkWait.memWaitUpdateReq 610 statusArray.io.fromMem.get.stIssuePtr := memIO.checkWait.stIssuePtr 611 } 612 613 io.deq.zipWithIndex.foreach { case (deq, i) => 614 deq.bits.common.sqIdx.get := payloadArrayRdata(i).sqIdx 615 deq.bits.common.lqIdx.get := payloadArrayRdata(i).lqIdx 616 if (params.isLdAddrIQ) { 617 deq.bits.common.ftqIdx.get := payloadArrayRdata(i).ftqPtr 618 deq.bits.common.ftqOffset.get := payloadArrayRdata(i).ftqOffset 619 } 620 } 621}