xref: /XiangShan/src/main/scala/xiangshan/backend/datapath/DataPath.scala (revision c4fc226ad7a2197009ce1afff94b3636f87bb475)
1package xiangshan.backend.datapath
2
3import org.chipsalliance.cde.config.Parameters
4import chisel3._
5import chisel3.util._
6import difftest.{DiffArchFpRegState, DiffArchIntRegState, DiffArchVecRegState, DifftestModule}
7import freechips.rocketchip.diplomacy.{LazyModule, LazyModuleImp}
8import utility._
9import utils.SeqUtils._
10import utils.{XSPerfAccumulate, XSPerfHistogram}
11import xiangshan._
12import xiangshan.backend.BackendParams
13import xiangshan.backend.Bundles._
14import xiangshan.backend.decode.ImmUnion
15import xiangshan.backend.datapath.DataConfig._
16import xiangshan.backend.datapath.RdConfig._
17import xiangshan.backend.issue.{ImmExtractor, IntScheduler, MemScheduler, VfScheduler}
18import xiangshan.backend.issue.EntryBundles._
19import xiangshan.backend.regfile._
20import xiangshan.backend.PcToDataPathIO
21
22class DataPath(params: BackendParams)(implicit p: Parameters) extends LazyModule {
23  override def shouldBeInlined: Boolean = false
24
25  private implicit val dpParams: BackendParams = params
26  lazy val module = new DataPathImp(this)
27
28  println(s"[DataPath] Preg Params: ")
29  println(s"[DataPath]   Int R(${params.getRfReadSize(IntData())}), W(${params.getRfWriteSize(IntData())}) ")
30  println(s"[DataPath]   Vf R(${params.getRfReadSize(VecData())}), W(${params.getRfWriteSize(VecData())}) ")
31}
32
33class DataPathImp(override val wrapper: DataPath)(implicit p: Parameters, params: BackendParams)
34  extends LazyModuleImp(wrapper) with HasXSParameter {
35
36  private val VCONFIG_PORT = params.vconfigPort
37  private val VLD_PORT = params.vldPort
38
39  val io = IO(new DataPathIO())
40
41  private val (fromIntIQ, toIntIQ, toIntExu) = (io.fromIntIQ, io.toIntIQ, io.toIntExu)
42  private val (fromMemIQ, toMemIQ, toMemExu) = (io.fromMemIQ, io.toMemIQ, io.toMemExu)
43  private val (fromVfIQ , toVfIQ , toVfExu ) = (io.fromVfIQ , io.toVfIQ , io.toFpExu)
44
45  println(s"[DataPath] IntIQ(${fromIntIQ.size}), MemIQ(${fromMemIQ.size})")
46  println(s"[DataPath] IntExu(${fromIntIQ.map(_.size).sum}), MemExu(${fromMemIQ.map(_.size).sum})")
47
48  // just refences for convience
49  private val fromIQ: Seq[MixedVec[DecoupledIO[IssueQueueIssueBundle]]] = (fromIntIQ ++ fromVfIQ ++ fromMemIQ).toSeq
50
51  private val toIQs = toIntIQ ++ toVfIQ ++ toMemIQ
52
53  private val toExu: Seq[MixedVec[DecoupledIO[ExuInput]]] = (toIntExu ++ toVfExu ++ toMemExu).toSeq
54
55  private val fromFlattenIQ: Seq[DecoupledIO[IssueQueueIssueBundle]] = fromIQ.flatten
56
57  private val toFlattenExu: Seq[DecoupledIO[ExuInput]] = toExu.flatten
58
59  private val intWbBusyArbiter = Module(new IntRFWBCollideChecker(backendParams))
60  private val vfWbBusyArbiter = Module(new VfRFWBCollideChecker(backendParams))
61  private val intRFReadArbiter = Module(new IntRFReadArbiter(backendParams))
62  private val vfRFReadArbiter = Module(new VfRFReadArbiter(backendParams))
63
64  private val og0FailedVec2: MixedVec[Vec[Bool]] = Wire(MixedVec(fromIQ.map(x => Vec(x.size, Bool())).toSeq))
65  private val og1FailedVec2: MixedVec[Vec[Bool]] = Wire(MixedVec(fromIQ.map(x => Vec(x.size, Bool())).toSeq))
66
67  // port -> win
68  private val intRdArbWinner: Seq2[MixedVec[Bool]] = intRFReadArbiter.io.in.map(_.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq).toSeq
69  private val vfRdArbWinner: Seq2[MixedVec[Bool]] = vfRFReadArbiter.io.in.map(_.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq).toSeq
70  private val intWbNotBlock: Seq[MixedVec[Bool]] = intWbBusyArbiter.io.in.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq
71  private val vfWbNotBlock: Seq[MixedVec[Bool]] = vfWbBusyArbiter.io.in.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq
72
73  private val intRdNotBlock: Seq2[Bool] = intRdArbWinner.map(_.map(_.asUInt.andR))
74  private val vfRdNotBlock: Seq2[Bool] = vfRdArbWinner.map(_.map(_.asUInt.andR))
75
76  private val intRFReadReq: Seq3[ValidIO[RfReadPortWithConfig]] = fromIQ.map(x => x.map(xx => xx.bits.getIntRfReadValidBundle(xx.valid)).toSeq).toSeq
77  private val intDataSources: Seq[Seq[Vec[DataSource]]] = fromIQ.map(x => x.map(xx => xx.bits.common.dataSources).toSeq)
78  private val intNumRegSrcs: Seq[Seq[Int]] = fromIQ.map(x => x.map(xx => xx.bits.exuParams.numRegSrc).toSeq)
79
80  intRFReadArbiter.io.in.zip(intRFReadReq).zipWithIndex.foreach { case ((arbInSeq2, inRFReadReqSeq2), iqIdx) =>
81    arbInSeq2.zip(inRFReadReqSeq2).zipWithIndex.foreach { case ((arbInSeq, inRFReadReqSeq), exuIdx) =>
82      val srcIndices: Seq[Int] = fromIQ(iqIdx)(exuIdx).bits.exuParams.getRfReadSrcIdx(IntData())
83      for (srcIdx <- 0 until fromIQ(iqIdx)(exuIdx).bits.exuParams.numRegSrc) {
84        if (srcIndices.contains(srcIdx) && inRFReadReqSeq.isDefinedAt(srcIdx)) {
85          if (intNumRegSrcs(iqIdx)(exuIdx) == 2) {
86            val src0Req = inRFReadReqSeq(0).valid && intDataSources(iqIdx)(exuIdx)(0).readReg
87            val src1Req = inRFReadReqSeq(1).valid && intDataSources(iqIdx)(exuIdx)(1).readReg
88            if (srcIdx == 0) {
89              arbInSeq(srcIdx).valid := src0Req || src1Req
90              arbInSeq(srcIdx).bits.addr := Mux(src1Req && !src0Req, inRFReadReqSeq(1).bits.addr,inRFReadReqSeq(0).bits.addr)
91            } else {
92              arbInSeq(srcIdx).valid := src0Req && src1Req
93              arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr
94            }
95          } else {
96            arbInSeq(srcIdx).valid := inRFReadReqSeq(srcIdx).valid && intDataSources(iqIdx)(exuIdx)(srcIdx).readReg
97            arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr
98          }
99        } else {
100          arbInSeq(srcIdx).valid := false.B
101          arbInSeq(srcIdx).bits.addr := 0.U
102        }
103      }
104    }
105  }
106
107  private val vfRFReadReq: Seq3[ValidIO[RfReadPortWithConfig]] = fromIQ.map(x => x.map(xx => xx.bits.getVfRfReadValidBundle(xx.valid)).toSeq).toSeq
108
109  vfRFReadArbiter.io.in.zip(vfRFReadReq).zipWithIndex.foreach { case ((arbInSeq2, inRFReadReqSeq2), iqIdx) =>
110    arbInSeq2.zip(inRFReadReqSeq2).zipWithIndex.foreach { case ((arbInSeq, inRFReadReqSeq), exuIdx) =>
111      val srcIndices: Seq[Int] = VfRegSrcDataSet.flatMap(data => fromIQ(iqIdx)(exuIdx).bits.exuParams.getRfReadSrcIdx(data)).toSeq.sorted
112      for (srcIdx <- 0 until fromIQ(iqIdx)(exuIdx).bits.exuParams.numRegSrc) {
113        if (srcIndices.contains(srcIdx) && inRFReadReqSeq.isDefinedAt(srcIdx)) {
114          arbInSeq(srcIdx).valid := inRFReadReqSeq(srcIdx).valid
115          arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr
116        } else {
117          arbInSeq(srcIdx).valid := false.B
118          arbInSeq(srcIdx).bits.addr := 0.U
119        }
120      }
121    }
122  }
123
124  private val intRFWriteReq: Seq2[Bool] = fromIQ.map(x => x.map(xx => xx.valid && xx.bits.common.rfWen.getOrElse(false.B)).toSeq).toSeq
125  private val vfRFWriteReq: Seq2[Bool] = fromIQ.map(x => x.map(xx => xx.valid && xx.bits.common.getVfWen.getOrElse(false.B)).toSeq).toSeq
126
127  intWbBusyArbiter.io.in.zip(intRFWriteReq).foreach { case (arbInSeq, inRFWriteReqSeq) =>
128    arbInSeq.zip(inRFWriteReqSeq).foreach { case (arbIn, inRFWriteReq) =>
129      arbIn.valid := inRFWriteReq
130    }
131  }
132
133  vfWbBusyArbiter.io.in.zip(vfRFWriteReq).foreach { case (arbInSeq, inRFWriteReqSeq) =>
134    arbInSeq.zip(inRFWriteReqSeq).foreach { case (arbIn, inRFWriteReq) =>
135      arbIn.valid := inRFWriteReq
136    }
137  }
138
139  private val intSchdParams = params.schdParams(IntScheduler())
140  private val vfSchdParams = params.schdParams(VfScheduler())
141  private val memSchdParams = params.schdParams(MemScheduler())
142
143  private val numIntRfReadByExu = intSchdParams.numIntRfReadByExu + memSchdParams.numIntRfReadByExu
144  private val numVfRfReadByExu = vfSchdParams.numVfRfReadByExu + memSchdParams.numVfRfReadByExu
145  // Todo: limit read port
146  private val numIntR = numIntRfReadByExu
147  private val numVfR = numVfRfReadByExu
148  println(s"[DataPath] RegFile read req needed by Exu: Int(${numIntRfReadByExu}), Vf(${numVfRfReadByExu})")
149  println(s"[DataPath] RegFile read port: Int(${numIntR}), Vf(${numVfR})")
150
151  private val schdParams = params.allSchdParams
152
153  private val pcReadFtqPtr = Wire(chiselTypeOf(io.pcFromPcTargetMem.fromDataPathFtqPtr))
154  private val pcReadFtqOffset = Wire(chiselTypeOf(io.pcFromPcTargetMem.fromDataPathFtqOffset))
155  private val pcRdata = io.pcFromPcTargetMem.toDataPathPC
156  private val intRfRaddr = Wire(Vec(params.numPregRd(IntData()), UInt(intSchdParams.pregIdxWidth.W)))
157  private val intRfRdata = Wire(Vec(params.numPregRd(IntData()), UInt(intSchdParams.rfDataWidth.W)))
158  private val intRfWen = Wire(Vec(io.fromIntWb.length, Bool()))
159  private val intRfWaddr = Wire(Vec(io.fromIntWb.length, UInt(intSchdParams.pregIdxWidth.W)))
160  private val intRfWdata = Wire(Vec(io.fromIntWb.length, UInt(intSchdParams.rfDataWidth.W)))
161
162  private val vfRfSplitNum = VLEN / XLEN
163  private val vfRfRaddr = Wire(Vec(params.numPregRd(VecData()), UInt(vfSchdParams.pregIdxWidth.W)))
164  private val vfRfRdata = Wire(Vec(params.numPregRd(VecData()), UInt(vfSchdParams.rfDataWidth.W)))
165  private val vfRfWen = Wire(Vec(vfRfSplitNum, Vec(io.fromVfWb.length, Bool())))
166  private val vfRfWaddr = Wire(Vec(io.fromVfWb.length, UInt(vfSchdParams.pregIdxWidth.W)))
167  private val vfRfWdata = Wire(Vec(io.fromVfWb.length, UInt(vfSchdParams.rfDataWidth.W)))
168
169  val pcReadFtqPtrFormIQ = fromIntIQ.flatten.filter(x => x.bits.exuParams.needPc)
170  assert(pcReadFtqPtrFormIQ.size == pcReadFtqPtr.size, s"pcReadFtqPtrFormIQ.size ${pcReadFtqPtrFormIQ.size} not equal pcReadFtqPtr.size ${pcReadFtqPtr.size}")
171  pcReadFtqPtr.zip(pcReadFtqPtrFormIQ.map(_.bits.common.ftqIdx.get)).map(x => x._1 := x._2)
172  pcReadFtqOffset.zip(pcReadFtqPtrFormIQ.map(_.bits.common.ftqOffset.get)).map(x => x._1 := x._2)
173  io.pcFromPcTargetMem.fromDataPathFtqPtr := pcReadFtqPtr
174  io.pcFromPcTargetMem.fromDataPathFtqOffset := pcReadFtqOffset
175  private val intDebugRead: Option[(Vec[UInt], Vec[UInt])] =
176    if (env.AlwaysBasicDiff || env.EnableDifftest) {
177      Some(Wire(Vec(32, UInt(intSchdParams.pregIdxWidth.W))), Wire(Vec(32, UInt(XLEN.W))))
178    } else { None }
179  private val vfDebugRead: Option[(Vec[UInt], Vec[UInt])] =
180    if (env.AlwaysBasicDiff || env.EnableDifftest) {
181      Some(Wire(Vec(32 + 32 + 1, UInt(vfSchdParams.pregIdxWidth.W))), Wire(Vec(32 + 32 + 1, UInt(VLEN.W))))
182    } else { None }
183
184  private val fpDebugReadData: Option[Vec[UInt]] =
185    if (env.AlwaysBasicDiff || env.EnableDifftest) {
186      Some(Wire(Vec(32, UInt(XLEN.W))))
187    } else { None }
188  private val vecDebugReadData: Option[Vec[UInt]] =
189    if (env.AlwaysBasicDiff || env.EnableDifftest) {
190      Some(Wire(Vec(64, UInt(64.W)))) // v0 = Cat(Vec(1), Vec(0))
191    } else { None }
192  private val vconfigDebugReadData: Option[UInt] =
193    if (env.AlwaysBasicDiff || env.EnableDifftest) {
194      Some(Wire(UInt(64.W)))
195    } else { None }
196
197
198  fpDebugReadData.foreach(_ := vfDebugRead
199    .get._2
200    .slice(0, 32)
201    .map(_(63, 0))
202  ) // fp only used [63, 0]
203  vecDebugReadData.foreach(_ := vfDebugRead
204    .get._2
205    .slice(32, 64)
206    .map(x => Seq(x(63, 0), x(127, 64))).flatten
207  )
208  vconfigDebugReadData.foreach(_ := vfDebugRead
209    .get._2(64)(63, 0)
210  )
211
212  io.debugVconfig.foreach(_ := vconfigDebugReadData.get)
213
214  IntRegFile("IntRegFile", intSchdParams.numPregs, intRfRaddr, intRfRdata, intRfWen, intRfWaddr, intRfWdata,
215    debugReadAddr = intDebugRead.map(_._1),
216    debugReadData = intDebugRead.map(_._2))
217  VfRegFile("VfRegFile", vfSchdParams.numPregs, vfRfSplitNum, vfRfRaddr, vfRfRdata, vfRfWen, vfRfWaddr, vfRfWdata,
218    debugReadAddr = vfDebugRead.map(_._1),
219    debugReadData = vfDebugRead.map(_._2))
220
221  intRfWaddr := io.fromIntWb.map(_.addr).toSeq
222  intRfWdata := io.fromIntWb.map(_.data).toSeq
223  intRfWen := io.fromIntWb.map(_.wen).toSeq
224
225  for (portIdx <- intRfRaddr.indices) {
226    if (intRFReadArbiter.io.out.isDefinedAt(portIdx))
227      intRfRaddr(portIdx) := intRFReadArbiter.io.out(portIdx).bits.addr
228    else
229      intRfRaddr(portIdx) := 0.U
230  }
231
232  vfRfWaddr := io.fromVfWb.map(_.addr).toSeq
233  vfRfWdata := io.fromVfWb.map(_.data).toSeq
234  vfRfWen.foreach(_.zip(io.fromVfWb.map(_.wen)).foreach { case (wenSink, wenSource) => wenSink := wenSource } )// Todo: support fp multi-write
235
236  for (portIdx <- vfRfRaddr.indices) {
237    if (vfRFReadArbiter.io.out.isDefinedAt(portIdx))
238      vfRfRaddr(portIdx) := vfRFReadArbiter.io.out(portIdx).bits.addr
239    else
240      vfRfRaddr(portIdx) := 0.U
241  }
242
243  vfRfRaddr(VCONFIG_PORT) := io.vconfigReadPort.addr
244  io.vconfigReadPort.data := vfRfRdata(VCONFIG_PORT)
245  // vfRfRaddr(VLD_PORT) := io.vldReadPort.addr
246  io.vldReadPort.data := DontCare
247
248  intDebugRead.foreach { case (addr, _) =>
249    addr := io.debugIntRat.get
250  }
251
252  vfDebugRead.foreach { case (addr, _) =>
253    addr := io.debugFpRat.get ++ io.debugVecRat.get :+ io.debugVconfigRat.get
254  }
255  println(s"[DataPath] " +
256    s"has intDebugRead: ${intDebugRead.nonEmpty}, " +
257    s"has vfDebugRead: ${vfDebugRead.nonEmpty}")
258
259  val s1_addrOHs = Reg(MixedVec(
260    fromIQ.map(x => MixedVec(x.map(_.bits.addrOH.cloneType).toSeq)).toSeq
261  ))
262  val s1_toExuValid: MixedVec[MixedVec[Bool]] = Reg(MixedVec(
263    toExu.map(x => MixedVec(x.map(_.valid.cloneType).toSeq)).toSeq
264  ))
265  val s1_toExuData: MixedVec[MixedVec[ExuInput]] = Reg(MixedVec(toExu.map(x => MixedVec(x.map(_.bits.cloneType).toSeq)).toSeq))
266  val s1_toExuReady = Wire(MixedVec(toExu.map(x => MixedVec(x.map(_.ready.cloneType).toSeq))))
267  val s1_srcType: MixedVec[MixedVec[Vec[UInt]]] = MixedVecInit(fromIQ.map(x => MixedVecInit(x.map(xx => RegEnable(xx.bits.srcType, xx.fire)).toSeq)))
268
269  val s1_intPregRData: MixedVec[MixedVec[Vec[UInt]]] = Wire(MixedVec(toExu.map(x => MixedVec(x.map(_.bits.src.cloneType).toSeq))))
270  val s1_vfPregRData: MixedVec[MixedVec[Vec[UInt]]] = Wire(MixedVec(toExu.map(x => MixedVec(x.map(_.bits.src.cloneType).toSeq))))
271
272  val rfrPortConfigs = schdParams.map(_.issueBlockParams).flatten.map(_.exuBlockParams.map(_.rfrPortConfigs))
273
274  println(s"[DataPath] s1_intPregRData.flatten.flatten.size: ${s1_intPregRData.flatten.flatten.size}, intRfRdata.size: ${intRfRdata.size}")
275  s1_intPregRData.foreach(_.foreach(_.foreach(_ := 0.U)))
276  s1_intPregRData.zip(rfrPortConfigs).foreach { case (iqRdata, iqCfg) =>
277      iqRdata.zip(iqCfg).foreach { case (iuRdata, iuCfg) =>
278        val realIuCfg = iuCfg.map(x => if(x.size > 1) x.filter(_.isInstanceOf[IntRD]) else x).flatten
279        assert(iuRdata.size == realIuCfg.size, "iuRdata.size != realIuCfg.size")
280        iuRdata.zip(realIuCfg)
281          .filter { case (_, rfrPortConfig) => rfrPortConfig.isInstanceOf[IntRD] }
282          .foreach { case (sink, cfg) => sink := intRfRdata(cfg.port) }
283      }
284  }
285
286  println(s"[DataPath] s1_vfPregRData.flatten.flatten.size: ${s1_vfPregRData.flatten.flatten.size}, vfRfRdata.size: ${vfRfRdata.size}")
287  s1_vfPregRData.foreach(_.foreach(_.foreach(_ := 0.U)))
288  s1_vfPregRData.zip(rfrPortConfigs).foreach{ case(iqRdata, iqCfg) =>
289      iqRdata.zip(iqCfg).foreach{ case(iuRdata, iuCfg) =>
290        val realIuCfg = iuCfg.map(x => if(x.size > 1) x.filter(_.isInstanceOf[VfRD]) else x).flatten
291        assert(iuRdata.size == realIuCfg.size, "iuRdata.size != realIuCfg.size")
292        iuRdata.zip(realIuCfg)
293          .filter { case (_, rfrPortConfig) => rfrPortConfig.isInstanceOf[VfRD] }
294          .foreach { case (sink, cfg) => sink := vfRfRdata(cfg.port) }
295      }
296  }
297
298  for (i <- fromIQ.indices) {
299    for (j <- fromIQ(i).indices) {
300      // IQ(s0) --[Ctrl]--> s1Reg ---------- begin
301      // refs
302      val s1_valid = s1_toExuValid(i)(j)
303      val s1_ready = s1_toExuReady(i)(j)
304      val s1_data = s1_toExuData(i)(j)
305      val s1_addrOH = s1_addrOHs(i)(j)
306      val s0 = fromIQ(i)(j) // s0
307
308      val srcNotBlock = Wire(Bool())
309      srcNotBlock := s0.bits.common.dataSources.zip(intRdArbWinner(i)(j) zip vfRdArbWinner(i)(j)).map { case (source, win) =>
310        !source.readReg || win._1 && win._2
311      }.fold(true.B)(_ && _)
312      if (fromIQ(i)(j).bits.exuParams.schdType.isInstanceOf[IntScheduler] && (fromIQ(i)(j).bits.exuParams.numRegSrc == 2)) {
313        val src0VfBlock = s0.bits.common.dataSources(0).readReg && !vfRdArbWinner(i)(j)(0)
314        val src1VfBlock = s0.bits.common.dataSources(1).readReg && !vfRdArbWinner(i)(j)(1)
315        val src1IntBlock = s0.bits.common.dataSources(0).readReg && s0.bits.common.dataSources(1).readReg && !intRdArbWinner(i)(j)(1)
316        srcNotBlock := !src0VfBlock && !src1VfBlock && !src1IntBlock
317      }
318      val notBlock = srcNotBlock && intWbNotBlock(i)(j) && vfWbNotBlock(i)(j)
319      val s1_flush = s0.bits.common.robIdx.needFlush(Seq(io.flush, RegNextWithEnable(io.flush)))
320      val s1_cancel = og1FailedVec2(i)(j)
321      val s1_ldCancel = LoadShouldCancel(s0.bits.common.loadDependency, io.ldCancel)
322      when (s0.fire && !s1_flush && notBlock && !s1_cancel && !s1_ldCancel) {
323        s1_valid := s0.valid
324        s1_data.fromIssueBundle(s0.bits) // no src data here
325        if (fromIQ(i)(j).bits.exuParams.schdType.isInstanceOf[IntScheduler] && (fromIQ(i)(j).bits.exuParams.numRegSrc == 2)) {
326          s1_data.dataSources(1).value := Mux(!s0.bits.common.dataSources(0).readReg && s0.bits.common.dataSources(1).readReg, DataSource.anotherReg, s0.bits.common.dataSources(1).value)
327        }
328        s1_addrOH := s0.bits.addrOH
329      }.otherwise {
330        s1_valid := false.B
331      }
332      s0.ready := (s1_ready || !s1_valid) && notBlock
333      // IQ(s0) --[Ctrl]--> s1Reg ---------- end
334
335      // IQ(s0) --[Data]--> s1Reg ---------- begin
336      // imm extract
337      when (s0.fire && !s1_flush && notBlock) {
338        if (s1_data.params.immType.nonEmpty && s1_data.src.size > 1) {
339          // rs1 is always int reg, rs2 may be imm
340          when(SrcType.isImm(s0.bits.srcType(1))) {
341            s1_data.src(1) := ImmExtractor(
342              s0.bits.common.imm,
343              s0.bits.immType,
344              s1_data.params.dataBitsMax,
345              s1_data.params.immType.map(_.litValue)
346            )
347          }
348        }
349        if (s1_data.params.hasVecFu) {
350          // Fuck off riscv vector imm!!! Why not src1???
351          when(SrcType.isImm(s0.bits.srcType(0))) {
352            s1_data.src(0) := ImmExtractor(
353              s0.bits.common.imm,
354              s0.bits.immType,
355              s1_data.params.dataBitsMax,
356              s1_data.params.immType.map(_.litValue)
357            )
358          }
359        } else if (s1_data.params.hasLoadFu || s1_data.params.hasHyldaFu) {
360          // dirty code for fused_lui_load
361          when(SrcType.isImm(s0.bits.srcType(0))) {
362            s1_data.src(0) := SignExt(ImmUnion.U.toImm32(s0.bits.common.imm(s0.bits.common.imm.getWidth - 1, ImmUnion.I.len)), XLEN)
363          }
364        }
365      }
366      // IQ(s0) --[Data]--> s1Reg ---------- end
367    }
368  }
369
370  private val fromIQFire = fromIQ.map(_.map(_.fire))
371  private val toExuFire = toExu.map(_.map(_.fire))
372  toIQs.zipWithIndex.foreach {
373    case(toIQ, iqIdx) =>
374      toIQ.zipWithIndex.foreach {
375        case (toIU, iuIdx) =>
376          // IU: issue unit
377          val og0resp = toIU.og0resp
378          og0FailedVec2(iqIdx)(iuIdx) := fromIQ(iqIdx)(iuIdx).valid && (!fromIQFire(iqIdx)(iuIdx))
379          og0resp.valid                 := og0FailedVec2(iqIdx)(iuIdx)
380          og0resp.bits.robIdx           := fromIQ(iqIdx)(iuIdx).bits.common.robIdx
381          og0resp.bits.uopIdx.foreach(_ := fromIQ(iqIdx)(iuIdx).bits.common.vpu.get.vuopIdx)
382          og0resp.bits.resp             := RespType.block
383          og0resp.bits.fuType           := fromIQ(iqIdx)(iuIdx).bits.common.fuType
384
385          val og1resp = toIU.og1resp
386          og1FailedVec2(iqIdx)(iuIdx)   := s1_toExuValid(iqIdx)(iuIdx) && !toExuFire(iqIdx)(iuIdx)
387          og1resp.valid                 := s1_toExuValid(iqIdx)(iuIdx)
388          og1resp.bits.robIdx           := s1_toExuData(iqIdx)(iuIdx).robIdx
389          og1resp.bits.uopIdx.foreach(_ := s1_toExuData(iqIdx)(iuIdx).vpu.get.vuopIdx)
390          // respType:  fuIdle      ->IQ entry clear
391          //            fuUncertain ->IQ entry no action
392          //            fuBusy      ->IQ entry issued set false, then re-issue
393          // Only hyu, lda and sta are fuUncertain at OG1 stage
394          og1resp.bits.resp             := Mux(!og1FailedVec2(iqIdx)(iuIdx),
395            if (toIU.issueQueueParams.isMemAddrIQ) RespType.uncertain else RespType.success,
396            RespType.block
397          )
398          og1resp.bits.fuType           := s1_toExuData(iqIdx)(iuIdx).fuType
399      }
400  }
401
402  io.og0CancelOH := VecInit(fromFlattenIQ.map(x => x.valid && !x.fire)).asUInt
403  io.og1CancelOH := VecInit(toFlattenExu.map(x => x.valid && !x.fire)).asUInt
404
405  io.cancelToBusyTable.zipWithIndex.foreach { case (cancel, i) =>
406    cancel.valid := fromFlattenIQ(i).valid && !fromFlattenIQ(i).fire && {
407      if (fromFlattenIQ(i).bits.common.rfWen.isDefined)
408        fromFlattenIQ(i).bits.common.rfWen.get && fromFlattenIQ(i).bits.common.pdest =/= 0.U
409      else
410        true.B
411    }
412    cancel.bits.rfWen := fromFlattenIQ(i).bits.common.rfWen.getOrElse(false.B)
413    cancel.bits.fpWen := fromFlattenIQ(i).bits.common.fpWen.getOrElse(false.B)
414    cancel.bits.vecWen := fromFlattenIQ(i).bits.common.vecWen.getOrElse(false.B)
415    cancel.bits.pdest := fromFlattenIQ(i).bits.common.pdest
416  }
417
418  for (i <- toExu.indices) {
419    for (j <- toExu(i).indices) {
420      // s1Reg --[Ctrl]--> exu(s1) ---------- begin
421      // refs
422      val sinkData = toExu(i)(j).bits
423      // assign
424      toExu(i)(j).valid := s1_toExuValid(i)(j)
425      s1_toExuReady(i)(j) := toExu(i)(j).ready
426      sinkData := s1_toExuData(i)(j)
427      // s1Reg --[Ctrl]--> exu(s1) ---------- end
428
429      // s1Reg --[Data]--> exu(s1) ---------- begin
430      // data source1: preg read data
431      for (k <- sinkData.src.indices) {
432        val srcDataTypeSet: Set[DataConfig] = sinkData.params.getSrcDataType(k)
433
434        val readRfMap: Seq[(Bool, UInt)] = (Seq(None) :+
435          (if (s1_intPregRData(i)(j).isDefinedAt(k) && srcDataTypeSet.intersect(IntRegSrcDataSet).nonEmpty)
436            Some(SrcType.isXp(s1_srcType(i)(j)(k)) -> s1_intPregRData(i)(j)(k))
437          else None) :+
438          (if (s1_vfPregRData(i)(j).isDefinedAt(k) && srcDataTypeSet.intersect(VfRegSrcDataSet).nonEmpty)
439            Some(SrcType.isVfp(s1_srcType(i)(j)(k))-> s1_vfPregRData(i)(j)(k))
440          else None)
441        ).filter(_.nonEmpty).map(_.get)
442        if (readRfMap.nonEmpty)
443          sinkData.src(k) := Mux1H(readRfMap)
444      }
445
446      // data source2: extracted imm and pc saved in s1Reg
447      if (sinkData.params.immType.nonEmpty && sinkData.src.size > 1) {
448        when(SrcType.isImm(s1_srcType(i)(j)(1))) {
449          sinkData.src(1) := s1_toExuData(i)(j).src(1)
450        }
451      }
452      if (sinkData.params.hasJmpFu) {
453        val index = pcReadFtqPtrFormIQ.map(_.bits.exuParams).indexOf(sinkData.params)
454        sinkData.pc.get := pcRdata(index)
455      } else if (sinkData.params.hasVecFu) {
456        when(SrcType.isImm(s1_srcType(i)(j)(0))) {
457          sinkData.src(0) := s1_toExuData(i)(j).src(0)
458        }
459      } else if (sinkData.params.hasLoadFu || sinkData.params.hasHyldaFu) {
460        when(SrcType.isImm(s1_srcType(i)(j)(0))) {
461          sinkData.src(0) := s1_toExuData(i)(j).src(0)
462        }
463      }
464      // s1Reg --[Data]--> exu(s1) ---------- end
465    }
466  }
467
468  if (env.AlwaysBasicDiff || env.EnableDifftest) {
469    val delayedCnt = 2
470    val difftestArchIntRegState = DifftestModule(new DiffArchIntRegState, delay = delayedCnt)
471    difftestArchIntRegState.coreid := io.hartId
472    difftestArchIntRegState.value := intDebugRead.get._2
473
474    val difftestArchFpRegState = DifftestModule(new DiffArchFpRegState, delay = delayedCnt)
475    difftestArchFpRegState.coreid := io.hartId
476    difftestArchFpRegState.value := fpDebugReadData.get
477
478    val difftestArchVecRegState = DifftestModule(new DiffArchVecRegState, delay = delayedCnt)
479    difftestArchVecRegState.coreid := io.hartId
480    difftestArchVecRegState.value := vecDebugReadData.get
481  }
482
483  val int_regcache_size = 48
484  val int_regcache_tag = RegInit(VecInit(Seq.fill(int_regcache_size)(0.U(intSchdParams.pregIdxWidth.W))))
485  val int_regcache_enqPtr = RegInit(0.U(log2Up(int_regcache_size).W))
486  int_regcache_enqPtr := int_regcache_enqPtr + PopCount(intRfWen)
487  for (i <- intRfWen.indices) {
488    when (intRfWen(i)) {
489      int_regcache_tag(int_regcache_enqPtr + PopCount(intRfWen.take(i))) := intRfWaddr(i)
490    }
491  }
492
493  val vf_regcache_size = 48
494  val vf_regcache_tag = RegInit(VecInit(Seq.fill(vf_regcache_size)(0.U(vfSchdParams.pregIdxWidth.W))))
495  val vf_regcache_enqPtr = RegInit(0.U(log2Up(vf_regcache_size).W))
496  vf_regcache_enqPtr := vf_regcache_enqPtr + PopCount(vfRfWen.head)
497  for (i <- vfRfWen.indices) {
498    when (vfRfWen.head(i)) {
499      vf_regcache_tag(vf_regcache_enqPtr + PopCount(vfRfWen.head.take(i))) := vfRfWaddr(i)
500    }
501  }
502
503  XSPerfHistogram(s"IntRegFileRead_hist", PopCount(intRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 20, 1)
504  XSPerfHistogram(s"VfRegFileRead_hist", PopCount(vfRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 20, 1)
505  XSPerfHistogram(s"IntRegFileWrite_hist", PopCount(intRFWriteReq.flatten), true.B, 0, 20, 1)
506  XSPerfHistogram(s"VfRegFileWrite_hist", PopCount(vfRFWriteReq.flatten), true.B, 0, 20, 1)
507
508  val int_regcache_part32 = (1 until 33).map(i => int_regcache_tag(int_regcache_enqPtr - i.U))
509  val int_regcache_part24 = (1 until 24).map(i => int_regcache_tag(int_regcache_enqPtr - i.U))
510  val int_regcache_part16 = (1 until 17).map(i => int_regcache_tag(int_regcache_enqPtr - i.U))
511  val int_regcache_part8 = (1 until 9).map(i => int_regcache_tag(int_regcache_enqPtr - i.U))
512
513  val int_regcache_48_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_tag.map(_ === x.bits.addr).reduce(_ || _))
514  val int_regcache_8_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_part8.map(_ === x.bits.addr).reduce(_ || _))
515  val int_regcache_16_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_part16.map(_ === x.bits.addr).reduce(_ || _))
516  val int_regcache_24_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_part24.map(_ === x.bits.addr).reduce(_ || _))
517  val int_regcache_32_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_part32.map(_ === x.bits.addr).reduce(_ || _))
518  XSPerfAccumulate("IntRegCache48Hit", PopCount(int_regcache_48_hit_vec))
519  XSPerfAccumulate("IntRegCache8Hit", PopCount(int_regcache_8_hit_vec))
520  XSPerfAccumulate("IntRegCache16Hit", PopCount(int_regcache_16_hit_vec))
521  XSPerfAccumulate("IntRegCache24Hit", PopCount(int_regcache_24_hit_vec))
522  XSPerfAccumulate("IntRegCache32Hit", PopCount(int_regcache_32_hit_vec))
523  XSPerfHistogram("IntRegCache48Hit_hist", PopCount(int_regcache_48_hit_vec), true.B, 0, 16, 2)
524
525  XSPerfAccumulate(s"IntRFReadBeforeArb", PopCount(intRFReadArbiter.io.in.flatten.flatten.map(_.valid)))
526  XSPerfAccumulate(s"IntRFReadAfterArb", PopCount(intRFReadArbiter.io.out.map(_.valid)))
527  XSPerfAccumulate(s"VfRFReadBeforeArb", PopCount(vfRFReadArbiter.io.in.flatten.flatten.map(_.valid)))
528  XSPerfAccumulate(s"VfRFReadAfterArb", PopCount(vfRFReadArbiter.io.out.map(_.valid)))
529  XSPerfAccumulate(s"IntUopBeforeArb", PopCount(fromIntIQ.flatten.map(_.valid)))
530  XSPerfAccumulate(s"IntUopAfterArb", PopCount(fromIntIQ.flatten.map(_.fire)))
531  XSPerfAccumulate(s"MemUopBeforeArb", PopCount(fromMemIQ.flatten.map(_.valid)))
532  XSPerfAccumulate(s"MemUopAfterArb", PopCount(fromMemIQ.flatten.map(_.fire)))
533  XSPerfAccumulate(s"VfUopBeforeArb", PopCount(fromVfIQ.flatten.map(_.valid)))
534  XSPerfAccumulate(s"VfUopAfterArb", PopCount(fromVfIQ.flatten.map(_.fire)))
535
536  XSPerfHistogram(s"IntRFReadBeforeArb_hist", PopCount(intRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 16, 2)
537  XSPerfHistogram(s"IntRFReadAfterArb_hist", PopCount(intRFReadArbiter.io.out.map(_.valid)), true.B, 0, 16, 2)
538  XSPerfHistogram(s"VfRFReadBeforeArb_hist", PopCount(vfRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 16, 2)
539  XSPerfHistogram(s"VfRFReadAfterArb_hist", PopCount(vfRFReadArbiter.io.out.map(_.valid)), true.B, 0, 16, 2)
540  XSPerfHistogram(s"IntUopBeforeArb_hist", PopCount(fromIntIQ.flatten.map(_.valid)), true.B, 0, 8, 2)
541  XSPerfHistogram(s"IntUopAfterArb_hist", PopCount(fromIntIQ.flatten.map(_.fire)), true.B, 0, 8, 2)
542  XSPerfHistogram(s"MemUopBeforeArb_hist", PopCount(fromMemIQ.flatten.map(_.valid)), true.B, 0, 8, 2)
543  XSPerfHistogram(s"MemUopAfterArb_hist", PopCount(fromMemIQ.flatten.map(_.fire)), true.B, 0, 8, 2)
544  XSPerfHistogram(s"VfUopBeforeArb_hist", PopCount(fromVfIQ.flatten.map(_.valid)), true.B, 0, 8, 2)
545  XSPerfHistogram(s"VfUopAfterArb_hist", PopCount(fromVfIQ.flatten.map(_.fire)), true.B, 0, 8, 2)
546}
547
548class DataPathIO()(implicit p: Parameters, params: BackendParams) extends XSBundle {
549  // params
550  private val intSchdParams = params.schdParams(IntScheduler())
551  private val vfSchdParams = params.schdParams(VfScheduler())
552  private val memSchdParams = params.schdParams(MemScheduler())
553  // bundles
554  val hartId = Input(UInt(8.W))
555
556  val flush: ValidIO[Redirect] = Flipped(ValidIO(new Redirect))
557
558  // Todo: check if this can be removed
559  val vconfigReadPort = new RfReadPort(XLEN, PhyRegIdxWidth)
560
561  val vldReadPort = new RfReadPort(VLEN, PhyRegIdxWidth)
562
563  val wbConfictRead = Input(MixedVec(params.allSchdParams.map(x => MixedVec(x.issueBlockParams.map(x => x.genWbConflictBundle())))))
564
565  val fromIntIQ: MixedVec[MixedVec[DecoupledIO[IssueQueueIssueBundle]]] =
566    Flipped(MixedVec(intSchdParams.issueBlockParams.map(_.genIssueDecoupledBundle)))
567
568  val fromMemIQ: MixedVec[MixedVec[DecoupledIO[IssueQueueIssueBundle]]] =
569    Flipped(MixedVec(memSchdParams.issueBlockParams.map(_.genIssueDecoupledBundle)))
570
571  val fromVfIQ = Flipped(MixedVec(vfSchdParams.issueBlockParams.map(_.genIssueDecoupledBundle)))
572
573  val toIntIQ = MixedVec(intSchdParams.issueBlockParams.map(_.genOGRespBundle))
574
575  val toMemIQ = MixedVec(memSchdParams.issueBlockParams.map(_.genOGRespBundle))
576
577  val toVfIQ = MixedVec(vfSchdParams.issueBlockParams.map(_.genOGRespBundle))
578
579  val og0CancelOH = Output(ExuOH(backendParams.numExu))
580
581  val og1CancelOH = Output(ExuOH(backendParams.numExu))
582
583  val ldCancel = Vec(backendParams.LduCnt + backendParams.HyuCnt, Flipped(new LoadCancelIO))
584
585  val cancelToBusyTable = Vec(backendParams.numExu, ValidIO(new CancelSignal))
586
587  val toIntExu: MixedVec[MixedVec[DecoupledIO[ExuInput]]] = intSchdParams.genExuInputBundle
588
589  val toFpExu: MixedVec[MixedVec[DecoupledIO[ExuInput]]] = MixedVec(vfSchdParams.genExuInputBundle)
590
591  val toMemExu: MixedVec[MixedVec[DecoupledIO[ExuInput]]] = memSchdParams.genExuInputBundle
592
593  val fromIntWb: MixedVec[RfWritePortWithConfig] = MixedVec(params.genIntWriteBackBundle)
594
595  val fromVfWb: MixedVec[RfWritePortWithConfig] = MixedVec(params.genVfWriteBackBundle)
596
597  val pcFromPcTargetMem = Flipped(new PcToDataPathIO(params))
598
599  val debugIntRat     = if (params.debugEn) Some(Input(Vec(32, UInt(intSchdParams.pregIdxWidth.W)))) else None
600  val debugFpRat      = if (params.debugEn) Some(Input(Vec(32, UInt(vfSchdParams.pregIdxWidth.W)))) else None
601  val debugVecRat     = if (params.debugEn) Some(Input(Vec(32, UInt(vfSchdParams.pregIdxWidth.W)))) else None
602  val debugVconfigRat = if (params.debugEn) Some(Input(UInt(vfSchdParams.pregIdxWidth.W))) else None
603  val debugVconfig    = if (params.debugEn) Some(Output(UInt(XLEN.W))) else None
604}
605