1package xiangshan.backend.datapath 2 3import org.chipsalliance.cde.config.Parameters 4import chisel3._ 5import chisel3.util._ 6import difftest.{DiffArchFpRegState, DiffArchIntRegState, DiffArchVecRegState, DifftestModule} 7import freechips.rocketchip.diplomacy.{LazyModule, LazyModuleImp} 8import utility._ 9import utils.SeqUtils._ 10import utils._ 11import xiangshan._ 12import xiangshan.backend.BackendParams 13import xiangshan.backend.Bundles._ 14import xiangshan.backend.decode.ImmUnion 15import xiangshan.backend.datapath.DataConfig._ 16import xiangshan.backend.datapath.RdConfig._ 17import xiangshan.backend.issue.{ImmExtractor, IntScheduler, MemScheduler, VfScheduler, FpScheduler} 18import xiangshan.backend.issue.EntryBundles._ 19import xiangshan.backend.regfile._ 20import xiangshan.backend.PcToDataPathIO 21import xiangshan.backend.fu.FuType.is0latency 22 23class DataPath(params: BackendParams)(implicit p: Parameters) extends LazyModule { 24 override def shouldBeInlined: Boolean = false 25 26 private implicit val dpParams: BackendParams = params 27 lazy val module = new DataPathImp(this) 28 29 println(s"[DataPath] Preg Params: ") 30 println(s"[DataPath] Int R(${params.getRfReadSize(IntData())}), W(${params.getRfWriteSize(IntData())}) ") 31 println(s"[DataPath] Fp R(${params.getRfReadSize(FpData())}), W(${params.getRfWriteSize(FpData())}) ") 32 println(s"[DataPath] Vf R(${params.getRfReadSize(VecData())}), W(${params.getRfWriteSize(VecData())}) ") 33 println(s"[DataPath] V0 R(${params.getRfReadSize(V0Data())}), W(${params.getRfWriteSize(V0Data())}) ") 34 println(s"[DataPath] Vl R(${params.getRfReadSize(VlData())}), W(${params.getRfWriteSize(VlData())}) ") 35} 36 37class DataPathImp(override val wrapper: DataPath)(implicit p: Parameters, params: BackendParams) 38 extends LazyModuleImp(wrapper) with HasXSParameter { 39 40 val io = IO(new DataPathIO()) 41 42 private val (fromIntIQ, toIntIQ, toIntExu) = (io.fromIntIQ, io.toIntIQ, io.toIntExu) 43 private val (fromFpIQ, toFpIQ, toFpExu) = (io.fromFpIQ, io.toFpIQ, io.toFpExu) 44 private val (fromMemIQ, toMemIQ, toMemExu) = (io.fromMemIQ, io.toMemIQ, io.toMemExu) 45 private val (fromVfIQ, toVfIQ, toVfExu ) = (io.fromVfIQ, io.toVfIQ, io.toVecExu) 46 47 println(s"[DataPath] IntIQ(${fromIntIQ.size}), FpIQ(${fromFpIQ.size}), VecIQ(${fromVfIQ.size}), MemIQ(${fromMemIQ.size})") 48 println(s"[DataPath] IntExu(${fromIntIQ.map(_.size).sum}), FpExu(${fromFpIQ.map(_.size).sum}), VecExu(${fromVfIQ.map(_.size).sum}), MemExu(${fromMemIQ.map(_.size).sum})") 49 50 // just refences for convience 51 private val fromIQ: Seq[MixedVec[DecoupledIO[IssueQueueIssueBundle]]] = (fromIntIQ ++ fromFpIQ ++ fromVfIQ ++ fromMemIQ).toSeq 52 53 private val toIQs = toIntIQ ++ toFpIQ ++ toVfIQ ++ toMemIQ 54 55 private val toExu: Seq[MixedVec[DecoupledIO[ExuInput]]] = (toIntExu ++ toFpExu ++ toVfExu ++ toMemExu).toSeq 56 57 private val fromFlattenIQ: Seq[DecoupledIO[IssueQueueIssueBundle]] = fromIQ.flatten 58 59 private val toFlattenExu: Seq[DecoupledIO[ExuInput]] = toExu.flatten 60 61 private val intWbBusyArbiter = Module(new IntRFWBCollideChecker(backendParams)) 62 private val fpWbBusyArbiter = Module(new FpRFWBCollideChecker(backendParams)) 63 private val vfWbBusyArbiter = Module(new VfRFWBCollideChecker(backendParams)) 64 private val v0WbBusyArbiter = Module(new V0RFWBCollideChecker(backendParams)) 65 private val vlWbBusyArbiter = Module(new VlRFWBCollideChecker(backendParams)) 66 67 private val intRFReadArbiter = Module(new IntRFReadArbiter(backendParams)) 68 private val fpRFReadArbiter = Module(new FpRFReadArbiter(backendParams)) 69 private val vfRFReadArbiter = Module(new VfRFReadArbiter(backendParams)) 70 private val v0RFReadArbiter = Module(new V0RFReadArbiter(backendParams)) 71 private val vlRFReadArbiter = Module(new VlRFReadArbiter(backendParams)) 72 73 private val og0FailedVec2: MixedVec[Vec[Bool]] = Wire(MixedVec(fromIQ.map(x => Vec(x.size, Bool())).toSeq)) 74 private val og1FailedVec2: MixedVec[Vec[Bool]] = Wire(MixedVec(fromIQ.map(x => Vec(x.size, Bool())).toSeq)) 75 76 // port -> win 77 private val intRdArbWinner: Seq2[MixedVec[Bool]] = intRFReadArbiter.io.in.map(_.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq).toSeq 78 private val fpRdArbWinner: Seq2[MixedVec[Bool]] = fpRFReadArbiter.io.in.map(_.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq).toSeq 79 private val vfRdArbWinner: Seq2[MixedVec[Bool]] = vfRFReadArbiter.io.in.map(_.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq).toSeq 80 private val v0RdArbWinner: Seq2[MixedVec[Bool]] = v0RFReadArbiter.io.in.map(_.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq).toSeq 81 private val vlRdArbWinner: Seq2[MixedVec[Bool]] = vlRFReadArbiter.io.in.map(_.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq).toSeq 82 83 private val intWbNotBlock: Seq[MixedVec[Bool]] = intWbBusyArbiter.io.in.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq 84 private val fpWbNotBlock: Seq[MixedVec[Bool]] = fpWbBusyArbiter.io.in.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq 85 private val vfWbNotBlock: Seq[MixedVec[Bool]] = vfWbBusyArbiter.io.in.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq 86 private val v0WbNotBlock: Seq[MixedVec[Bool]] = v0WbBusyArbiter.io.in.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq 87 private val vlWbNotBlock: Seq[MixedVec[Bool]] = vlWbBusyArbiter.io.in.map(x => MixedVecInit(x.map(_.ready).toSeq)).toSeq 88 89 private val intRdNotBlock: Seq2[Bool] = intRdArbWinner.map(_.map(_.asUInt.andR)) 90 private val fpRdNotBlock: Seq2[Bool] = fpRdArbWinner.map(_.map(_.asUInt.andR)) 91 private val vfRdNotBlock: Seq2[Bool] = vfRdArbWinner.map(_.map(_.asUInt.andR)) 92 private val v0RdNotBlock: Seq2[Bool] = v0RdArbWinner.map(_.map(_.asUInt.andR)) 93 private val vlRdNotBlock: Seq2[Bool] = vlRdArbWinner.map(_.map(_.asUInt.andR)) 94 95 private val intRFReadReq: Seq3[ValidIO[RfReadPortWithConfig]] = fromIQ.map(x => x.map(xx => xx.bits.getRfReadValidBundle(xx.valid)).toSeq).toSeq 96 private val fpRFReadReq: Seq3[ValidIO[RfReadPortWithConfig]] = fromIQ.map(x => x.map(xx => xx.bits.getRfReadValidBundle(xx.valid)).toSeq).toSeq 97 private val vfRFReadReq: Seq3[ValidIO[RfReadPortWithConfig]] = fromIQ.map(x => x.map(xx => xx.bits.getRfReadValidBundle(xx.valid)).toSeq).toSeq 98 private val v0RFReadReq: Seq3[ValidIO[RfReadPortWithConfig]] = fromIQ.map(x => x.map(xx => xx.bits.getRfReadValidBundle(xx.valid)).toSeq).toSeq 99 private val vlRFReadReq: Seq3[ValidIO[RfReadPortWithConfig]] = fromIQ.map(x => x.map(xx => xx.bits.getRfReadValidBundle(xx.valid)).toSeq).toSeq 100 101 private val allDataSources: Seq[Seq[Vec[DataSource]]] = fromIQ.map(x => x.map(xx => xx.bits.common.dataSources).toSeq) 102 private val allNumRegSrcs: Seq[Seq[Int]] = fromIQ.map(x => x.map(xx => xx.bits.exuParams.numRegSrc).toSeq) 103 104 intRFReadArbiter.io.in.zip(intRFReadReq).zipWithIndex.foreach { case ((arbInSeq2, inRFReadReqSeq2), iqIdx) => 105 arbInSeq2.zip(inRFReadReqSeq2).zipWithIndex.foreach { case ((arbInSeq, inRFReadReqSeq), exuIdx) => 106 val srcIndices: Seq[Int] = fromIQ(iqIdx)(exuIdx).bits.exuParams.getRfReadSrcIdx(IntData()) 107 for (srcIdx <- 0 until fromIQ(iqIdx)(exuIdx).bits.exuParams.numRegSrc) { 108 if (srcIndices.contains(srcIdx) && inRFReadReqSeq.isDefinedAt(srcIdx)) { 109 arbInSeq(srcIdx).valid := inRFReadReqSeq(srcIdx).valid && allDataSources(iqIdx)(exuIdx)(srcIdx).readReg 110 arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr 111// if (allNumRegSrcs(iqIdx)(exuIdx) == 2) { 112// val src0Req = inRFReadReqSeq(0).valid && allDataSources(iqIdx)(exuIdx)(0).readReg 113// val src1Req = inRFReadReqSeq(1).valid && allDataSources(iqIdx)(exuIdx)(1).readReg 114// if (srcIdx == 0) { 115// arbInSeq(srcIdx).valid := src0Req || src1Req 116// arbInSeq(srcIdx).bits.addr := Mux(src1Req && !src0Req, inRFReadReqSeq(1).bits.addr,inRFReadReqSeq(0).bits.addr) 117// } else { 118// arbInSeq(srcIdx).valid := src0Req && src1Req 119// arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr 120// } 121// } else { 122// arbInSeq(srcIdx).valid := inRFReadReqSeq(srcIdx).valid && allDataSources(iqIdx)(exuIdx)(srcIdx).readReg 123// arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr 124// } 125 } else { 126 arbInSeq(srcIdx).valid := false.B 127 arbInSeq(srcIdx).bits.addr := 0.U 128 } 129 } 130 } 131 } 132 fpRFReadArbiter.io.in.zip(fpRFReadReq).zipWithIndex.foreach { case ((arbInSeq2, inRFReadReqSeq2), iqIdx) => 133 arbInSeq2.zip(inRFReadReqSeq2).zipWithIndex.foreach { case ((arbInSeq, inRFReadReqSeq), exuIdx) => 134 val srcIndices: Seq[Int] = FpRegSrcDataSet.flatMap(data => fromIQ(iqIdx)(exuIdx).bits.exuParams.getRfReadSrcIdx(data)).toSeq.sorted 135 for (srcIdx <- 0 until fromIQ(iqIdx)(exuIdx).bits.exuParams.numRegSrc) { 136 if (srcIndices.contains(srcIdx) && inRFReadReqSeq.isDefinedAt(srcIdx)) { 137 arbInSeq(srcIdx).valid := inRFReadReqSeq(srcIdx).valid && allDataSources(iqIdx)(exuIdx)(srcIdx).readReg 138 arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr 139 } else { 140 arbInSeq(srcIdx).valid := false.B 141 arbInSeq(srcIdx).bits.addr := 0.U 142 } 143 } 144 } 145 } 146 147 vfRFReadArbiter.io.in.zip(vfRFReadReq).zipWithIndex.foreach { case ((arbInSeq2, inRFReadReqSeq2), iqIdx) => 148 arbInSeq2.zip(inRFReadReqSeq2).zipWithIndex.foreach { case ((arbInSeq, inRFReadReqSeq), exuIdx) => 149 val srcIndices: Seq[Int] = VecRegSrcDataSet.flatMap(data => fromIQ(iqIdx)(exuIdx).bits.exuParams.getRfReadSrcIdx(data)).toSeq.sorted 150 for (srcIdx <- 0 until fromIQ(iqIdx)(exuIdx).bits.exuParams.numRegSrc) { 151 if (srcIndices.contains(srcIdx) && inRFReadReqSeq.isDefinedAt(srcIdx)) { 152 arbInSeq(srcIdx).valid := inRFReadReqSeq(srcIdx).valid && allDataSources(iqIdx)(exuIdx)(srcIdx).readReg 153 arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr 154 } else { 155 arbInSeq(srcIdx).valid := false.B 156 arbInSeq(srcIdx).bits.addr := 0.U 157 } 158 } 159 } 160 } 161 162 v0RFReadArbiter.io.in.zip(v0RFReadReq).zipWithIndex.foreach { case ((arbInSeq2, inRFReadReqSeq2), iqIdx) => 163 arbInSeq2.zip(inRFReadReqSeq2).zipWithIndex.foreach { case ((arbInSeq, inRFReadReqSeq), exuIdx) => 164 val srcIndices: Seq[Int] = V0RegSrcDataSet.flatMap(data => fromIQ(iqIdx)(exuIdx).bits.exuParams.getRfReadSrcIdx(data)).toSeq.sorted 165 for (srcIdx <- 0 until fromIQ(iqIdx)(exuIdx).bits.exuParams.numRegSrc) { 166 if (srcIndices.contains(srcIdx) && inRFReadReqSeq.isDefinedAt(srcIdx)) { 167 arbInSeq(srcIdx).valid := inRFReadReqSeq(srcIdx).valid && allDataSources(iqIdx)(exuIdx)(srcIdx).readReg 168 arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr 169 } else { 170 arbInSeq(srcIdx).valid := false.B 171 arbInSeq(srcIdx).bits.addr := 0.U 172 } 173 } 174 } 175 } 176 177 vlRFReadArbiter.io.in.zip(vlRFReadReq).zipWithIndex.foreach { case ((arbInSeq2, inRFReadReqSeq2), iqIdx) => 178 arbInSeq2.zip(inRFReadReqSeq2).zipWithIndex.foreach { case ((arbInSeq, inRFReadReqSeq), exuIdx) => 179 val srcIndices: Seq[Int] = VlRegSrcDataSet.flatMap(data => fromIQ(iqIdx)(exuIdx).bits.exuParams.getRfReadSrcIdx(data)).toSeq.sorted 180 for (srcIdx <- 0 until fromIQ(iqIdx)(exuIdx).bits.exuParams.numRegSrc) { 181 if (srcIndices.contains(srcIdx) && inRFReadReqSeq.isDefinedAt(srcIdx)) { 182 arbInSeq(srcIdx).valid := inRFReadReqSeq(srcIdx).valid && allDataSources(iqIdx)(exuIdx)(srcIdx).readReg 183 arbInSeq(srcIdx).bits.addr := inRFReadReqSeq(srcIdx).bits.addr 184 } else { 185 arbInSeq(srcIdx).valid := false.B 186 arbInSeq(srcIdx).bits.addr := 0.U 187 } 188 } 189 } 190 } 191 192 private val intRFWriteReq: Seq2[Bool] = fromIQ.map(x => x.map(xx => xx.valid && xx.bits.common.rfWen.getOrElse(false.B)).toSeq).toSeq 193 private val fpRFWriteReq: Seq2[Bool] = fromIQ.map(x => x.map(xx => xx.valid && xx.bits.common.fpWen.getOrElse(false.B)).toSeq).toSeq 194 private val vfRFWriteReq: Seq2[Bool] = fromIQ.map(x => x.map(xx => xx.valid && xx.bits.common.vecWen.getOrElse(false.B)).toSeq).toSeq 195 private val v0RFWriteReq: Seq2[Bool] = fromIQ.map(x => x.map(xx => xx.valid && xx.bits.common.v0Wen.getOrElse(false.B)).toSeq).toSeq 196 private val vlRFWriteReq: Seq2[Bool] = fromIQ.map(x => x.map(xx => xx.valid && xx.bits.common.vlWen.getOrElse(false.B)).toSeq).toSeq 197 198 intWbBusyArbiter.io.in.zip(intRFWriteReq).foreach { case (arbInSeq, inRFWriteReqSeq) => 199 arbInSeq.zip(inRFWriteReqSeq).foreach { case (arbIn, inRFWriteReq) => 200 arbIn.valid := inRFWriteReq 201 } 202 } 203 204 fpWbBusyArbiter.io.in.zip(fpRFWriteReq).foreach { case (arbInSeq, inRFWriteReqSeq) => 205 arbInSeq.zip(inRFWriteReqSeq).foreach { case (arbIn, inRFWriteReq) => 206 arbIn.valid := inRFWriteReq 207 } 208 } 209 210 vfWbBusyArbiter.io.in.zip(vfRFWriteReq).foreach { case (arbInSeq, inRFWriteReqSeq) => 211 arbInSeq.zip(inRFWriteReqSeq).foreach { case (arbIn, inRFWriteReq) => 212 arbIn.valid := inRFWriteReq 213 } 214 } 215 216 v0WbBusyArbiter.io.in.zip(v0RFWriteReq).foreach { case (arbInSeq, inRFWriteReqSeq) => 217 arbInSeq.zip(inRFWriteReqSeq).foreach { case (arbIn, inRFWriteReq) => 218 arbIn.valid := inRFWriteReq 219 } 220 } 221 222 vlWbBusyArbiter.io.in.zip(vlRFWriteReq).foreach { case (arbInSeq, inRFWriteReqSeq) => 223 arbInSeq.zip(inRFWriteReqSeq).foreach { case (arbIn, inRFWriteReq) => 224 arbIn.valid := inRFWriteReq 225 } 226 } 227 228 private val intSchdParams = params.schdParams(IntScheduler()) 229 private val fpSchdParams = params.schdParams(FpScheduler()) 230 private val vfSchdParams = params.schdParams(VfScheduler()) 231 private val memSchdParams = params.schdParams(MemScheduler()) 232 233 private val schdParams = params.allSchdParams 234 235 private val pcReadValid = Wire(chiselTypeOf(io.fromPcTargetMem.fromDataPathValid)) 236 private val pcReadFtqPtr = Wire(chiselTypeOf(io.fromPcTargetMem.fromDataPathFtqPtr)) 237 private val pcReadFtqOffset = Wire(chiselTypeOf(io.fromPcTargetMem.fromDataPathFtqOffset)) 238 private val targetPCRdata = io.fromPcTargetMem.toDataPathTargetPC 239 private val pcRdata = io.fromPcTargetMem.toDataPathPC 240 private val intRfRaddr = Wire(Vec(params.numPregRd(IntData()), UInt(intSchdParams.pregIdxWidth.W))) 241 private val intRfRdata = Wire(Vec(params.numPregRd(IntData()), UInt(intSchdParams.rfDataWidth.W))) 242 private val intRfWen = Wire(Vec(io.fromIntWb.length, Bool())) 243 private val intRfWaddr = Wire(Vec(io.fromIntWb.length, UInt(intSchdParams.pregIdxWidth.W))) 244 private val intRfWdata = Wire(Vec(io.fromIntWb.length, UInt(intSchdParams.rfDataWidth.W))) 245 246 private val fpRfRaddr = Wire(Vec(params.numPregRd(FpData()), UInt(fpSchdParams.pregIdxWidth.W))) 247 private val fpRfRdata = Wire(Vec(params.numPregRd(FpData()), UInt(fpSchdParams.rfDataWidth.W))) 248 private val fpRfWen = Wire(Vec(io.fromFpWb.length, Bool())) 249 private val fpRfWaddr = Wire(Vec(io.fromFpWb.length, UInt(fpSchdParams.pregIdxWidth.W))) 250 private val fpRfWdata = Wire(Vec(io.fromFpWb.length, UInt(fpSchdParams.rfDataWidth.W))) 251 252 private val vfRfSplitNum = VLEN / XLEN 253 private val vfRfRaddr = Wire(Vec(params.numPregRd(VecData()), UInt(vfSchdParams.pregIdxWidth.W))) 254 private val vfRfRdata = Wire(Vec(params.numPregRd(VecData()), UInt(vfSchdParams.rfDataWidth.W))) 255 private val vfRfWen = Wire(Vec(vfRfSplitNum, Vec(io.fromVfWb.length, Bool()))) 256 private val vfRfWaddr = Wire(Vec(io.fromVfWb.length, UInt(vfSchdParams.pregIdxWidth.W))) 257 private val vfRfWdata = Wire(Vec(io.fromVfWb.length, UInt(vfSchdParams.rfDataWidth.W))) 258 259 private val v0RfSplitNum = VLEN / XLEN 260 private val v0RfRaddr = Wire(Vec(params.numPregRd(V0Data()), UInt(log2Up(V0PhyRegs).W))) 261 private val v0RfRdata = Wire(Vec(params.numPregRd(V0Data()), UInt(V0Data().dataWidth.W))) 262 private val v0RfWen = Wire(Vec(v0RfSplitNum, Vec(io.fromV0Wb.length, Bool()))) 263 private val v0RfWaddr = Wire(Vec(io.fromV0Wb.length, UInt(log2Up(V0PhyRegs).W))) 264 private val v0RfWdata = Wire(Vec(io.fromV0Wb.length, UInt(V0Data().dataWidth.W))) 265 266 private val vlRfRaddr = Wire(Vec(params.numPregRd(VlData()), UInt(log2Up(VlPhyRegs).W))) 267 private val vlRfRdata = Wire(Vec(params.numPregRd(VlData()), UInt(VlData().dataWidth.W))) 268 private val vlRfWen = Wire(Vec(io.fromVlWb.length, Bool())) 269 private val vlRfWaddr = Wire(Vec(io.fromVlWb.length, UInt(log2Up(VlPhyRegs).W))) 270 private val vlRfWdata = Wire(Vec(io.fromVlWb.length, UInt(VlData().dataWidth.W))) 271 272 val pcReadFtqPtrFormIQ = fromIntIQ.flatten.filter(x => x.bits.exuParams.needPc) 273 assert(pcReadFtqPtrFormIQ.size == pcReadFtqPtr.size, s"pcReadFtqPtrFormIQ.size ${pcReadFtqPtrFormIQ.size} not equal pcReadFtqPtr.size ${pcReadFtqPtr.size}") 274 pcReadValid.zip(pcReadFtqPtrFormIQ.map(_.valid)).map(x => x._1 := x._2) 275 pcReadFtqPtr.zip(pcReadFtqPtrFormIQ.map(_.bits.common.ftqIdx.get)).map(x => x._1 := x._2) 276 pcReadFtqOffset.zip(pcReadFtqPtrFormIQ.map(_.bits.common.ftqOffset.get)).map(x => x._1 := x._2) 277 io.fromPcTargetMem.fromDataPathValid := pcReadValid 278 io.fromPcTargetMem.fromDataPathFtqPtr := pcReadFtqPtr 279 io.fromPcTargetMem.fromDataPathFtqOffset := pcReadFtqOffset 280 281 private val intDebugRead: Option[(Vec[UInt], Vec[UInt])] = 282 OptionWrapper(env.AlwaysBasicDiff || env.EnableDifftest, (Wire(Vec(32, UInt(intSchdParams.pregIdxWidth.W))), Wire(Vec(32, UInt(XLEN.W))))) 283 private val fpDebugRead: Option[(Vec[UInt], Vec[UInt])] = 284 OptionWrapper(env.AlwaysBasicDiff || env.EnableDifftest, (Wire(Vec(32, UInt(fpSchdParams.pregIdxWidth.W))), Wire(Vec(32, UInt(XLEN.W))))) 285 private val vfDebugRead: Option[(Vec[UInt], Vec[UInt])] = 286 OptionWrapper(env.AlwaysBasicDiff || env.EnableDifftest, (Wire(Vec(31, UInt(vfSchdParams.pregIdxWidth.W))), Wire(Vec(31, UInt(VLEN.W))))) 287 private val v0DebugRead: Option[(Vec[UInt], Vec[UInt])] = 288 OptionWrapper(env.AlwaysBasicDiff || env.EnableDifftest, (Wire(Vec(1, UInt(log2Up(V0PhyRegs).W))), Wire(Vec(1, UInt(V0Data().dataWidth.W))))) 289 private val vlDebugRead: Option[(Vec[UInt], Vec[UInt])] = 290 OptionWrapper(env.AlwaysBasicDiff || env.EnableDifftest, (Wire(Vec(1, UInt(log2Up(VlPhyRegs).W))), Wire(Vec(1, UInt(VlData().dataWidth.W))))) 291 292 private val fpDebugReadData: Option[Vec[UInt]] = 293 OptionWrapper(env.AlwaysBasicDiff || env.EnableDifftest, Wire(Vec(32, UInt(XLEN.W)))) 294 private val vecDebugReadData: Option[Vec[UInt]] = 295 OptionWrapper(env.AlwaysBasicDiff || env.EnableDifftest, Wire(Vec(64, UInt(64.W)))) // v0 = Cat(Vec(1), Vec(0)) 296 private val vlDebugReadData: Option[UInt] = 297 OptionWrapper(env.AlwaysBasicDiff || env.EnableDifftest, Wire(UInt(VlData().dataWidth.W))) 298 299 300 fpDebugReadData.foreach(_ := fpDebugRead 301 .get._2 302 .slice(0, 32) 303 .map(_(63, 0)) 304 ) // fp only used [63, 0] 305 vecDebugReadData.foreach(_ := 306 v0DebugRead 307 .get._2 308 .slice(0, 1) 309 .map(x => Seq(x(63, 0), x(127, 64))).flatten ++ 310 vfDebugRead 311 .get._2 312 .slice(0, 31) 313 .map(x => Seq(x(63, 0), x(127, 64))).flatten 314 ) 315 vlDebugReadData.foreach(_ := vlDebugRead 316 .get._2(0) 317 ) 318 319 io.debugVl.foreach(_ := vlDebugReadData.get) 320 321 IntRegFile("IntRegFile", intSchdParams.numPregs, intRfRaddr, intRfRdata, intRfWen, intRfWaddr, intRfWdata, 322 bankNum = 1, 323 debugReadAddr = intDebugRead.map(_._1), 324 debugReadData = intDebugRead.map(_._2) 325 ) 326 FpRegFile("FpRegFile", fpSchdParams.numPregs, fpRfRaddr, fpRfRdata, fpRfWen, fpRfWaddr, fpRfWdata, 327 bankNum = 1, 328 debugReadAddr = fpDebugRead.map(_._1), 329 debugReadData = fpDebugRead.map(_._2) 330 ) 331 VfRegFile("VfRegFile", vfSchdParams.numPregs, vfRfSplitNum, vfRfRaddr, vfRfRdata, vfRfWen, vfRfWaddr, vfRfWdata, 332 debugReadAddr = vfDebugRead.map(_._1), 333 debugReadData = vfDebugRead.map(_._2) 334 ) 335 VfRegFile("V0RegFile", V0PhyRegs, v0RfSplitNum, v0RfRaddr, v0RfRdata, v0RfWen, v0RfWaddr, v0RfWdata, 336 debugReadAddr = v0DebugRead.map(_._1), 337 debugReadData = v0DebugRead.map(_._2) 338 ) 339 FpRegFile("VlRegFile", VlPhyRegs, vlRfRaddr, vlRfRdata, vlRfWen, vlRfWaddr, vlRfWdata, 340 bankNum = 1, 341 debugReadAddr = vlDebugRead.map(_._1), 342 debugReadData = vlDebugRead.map(_._2) 343 ) 344 345 intRfWaddr := io.fromIntWb.map(x => RegEnable(x.addr, x.wen)).toSeq 346 intRfWdata := io.fromIntWb.map(x => RegEnable(x.data, x.wen)).toSeq 347 intRfWen := RegNext(VecInit(io.fromIntWb.map(_.wen).toSeq)) 348 349 for (portIdx <- intRfRaddr.indices) { 350 if (intRFReadArbiter.io.out.isDefinedAt(portIdx)) 351 intRfRaddr(portIdx) := intRFReadArbiter.io.out(portIdx).bits.addr 352 else 353 intRfRaddr(portIdx) := 0.U 354 } 355 356 fpRfWaddr := io.fromFpWb.map(x => RegEnable(x.addr, x.wen)).toSeq 357 fpRfWdata := io.fromFpWb.map(x => RegEnable(x.data, x.wen)).toSeq 358 fpRfWen := RegNext(VecInit(io.fromFpWb.map(_.wen).toSeq)) 359 360 for (portIdx <- fpRfRaddr.indices) { 361 if (fpRFReadArbiter.io.out.isDefinedAt(portIdx)) 362 fpRfRaddr(portIdx) := fpRFReadArbiter.io.out(portIdx).bits.addr 363 else 364 fpRfRaddr(portIdx) := 0.U 365 } 366 367 vfRfWaddr := io.fromVfWb.map(x => RegEnable(x.addr, x.wen)).toSeq 368 vfRfWdata := io.fromVfWb.map(x => RegEnable(x.data, x.wen)).toSeq 369 vfRfWen.foreach(_.zip(io.fromVfWb.map(x => RegNext(x.wen))).foreach { case (wenSink, wenSource) => wenSink := wenSource } ) 370 371 for (portIdx <- vfRfRaddr.indices) { 372 if (vfRFReadArbiter.io.out.isDefinedAt(portIdx)) 373 vfRfRaddr(portIdx) := vfRFReadArbiter.io.out(portIdx).bits.addr 374 else 375 vfRfRaddr(portIdx) := 0.U 376 } 377 378 v0RfWaddr := io.fromV0Wb.map(_.addr).toSeq 379 v0RfWdata := io.fromV0Wb.map(_.data).toSeq 380 v0RfWen.foreach(_.zip(io.fromV0Wb.map(_.wen)).foreach { case (wenSink, wenSource) => wenSink := wenSource } ) 381 382 for (portIdx <- v0RfRaddr.indices) { 383 if (v0RFReadArbiter.io.out.isDefinedAt(portIdx)) 384 v0RfRaddr(portIdx) := v0RFReadArbiter.io.out(portIdx).bits.addr 385 else 386 v0RfRaddr(portIdx) := 0.U 387 } 388 389 vlRfWaddr := io.fromVlWb.map(_.addr).toSeq 390 vlRfWdata := io.fromVlWb.map(_.data).toSeq 391 vlRfWen := io.fromVlWb.map(_.wen).toSeq 392 393 for (portIdx <- vlRfRaddr.indices) { 394 if (vlRFReadArbiter.io.out.isDefinedAt(portIdx)) 395 vlRfRaddr(portIdx) := vlRFReadArbiter.io.out(portIdx).bits.addr 396 else 397 vlRfRaddr(portIdx) := 0.U 398 } 399 400 401 intDebugRead.foreach { case (addr, _) => 402 addr := io.debugIntRat.get 403 } 404 405 fpDebugRead.foreach { case (addr, _) => 406 addr := io.debugFpRat.get 407 } 408 409 vfDebugRead.foreach { case (addr, _) => 410 addr := io.debugVecRat.get 411 } 412 v0DebugRead.foreach { case (addr, _) => 413 addr := VecInit(io.debugV0Rat.get) 414 } 415 vlDebugRead.foreach { case (addr, _) => 416 addr := VecInit(io.debugVlRat.get) 417 } 418 419 println(s"[DataPath] " + 420 s"has intDebugRead: ${intDebugRead.nonEmpty}, " + 421 s"has fpDebugRead: ${fpDebugRead.nonEmpty}, " + 422 s"has vecDebugRead: ${vfDebugRead.nonEmpty}, " + 423 s"has v0DebugRead: ${v0DebugRead.nonEmpty}, " + 424 s"has vlDebugRead: ${vlDebugRead.nonEmpty}") 425 426 val s1_addrOHs = Reg(MixedVec( 427 fromIQ.map(x => MixedVec(x.map(_.bits.addrOH.cloneType).toSeq)).toSeq 428 )) 429 val s1_toExuValid: MixedVec[MixedVec[Bool]] = Reg(MixedVec( 430 toExu.map(x => MixedVec(x.map(_.valid.cloneType).toSeq)).toSeq 431 )) 432 val s1_toExuData: MixedVec[MixedVec[ExuInput]] = Reg(MixedVec(toExu.map(x => MixedVec(x.map(_.bits.cloneType).toSeq)).toSeq)) 433 val s1_immInfo = Reg(MixedVec(toExu.map(x => MixedVec(x.map(x => new ImmInfo).toSeq)).toSeq)) 434 s1_immInfo.zip(fromIQ).map { case (s1Vec, s0Vec) => 435 s1Vec.zip(s0Vec).map { case (s1, s0) => 436 s1.imm := Mux(s0.valid, s0.bits.common.imm, s1.imm) 437 s1.immType := Mux(s0.valid, s0.bits.immType, s1.immType) 438 } 439 } 440 io.og1ImmInfo.zip(s1_immInfo.flatten).map{ case(out, reg) => 441 out := reg 442 } 443 val s1_toExuReady = Wire(MixedVec(toExu.map(x => MixedVec(x.map(_.ready.cloneType).toSeq)))) 444 val s1_srcType: MixedVec[MixedVec[Vec[UInt]]] = MixedVecInit(fromIQ.map(x => MixedVecInit(x.map(xx => RegEnable(xx.bits.srcType, xx.fire)).toSeq))) 445 446 val s1_intPregRData: MixedVec[MixedVec[Vec[UInt]]] = Wire(MixedVec(toExu.map(x => MixedVec(x.map(_.bits.src.cloneType).toSeq)))) 447 val s1_fpPregRData: MixedVec[MixedVec[Vec[UInt]]] = Wire(MixedVec(toExu.map(x => MixedVec(x.map(_.bits.src.cloneType).toSeq)))) 448 val s1_vfPregRData: MixedVec[MixedVec[Vec[UInt]]] = Wire(MixedVec(toExu.map(x => MixedVec(x.map(_.bits.src.cloneType).toSeq)))) 449 val s1_v0PregRData: MixedVec[MixedVec[Vec[UInt]]] = Wire(MixedVec(toExu.map(x => MixedVec(x.map(_.bits.src.cloneType).toSeq)))) 450 val s1_vlPregRData: MixedVec[MixedVec[Vec[UInt]]] = Wire(MixedVec(toExu.map(x => MixedVec(x.map(_.bits.src.cloneType).toSeq)))) 451 452 val rfrPortConfigs = schdParams.map(_.issueBlockParams).flatten.map(_.exuBlockParams.map(_.rfrPortConfigs)) 453 454 println(s"[DataPath] s1_intPregRData.flatten.flatten.size: ${s1_intPregRData.flatten.flatten.size}, intRfRdata.size: ${intRfRdata.size}") 455 s1_intPregRData.foreach(_.foreach(_.foreach(_ := 0.U))) 456 s1_intPregRData.zip(rfrPortConfigs).foreach { case (iqRdata, iqCfg) => 457 iqRdata.zip(iqCfg).foreach { case (iuRdata, iuCfg) => 458 val realIuCfg = iuCfg.map(x => x.filter(_.isInstanceOf[IntRD])).flatten 459 iuRdata.zip(realIuCfg) 460 .filter { case (_, rfrPortConfig) => rfrPortConfig.isInstanceOf[IntRD] } 461 .foreach { case (sink, cfg) => sink := intRfRdata(cfg.port) } 462 } 463 } 464 465 println(s"[DataPath] s1_fpPregRData.flatten.flatten.size: ${s1_fpPregRData.flatten.flatten.size}, fpRfRdata.size: ${fpRfRdata.size}") 466 s1_fpPregRData.foreach(_.foreach(_.foreach(_ := 0.U))) 467 s1_fpPregRData.zip(rfrPortConfigs).foreach { case (iqRdata, iqCfg) => 468 iqRdata.zip(iqCfg).foreach { case (iuRdata, iuCfg) => 469 val realIuCfg = iuCfg.map(x => x.filter(_.isInstanceOf[FpRD])).flatten 470 iuRdata.zip(realIuCfg) 471 .filter { case (_, rfrPortConfig) => rfrPortConfig.isInstanceOf[FpRD] } 472 .foreach { case (sink, cfg) => sink := fpRfRdata(cfg.port) } 473 } 474 } 475 476 println(s"[DataPath] s1_vfPregRData.flatten.flatten.size: ${s1_vfPregRData.flatten.flatten.size}, vfRfRdata.size: ${vfRfRdata.size}") 477 s1_vfPregRData.foreach(_.foreach(_.foreach(_ := 0.U))) 478 s1_vfPregRData.zip(rfrPortConfigs).foreach{ case(iqRdata, iqCfg) => 479 iqRdata.zip(iqCfg).foreach{ case(iuRdata, iuCfg) => 480 val realIuCfg = iuCfg.map(x => x.filter(_.isInstanceOf[VfRD])).flatten 481 iuRdata.zip(realIuCfg) 482 .filter { case (_, rfrPortConfig) => rfrPortConfig.isInstanceOf[VfRD] } 483 .foreach { case (sink, cfg) => sink := vfRfRdata(cfg.port) } 484 } 485 } 486 487 println(s"[DataPath] s1_v0PregRData.flatten.flatten.size: ${s1_v0PregRData.flatten.flatten.size}, v0RfRdata.size: ${v0RfRdata.size}") 488 s1_v0PregRData.foreach(_.foreach(_.foreach(_ := 0.U))) 489 s1_v0PregRData.zip(rfrPortConfigs).foreach{ case(iqRdata, iqCfg) => 490 iqRdata.zip(iqCfg).foreach{ case(iuRdata, iuCfg) => 491 val realIuCfg = iuCfg.map(x => x.filter(_.isInstanceOf[V0RD])).flatten 492 iuRdata.zip(realIuCfg) 493 .filter { case (_, rfrPortConfig) => rfrPortConfig.isInstanceOf[V0RD] } 494 .foreach { case (sink, cfg) => sink := v0RfRdata(cfg.port) } 495 } 496 } 497 498 println(s"[DataPath] s1_vlPregRData.flatten.flatten.size: ${s1_vlPregRData.flatten.flatten.size}, vlRfRdata.size: ${vlRfRdata.size}") 499 s1_vlPregRData.foreach(_.foreach(_.foreach(_ := 0.U))) 500 s1_vlPregRData.zip(rfrPortConfigs).foreach{ case(iqRdata, iqCfg) => 501 iqRdata.zip(iqCfg).foreach{ case(iuRdata, iuCfg) => 502 val realIuCfg = iuCfg.map(x => x.filter(_.isInstanceOf[VlRD])).flatten 503 iuRdata.zip(realIuCfg) 504 .filter { case (_, rfrPortConfig) => rfrPortConfig.isInstanceOf[VlRD] } 505 .foreach { case (sink, cfg) => sink := vlRfRdata(cfg.port) } 506 } 507 } 508 509 val og0_cancel_no_load = VecInit(og0FailedVec2.flatten.zip(params.allExuParams).filter(!_._2.hasLoadFu).map(_._1).toSeq) 510 val exuParamsNoLoad = fromIQ.flatten.zip(params.allExuParams).filter(!_._2.hasLoadFu) 511 val is_0latency = Wire(Vec(og0_cancel_no_load.size, Bool())) 512 is_0latency := exuParamsNoLoad.map(x => is0latency(x._1.bits.common.fuType)) 513 val og0_cancel_delay = RegNext(VecInit(og0_cancel_no_load.zip(is_0latency).map(x => x._1 && x._2))) 514 val isVfScheduler = VecInit(exuParamsNoLoad.map(x => x._2.schdType.isInstanceOf[VfScheduler].B)) 515 val og0_cancel_delay_for_mem = VecInit(og0_cancel_delay.zip(isVfScheduler).map(x => x._1 && !x._2)) 516 for (i <- fromIQ.indices) { 517 for (j <- fromIQ(i).indices) { 518 // IQ(s0) --[Ctrl]--> s1Reg ---------- begin 519 // refs 520 val s1_valid = s1_toExuValid(i)(j) 521 val s1_ready = s1_toExuReady(i)(j) 522 val s1_data = s1_toExuData(i)(j) 523 val s1_addrOH = s1_addrOHs(i)(j) 524 val s0 = fromIQ(i)(j) // s0 525 526 val srcNotBlock = Wire(Bool()) 527 srcNotBlock := s0.bits.common.dataSources.zip(intRdArbWinner(i)(j) zip fpRdArbWinner(i)(j) zip vfRdArbWinner(i)(j) zip v0RdArbWinner(i)(j) zip vlRdArbWinner(i)(j)).map { 528 case (source, ((((win_int, win_fp), win_vf), win_v0), win_vl)) => 529 !source.readReg || win_int && win_fp && win_vf && win_v0 && win_vl 530 }.fold(true.B)(_ && _) 531 val notBlock = srcNotBlock && intWbNotBlock(i)(j) && fpWbNotBlock(i)(j) && vfWbNotBlock(i)(j) && v0WbNotBlock(i)(j) && vlWbNotBlock(i)(j) 532 val s1_flush = s0.bits.common.robIdx.needFlush(Seq(io.flush, RegNextWithEnable(io.flush))) 533 val s1_cancel = og1FailedVec2(i)(j) 534 val s0_cancel = Wire(Bool()) 535 val og0_cancel_delay_need = if (s0.bits.exuParams.schdType.isInstanceOf[MemScheduler]) og0_cancel_delay_for_mem else og0_cancel_delay 536 if (s0.bits.exuParams.isIQWakeUpSink) { 537 val exuOHNoLoad = s0.bits.common.l1ExuOH.get.map(x => x.asTypeOf(Vec(x.getWidth, Bool())).zip(params.allExuParams).filter(!_._2.hasLoadFu).map(_._1)) 538 s0_cancel := exuOHNoLoad.zip(s0.bits.common.dataSources).map{ 539 case (exuOH, dataSource) => (VecInit(exuOH).asUInt & og0_cancel_delay_need.asUInt).orR && dataSource.readForward 540 }.reduce(_ || _) && s0.valid 541 } else s0_cancel := false.B 542 val s0_ldCancel = LoadShouldCancel(s0.bits.common.loadDependency, io.ldCancel) 543 when (s0.fire && !s1_flush && notBlock && !s1_cancel && !s0_ldCancel && !s0_cancel) { 544 s1_valid := s0.valid 545 s1_data.fromIssueBundle(s0.bits) // no src data here 546 s1_addrOH := s0.bits.addrOH 547 }.otherwise { 548 s1_valid := false.B 549 } 550 s0.ready := (s1_ready || !s1_valid) && notBlock && !s1_cancel && !s0_ldCancel && !s0_cancel 551 // IQ(s0) --[Ctrl]--> s1Reg ---------- end 552 } 553 } 554 555 private val fromIQFire = fromIQ.map(_.map(_.fire)) 556 private val toExuFire = toExu.map(_.map(_.fire)) 557 toIQs.zipWithIndex.foreach { 558 case(toIQ, iqIdx) => 559 toIQ.zipWithIndex.foreach { 560 case (toIU, iuIdx) => 561 // IU: issue unit 562 val og0resp = toIU.og0resp 563 og0FailedVec2(iqIdx)(iuIdx) := fromIQ(iqIdx)(iuIdx).valid && (!fromIQFire(iqIdx)(iuIdx)) 564 og0resp.valid := og0FailedVec2(iqIdx)(iuIdx) 565 og0resp.bits.robIdx := fromIQ(iqIdx)(iuIdx).bits.common.robIdx 566 og0resp.bits.uopIdx.foreach(_ := fromIQ(iqIdx)(iuIdx).bits.common.vpu.get.vuopIdx) 567 og0resp.bits.resp := RespType.block 568 og0resp.bits.fuType := fromIQ(iqIdx)(iuIdx).bits.common.fuType 569 570 val og1resp = toIU.og1resp 571 og1FailedVec2(iqIdx)(iuIdx) := s1_toExuValid(iqIdx)(iuIdx) && !toExuFire(iqIdx)(iuIdx) 572 og1resp.valid := s1_toExuValid(iqIdx)(iuIdx) 573 og1resp.bits.robIdx := s1_toExuData(iqIdx)(iuIdx).robIdx 574 og1resp.bits.uopIdx.foreach(_ := s1_toExuData(iqIdx)(iuIdx).vpu.get.vuopIdx) 575 // respType: fuIdle ->IQ entry clear 576 // fuUncertain ->IQ entry no action 577 // fuBusy ->IQ entry issued set false, then re-issue 578 // hyu, lda and sta are fuUncertain at OG1 stage 579 // and all vector arith exu should check success in og2 stage 580 og1resp.bits.resp := Mux(og1FailedVec2(iqIdx)(iuIdx), 581 RespType.block, 582 if (toIU.issueQueueParams match { case x => x.isLdAddrIQ || x.isStAddrIQ || x.isHyAddrIQ || x.isVecLduIQ || x.isVecStuIQ || x.inVfSchd}) 583 RespType.uncertain 584 else 585 RespType.success, 586 ) 587 og1resp.bits.fuType := s1_toExuData(iqIdx)(iuIdx).fuType 588 } 589 } 590 591 io.og0CancelOH := VecInit(fromFlattenIQ.map(x => x.valid && !x.fire)).asUInt 592 io.og1CancelOH := VecInit(toFlattenExu.map(x => x.valid && !x.fire)).asUInt 593 594 io.cancelToBusyTable.zipWithIndex.foreach { case (cancel, i) => 595 cancel.valid := fromFlattenIQ(i).valid && !fromFlattenIQ(i).fire 596 cancel.bits.rfWen := fromFlattenIQ(i).bits.common.rfWen.getOrElse(false.B) 597 cancel.bits.fpWen := fromFlattenIQ(i).bits.common.fpWen.getOrElse(false.B) 598 cancel.bits.vecWen := fromFlattenIQ(i).bits.common.vecWen.getOrElse(false.B) 599 cancel.bits.v0Wen := fromFlattenIQ(i).bits.common.v0Wen.getOrElse(false.B) 600 cancel.bits.vlWen := fromFlattenIQ(i).bits.common.vlWen.getOrElse(false.B) 601 cancel.bits.pdest := fromFlattenIQ(i).bits.common.pdest 602 } 603 604 if (backendParams.debugEn){ 605 dontTouch(og0_cancel_no_load) 606 dontTouch(is_0latency) 607 dontTouch(og0_cancel_delay) 608 dontTouch(isVfScheduler) 609 dontTouch(og0_cancel_delay_for_mem) 610 } 611 for (i <- toExu.indices) { 612 for (j <- toExu(i).indices) { 613 // s1Reg --[Ctrl]--> exu(s1) ---------- begin 614 // refs 615 val sinkData = toExu(i)(j).bits 616 // assign 617 toExu(i)(j).valid := s1_toExuValid(i)(j) 618 s1_toExuReady(i)(j) := toExu(i)(j).ready 619 sinkData := s1_toExuData(i)(j) 620 // s1Reg --[Ctrl]--> exu(s1) ---------- end 621 622 // s1Reg --[Data]--> exu(s1) ---------- begin 623 // data source1: preg read data 624 for (k <- sinkData.src.indices) { 625 val srcDataTypeSet: Set[DataConfig] = sinkData.params.getSrcDataType(k) 626 val readRfMap: Seq[(Bool, UInt)] = ( 627 if (k == 3) {( 628 Seq(None) 629 :+ 630 OptionWrapper(s1_v0PregRData(i)(j).isDefinedAt(k) && srcDataTypeSet.intersect(V0RegSrcDataSet).nonEmpty, 631 (SrcType.isV0(s1_srcType(i)(j)(k)) -> s1_v0PregRData(i)(j)(k))) 632 )} 633 else if (k == 4) {( 634 Seq(None) 635 :+ 636 OptionWrapper(s1_vlPregRData(i)(j).isDefinedAt(k) && srcDataTypeSet.intersect(VlRegSrcDataSet).nonEmpty, 637 (SrcType.isVp(s1_srcType(i)(j)(k)) -> s1_vlPregRData(i)(j)(k))) 638 )} 639 else {( 640 Seq(None) 641 :+ 642 OptionWrapper(s1_intPregRData(i)(j).isDefinedAt(k) && srcDataTypeSet.intersect(IntRegSrcDataSet).nonEmpty, 643 (SrcType.isXp(s1_srcType(i)(j)(k)) -> s1_intPregRData(i)(j)(k))) 644 :+ 645 OptionWrapper(s1_vfPregRData(i)(j).isDefinedAt(k) && srcDataTypeSet.intersect(VecRegSrcDataSet).nonEmpty, 646 (SrcType.isVp(s1_srcType(i)(j)(k)) -> s1_vfPregRData(i)(j)(k))) 647 :+ 648 OptionWrapper(s1_fpPregRData(i)(j).isDefinedAt(k) && srcDataTypeSet.intersect(FpRegSrcDataSet).nonEmpty, 649 (SrcType.isFp(s1_srcType(i)(j)(k)) -> s1_fpPregRData(i)(j)(k))) 650 )} 651 ).filter(_.nonEmpty).map(_.get) 652 653 if (readRfMap.nonEmpty) 654 sinkData.src(k) := Mux1H(readRfMap) 655 } 656 if (sinkData.params.hasJmpFu) { 657 val index = pcReadFtqPtrFormIQ.map(_.bits.exuParams).indexOf(sinkData.params) 658 sinkData.pc.get := pcRdata(index) 659 } 660 if (sinkData.params.needTarget) { 661 val index = pcReadFtqPtrFormIQ.map(_.bits.exuParams).indexOf(sinkData.params) 662 sinkData.predictInfo.get.target := targetPCRdata(index) 663 } 664 } 665 } 666 667 if (env.AlwaysBasicDiff || env.EnableDifftest) { 668 val delayedCnt = 2 669 val difftestArchIntRegState = DifftestModule(new DiffArchIntRegState, delay = delayedCnt) 670 difftestArchIntRegState.coreid := io.hartId 671 difftestArchIntRegState.value := intDebugRead.get._2 672 673 val difftestArchFpRegState = DifftestModule(new DiffArchFpRegState, delay = delayedCnt) 674 difftestArchFpRegState.coreid := io.hartId 675 difftestArchFpRegState.value := fpDebugReadData.get 676 677 val difftestArchVecRegState = DifftestModule(new DiffArchVecRegState, delay = delayedCnt) 678 difftestArchVecRegState.coreid := io.hartId 679 difftestArchVecRegState.value := vecDebugReadData.get 680 } 681 682 val int_regcache_size = 48 683 val int_regcache_tag = RegInit(VecInit(Seq.fill(int_regcache_size)(0.U(intSchdParams.pregIdxWidth.W)))) 684 val int_regcache_enqPtr = RegInit(0.U(log2Up(int_regcache_size).W)) 685 int_regcache_enqPtr := int_regcache_enqPtr + PopCount(intRfWen) 686 for (i <- intRfWen.indices) { 687 when (intRfWen(i)) { 688 int_regcache_tag(int_regcache_enqPtr + PopCount(intRfWen.take(i))) := intRfWaddr(i) 689 } 690 } 691 692 val vf_regcache_size = 48 693 val vf_regcache_tag = RegInit(VecInit(Seq.fill(vf_regcache_size)(0.U(vfSchdParams.pregIdxWidth.W)))) 694 val vf_regcache_enqPtr = RegInit(0.U(log2Up(vf_regcache_size).W)) 695 vf_regcache_enqPtr := vf_regcache_enqPtr + PopCount(vfRfWen.head) 696 for (i <- vfRfWen.indices) { 697 when (vfRfWen.head(i)) { 698 vf_regcache_tag(vf_regcache_enqPtr + PopCount(vfRfWen.head.take(i))) := vfRfWaddr(i) 699 } 700 } 701 702 XSPerfHistogram(s"IntRegFileRead_hist", PopCount(intRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 20, 1) 703 XSPerfHistogram(s"FpRegFileRead_hist", PopCount(fpRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 20, 1) 704 XSPerfHistogram(s"VfRegFileRead_hist", PopCount(vfRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 20, 1) 705 XSPerfHistogram(s"IntRegFileWrite_hist", PopCount(intRFWriteReq.flatten), true.B, 0, 20, 1) 706 XSPerfHistogram(s"FpRegFileWrite_hist", PopCount(fpRFWriteReq.flatten), true.B, 0, 20, 1) 707 XSPerfHistogram(s"VfRegFileWrite_hist", PopCount(vfRFWriteReq.flatten), true.B, 0, 20, 1) 708 709 val int_regcache_part32 = (1 until 33).map(i => int_regcache_tag(int_regcache_enqPtr - i.U)) 710 val int_regcache_part24 = (1 until 24).map(i => int_regcache_tag(int_regcache_enqPtr - i.U)) 711 val int_regcache_part16 = (1 until 17).map(i => int_regcache_tag(int_regcache_enqPtr - i.U)) 712 val int_regcache_part8 = (1 until 9).map(i => int_regcache_tag(int_regcache_enqPtr - i.U)) 713 714 val int_regcache_48_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_tag.map(_ === x.bits.addr).reduce(_ || _)) 715 val int_regcache_8_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_part8.map(_ === x.bits.addr).reduce(_ || _)) 716 val int_regcache_16_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_part16.map(_ === x.bits.addr).reduce(_ || _)) 717 val int_regcache_24_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_part24.map(_ === x.bits.addr).reduce(_ || _)) 718 val int_regcache_32_hit_vec = intRFReadArbiter.io.in.flatten.flatten.map(x => x.valid && int_regcache_part32.map(_ === x.bits.addr).reduce(_ || _)) 719 XSPerfAccumulate("IntRegCache48Hit", PopCount(int_regcache_48_hit_vec)) 720 XSPerfAccumulate("IntRegCache8Hit", PopCount(int_regcache_8_hit_vec)) 721 XSPerfAccumulate("IntRegCache16Hit", PopCount(int_regcache_16_hit_vec)) 722 XSPerfAccumulate("IntRegCache24Hit", PopCount(int_regcache_24_hit_vec)) 723 XSPerfAccumulate("IntRegCache32Hit", PopCount(int_regcache_32_hit_vec)) 724 XSPerfHistogram("IntRegCache48Hit_hist", PopCount(int_regcache_48_hit_vec), true.B, 0, 16, 2) 725 726 XSPerfAccumulate(s"IntRFReadBeforeArb", PopCount(intRFReadArbiter.io.in.flatten.flatten.map(_.valid))) 727 XSPerfAccumulate(s"IntRFReadAfterArb", PopCount(intRFReadArbiter.io.out.map(_.valid))) 728 XSPerfAccumulate(s"FpRFReadBeforeArb", PopCount(fpRFReadArbiter.io.in.flatten.flatten.map(_.valid))) 729 XSPerfAccumulate(s"FpRFReadAfterArb", PopCount(fpRFReadArbiter.io.out.map(_.valid))) 730 XSPerfAccumulate(s"VfRFReadBeforeArb", PopCount(vfRFReadArbiter.io.in.flatten.flatten.map(_.valid))) 731 XSPerfAccumulate(s"VfRFReadAfterArb", PopCount(vfRFReadArbiter.io.out.map(_.valid))) 732 XSPerfAccumulate(s"IntUopBeforeArb", PopCount(fromIntIQ.flatten.map(_.valid))) 733 XSPerfAccumulate(s"IntUopAfterArb", PopCount(fromIntIQ.flatten.map(_.fire))) 734 XSPerfAccumulate(s"MemUopBeforeArb", PopCount(fromMemIQ.flatten.map(_.valid))) 735 XSPerfAccumulate(s"MemUopAfterArb", PopCount(fromMemIQ.flatten.map(_.fire))) 736 XSPerfAccumulate(s"VfUopBeforeArb", PopCount(fromVfIQ.flatten.map(_.valid))) 737 XSPerfAccumulate(s"VfUopAfterArb", PopCount(fromVfIQ.flatten.map(_.fire))) 738 739 XSPerfHistogram(s"IntRFReadBeforeArb_hist", PopCount(intRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 16, 2) 740 XSPerfHistogram(s"IntRFReadAfterArb_hist", PopCount(intRFReadArbiter.io.out.map(_.valid)), true.B, 0, 16, 2) 741 XSPerfHistogram(s"FpRFReadBeforeArb_hist", PopCount(fpRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 16, 2) 742 XSPerfHistogram(s"FpRFReadAfterArb_hist", PopCount(fpRFReadArbiter.io.out.map(_.valid)), true.B, 0, 16, 2) 743 XSPerfHistogram(s"VfRFReadBeforeArb_hist", PopCount(vfRFReadArbiter.io.in.flatten.flatten.map(_.valid)), true.B, 0, 16, 2) 744 XSPerfHistogram(s"VfRFReadAfterArb_hist", PopCount(vfRFReadArbiter.io.out.map(_.valid)), true.B, 0, 16, 2) 745 XSPerfHistogram(s"IntUopBeforeArb_hist", PopCount(fromIntIQ.flatten.map(_.valid)), true.B, 0, 8, 2) 746 XSPerfHistogram(s"IntUopAfterArb_hist", PopCount(fromIntIQ.flatten.map(_.fire)), true.B, 0, 8, 2) 747 XSPerfHistogram(s"MemUopBeforeArb_hist", PopCount(fromMemIQ.flatten.map(_.valid)), true.B, 0, 8, 2) 748 XSPerfHistogram(s"MemUopAfterArb_hist", PopCount(fromMemIQ.flatten.map(_.fire)), true.B, 0, 8, 2) 749 XSPerfHistogram(s"VfUopBeforeArb_hist", PopCount(fromVfIQ.flatten.map(_.valid)), true.B, 0, 8, 2) 750 XSPerfHistogram(s"VfUopAfterArb_hist", PopCount(fromVfIQ.flatten.map(_.fire)), true.B, 0, 8, 2) 751} 752 753class DataPathIO()(implicit p: Parameters, params: BackendParams) extends XSBundle { 754 // params 755 private val intSchdParams = params.schdParams(IntScheduler()) 756 private val fpSchdParams = params.schdParams(FpScheduler()) 757 private val vfSchdParams = params.schdParams(VfScheduler()) 758 private val memSchdParams = params.schdParams(MemScheduler()) 759 // bundles 760 val hartId = Input(UInt(8.W)) 761 762 val flush: ValidIO[Redirect] = Flipped(ValidIO(new Redirect)) 763 764 val wbConfictRead = Input(MixedVec(params.allSchdParams.map(x => MixedVec(x.issueBlockParams.map(x => x.genWbConflictBundle()))))) 765 766 val fromIntIQ: MixedVec[MixedVec[DecoupledIO[IssueQueueIssueBundle]]] = 767 Flipped(MixedVec(intSchdParams.issueBlockParams.map(_.genIssueDecoupledBundle))) 768 769 val fromFpIQ: MixedVec[MixedVec[DecoupledIO[IssueQueueIssueBundle]]] = 770 Flipped(MixedVec(fpSchdParams.issueBlockParams.map(_.genIssueDecoupledBundle))) 771 772 val fromMemIQ: MixedVec[MixedVec[DecoupledIO[IssueQueueIssueBundle]]] = 773 Flipped(MixedVec(memSchdParams.issueBlockParams.map(_.genIssueDecoupledBundle))) 774 775 val fromVfIQ = Flipped(MixedVec(vfSchdParams.issueBlockParams.map(_.genIssueDecoupledBundle))) 776 777 val toIntIQ = MixedVec(intSchdParams.issueBlockParams.map(_.genOGRespBundle)) 778 779 val toFpIQ = MixedVec(fpSchdParams.issueBlockParams.map(_.genOGRespBundle)) 780 781 val toMemIQ = MixedVec(memSchdParams.issueBlockParams.map(_.genOGRespBundle)) 782 783 val toVfIQ = MixedVec(vfSchdParams.issueBlockParams.map(_.genOGRespBundle)) 784 785 val og0CancelOH = Output(ExuOH(backendParams.numExu)) 786 787 val og1CancelOH = Output(ExuOH(backendParams.numExu)) 788 789 val ldCancel = Vec(backendParams.LduCnt + backendParams.HyuCnt, Flipped(new LoadCancelIO)) 790 791 val cancelToBusyTable = Vec(backendParams.numExu, ValidIO(new CancelSignal)) 792 793 val toIntExu: MixedVec[MixedVec[DecoupledIO[ExuInput]]] = intSchdParams.genExuInputBundle 794 795 val toFpExu: MixedVec[MixedVec[DecoupledIO[ExuInput]]] = MixedVec(fpSchdParams.genExuInputBundle) 796 797 val toVecExu: MixedVec[MixedVec[DecoupledIO[ExuInput]]] = MixedVec(vfSchdParams.genExuInputBundle) 798 799 val toMemExu: MixedVec[MixedVec[DecoupledIO[ExuInput]]] = memSchdParams.genExuInputBundle 800 801 val og1ImmInfo: Vec[ImmInfo] = Output(Vec(params.allExuParams.size, new ImmInfo)) 802 803 val fromIntWb: MixedVec[RfWritePortWithConfig] = MixedVec(params.genIntWriteBackBundle) 804 805 val fromFpWb: MixedVec[RfWritePortWithConfig] = MixedVec(params.genFpWriteBackBundle) 806 807 val fromVfWb: MixedVec[RfWritePortWithConfig] = MixedVec(params.genVfWriteBackBundle) 808 809 val fromV0Wb: MixedVec[RfWritePortWithConfig] = MixedVec(params.genV0WriteBackBundle) 810 811 val fromVlWb: MixedVec[RfWritePortWithConfig] = MixedVec(params.genVlWriteBackBundle) 812 813 val fromPcTargetMem = Flipped(new PcToDataPathIO(params)) 814 815 val debugIntRat = if (params.debugEn) Some(Input(Vec(32, UInt(intSchdParams.pregIdxWidth.W)))) else None 816 val debugFpRat = if (params.debugEn) Some(Input(Vec(32, UInt(fpSchdParams.pregIdxWidth.W)))) else None 817 val debugVecRat = if (params.debugEn) Some(Input(Vec(31, UInt(vfSchdParams.pregIdxWidth.W)))) else None 818 val debugV0Rat = if (params.debugEn) Some(Input(UInt(log2Up(V0PhyRegs).W))) else None 819 val debugVlRat = if (params.debugEn) Some(Input(UInt(log2Up(VlPhyRegs).W))) else None 820 val debugVl = if (params.debugEn) Some(Output(UInt(VlData().dataWidth.W))) else None 821} 822