xref: /XiangShan/src/main/scala/xiangshan/backend/exu/ExeUnit.scala (revision 039cdc35f5f3b68b6295ec5ace90f22a77322e02)
1/***************************************************************************************
2* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3* Copyright (c) 2020-2021 Peng Cheng Laboratory
4*
5* XiangShan is licensed under Mulan PSL v2.
6* You can use this software according to the terms and conditions of the Mulan PSL v2.
7* You may obtain a copy of Mulan PSL v2 at:
8*          http://license.coscl.org.cn/MulanPSL2
9*
10* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
11* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
12* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
13*
14* See the Mulan PSL v2 for more details.
15***************************************************************************************/
16
17package xiangshan.backend.exu
18
19import org.chipsalliance.cde.config.Parameters
20import chisel3._
21import chisel3.experimental.hierarchy.{Definition, instantiable}
22import chisel3.util._
23import freechips.rocketchip.diplomacy.{LazyModule, LazyModuleImp}
24import utility._
25import xiangshan.backend.fu.{CSRFileIO, FenceIO, FuncUnitInput}
26import xiangshan.backend.Bundles.{ExuInput, ExuOutput, MemExuInput, MemExuOutput}
27import xiangshan.{FPUCtrlSignals, HasXSParameter, Redirect, XSBundle, XSModule}
28import xiangshan.backend.datapath.WbConfig.{PregWB, _}
29import xiangshan.backend.fu.FuType
30import xiangshan.backend.fu.vector.Bundles.{VType, Vxrm}
31import xiangshan.backend.fu.fpu.Bundles.Frm
32
33class ExeUnitIO(params: ExeUnitParams)(implicit p: Parameters) extends XSBundle {
34  val flush = Flipped(ValidIO(new Redirect()))
35  val in = Flipped(DecoupledIO(new ExuInput(params)))
36  val out = DecoupledIO(new ExuOutput(params))
37  val csrio = Option.when(params.hasCSR)(new CSRFileIO)
38  val fenceio = Option.when(params.hasFence)(new FenceIO)
39  val frm = Option.when(params.needSrcFrm)(Input(Frm()))
40  val vxrm = Option.when(params.needSrcVxrm)(Input(Vxrm()))
41  val vtype = Option.when(params.writeVConfig)((Valid(new VType)))
42  val vlIsZero = Option.when(params.writeVConfig)(Output(Bool()))
43  val vlIsVlmax = Option.when(params.writeVConfig)(Output(Bool()))
44}
45
46class ExeUnit(val exuParams: ExeUnitParams)(implicit p: Parameters) extends LazyModule {
47  override def shouldBeInlined: Boolean = false
48
49  lazy val module = new ExeUnitImp(this)(p, exuParams)
50}
51
52class ExeUnitImp(
53  override val wrapper: ExeUnit
54)(implicit
55  p: Parameters, exuParams: ExeUnitParams
56) extends LazyModuleImp(wrapper) with HasXSParameter{
57  private val fuCfgs = exuParams.fuConfigs
58
59  val io = IO(new ExeUnitIO(exuParams))
60
61  val funcUnits = fuCfgs.map(cfg => {
62    assert(cfg.fuGen != null, cfg.name + "Cfg'fuGen is null !!!")
63    val module = cfg.fuGen(p, cfg)
64    module
65  })
66
67  if (EnableClockGate) {
68    fuCfgs.zip(funcUnits).foreach { case (cfg, fu) =>
69      val clk_en = WireInit(false.B)
70      val fuVld_en = WireInit(false.B)
71      val fuVld_en_reg = RegInit(false.B)
72      val uncer_en_reg = RegInit(false.B)
73
74      def latReal: Int = cfg.latency.latencyVal.getOrElse(0)
75      def extralat: Int = cfg.latency.extraLatencyVal.getOrElse(0)
76
77      val uncerLat = cfg.latency.uncertainEnable.nonEmpty
78      val lat0 = (latReal == 0 && !uncerLat).asBool
79      val latN = (latReal >  0 && !uncerLat).asBool
80
81      val fuVldVec = (io.in.valid && latN) +: Seq.fill(latReal)(RegInit(false.B))
82      val fuRdyVec = Seq.fill(latReal)(Wire(Bool())) :+ io.out.ready
83
84      for (i <- 0 until latReal) {
85        fuRdyVec(i) := !fuVldVec(i + 1) || fuRdyVec(i + 1)
86      }
87
88      for (i <- 1 to latReal) {
89        when(fuRdyVec(i - 1) && fuVldVec(i - 1)) {
90          fuVldVec(i) := fuVldVec(i - 1)
91        }.elsewhen(fuRdyVec(i)) {
92          fuVldVec(i) := false.B
93        }
94      }
95      fuVld_en := fuVldVec.map(v => v).reduce(_ || _)
96      fuVld_en_reg := fuVld_en
97
98      when(uncerLat.asBool && io.in.fire) {
99        uncer_en_reg := true.B
100      }.elsewhen(uncerLat.asBool && io.out.fire) {
101        uncer_en_reg := false.B
102      }
103
104      when(lat0 && io.in.fire) {
105        clk_en := true.B
106      }.elsewhen(latN && fuVld_en || fuVld_en_reg) {
107        clk_en := true.B
108      }.elsewhen(uncerLat.asBool && io.in.fire || uncer_en_reg) {
109        clk_en := true.B
110      }
111
112      if (cfg.ckAlwaysEn) {
113        clk_en := true.B
114      }
115
116      fu.clock := ClockGate(false.B, clk_en, clock)
117      XSPerfAccumulate(s"clock_gate_en_${fu.cfg.name}", clk_en)
118    }
119  }
120
121  val busy = RegInit(false.B)
122  if (exuParams.latencyCertain){
123    busy := false.B
124  }
125  else {
126    val robIdx = RegEnable(io.in.bits.robIdx, io.in.fire)
127    when(io.in.fire && io.in.bits.robIdx.needFlush(io.flush)) {
128      busy := false.B
129    }.elsewhen(busy && robIdx.needFlush(io.flush)) {
130      busy := false.B
131    }.elsewhen(io.out.fire) {
132      busy := false.B
133    }.elsewhen(io.in.fire) {
134      busy := true.B
135    }
136  }
137
138  exuParams.wbPortConfigs.map{
139    x => x match {
140      case IntWB(port, priority) => assert(priority >= 0 && priority <= 2,
141        s"${exuParams.name}: WbPort must priority=0 or priority=1")
142      case FpWB(port, priority) => assert(priority >= 0 && priority <= 2,
143        s"${exuParams.name}: WbPort must priority=0 or priority=1")
144      case VfWB (port, priority) => assert(priority >= 0 && priority <= 2,
145        s"${exuParams.name}: WbPort must priority=0 or priority=1")
146      case _ =>
147    }
148  }
149  val intWbPort = exuParams.getIntWBPort
150  if (intWbPort.isDefined){
151    val sameIntPortExuParam = backendParams.allExuParams.filter(_.getIntWBPort.isDefined)
152      .filter(_.getIntWBPort.get.port == intWbPort.get.port)
153    val samePortOneCertainOneUncertain = sameIntPortExuParam.map(_.latencyCertain).contains(true) && sameIntPortExuParam.map(_.latencyCertain).contains(false)
154    if (samePortOneCertainOneUncertain) sameIntPortExuParam.map(samePort =>
155      samePort.wbPortConfigs.map(
156        x => x match {
157          case IntWB(port, priority) => {
158            if (!samePort.latencyCertain) assert(priority == sameIntPortExuParam.size - 1,
159              s"${samePort.name}: IntWbPort $port must latencyCertain priority=0 or latencyUnCertain priority=max(${sameIntPortExuParam.size - 1})")
160            // Certain latency can be handled by WbBusyTable, so there is no need to limit the exu's WB priority
161          }
162          case _ =>
163        }
164      )
165    )
166  }
167  val fpWbPort = exuParams.getFpWBPort
168  if (fpWbPort.isDefined) {
169    val sameFpPortExuParam = backendParams.allExuParams.filter(_.getFpWBPort.isDefined)
170      .filter(_.getFpWBPort.get.port == fpWbPort.get.port)
171    val samePortOneCertainOneUncertain = sameFpPortExuParam.map(_.latencyCertain).contains(true) && sameFpPortExuParam.map(_.latencyCertain).contains(false)
172    if (samePortOneCertainOneUncertain) sameFpPortExuParam.map(samePort =>
173      samePort.wbPortConfigs.map(
174        x => x match {
175          case FpWB(port, priority) => {
176            if (!samePort.latencyCertain) assert(priority == sameFpPortExuParam.size - 1,
177              s"${samePort.name}: FpWbPort $port must latencyCertain priority=0 or latencyUnCertain priority=max(${sameFpPortExuParam.size - 1})")
178            // Certain latency can be handled by WbBusyTable, so there is no need to limit the exu's WB priority
179          }
180          case _ =>
181        }
182      )
183    )
184  }
185  val vfWbPort = exuParams.getVfWBPort
186  if (vfWbPort.isDefined) {
187    val sameVfPortExuParam = backendParams.allExuParams.filter(_.getVfWBPort.isDefined)
188      .filter(_.getVfWBPort.get.port == vfWbPort.get.port)
189    val samePortOneCertainOneUncertain = sameVfPortExuParam.map(_.latencyCertain).contains(true) && sameVfPortExuParam.map(_.latencyCertain).contains(false)
190    if (samePortOneCertainOneUncertain)  sameVfPortExuParam.map(samePort =>
191      samePort.wbPortConfigs.map(
192        x => x match {
193          case VfWB(port, priority) => {
194            if (!samePort.latencyCertain) assert(priority == sameVfPortExuParam.size - 1,
195              s"${samePort.name}: VfWbPort $port must latencyCertain priority=0 or latencyUnCertain priority=max(${sameVfPortExuParam.size - 1})")
196            // Certain latency can be handled by WbBusyTable, so there is no need to limit the exu's WB priority
197          }
198          case _ =>
199        }
200      )
201    )
202  }
203  if(backendParams.debugEn) {
204    dontTouch(io.out.ready)
205  }
206  // rob flush --> funcUnits
207  funcUnits.zipWithIndex.foreach { case (fu, i) =>
208    fu.io.flush <> io.flush
209  }
210
211  def acceptCond(input: ExuInput): Seq[Bool] = {
212    input.params.fuConfigs.map(_.fuSel(input))
213  }
214
215  val in1ToN = Module(new Dispatcher(new ExuInput(exuParams), funcUnits.length, acceptCond))
216
217  // ExeUnit.in <---> Dispatcher.in
218  in1ToN.io.in.valid := io.in.valid && !busy
219  in1ToN.io.in.bits := io.in.bits
220  io.in.ready := !busy && in1ToN.io.in.ready
221
222  // Dispatcher.out <---> FunctionUnits
223  in1ToN.io.out.zip(funcUnits.map(_.io.in)).foreach {
224    case (source: DecoupledIO[ExuInput], sink: DecoupledIO[FuncUnitInput]) =>
225      sink.valid := source.valid
226      source.ready := sink.ready
227
228      sink.bits.data.src.zip(source.bits.src).foreach { case(fuSrc, exuSrc) => fuSrc := exuSrc }
229      sink.bits.data.pc          .foreach(x => x := source.bits.pc.get)
230      sink.bits.data.imm         := source.bits.imm
231      sink.bits.ctrl.fuOpType    := source.bits.fuOpType
232      sink.bits.ctrl.robIdx      := source.bits.robIdx
233      sink.bits.ctrl.pdest       := source.bits.pdest
234      sink.bits.ctrl.rfWen       .foreach(x => x := source.bits.rfWen.get)
235      sink.bits.ctrl.fpWen       .foreach(x => x := source.bits.fpWen.get)
236      sink.bits.ctrl.vecWen      .foreach(x => x := source.bits.vecWen.get)
237      sink.bits.ctrl.v0Wen       .foreach(x => x := source.bits.v0Wen.get)
238      sink.bits.ctrl.vlWen       .foreach(x => x := source.bits.vlWen.get)
239      sink.bits.ctrl.flushPipe   .foreach(x => x := source.bits.flushPipe.get)
240      sink.bits.ctrl.preDecode   .foreach(x => x := source.bits.preDecode.get)
241      sink.bits.ctrl.ftqIdx      .foreach(x => x := source.bits.ftqIdx.get)
242      sink.bits.ctrl.ftqOffset   .foreach(x => x := source.bits.ftqOffset.get)
243      sink.bits.ctrl.predictInfo .foreach(x => x := source.bits.predictInfo.get)
244      sink.bits.ctrl.fpu         .foreach(x => x := source.bits.fpu.get)
245      sink.bits.ctrl.vpu         .foreach(x => x := source.bits.vpu.get)
246      sink.bits.ctrl.vpu         .foreach(x => x.fpu.isFpToVecInst := 0.U)
247      sink.bits.ctrl.vpu         .foreach(x => x.fpu.isFP32Instr   := 0.U)
248      sink.bits.ctrl.vpu         .foreach(x => x.fpu.isFP64Instr   := 0.U)
249      sink.bits.perfDebugInfo    := source.bits.perfDebugInfo
250  }
251
252  private val OutresVecs = funcUnits.map { fu =>
253    def latDiff :Int = fu.cfg.latency.extraLatencyVal.getOrElse(0)
254    val OutresVec = fu.io.out.bits.res +: Seq.fill(latDiff)(Reg(chiselTypeOf(fu.io.out.bits.res)))
255    for (i <- 1 to latDiff) {
256      OutresVec(i) := OutresVec(i - 1)
257    }
258    OutresVec
259  }
260  OutresVecs.foreach(vec => vec.foreach(res =>dontTouch(res)))
261
262  private val fuOutValidOH = funcUnits.map(_.io.out.valid)
263  XSError(PopCount(fuOutValidOH) > 1.U, p"fuOutValidOH ${Binary(VecInit(fuOutValidOH).asUInt)} should be one-hot)\n")
264  private val fuOutBitsVec = funcUnits.map(_.io.out.bits)
265  private val fuOutresVec = OutresVecs.map(_.last)
266  private val fuRedirectVec: Seq[Option[ValidIO[Redirect]]] = fuOutresVec.map(_.redirect)
267
268  // Assume that one fu can only write int or fp or vec,
269  // otherwise, wenVec should be assigned to wen in fu.
270  private val fuIntWenVec = funcUnits.map(x => x.cfg.needIntWen.B && x.io.out.bits.ctrl.rfWen.getOrElse(false.B))
271  private val fuFpWenVec  = funcUnits.map(x => x.cfg.needFpWen.B  && x.io.out.bits.ctrl.fpWen.getOrElse(false.B))
272  private val fuVecWenVec = funcUnits.map(x => x.cfg.needVecWen.B && x.io.out.bits.ctrl.vecWen.getOrElse(false.B))
273  private val fuV0WenVec = funcUnits.map(x => x.cfg.needV0Wen.B && x.io.out.bits.ctrl.v0Wen.getOrElse(false.B))
274  private val fuVlWenVec = funcUnits.map(x => x.cfg.needVlWen.B && x.io.out.bits.ctrl.vlWen.getOrElse(false.B))
275  // FunctionUnits <---> ExeUnit.out
276
277  private val outDataVec = Seq(
278    Some(fuOutresVec.map(_.data)),
279    Option.when(funcUnits.exists(_.cfg.writeIntRf))
280      (funcUnits.zip(fuOutresVec).filter{ case (fu, _) => fu.cfg.writeIntRf}.map{ case(_, fuout) => fuout.data}),
281    Option.when(funcUnits.exists(_.cfg.writeFpRf))
282      (funcUnits.zip(fuOutresVec).filter{ case (fu, _) => fu.cfg.writeFpRf}.map{ case(_, fuout) => fuout.data}),
283    Option.when(funcUnits.exists(_.cfg.writeVecRf))
284      (funcUnits.zip(fuOutresVec).filter{ case (fu, _) => fu.cfg.writeVecRf}.map{ case(_, fuout) => fuout.data}),
285    Option.when(funcUnits.exists(_.cfg.writeV0Rf))
286      (funcUnits.zip(fuOutresVec).filter{ case (fu, _) => fu.cfg.writeV0Rf}.map{ case(_, fuout) => fuout.data}),
287    Option.when(funcUnits.exists(_.cfg.writeVlRf))
288      (funcUnits.zip(fuOutresVec).filter{ case (fu, _) => fu.cfg.writeVlRf}.map{ case(_, fuout) => fuout.data}),
289  ).flatten
290  private val outDataValidOH = Seq(
291    Some(fuOutValidOH),
292    Option.when(funcUnits.exists(_.cfg.writeIntRf))
293      (funcUnits.zip(fuOutValidOH).filter{ case (fu, _) => fu.cfg.writeIntRf}.map{ case(_, fuoutOH) => fuoutOH}),
294    Option.when(funcUnits.exists(_.cfg.writeFpRf))
295      (funcUnits.zip(fuOutValidOH).filter{ case (fu, _) => fu.cfg.writeFpRf}.map{ case(_, fuoutOH) => fuoutOH}),
296    Option.when(funcUnits.exists(_.cfg.writeVecRf))
297      (funcUnits.zip(fuOutValidOH).filter{ case (fu, _) => fu.cfg.writeVecRf}.map{ case(_, fuoutOH) => fuoutOH}),
298    Option.when(funcUnits.exists(_.cfg.writeV0Rf))
299      (funcUnits.zip(fuOutValidOH).filter{ case (fu, _) => fu.cfg.writeV0Rf}.map{ case(_, fuoutOH) => fuoutOH}),
300    Option.when(funcUnits.exists(_.cfg.writeVlRf))
301      (funcUnits.zip(fuOutValidOH).filter{ case (fu, _) => fu.cfg.writeVlRf}.map{ case(_, fuoutOH) => fuoutOH}),
302  ).flatten
303
304  io.out.valid := Cat(fuOutValidOH).orR
305  funcUnits.foreach(fu => fu.io.out.ready := io.out.ready)
306
307  // select one fu's result
308  io.out.bits.data := VecInit(outDataVec.zip(outDataValidOH).map{ case(data, validOH) => Mux1H(validOH, data)})
309  io.out.bits.robIdx := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.robIdx))
310  io.out.bits.pdest := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.pdest))
311  io.out.bits.intWen.foreach(x => x := Mux1H(fuOutValidOH, fuIntWenVec))
312  io.out.bits.fpWen.foreach(x => x := Mux1H(fuOutValidOH, fuFpWenVec))
313  io.out.bits.vecWen.foreach(x => x := Mux1H(fuOutValidOH, fuVecWenVec))
314  io.out.bits.v0Wen.foreach(x => x := Mux1H(fuOutValidOH, fuV0WenVec))
315  io.out.bits.vlWen.foreach(x => x := Mux1H(fuOutValidOH, fuVlWenVec))
316  io.out.bits.redirect.foreach(x => x := Mux1H((fuOutValidOH zip fuRedirectVec).filter(_._2.isDefined).map(x => (x._1, x._2.get))))
317  io.out.bits.fflags.foreach(x => x := Mux1H(fuOutValidOH, fuOutresVec.map(_.fflags.getOrElse(0.U.asTypeOf(io.out.bits.fflags.get)))))
318  io.out.bits.wflags.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.fpu.getOrElse(0.U.asTypeOf(new FPUCtrlSignals)).wflags)))
319  io.out.bits.vxsat.foreach(x => x := Mux1H(fuOutValidOH, fuOutresVec.map(_.vxsat.getOrElse(0.U.asTypeOf(io.out.bits.vxsat.get)))))
320  io.out.bits.exceptionVec.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.exceptionVec.getOrElse(0.U.asTypeOf(io.out.bits.exceptionVec.get)))))
321  io.out.bits.flushPipe.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.flushPipe.getOrElse(0.U.asTypeOf(io.out.bits.flushPipe.get)))))
322  io.out.bits.replay.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.replay.getOrElse(0.U.asTypeOf(io.out.bits.replay.get)))))
323  io.out.bits.predecodeInfo.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.preDecode.getOrElse(0.U.asTypeOf(io.out.bits.predecodeInfo.get)))))
324
325  io.csrio.foreach(exuio => funcUnits.foreach(fu => fu.io.csrio.foreach{
326    fuio =>
327      exuio <> fuio
328      fuio.exception := DelayN(exuio.exception, 2)
329  }))
330
331  io.vtype.foreach(exuio => funcUnits.foreach(fu => fu.io.vtype.foreach(fuio => exuio := fuio)))
332  io.fenceio.foreach(exuio => funcUnits.foreach(fu => fu.io.fenceio.foreach(fuio => fuio <> exuio)))
333  io.frm.foreach(exuio => funcUnits.foreach(fu => fu.io.frm.foreach(fuio => fuio <> exuio)))
334  io.vxrm.foreach(exuio => funcUnits.foreach(fu => fu.io.vxrm.foreach(fuio => fuio <> exuio)))
335  io.vlIsZero.foreach(exuio => funcUnits.foreach(fu => fu.io.vlIsZero.foreach(fuio => exuio := fuio)))
336  io.vlIsVlmax.foreach(exuio => funcUnits.foreach(fu => fu.io.vlIsVlmax.foreach(fuio => exuio := fuio)))
337
338  // debug info
339  io.out.bits.debug     := 0.U.asTypeOf(io.out.bits.debug)
340  io.out.bits.debug.isPerfCnt := funcUnits.map(_.io.csrio.map(_.isPerfCnt)).map(_.getOrElse(false.B)).reduce(_ || _)
341  io.out.bits.debugInfo := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.perfDebugInfo))
342}
343
344class DispatcherIO[T <: Data](private val gen: T, n: Int) extends Bundle {
345  val in = Flipped(DecoupledIO(gen))
346
347  val out = Vec(n, DecoupledIO(gen))
348}
349
350class Dispatcher[T <: Data](private val gen: T, n: Int, acceptCond: T => Seq[Bool])
351  (implicit p: Parameters)
352  extends Module {
353
354  val io = IO(new DispatcherIO(gen, n))
355
356  private val acceptVec: Vec[Bool] = VecInit(acceptCond(io.in.bits))
357
358  XSError(io.in.valid && PopCount(acceptVec) > 1.U, p"[ExeUnit] accept vec should no more than 1, ${Binary(acceptVec.asUInt)} ")
359  XSError(io.in.valid && PopCount(acceptVec) === 0.U, "[ExeUnit] there is a inst not dispatched to any fu")
360
361  io.out.zipWithIndex.foreach { case (out, i) =>
362    out.valid := acceptVec(i) && io.in.valid
363    out.bits := io.in.bits
364  }
365
366  io.in.ready := Cat(io.out.map(_.ready)).andR
367}
368
369class MemExeUnitIO (implicit p: Parameters) extends XSBundle {
370  val flush = Flipped(ValidIO(new Redirect()))
371  val in = Flipped(DecoupledIO(new MemExuInput()))
372  val out = DecoupledIO(new MemExuOutput())
373}
374
375class MemExeUnit(exuParams: ExeUnitParams)(implicit p: Parameters) extends XSModule {
376  val io = IO(new MemExeUnitIO)
377  val fu = exuParams.fuConfigs.head.fuGen(p, exuParams.fuConfigs.head)
378  fu.io.flush             := io.flush
379  fu.io.in.valid          := io.in.valid
380  io.in.ready             := fu.io.in.ready
381
382  fu.io.in.bits.ctrl.robIdx    := io.in.bits.uop.robIdx
383  fu.io.in.bits.ctrl.pdest     := io.in.bits.uop.pdest
384  fu.io.in.bits.ctrl.fuOpType  := io.in.bits.uop.fuOpType
385  fu.io.in.bits.data.imm       := io.in.bits.uop.imm
386  fu.io.in.bits.data.src.zip(io.in.bits.src).foreach(x => x._1 := x._2)
387  fu.io.in.bits.perfDebugInfo := io.in.bits.uop.debugInfo
388
389  io.out.valid            := fu.io.out.valid
390  fu.io.out.ready         := io.out.ready
391
392  io.out.bits             := 0.U.asTypeOf(io.out.bits) // dontCare other fields
393  io.out.bits.data        := fu.io.out.bits.res.data
394  io.out.bits.uop.robIdx  := fu.io.out.bits.ctrl.robIdx
395  io.out.bits.uop.pdest   := fu.io.out.bits.ctrl.pdest
396  io.out.bits.uop.fuType  := io.in.bits.uop.fuType
397  io.out.bits.uop.fuOpType:= io.in.bits.uop.fuOpType
398  io.out.bits.uop.sqIdx   := io.in.bits.uop.sqIdx
399  io.out.bits.uop.debugInfo := fu.io.out.bits.perfDebugInfo
400
401  io.out.bits.debug       := 0.U.asTypeOf(io.out.bits.debug)
402}