xref: /XiangShan/src/main/scala/xiangshan/backend/decode/FPDecoder.scala (revision b189aafaec05caa2f6081d616f1f0daab1fd2ad8)
1c6d43980SLemover/***************************************************************************************
2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory
4c6d43980SLemover*
5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2.
6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2.
7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at:
8c6d43980SLemover*          http://license.coscl.org.cn/MulanPSL2
9c6d43980SLemover*
10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
13c6d43980SLemover*
14c6d43980SLemover* See the Mulan PSL v2 for more details.
15c6d43980SLemover***************************************************************************************/
16c6d43980SLemover
172ce29ed6SLinJiaweipackage xiangshan.backend.decode
182ce29ed6SLinJiawei
198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters
202ce29ed6SLinJiaweiimport chisel3._
212ce29ed6SLinJiaweiimport chisel3.util._
222ce29ed6SLinJiaweiimport freechips.rocketchip.rocket.DecodeLogic
23361e6d51SJiuyang Liuimport freechips.rocketchip.rocket.Instructions._
2498cfe81bSxgkiriimport xiangshan.backend.decode.isa.bitfield.XSInstBitFields
25dc597826SJiawei Linimport xiangshan.backend.fu.fpu.FPU
26395c8649SZiyue-Zhangimport xiangshan.backend.fu.vector.Bundles.{VSew, VLmul}
27bdda74fdSxiaofeibao-xjtuimport xiangshan.backend.Bundles.VPUCtrlSignals
282ce29ed6SLinJiaweiimport xiangshan.{FPUCtrlSignals, XSModule}
292ce29ed6SLinJiawei
30bdda74fdSxiaofeibao-xjtuclass FPToVecDecoder(implicit p: Parameters) extends XSModule {
31bdda74fdSxiaofeibao-xjtu  val io = IO(new Bundle() {
32bdda74fdSxiaofeibao-xjtu    val instr = Input(UInt(32.W))
33bdda74fdSxiaofeibao-xjtu    val vpuCtrl = Output(new VPUCtrlSignals)
34bdda74fdSxiaofeibao-xjtu  })
35bdda74fdSxiaofeibao-xjtu
36bdda74fdSxiaofeibao-xjtu  val inst = io.instr.asTypeOf(new XSInstBitFields)
37bdda74fdSxiaofeibao-xjtu  val fpToVecInsts = Seq(
38bdda74fdSxiaofeibao-xjtu    FADD_S, FSUB_S, FADD_D, FSUB_D,
39bdda74fdSxiaofeibao-xjtu    FEQ_S, FLT_S, FLE_S, FEQ_D, FLT_D, FLE_D,
40bdda74fdSxiaofeibao-xjtu    FMIN_S, FMAX_S, FMIN_D, FMAX_D,
41bdda74fdSxiaofeibao-xjtu    FMUL_S, FMUL_D,
42bdda74fdSxiaofeibao-xjtu    FDIV_S, FDIV_D, FSQRT_S, FSQRT_D,
43bdda74fdSxiaofeibao-xjtu    FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D,
44bdda74fdSxiaofeibao-xjtu    FCLASS_S, FCLASS_D, FSGNJ_S, FSGNJ_D, FSGNJX_S, FSGNJX_D, FSGNJN_S, FSGNJN_D,
4534f9ccd0SZiyue Zhang
4634f9ccd0SZiyue Zhang    // scalar cvt inst
4734f9ccd0SZiyue Zhang    FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S,
4834f9ccd0SZiyue Zhang    FCVT_W_D, FCVT_WU_D, FCVT_L_D, FCVT_LU_D, FCVT_S_D, FCVT_D_S,
49*b189aafaSzmx    FCVT_S_H, FCVT_H_S, FCVT_H_D, FCVT_D_H,
50*b189aafaSzmx    FMV_X_W, FMV_X_D, FMV_X_H,
51bdda74fdSxiaofeibao-xjtu  )
52bdda74fdSxiaofeibao-xjtu  val isFpToVecInst = fpToVecInsts.map(io.instr === _).reduce(_ || _)
53bdda74fdSxiaofeibao-xjtu  val isFP32Instrs = Seq(
54bdda74fdSxiaofeibao-xjtu    FADD_S, FSUB_S, FEQ_S, FLT_S, FLE_S, FMIN_S, FMAX_S,
55bdda74fdSxiaofeibao-xjtu    FMUL_S, FDIV_S, FSQRT_S,
56bdda74fdSxiaofeibao-xjtu    FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S,
57bdda74fdSxiaofeibao-xjtu    FCLASS_S, FSGNJ_S, FSGNJX_S, FSGNJN_S,
58bdda74fdSxiaofeibao-xjtu  )
59bdda74fdSxiaofeibao-xjtu  val isFP32Instr = isFP32Instrs.map(io.instr === _).reduce(_ || _)
60bdda74fdSxiaofeibao-xjtu  val isFP64Instrs = Seq(
61bdda74fdSxiaofeibao-xjtu    FADD_D, FSUB_D, FEQ_D, FLT_D, FLE_D, FMIN_D, FMAX_D,
62bdda74fdSxiaofeibao-xjtu    FMUL_D, FDIV_D, FSQRT_D,
63bdda74fdSxiaofeibao-xjtu    FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D,
64bdda74fdSxiaofeibao-xjtu    FCLASS_D, FSGNJ_D, FSGNJX_D, FSGNJN_D,
65bdda74fdSxiaofeibao-xjtu  )
66bdda74fdSxiaofeibao-xjtu  val isFP64Instr = isFP64Instrs.map(io.instr === _).reduce(_ || _)
6734f9ccd0SZiyue Zhang  // scalar cvt inst
6834f9ccd0SZiyue Zhang  val isSew2Cvts = Seq(
6934f9ccd0SZiyue Zhang    FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S,
7034f9ccd0SZiyue Zhang    FCVT_W_D, FCVT_WU_D, FCVT_S_D, FCVT_D_S,
7134f9ccd0SZiyue Zhang    FMV_X_W,
7234f9ccd0SZiyue Zhang  )
73*b189aafaSzmx  /*
74*b189aafaSzmx  The optype for FCVT_D_H and FCVT_H_D is the same,
75*b189aafaSzmx  so the two instructions are distinguished by sew.
76*b189aafaSzmx  FCVT_H_D:VSew.e64
77*b189aafaSzmx  FCVT_D_H:VSew.e16
78*b189aafaSzmx   */
79*b189aafaSzmx  val isSew2Cvth = Seq(
80*b189aafaSzmx    FCVT_S_H, FCVT_H_S, FCVT_D_H,
81*b189aafaSzmx    FMV_X_H,
82*b189aafaSzmx  )
83*b189aafaSzmx  val isSew2Cvt32 = isSew2Cvts.map(io.instr === _).reduce(_ || _)
84*b189aafaSzmx  val isSew2Cvt16 = isSew2Cvth.map(io.instr === _).reduce(_ || _)
8534f9ccd0SZiyue Zhang  val isLmulMf4Cvts = Seq(
8634f9ccd0SZiyue Zhang    FCVT_W_S, FCVT_WU_S,
8734f9ccd0SZiyue Zhang    FMV_X_W,
8834f9ccd0SZiyue Zhang  )
8934f9ccd0SZiyue Zhang  val isLmulMf4Cvt = isLmulMf4Cvts.map(io.instr === _).reduce(_ || _)
904b136a73Ssinsanction  val needReverseInsts = Seq(
914b136a73Ssinsanction    FADD_S, FSUB_S, FADD_D, FSUB_D,
924b136a73Ssinsanction    FEQ_S, FLT_S, FLE_S, FEQ_D, FLT_D, FLE_D,
934b136a73Ssinsanction    FMIN_S, FMAX_S, FMIN_D, FMAX_D,
944b136a73Ssinsanction    FMUL_S, FMUL_D,
954b136a73Ssinsanction    FDIV_S, FDIV_D, FSQRT_S, FSQRT_D,
964b136a73Ssinsanction    FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D,
974b136a73Ssinsanction    FCLASS_S, FCLASS_D, FSGNJ_S, FSGNJ_D, FSGNJX_S, FSGNJX_D, FSGNJN_S, FSGNJN_D,
984b136a73Ssinsanction  )
99bdda74fdSxiaofeibao-xjtu  val needReverseInst = needReverseInsts.map(_ === inst.ALL).reduce(_ || _)
100bdda74fdSxiaofeibao-xjtu  io.vpuCtrl := 0.U.asTypeOf(io.vpuCtrl)
101bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.fpu.isFpToVecInst := isFpToVecInst
102bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.fpu.isFP32Instr   := isFP32Instr
103bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.fpu.isFP64Instr   := isFP64Instr
104bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vill  := false.B
105bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vma   := true.B
106bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vta   := true.B
107*b189aafaSzmx  io.vpuCtrl.vsew  := Mux(isFP32Instr || isSew2Cvt32, VSew.e32, Mux(isSew2Cvt16, VSew.e16, VSew.e64))
10834f9ccd0SZiyue Zhang  io.vpuCtrl.vlmul := Mux(isFP32Instr || isLmulMf4Cvt, VLmul.mf4, VLmul.mf2)
109bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vm    := inst.VM
110bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.nf    := inst.NF
111d9355d3aSZiyue-Zhang  io.vpuCtrl.veew := inst.WIDTH
112bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isReverse := needReverseInst
113bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isExt     := false.B
114bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isNarrow  := false.B
115bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isDstMask := false.B
11630fcc710SZiyue Zhang  io.vpuCtrl.isOpMask  := false.B
117b6279fc6SZiyue Zhang  io.vpuCtrl.isDependOldvd := false.B
118d8ceb649SZiyue Zhang  io.vpuCtrl.isWritePartVd := false.B
119bdda74fdSxiaofeibao-xjtu}
120bdda74fdSxiaofeibao-xjtu
121bdda74fdSxiaofeibao-xjtu
1222225d46eSJiawei Linclass FPDecoder(implicit p: Parameters) extends XSModule{
1232ce29ed6SLinJiawei  val io = IO(new Bundle() {
1242ce29ed6SLinJiawei    val instr = Input(UInt(32.W))
1252ce29ed6SLinJiawei    val fpCtrl = Output(new FPUCtrlSignals)
1262ce29ed6SLinJiawei  })
1272ce29ed6SLinJiawei
12898cfe81bSxgkiri  private val inst: XSInstBitFields = io.instr.asTypeOf(new XSInstBitFields)
12998cfe81bSxgkiri
1302ce29ed6SLinJiawei  def X = BitPat("b?")
1312ce29ed6SLinJiawei  def N = BitPat("b0")
1322ce29ed6SLinJiawei  def Y = BitPat("b1")
133*b189aafaSzmx  val s = BitPat(FPU.S(0))
134*b189aafaSzmx  val d = BitPat(FPU.D(0))
135*b189aafaSzmx  val i = BitPat(FPU.D(0))
1362ce29ed6SLinJiawei
137fe73f692SLinJiawei  val default = List(X,X,X,N,N,N,X,X,X)
1382ce29ed6SLinJiawei
1392ce29ed6SLinJiawei  // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt
1402ce29ed6SLinJiawei  val single: Array[(BitPat, List[BitPat])] = Array(
141dc597826SJiawei Lin    // IntToFP
142dc597826SJiawei Lin    FMV_W_X  -> List(N,i,s,Y,N,Y,N,N,N),
143dc597826SJiawei Lin    FCVT_S_W -> List(N,i,s,Y,Y,Y,N,N,Y),
144dc597826SJiawei Lin    FCVT_S_WU-> List(N,i,s,Y,Y,Y,N,N,Y),
145dc597826SJiawei Lin    FCVT_S_L -> List(N,i,s,Y,Y,Y,N,N,Y),
146dc597826SJiawei Lin    FCVT_S_LU-> List(N,i,s,Y,Y,Y,N,N,Y),
147dc597826SJiawei Lin    // FPToInt
148dc597826SJiawei Lin    FMV_X_W  -> List(N,d,i,N,N,N,N,N,N), // dont box result of fmv.fp.int
1498cc1ac81SLinJiawei    FCLASS_S -> List(N,s,i,N,N,N,N,N,N),
1508cc1ac81SLinJiawei    FCVT_W_S -> List(N,s,i,N,Y,N,N,N,Y),
1518cc1ac81SLinJiawei    FCVT_WU_S-> List(N,s,i,N,Y,N,N,N,Y),
1528cc1ac81SLinJiawei    FCVT_L_S -> List(N,s,i,N,Y,N,N,N,Y),
1538cc1ac81SLinJiawei    FCVT_LU_S-> List(N,s,i,N,Y,N,N,N,Y),
1548cc1ac81SLinJiawei    FEQ_S    -> List(N,s,i,N,Y,N,N,N,N),
1558cc1ac81SLinJiawei    FLT_S    -> List(N,s,i,N,Y,N,N,N,N),
1568cc1ac81SLinJiawei    FLE_S    -> List(N,s,i,N,Y,N,N,N,N),
157dc597826SJiawei Lin    // FPToFP
1582ce29ed6SLinJiawei    FSGNJ_S  -> List(N,s,s,N,N,Y,N,N,N),
1592ce29ed6SLinJiawei    FSGNJN_S -> List(N,s,s,N,N,Y,N,N,N),
1602ce29ed6SLinJiawei    FSGNJX_S -> List(N,s,s,N,N,Y,N,N,N),
1612ce29ed6SLinJiawei    FMIN_S   -> List(N,s,s,N,Y,Y,N,N,N),
1622ce29ed6SLinJiawei    FMAX_S   -> List(N,s,s,N,Y,Y,N,N,N),
1632ce29ed6SLinJiawei    FADD_S   -> List(Y,s,s,N,Y,Y,N,N,N),
1642ce29ed6SLinJiawei    FSUB_S   -> List(Y,s,s,N,Y,Y,N,N,N),
1652ce29ed6SLinJiawei    FMUL_S   -> List(N,s,s,N,Y,Y,N,N,N),
1662ce29ed6SLinJiawei    FMADD_S  -> List(N,s,s,N,Y,Y,N,N,N),
1672ce29ed6SLinJiawei    FMSUB_S  -> List(N,s,s,N,Y,Y,N,N,N),
1682ce29ed6SLinJiawei    FNMADD_S -> List(N,s,s,N,Y,Y,N,N,N),
1692ce29ed6SLinJiawei    FNMSUB_S -> List(N,s,s,N,Y,Y,N,N,N),
1702ce29ed6SLinJiawei    FDIV_S   -> List(N,s,s,N,Y,Y,Y,N,N),
1712ce29ed6SLinJiawei    FSQRT_S  -> List(N,s,s,N,Y,Y,N,Y,N)
1722ce29ed6SLinJiawei  )
1732ce29ed6SLinJiawei
174e50fb2d7SLinJiawei
175e50fb2d7SLinJiawei  // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt
176e50fb2d7SLinJiawei  val double: Array[(BitPat, List[BitPat])] = Array(
177dc597826SJiawei Lin    FMV_D_X  -> List(N,i,d,Y,N,Y,N,N,N),
178dc597826SJiawei Lin    FCVT_D_W -> List(N,i,d,Y,Y,Y,N,N,Y),
179dc597826SJiawei Lin    FCVT_D_WU-> List(N,i,d,Y,Y,Y,N,N,Y),
180dc597826SJiawei Lin    FCVT_D_L -> List(N,i,d,Y,Y,Y,N,N,Y),
181dc597826SJiawei Lin    FCVT_D_LU-> List(N,i,d,Y,Y,Y,N,N,Y),
1828cc1ac81SLinJiawei    FMV_X_D  -> List(N,d,i,N,N,N,N,N,N),
1838cc1ac81SLinJiawei    FCLASS_D -> List(N,d,i,N,N,N,N,N,N),
1848cc1ac81SLinJiawei    FCVT_W_D -> List(N,d,i,N,Y,N,N,N,Y),
1858cc1ac81SLinJiawei    FCVT_WU_D-> List(N,d,i,N,Y,N,N,N,Y),
1868cc1ac81SLinJiawei    FCVT_L_D -> List(N,d,i,N,Y,N,N,N,Y),
1878cc1ac81SLinJiawei    FCVT_LU_D-> List(N,d,i,N,Y,N,N,N,Y),
188e50fb2d7SLinJiawei    FCVT_S_D -> List(N,d,s,N,Y,Y,N,N,Y),
189e50fb2d7SLinJiawei    FCVT_D_S -> List(N,s,d,N,Y,Y,N,N,Y),
1908cc1ac81SLinJiawei    FEQ_D    -> List(N,d,i,N,Y,N,N,N,N),
1918cc1ac81SLinJiawei    FLT_D    -> List(N,d,i,N,Y,N,N,N,N),
1928cc1ac81SLinJiawei    FLE_D    -> List(N,d,i,N,Y,N,N,N,N),
193e50fb2d7SLinJiawei    FSGNJ_D  -> List(N,d,d,N,N,Y,N,N,N),
194e50fb2d7SLinJiawei    FSGNJN_D -> List(N,d,d,N,N,Y,N,N,N),
195e50fb2d7SLinJiawei    FSGNJX_D -> List(N,d,d,N,N,Y,N,N,N),
196e50fb2d7SLinJiawei    FMIN_D   -> List(N,d,d,N,Y,Y,N,N,N),
197e50fb2d7SLinJiawei    FMAX_D   -> List(N,d,d,N,Y,Y,N,N,N),
198e50fb2d7SLinJiawei    FADD_D   -> List(Y,d,d,N,Y,Y,N,N,N),
199e50fb2d7SLinJiawei    FSUB_D   -> List(Y,d,d,N,Y,Y,N,N,N),
200e50fb2d7SLinJiawei    FMUL_D   -> List(N,d,d,N,Y,Y,N,N,N),
201e50fb2d7SLinJiawei    FMADD_D  -> List(N,d,d,N,Y,Y,N,N,N),
202e50fb2d7SLinJiawei    FMSUB_D  -> List(N,d,d,N,Y,Y,N,N,N),
203e50fb2d7SLinJiawei    FNMADD_D -> List(N,d,d,N,Y,Y,N,N,N),
204e50fb2d7SLinJiawei    FNMSUB_D -> List(N,d,d,N,Y,Y,N,N,N),
205e50fb2d7SLinJiawei    FDIV_D   -> List(N,d,d,N,Y,Y,Y,N,N),
206e50fb2d7SLinJiawei    FSQRT_D  -> List(N,d,d,N,Y,Y,N,Y,N)
207e50fb2d7SLinJiawei  )
208e50fb2d7SLinJiawei
209e50fb2d7SLinJiawei  val table = single ++ double
2102ce29ed6SLinJiawei
2112ce29ed6SLinJiawei  val decoder = DecodeLogic(io.instr, default, table)
2122ce29ed6SLinJiawei
2132ce29ed6SLinJiawei  val ctrl = io.fpCtrl
2142ce29ed6SLinJiawei  val sigs = Seq(
2152ce29ed6SLinJiawei    ctrl.isAddSub, ctrl.typeTagIn, ctrl.typeTagOut,
2162ce29ed6SLinJiawei    ctrl.fromInt, ctrl.wflags, ctrl.fpWen,
2172ce29ed6SLinJiawei    ctrl.div, ctrl.sqrt, ctrl.fcvt
2182ce29ed6SLinJiawei  )
2192ce29ed6SLinJiawei  sigs.zip(decoder).foreach({case (s, d) => s := d})
22098cfe81bSxgkiri  ctrl.typ := inst.TYP
22198cfe81bSxgkiri  ctrl.fmt := inst.FMT
22298cfe81bSxgkiri  ctrl.rm := inst.RM
2232ce29ed6SLinJiawei
2242ce29ed6SLinJiawei  val fmaTable: Array[(BitPat, List[BitPat])] = Array(
225e50fb2d7SLinJiawei    FADD_S  -> List(BitPat("b00"),N),
226e50fb2d7SLinJiawei    FADD_D  -> List(BitPat("b00"),N),
227e50fb2d7SLinJiawei    FSUB_S  -> List(BitPat("b01"),N),
228e50fb2d7SLinJiawei    FSUB_D  -> List(BitPat("b01"),N),
229e50fb2d7SLinJiawei    FMUL_S  -> List(BitPat("b00"),N),
230e50fb2d7SLinJiawei    FMUL_D  -> List(BitPat("b00"),N),
231e50fb2d7SLinJiawei    FMADD_S -> List(BitPat("b00"),Y),
232e50fb2d7SLinJiawei    FMADD_D -> List(BitPat("b00"),Y),
233e50fb2d7SLinJiawei    FMSUB_S -> List(BitPat("b01"),Y),
234e50fb2d7SLinJiawei    FMSUB_D -> List(BitPat("b01"),Y),
235e50fb2d7SLinJiawei    FNMADD_S-> List(BitPat("b11"),Y),
236e50fb2d7SLinJiawei    FNMADD_D-> List(BitPat("b11"),Y),
237e50fb2d7SLinJiawei    FNMSUB_S-> List(BitPat("b10"),Y),
238e50fb2d7SLinJiawei    FNMSUB_D-> List(BitPat("b10"),Y)
2392ce29ed6SLinJiawei  )
240e50fb2d7SLinJiawei  val fmaDefault = List(BitPat("b??"), N)
241e50fb2d7SLinJiawei  Seq(ctrl.fmaCmd, ctrl.ren3).zip(
2422ce29ed6SLinJiawei    DecodeLogic(io.instr, fmaDefault, fmaTable)
2432ce29ed6SLinJiawei  ).foreach({
2442ce29ed6SLinJiawei    case (s, d) => s := d
2452ce29ed6SLinJiawei  })
2462ce29ed6SLinJiawei}
247