xref: /XiangShan/src/main/scala/xiangshan/backend/decode/FPDecoder.scala (revision 34f9ccd0e235272c39ecb1ab5320cef847d56a8a)
1c6d43980SLemover/***************************************************************************************
2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory
4c6d43980SLemover*
5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2.
6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2.
7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at:
8c6d43980SLemover*          http://license.coscl.org.cn/MulanPSL2
9c6d43980SLemover*
10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
13c6d43980SLemover*
14c6d43980SLemover* See the Mulan PSL v2 for more details.
15c6d43980SLemover***************************************************************************************/
16c6d43980SLemover
172ce29ed6SLinJiaweipackage xiangshan.backend.decode
182ce29ed6SLinJiawei
198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters
202ce29ed6SLinJiaweiimport chisel3._
212ce29ed6SLinJiaweiimport chisel3.util._
222ce29ed6SLinJiaweiimport freechips.rocketchip.rocket.DecodeLogic
23361e6d51SJiuyang Liuimport freechips.rocketchip.rocket.Instructions._
2498cfe81bSxgkiriimport xiangshan.backend.decode.isa.bitfield.XSInstBitFields
25dc597826SJiawei Linimport xiangshan.backend.fu.fpu.FPU
26395c8649SZiyue-Zhangimport xiangshan.backend.fu.vector.Bundles.{VSew, VLmul}
27bdda74fdSxiaofeibao-xjtuimport xiangshan.backend.Bundles.VPUCtrlSignals
282ce29ed6SLinJiaweiimport xiangshan.{FPUCtrlSignals, XSModule}
292ce29ed6SLinJiawei
30bdda74fdSxiaofeibao-xjtuclass FPToVecDecoder(implicit p: Parameters) extends XSModule {
31bdda74fdSxiaofeibao-xjtu  val io = IO(new Bundle() {
32bdda74fdSxiaofeibao-xjtu    val instr = Input(UInt(32.W))
33bdda74fdSxiaofeibao-xjtu    val vpuCtrl = Output(new VPUCtrlSignals)
34bdda74fdSxiaofeibao-xjtu  })
35bdda74fdSxiaofeibao-xjtu
36bdda74fdSxiaofeibao-xjtu  val inst = io.instr.asTypeOf(new XSInstBitFields)
37bdda74fdSxiaofeibao-xjtu  val fpToVecInsts = Seq(
38bdda74fdSxiaofeibao-xjtu    FADD_S, FSUB_S, FADD_D, FSUB_D,
39bdda74fdSxiaofeibao-xjtu    FEQ_S, FLT_S, FLE_S, FEQ_D, FLT_D, FLE_D,
40bdda74fdSxiaofeibao-xjtu    FMIN_S, FMAX_S, FMIN_D, FMAX_D,
41bdda74fdSxiaofeibao-xjtu    FMUL_S, FMUL_D,
42bdda74fdSxiaofeibao-xjtu    FDIV_S, FDIV_D, FSQRT_S, FSQRT_D,
43bdda74fdSxiaofeibao-xjtu    FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D,
44bdda74fdSxiaofeibao-xjtu    FCLASS_S, FCLASS_D, FSGNJ_S, FSGNJ_D, FSGNJX_S, FSGNJX_D, FSGNJN_S, FSGNJN_D,
45*34f9ccd0SZiyue Zhang
46*34f9ccd0SZiyue Zhang    // scalar cvt inst
47*34f9ccd0SZiyue Zhang    FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S,
48*34f9ccd0SZiyue Zhang    FCVT_W_D, FCVT_WU_D, FCVT_L_D, FCVT_LU_D, FCVT_S_D, FCVT_D_S,
49*34f9ccd0SZiyue Zhang    FMV_X_W, FMV_X_D,
50bdda74fdSxiaofeibao-xjtu  )
51bdda74fdSxiaofeibao-xjtu  val isFpToVecInst = fpToVecInsts.map(io.instr === _).reduce(_ || _)
52bdda74fdSxiaofeibao-xjtu  val isFP32Instrs = Seq(
53bdda74fdSxiaofeibao-xjtu    FADD_S, FSUB_S, FEQ_S, FLT_S, FLE_S, FMIN_S, FMAX_S,
54bdda74fdSxiaofeibao-xjtu    FMUL_S, FDIV_S, FSQRT_S,
55bdda74fdSxiaofeibao-xjtu    FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S,
56bdda74fdSxiaofeibao-xjtu    FCLASS_S, FSGNJ_S, FSGNJX_S, FSGNJN_S,
57bdda74fdSxiaofeibao-xjtu  )
58bdda74fdSxiaofeibao-xjtu  val isFP32Instr = isFP32Instrs.map(io.instr === _).reduce(_ || _)
59bdda74fdSxiaofeibao-xjtu  val isFP64Instrs = Seq(
60bdda74fdSxiaofeibao-xjtu    FADD_D, FSUB_D, FEQ_D, FLT_D, FLE_D, FMIN_D, FMAX_D,
61bdda74fdSxiaofeibao-xjtu    FMUL_D, FDIV_D, FSQRT_D,
62bdda74fdSxiaofeibao-xjtu    FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D,
63bdda74fdSxiaofeibao-xjtu    FCLASS_D, FSGNJ_D, FSGNJX_D, FSGNJN_D,
64bdda74fdSxiaofeibao-xjtu  )
65bdda74fdSxiaofeibao-xjtu  val isFP64Instr = isFP64Instrs.map(io.instr === _).reduce(_ || _)
66*34f9ccd0SZiyue Zhang  // scalar cvt inst
67*34f9ccd0SZiyue Zhang  val isSew2Cvts = Seq(
68*34f9ccd0SZiyue Zhang    FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S,
69*34f9ccd0SZiyue Zhang    FCVT_W_D, FCVT_WU_D, FCVT_S_D, FCVT_D_S,
70*34f9ccd0SZiyue Zhang    FMV_X_W,
71*34f9ccd0SZiyue Zhang  )
72*34f9ccd0SZiyue Zhang  val isSew2Cvt = isSew2Cvts.map(io.instr === _).reduce(_ || _)
73*34f9ccd0SZiyue Zhang  val isLmulMf4Cvts = Seq(
74*34f9ccd0SZiyue Zhang    FCVT_W_S, FCVT_WU_S,
75*34f9ccd0SZiyue Zhang    FMV_X_W,
76*34f9ccd0SZiyue Zhang  )
77*34f9ccd0SZiyue Zhang  val isLmulMf4Cvt = isLmulMf4Cvts.map(io.instr === _).reduce(_ || _)
78bdda74fdSxiaofeibao-xjtu  val needReverseInsts = fpToVecInsts
79bdda74fdSxiaofeibao-xjtu  val needReverseInst = needReverseInsts.map(_ === inst.ALL).reduce(_ || _)
80bdda74fdSxiaofeibao-xjtu  io.vpuCtrl := 0.U.asTypeOf(io.vpuCtrl)
81bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.fpu.isFpToVecInst := isFpToVecInst
82bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.fpu.isFP32Instr   := isFP32Instr
83bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.fpu.isFP64Instr   := isFP64Instr
84bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vill  := false.B
85bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vma   := true.B
86bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vta   := true.B
87*34f9ccd0SZiyue Zhang  io.vpuCtrl.vsew  := Mux(isFP32Instr || isSew2Cvt, VSew.e32, VSew.e64)
88*34f9ccd0SZiyue Zhang  io.vpuCtrl.vlmul := Mux(isFP32Instr || isLmulMf4Cvt, VLmul.mf4, VLmul.mf2)
89bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vm    := inst.VM
90bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.nf    := inst.NF
91d9355d3aSZiyue-Zhang  io.vpuCtrl.veew := inst.WIDTH
92bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isReverse := needReverseInst
93bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isExt     := false.B
94bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isNarrow  := false.B
95bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isDstMask := false.B
9630fcc710SZiyue Zhang  io.vpuCtrl.isOpMask  := false.B
97bdda74fdSxiaofeibao-xjtu}
98bdda74fdSxiaofeibao-xjtu
99bdda74fdSxiaofeibao-xjtu
1002225d46eSJiawei Linclass FPDecoder(implicit p: Parameters) extends XSModule{
1012ce29ed6SLinJiawei  val io = IO(new Bundle() {
1022ce29ed6SLinJiawei    val instr = Input(UInt(32.W))
1032ce29ed6SLinJiawei    val fpCtrl = Output(new FPUCtrlSignals)
1042ce29ed6SLinJiawei  })
1052ce29ed6SLinJiawei
10698cfe81bSxgkiri  private val inst: XSInstBitFields = io.instr.asTypeOf(new XSInstBitFields)
10798cfe81bSxgkiri
1082ce29ed6SLinJiawei  def X = BitPat("b?")
1092ce29ed6SLinJiawei  def N = BitPat("b0")
1102ce29ed6SLinJiawei  def Y = BitPat("b1")
111dc597826SJiawei Lin  val s = BitPat(FPU.S)
112dc597826SJiawei Lin  val d = BitPat(FPU.D)
113dc597826SJiawei Lin  val i = BitPat(FPU.D)
1142ce29ed6SLinJiawei
115fe73f692SLinJiawei  val default = List(X,X,X,N,N,N,X,X,X)
1162ce29ed6SLinJiawei
1172ce29ed6SLinJiawei  // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt
1182ce29ed6SLinJiawei  val single: Array[(BitPat, List[BitPat])] = Array(
119dc597826SJiawei Lin    // IntToFP
120dc597826SJiawei Lin    FMV_W_X  -> List(N,i,s,Y,N,Y,N,N,N),
121dc597826SJiawei Lin    FCVT_S_W -> List(N,i,s,Y,Y,Y,N,N,Y),
122dc597826SJiawei Lin    FCVT_S_WU-> List(N,i,s,Y,Y,Y,N,N,Y),
123dc597826SJiawei Lin    FCVT_S_L -> List(N,i,s,Y,Y,Y,N,N,Y),
124dc597826SJiawei Lin    FCVT_S_LU-> List(N,i,s,Y,Y,Y,N,N,Y),
125dc597826SJiawei Lin    // FPToInt
126dc597826SJiawei Lin    FMV_X_W  -> List(N,d,i,N,N,N,N,N,N), // dont box result of fmv.fp.int
1278cc1ac81SLinJiawei    FCLASS_S -> List(N,s,i,N,N,N,N,N,N),
1288cc1ac81SLinJiawei    FCVT_W_S -> List(N,s,i,N,Y,N,N,N,Y),
1298cc1ac81SLinJiawei    FCVT_WU_S-> List(N,s,i,N,Y,N,N,N,Y),
1308cc1ac81SLinJiawei    FCVT_L_S -> List(N,s,i,N,Y,N,N,N,Y),
1318cc1ac81SLinJiawei    FCVT_LU_S-> List(N,s,i,N,Y,N,N,N,Y),
1328cc1ac81SLinJiawei    FEQ_S    -> List(N,s,i,N,Y,N,N,N,N),
1338cc1ac81SLinJiawei    FLT_S    -> List(N,s,i,N,Y,N,N,N,N),
1348cc1ac81SLinJiawei    FLE_S    -> List(N,s,i,N,Y,N,N,N,N),
135dc597826SJiawei Lin    // FPToFP
1362ce29ed6SLinJiawei    FSGNJ_S  -> List(N,s,s,N,N,Y,N,N,N),
1372ce29ed6SLinJiawei    FSGNJN_S -> List(N,s,s,N,N,Y,N,N,N),
1382ce29ed6SLinJiawei    FSGNJX_S -> List(N,s,s,N,N,Y,N,N,N),
1392ce29ed6SLinJiawei    FMIN_S   -> List(N,s,s,N,Y,Y,N,N,N),
1402ce29ed6SLinJiawei    FMAX_S   -> List(N,s,s,N,Y,Y,N,N,N),
1412ce29ed6SLinJiawei    FADD_S   -> List(Y,s,s,N,Y,Y,N,N,N),
1422ce29ed6SLinJiawei    FSUB_S   -> List(Y,s,s,N,Y,Y,N,N,N),
1432ce29ed6SLinJiawei    FMUL_S   -> List(N,s,s,N,Y,Y,N,N,N),
1442ce29ed6SLinJiawei    FMADD_S  -> List(N,s,s,N,Y,Y,N,N,N),
1452ce29ed6SLinJiawei    FMSUB_S  -> List(N,s,s,N,Y,Y,N,N,N),
1462ce29ed6SLinJiawei    FNMADD_S -> List(N,s,s,N,Y,Y,N,N,N),
1472ce29ed6SLinJiawei    FNMSUB_S -> List(N,s,s,N,Y,Y,N,N,N),
1482ce29ed6SLinJiawei    FDIV_S   -> List(N,s,s,N,Y,Y,Y,N,N),
1492ce29ed6SLinJiawei    FSQRT_S  -> List(N,s,s,N,Y,Y,N,Y,N)
1502ce29ed6SLinJiawei  )
1512ce29ed6SLinJiawei
152e50fb2d7SLinJiawei
153e50fb2d7SLinJiawei  // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt
154e50fb2d7SLinJiawei  val double: Array[(BitPat, List[BitPat])] = Array(
155dc597826SJiawei Lin    FMV_D_X  -> List(N,i,d,Y,N,Y,N,N,N),
156dc597826SJiawei Lin    FCVT_D_W -> List(N,i,d,Y,Y,Y,N,N,Y),
157dc597826SJiawei Lin    FCVT_D_WU-> List(N,i,d,Y,Y,Y,N,N,Y),
158dc597826SJiawei Lin    FCVT_D_L -> List(N,i,d,Y,Y,Y,N,N,Y),
159dc597826SJiawei Lin    FCVT_D_LU-> List(N,i,d,Y,Y,Y,N,N,Y),
1608cc1ac81SLinJiawei    FMV_X_D  -> List(N,d,i,N,N,N,N,N,N),
1618cc1ac81SLinJiawei    FCLASS_D -> List(N,d,i,N,N,N,N,N,N),
1628cc1ac81SLinJiawei    FCVT_W_D -> List(N,d,i,N,Y,N,N,N,Y),
1638cc1ac81SLinJiawei    FCVT_WU_D-> List(N,d,i,N,Y,N,N,N,Y),
1648cc1ac81SLinJiawei    FCVT_L_D -> List(N,d,i,N,Y,N,N,N,Y),
1658cc1ac81SLinJiawei    FCVT_LU_D-> List(N,d,i,N,Y,N,N,N,Y),
166e50fb2d7SLinJiawei    FCVT_S_D -> List(N,d,s,N,Y,Y,N,N,Y),
167e50fb2d7SLinJiawei    FCVT_D_S -> List(N,s,d,N,Y,Y,N,N,Y),
1688cc1ac81SLinJiawei    FEQ_D    -> List(N,d,i,N,Y,N,N,N,N),
1698cc1ac81SLinJiawei    FLT_D    -> List(N,d,i,N,Y,N,N,N,N),
1708cc1ac81SLinJiawei    FLE_D    -> List(N,d,i,N,Y,N,N,N,N),
171e50fb2d7SLinJiawei    FSGNJ_D  -> List(N,d,d,N,N,Y,N,N,N),
172e50fb2d7SLinJiawei    FSGNJN_D -> List(N,d,d,N,N,Y,N,N,N),
173e50fb2d7SLinJiawei    FSGNJX_D -> List(N,d,d,N,N,Y,N,N,N),
174e50fb2d7SLinJiawei    FMIN_D   -> List(N,d,d,N,Y,Y,N,N,N),
175e50fb2d7SLinJiawei    FMAX_D   -> List(N,d,d,N,Y,Y,N,N,N),
176e50fb2d7SLinJiawei    FADD_D   -> List(Y,d,d,N,Y,Y,N,N,N),
177e50fb2d7SLinJiawei    FSUB_D   -> List(Y,d,d,N,Y,Y,N,N,N),
178e50fb2d7SLinJiawei    FMUL_D   -> List(N,d,d,N,Y,Y,N,N,N),
179e50fb2d7SLinJiawei    FMADD_D  -> List(N,d,d,N,Y,Y,N,N,N),
180e50fb2d7SLinJiawei    FMSUB_D  -> List(N,d,d,N,Y,Y,N,N,N),
181e50fb2d7SLinJiawei    FNMADD_D -> List(N,d,d,N,Y,Y,N,N,N),
182e50fb2d7SLinJiawei    FNMSUB_D -> List(N,d,d,N,Y,Y,N,N,N),
183e50fb2d7SLinJiawei    FDIV_D   -> List(N,d,d,N,Y,Y,Y,N,N),
184e50fb2d7SLinJiawei    FSQRT_D  -> List(N,d,d,N,Y,Y,N,Y,N)
185e50fb2d7SLinJiawei  )
186e50fb2d7SLinJiawei
187e50fb2d7SLinJiawei  val table = single ++ double
1882ce29ed6SLinJiawei
1892ce29ed6SLinJiawei  val decoder = DecodeLogic(io.instr, default, table)
1902ce29ed6SLinJiawei
1912ce29ed6SLinJiawei  val ctrl = io.fpCtrl
1922ce29ed6SLinJiawei  val sigs = Seq(
1932ce29ed6SLinJiawei    ctrl.isAddSub, ctrl.typeTagIn, ctrl.typeTagOut,
1942ce29ed6SLinJiawei    ctrl.fromInt, ctrl.wflags, ctrl.fpWen,
1952ce29ed6SLinJiawei    ctrl.div, ctrl.sqrt, ctrl.fcvt
1962ce29ed6SLinJiawei  )
1972ce29ed6SLinJiawei  sigs.zip(decoder).foreach({case (s, d) => s := d})
19898cfe81bSxgkiri  ctrl.typ := inst.TYP
19998cfe81bSxgkiri  ctrl.fmt := inst.FMT
20098cfe81bSxgkiri  ctrl.rm := inst.RM
2012ce29ed6SLinJiawei
2022ce29ed6SLinJiawei  val fmaTable: Array[(BitPat, List[BitPat])] = Array(
203e50fb2d7SLinJiawei    FADD_S  -> List(BitPat("b00"),N),
204e50fb2d7SLinJiawei    FADD_D  -> List(BitPat("b00"),N),
205e50fb2d7SLinJiawei    FSUB_S  -> List(BitPat("b01"),N),
206e50fb2d7SLinJiawei    FSUB_D  -> List(BitPat("b01"),N),
207e50fb2d7SLinJiawei    FMUL_S  -> List(BitPat("b00"),N),
208e50fb2d7SLinJiawei    FMUL_D  -> List(BitPat("b00"),N),
209e50fb2d7SLinJiawei    FMADD_S -> List(BitPat("b00"),Y),
210e50fb2d7SLinJiawei    FMADD_D -> List(BitPat("b00"),Y),
211e50fb2d7SLinJiawei    FMSUB_S -> List(BitPat("b01"),Y),
212e50fb2d7SLinJiawei    FMSUB_D -> List(BitPat("b01"),Y),
213e50fb2d7SLinJiawei    FNMADD_S-> List(BitPat("b11"),Y),
214e50fb2d7SLinJiawei    FNMADD_D-> List(BitPat("b11"),Y),
215e50fb2d7SLinJiawei    FNMSUB_S-> List(BitPat("b10"),Y),
216e50fb2d7SLinJiawei    FNMSUB_D-> List(BitPat("b10"),Y)
2172ce29ed6SLinJiawei  )
218e50fb2d7SLinJiawei  val fmaDefault = List(BitPat("b??"), N)
219e50fb2d7SLinJiawei  Seq(ctrl.fmaCmd, ctrl.ren3).zip(
2202ce29ed6SLinJiawei    DecodeLogic(io.instr, fmaDefault, fmaTable)
2212ce29ed6SLinJiawei  ).foreach({
2222ce29ed6SLinJiawei    case (s, d) => s := d
2232ce29ed6SLinJiawei  })
2242ce29ed6SLinJiawei}
225