xref: /XiangShan/src/main/scala/xiangshan/backend/decode/FPDecoder.scala (revision 4b136a73e676909c30db26a961579ca6b925f7f8)
1c6d43980SLemover/***************************************************************************************
2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory
4c6d43980SLemover*
5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2.
6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2.
7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at:
8c6d43980SLemover*          http://license.coscl.org.cn/MulanPSL2
9c6d43980SLemover*
10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
13c6d43980SLemover*
14c6d43980SLemover* See the Mulan PSL v2 for more details.
15c6d43980SLemover***************************************************************************************/
16c6d43980SLemover
172ce29ed6SLinJiaweipackage xiangshan.backend.decode
182ce29ed6SLinJiawei
198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters
202ce29ed6SLinJiaweiimport chisel3._
212ce29ed6SLinJiaweiimport chisel3.util._
222ce29ed6SLinJiaweiimport freechips.rocketchip.rocket.DecodeLogic
23361e6d51SJiuyang Liuimport freechips.rocketchip.rocket.Instructions._
2498cfe81bSxgkiriimport xiangshan.backend.decode.isa.bitfield.XSInstBitFields
25dc597826SJiawei Linimport xiangshan.backend.fu.fpu.FPU
26395c8649SZiyue-Zhangimport xiangshan.backend.fu.vector.Bundles.{VSew, VLmul}
27bdda74fdSxiaofeibao-xjtuimport xiangshan.backend.Bundles.VPUCtrlSignals
282ce29ed6SLinJiaweiimport xiangshan.{FPUCtrlSignals, XSModule}
292ce29ed6SLinJiawei
30bdda74fdSxiaofeibao-xjtuclass FPToVecDecoder(implicit p: Parameters) extends XSModule {
31bdda74fdSxiaofeibao-xjtu  val io = IO(new Bundle() {
32bdda74fdSxiaofeibao-xjtu    val instr = Input(UInt(32.W))
33bdda74fdSxiaofeibao-xjtu    val vpuCtrl = Output(new VPUCtrlSignals)
34bdda74fdSxiaofeibao-xjtu  })
35bdda74fdSxiaofeibao-xjtu
36bdda74fdSxiaofeibao-xjtu  val inst = io.instr.asTypeOf(new XSInstBitFields)
37bdda74fdSxiaofeibao-xjtu  val fpToVecInsts = Seq(
38bdda74fdSxiaofeibao-xjtu    FADD_S, FSUB_S, FADD_D, FSUB_D,
39bdda74fdSxiaofeibao-xjtu    FEQ_S, FLT_S, FLE_S, FEQ_D, FLT_D, FLE_D,
40bdda74fdSxiaofeibao-xjtu    FMIN_S, FMAX_S, FMIN_D, FMAX_D,
41bdda74fdSxiaofeibao-xjtu    FMUL_S, FMUL_D,
42bdda74fdSxiaofeibao-xjtu    FDIV_S, FDIV_D, FSQRT_S, FSQRT_D,
43bdda74fdSxiaofeibao-xjtu    FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D,
44bdda74fdSxiaofeibao-xjtu    FCLASS_S, FCLASS_D, FSGNJ_S, FSGNJ_D, FSGNJX_S, FSGNJX_D, FSGNJN_S, FSGNJN_D,
45572278faSZiyue Zhang
46572278faSZiyue Zhang    // scalar cvt inst
47572278faSZiyue Zhang    FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S,
48572278faSZiyue Zhang    FCVT_W_D, FCVT_WU_D, FCVT_L_D, FCVT_LU_D, FCVT_S_D, FCVT_D_S,
49572278faSZiyue Zhang    FMV_X_W, FMV_X_D,
50bdda74fdSxiaofeibao-xjtu  )
51bdda74fdSxiaofeibao-xjtu  val isFpToVecInst = fpToVecInsts.map(io.instr === _).reduce(_ || _)
52bdda74fdSxiaofeibao-xjtu  val isFP32Instrs = Seq(
53bdda74fdSxiaofeibao-xjtu    FADD_S, FSUB_S, FEQ_S, FLT_S, FLE_S, FMIN_S, FMAX_S,
54bdda74fdSxiaofeibao-xjtu    FMUL_S, FDIV_S, FSQRT_S,
55bdda74fdSxiaofeibao-xjtu    FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S,
56bdda74fdSxiaofeibao-xjtu    FCLASS_S, FSGNJ_S, FSGNJX_S, FSGNJN_S,
57bdda74fdSxiaofeibao-xjtu  )
58bdda74fdSxiaofeibao-xjtu  val isFP32Instr = isFP32Instrs.map(io.instr === _).reduce(_ || _)
59bdda74fdSxiaofeibao-xjtu  val isFP64Instrs = Seq(
60bdda74fdSxiaofeibao-xjtu    FADD_D, FSUB_D, FEQ_D, FLT_D, FLE_D, FMIN_D, FMAX_D,
61bdda74fdSxiaofeibao-xjtu    FMUL_D, FDIV_D, FSQRT_D,
62bdda74fdSxiaofeibao-xjtu    FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D,
63bdda74fdSxiaofeibao-xjtu    FCLASS_D, FSGNJ_D, FSGNJX_D, FSGNJN_D,
64bdda74fdSxiaofeibao-xjtu  )
65bdda74fdSxiaofeibao-xjtu  val isFP64Instr = isFP64Instrs.map(io.instr === _).reduce(_ || _)
66572278faSZiyue Zhang  // scalar cvt inst
67572278faSZiyue Zhang  val isSew2Cvts = Seq(
68572278faSZiyue Zhang    FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S,
69572278faSZiyue Zhang    FCVT_W_D, FCVT_WU_D, FCVT_S_D, FCVT_D_S,
70572278faSZiyue Zhang    FMV_X_W,
71572278faSZiyue Zhang  )
72572278faSZiyue Zhang  val isSew2Cvt = isSew2Cvts.map(io.instr === _).reduce(_ || _)
73572278faSZiyue Zhang  val isLmulMf4Cvts = Seq(
74572278faSZiyue Zhang    FCVT_W_S, FCVT_WU_S,
75572278faSZiyue Zhang    FMV_X_W,
76572278faSZiyue Zhang  )
77572278faSZiyue Zhang  val isLmulMf4Cvt = isLmulMf4Cvts.map(io.instr === _).reduce(_ || _)
78*4b136a73Ssinsanction  val needReverseInsts = Seq(
79*4b136a73Ssinsanction    FADD_S, FSUB_S, FADD_D, FSUB_D,
80*4b136a73Ssinsanction    FEQ_S, FLT_S, FLE_S, FEQ_D, FLT_D, FLE_D,
81*4b136a73Ssinsanction    FMIN_S, FMAX_S, FMIN_D, FMAX_D,
82*4b136a73Ssinsanction    FMUL_S, FMUL_D,
83*4b136a73Ssinsanction    FDIV_S, FDIV_D, FSQRT_S, FSQRT_D,
84*4b136a73Ssinsanction    FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D,
85*4b136a73Ssinsanction    FCLASS_S, FCLASS_D, FSGNJ_S, FSGNJ_D, FSGNJX_S, FSGNJX_D, FSGNJN_S, FSGNJN_D,
86*4b136a73Ssinsanction  )
87bdda74fdSxiaofeibao-xjtu  val needReverseInst = needReverseInsts.map(_ === inst.ALL).reduce(_ || _)
88bdda74fdSxiaofeibao-xjtu  io.vpuCtrl := 0.U.asTypeOf(io.vpuCtrl)
89bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.fpu.isFpToVecInst := isFpToVecInst
90bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.fpu.isFP32Instr   := isFP32Instr
91bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.fpu.isFP64Instr   := isFP64Instr
92bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vill  := false.B
93bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vma   := true.B
94bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vta   := true.B
95572278faSZiyue Zhang  io.vpuCtrl.vsew  := Mux(isFP32Instr || isSew2Cvt, VSew.e32, VSew.e64)
96572278faSZiyue Zhang  io.vpuCtrl.vlmul := Mux(isFP32Instr || isLmulMf4Cvt, VLmul.mf4, VLmul.mf2)
97bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.vm    := inst.VM
98bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.nf    := inst.NF
99d9355d3aSZiyue-Zhang  io.vpuCtrl.veew := inst.WIDTH
100bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isReverse := needReverseInst
101bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isExt     := false.B
102bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isNarrow  := false.B
103bdda74fdSxiaofeibao-xjtu  io.vpuCtrl.isDstMask := false.B
10430fcc710SZiyue Zhang  io.vpuCtrl.isOpMask  := false.B
105bdda74fdSxiaofeibao-xjtu}
106bdda74fdSxiaofeibao-xjtu
107bdda74fdSxiaofeibao-xjtu
1082225d46eSJiawei Linclass FPDecoder(implicit p: Parameters) extends XSModule{
1092ce29ed6SLinJiawei  val io = IO(new Bundle() {
1102ce29ed6SLinJiawei    val instr = Input(UInt(32.W))
1112ce29ed6SLinJiawei    val fpCtrl = Output(new FPUCtrlSignals)
1122ce29ed6SLinJiawei  })
1132ce29ed6SLinJiawei
11498cfe81bSxgkiri  private val inst: XSInstBitFields = io.instr.asTypeOf(new XSInstBitFields)
11598cfe81bSxgkiri
1162ce29ed6SLinJiawei  def X = BitPat("b?")
1172ce29ed6SLinJiawei  def N = BitPat("b0")
1182ce29ed6SLinJiawei  def Y = BitPat("b1")
119dc597826SJiawei Lin  val s = BitPat(FPU.S)
120dc597826SJiawei Lin  val d = BitPat(FPU.D)
121dc597826SJiawei Lin  val i = BitPat(FPU.D)
1222ce29ed6SLinJiawei
123fe73f692SLinJiawei  val default = List(X,X,X,N,N,N,X,X,X)
1242ce29ed6SLinJiawei
1252ce29ed6SLinJiawei  // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt
1262ce29ed6SLinJiawei  val single: Array[(BitPat, List[BitPat])] = Array(
127dc597826SJiawei Lin    // IntToFP
128dc597826SJiawei Lin    FMV_W_X  -> List(N,i,s,Y,N,Y,N,N,N),
129dc597826SJiawei Lin    FCVT_S_W -> List(N,i,s,Y,Y,Y,N,N,Y),
130dc597826SJiawei Lin    FCVT_S_WU-> List(N,i,s,Y,Y,Y,N,N,Y),
131dc597826SJiawei Lin    FCVT_S_L -> List(N,i,s,Y,Y,Y,N,N,Y),
132dc597826SJiawei Lin    FCVT_S_LU-> List(N,i,s,Y,Y,Y,N,N,Y),
133dc597826SJiawei Lin    // FPToInt
134dc597826SJiawei Lin    FMV_X_W  -> List(N,d,i,N,N,N,N,N,N), // dont box result of fmv.fp.int
1358cc1ac81SLinJiawei    FCLASS_S -> List(N,s,i,N,N,N,N,N,N),
1368cc1ac81SLinJiawei    FCVT_W_S -> List(N,s,i,N,Y,N,N,N,Y),
1378cc1ac81SLinJiawei    FCVT_WU_S-> List(N,s,i,N,Y,N,N,N,Y),
1388cc1ac81SLinJiawei    FCVT_L_S -> List(N,s,i,N,Y,N,N,N,Y),
1398cc1ac81SLinJiawei    FCVT_LU_S-> List(N,s,i,N,Y,N,N,N,Y),
1408cc1ac81SLinJiawei    FEQ_S    -> List(N,s,i,N,Y,N,N,N,N),
1418cc1ac81SLinJiawei    FLT_S    -> List(N,s,i,N,Y,N,N,N,N),
1428cc1ac81SLinJiawei    FLE_S    -> List(N,s,i,N,Y,N,N,N,N),
143dc597826SJiawei Lin    // FPToFP
1442ce29ed6SLinJiawei    FSGNJ_S  -> List(N,s,s,N,N,Y,N,N,N),
1452ce29ed6SLinJiawei    FSGNJN_S -> List(N,s,s,N,N,Y,N,N,N),
1462ce29ed6SLinJiawei    FSGNJX_S -> List(N,s,s,N,N,Y,N,N,N),
1472ce29ed6SLinJiawei    FMIN_S   -> List(N,s,s,N,Y,Y,N,N,N),
1482ce29ed6SLinJiawei    FMAX_S   -> List(N,s,s,N,Y,Y,N,N,N),
1492ce29ed6SLinJiawei    FADD_S   -> List(Y,s,s,N,Y,Y,N,N,N),
1502ce29ed6SLinJiawei    FSUB_S   -> List(Y,s,s,N,Y,Y,N,N,N),
1512ce29ed6SLinJiawei    FMUL_S   -> List(N,s,s,N,Y,Y,N,N,N),
1522ce29ed6SLinJiawei    FMADD_S  -> List(N,s,s,N,Y,Y,N,N,N),
1532ce29ed6SLinJiawei    FMSUB_S  -> List(N,s,s,N,Y,Y,N,N,N),
1542ce29ed6SLinJiawei    FNMADD_S -> List(N,s,s,N,Y,Y,N,N,N),
1552ce29ed6SLinJiawei    FNMSUB_S -> List(N,s,s,N,Y,Y,N,N,N),
1562ce29ed6SLinJiawei    FDIV_S   -> List(N,s,s,N,Y,Y,Y,N,N),
1572ce29ed6SLinJiawei    FSQRT_S  -> List(N,s,s,N,Y,Y,N,Y,N)
1582ce29ed6SLinJiawei  )
1592ce29ed6SLinJiawei
160e50fb2d7SLinJiawei
161e50fb2d7SLinJiawei  // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt
162e50fb2d7SLinJiawei  val double: Array[(BitPat, List[BitPat])] = Array(
163dc597826SJiawei Lin    FMV_D_X  -> List(N,i,d,Y,N,Y,N,N,N),
164dc597826SJiawei Lin    FCVT_D_W -> List(N,i,d,Y,Y,Y,N,N,Y),
165dc597826SJiawei Lin    FCVT_D_WU-> List(N,i,d,Y,Y,Y,N,N,Y),
166dc597826SJiawei Lin    FCVT_D_L -> List(N,i,d,Y,Y,Y,N,N,Y),
167dc597826SJiawei Lin    FCVT_D_LU-> List(N,i,d,Y,Y,Y,N,N,Y),
1688cc1ac81SLinJiawei    FMV_X_D  -> List(N,d,i,N,N,N,N,N,N),
1698cc1ac81SLinJiawei    FCLASS_D -> List(N,d,i,N,N,N,N,N,N),
1708cc1ac81SLinJiawei    FCVT_W_D -> List(N,d,i,N,Y,N,N,N,Y),
1718cc1ac81SLinJiawei    FCVT_WU_D-> List(N,d,i,N,Y,N,N,N,Y),
1728cc1ac81SLinJiawei    FCVT_L_D -> List(N,d,i,N,Y,N,N,N,Y),
1738cc1ac81SLinJiawei    FCVT_LU_D-> List(N,d,i,N,Y,N,N,N,Y),
174e50fb2d7SLinJiawei    FCVT_S_D -> List(N,d,s,N,Y,Y,N,N,Y),
175e50fb2d7SLinJiawei    FCVT_D_S -> List(N,s,d,N,Y,Y,N,N,Y),
1768cc1ac81SLinJiawei    FEQ_D    -> List(N,d,i,N,Y,N,N,N,N),
1778cc1ac81SLinJiawei    FLT_D    -> List(N,d,i,N,Y,N,N,N,N),
1788cc1ac81SLinJiawei    FLE_D    -> List(N,d,i,N,Y,N,N,N,N),
179e50fb2d7SLinJiawei    FSGNJ_D  -> List(N,d,d,N,N,Y,N,N,N),
180e50fb2d7SLinJiawei    FSGNJN_D -> List(N,d,d,N,N,Y,N,N,N),
181e50fb2d7SLinJiawei    FSGNJX_D -> List(N,d,d,N,N,Y,N,N,N),
182e50fb2d7SLinJiawei    FMIN_D   -> List(N,d,d,N,Y,Y,N,N,N),
183e50fb2d7SLinJiawei    FMAX_D   -> List(N,d,d,N,Y,Y,N,N,N),
184e50fb2d7SLinJiawei    FADD_D   -> List(Y,d,d,N,Y,Y,N,N,N),
185e50fb2d7SLinJiawei    FSUB_D   -> List(Y,d,d,N,Y,Y,N,N,N),
186e50fb2d7SLinJiawei    FMUL_D   -> List(N,d,d,N,Y,Y,N,N,N),
187e50fb2d7SLinJiawei    FMADD_D  -> List(N,d,d,N,Y,Y,N,N,N),
188e50fb2d7SLinJiawei    FMSUB_D  -> List(N,d,d,N,Y,Y,N,N,N),
189e50fb2d7SLinJiawei    FNMADD_D -> List(N,d,d,N,Y,Y,N,N,N),
190e50fb2d7SLinJiawei    FNMSUB_D -> List(N,d,d,N,Y,Y,N,N,N),
191e50fb2d7SLinJiawei    FDIV_D   -> List(N,d,d,N,Y,Y,Y,N,N),
192e50fb2d7SLinJiawei    FSQRT_D  -> List(N,d,d,N,Y,Y,N,Y,N)
193e50fb2d7SLinJiawei  )
194e50fb2d7SLinJiawei
195e50fb2d7SLinJiawei  val table = single ++ double
1962ce29ed6SLinJiawei
1972ce29ed6SLinJiawei  val decoder = DecodeLogic(io.instr, default, table)
1982ce29ed6SLinJiawei
1992ce29ed6SLinJiawei  val ctrl = io.fpCtrl
2002ce29ed6SLinJiawei  val sigs = Seq(
2012ce29ed6SLinJiawei    ctrl.isAddSub, ctrl.typeTagIn, ctrl.typeTagOut,
2022ce29ed6SLinJiawei    ctrl.fromInt, ctrl.wflags, ctrl.fpWen,
2032ce29ed6SLinJiawei    ctrl.div, ctrl.sqrt, ctrl.fcvt
2042ce29ed6SLinJiawei  )
2052ce29ed6SLinJiawei  sigs.zip(decoder).foreach({case (s, d) => s := d})
20698cfe81bSxgkiri  ctrl.typ := inst.TYP
20798cfe81bSxgkiri  ctrl.fmt := inst.FMT
20898cfe81bSxgkiri  ctrl.rm := inst.RM
2092ce29ed6SLinJiawei
2102ce29ed6SLinJiawei  val fmaTable: Array[(BitPat, List[BitPat])] = Array(
211e50fb2d7SLinJiawei    FADD_S  -> List(BitPat("b00"),N),
212e50fb2d7SLinJiawei    FADD_D  -> List(BitPat("b00"),N),
213e50fb2d7SLinJiawei    FSUB_S  -> List(BitPat("b01"),N),
214e50fb2d7SLinJiawei    FSUB_D  -> List(BitPat("b01"),N),
215e50fb2d7SLinJiawei    FMUL_S  -> List(BitPat("b00"),N),
216e50fb2d7SLinJiawei    FMUL_D  -> List(BitPat("b00"),N),
217e50fb2d7SLinJiawei    FMADD_S -> List(BitPat("b00"),Y),
218e50fb2d7SLinJiawei    FMADD_D -> List(BitPat("b00"),Y),
219e50fb2d7SLinJiawei    FMSUB_S -> List(BitPat("b01"),Y),
220e50fb2d7SLinJiawei    FMSUB_D -> List(BitPat("b01"),Y),
221e50fb2d7SLinJiawei    FNMADD_S-> List(BitPat("b11"),Y),
222e50fb2d7SLinJiawei    FNMADD_D-> List(BitPat("b11"),Y),
223e50fb2d7SLinJiawei    FNMSUB_S-> List(BitPat("b10"),Y),
224e50fb2d7SLinJiawei    FNMSUB_D-> List(BitPat("b10"),Y)
2252ce29ed6SLinJiawei  )
226e50fb2d7SLinJiawei  val fmaDefault = List(BitPat("b??"), N)
227e50fb2d7SLinJiawei  Seq(ctrl.fmaCmd, ctrl.ren3).zip(
2282ce29ed6SLinJiawei    DecodeLogic(io.instr, fmaDefault, fmaTable)
2292ce29ed6SLinJiawei  ).foreach({
2302ce29ed6SLinJiawei    case (s, d) => s := d
2312ce29ed6SLinJiawei  })
2322ce29ed6SLinJiawei}
233