1c6d43980SLemover/*************************************************************************************** 2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory 4c6d43980SLemover* 5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2. 6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2. 7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at: 8c6d43980SLemover* http://license.coscl.org.cn/MulanPSL2 9c6d43980SLemover* 10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13c6d43980SLemover* 14c6d43980SLemover* See the Mulan PSL v2 for more details. 15c6d43980SLemover***************************************************************************************/ 16c6d43980SLemover 172ce29ed6SLinJiaweipackage xiangshan.backend.decode 182ce29ed6SLinJiawei 198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters 202ce29ed6SLinJiaweiimport chisel3._ 212ce29ed6SLinJiaweiimport chisel3.util._ 222ce29ed6SLinJiaweiimport freechips.rocketchip.rocket.DecodeLogic 23361e6d51SJiuyang Liuimport freechips.rocketchip.rocket.Instructions._ 2498cfe81bSxgkiriimport xiangshan.backend.decode.isa.bitfield.XSInstBitFields 25dc597826SJiawei Linimport xiangshan.backend.fu.fpu.FPU 26395c8649SZiyue-Zhangimport xiangshan.backend.fu.vector.Bundles.{VSew, VLmul} 27bdda74fdSxiaofeibao-xjtuimport xiangshan.backend.Bundles.VPUCtrlSignals 282ce29ed6SLinJiaweiimport xiangshan.{FPUCtrlSignals, XSModule} 292ce29ed6SLinJiawei 30bdda74fdSxiaofeibao-xjtuclass FPToVecDecoder(implicit p: Parameters) extends XSModule { 31bdda74fdSxiaofeibao-xjtu val io = IO(new Bundle() { 32bdda74fdSxiaofeibao-xjtu val instr = Input(UInt(32.W)) 33bdda74fdSxiaofeibao-xjtu val vpuCtrl = Output(new VPUCtrlSignals) 34bdda74fdSxiaofeibao-xjtu }) 35bdda74fdSxiaofeibao-xjtu 36bdda74fdSxiaofeibao-xjtu val inst = io.instr.asTypeOf(new XSInstBitFields) 37bdda74fdSxiaofeibao-xjtu val fpToVecInsts = Seq( 38bdda74fdSxiaofeibao-xjtu FADD_S, FSUB_S, FADD_D, FSUB_D, 39bdda74fdSxiaofeibao-xjtu FEQ_S, FLT_S, FLE_S, FEQ_D, FLT_D, FLE_D, 40bdda74fdSxiaofeibao-xjtu FMIN_S, FMAX_S, FMIN_D, FMAX_D, 41bdda74fdSxiaofeibao-xjtu FMUL_S, FMUL_D, 42bdda74fdSxiaofeibao-xjtu FDIV_S, FDIV_D, FSQRT_S, FSQRT_D, 43bdda74fdSxiaofeibao-xjtu FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D, 44bdda74fdSxiaofeibao-xjtu FCLASS_S, FCLASS_D, FSGNJ_S, FSGNJ_D, FSGNJX_S, FSGNJX_D, FSGNJN_S, FSGNJN_D, 45*34f9ccd0SZiyue Zhang 46*34f9ccd0SZiyue Zhang // scalar cvt inst 47*34f9ccd0SZiyue Zhang FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S, 48*34f9ccd0SZiyue Zhang FCVT_W_D, FCVT_WU_D, FCVT_L_D, FCVT_LU_D, FCVT_S_D, FCVT_D_S, 49*34f9ccd0SZiyue Zhang FMV_X_W, FMV_X_D, 50bdda74fdSxiaofeibao-xjtu ) 51bdda74fdSxiaofeibao-xjtu val isFpToVecInst = fpToVecInsts.map(io.instr === _).reduce(_ || _) 52bdda74fdSxiaofeibao-xjtu val isFP32Instrs = Seq( 53bdda74fdSxiaofeibao-xjtu FADD_S, FSUB_S, FEQ_S, FLT_S, FLE_S, FMIN_S, FMAX_S, 54bdda74fdSxiaofeibao-xjtu FMUL_S, FDIV_S, FSQRT_S, 55bdda74fdSxiaofeibao-xjtu FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, 56bdda74fdSxiaofeibao-xjtu FCLASS_S, FSGNJ_S, FSGNJX_S, FSGNJN_S, 57bdda74fdSxiaofeibao-xjtu ) 58bdda74fdSxiaofeibao-xjtu val isFP32Instr = isFP32Instrs.map(io.instr === _).reduce(_ || _) 59bdda74fdSxiaofeibao-xjtu val isFP64Instrs = Seq( 60bdda74fdSxiaofeibao-xjtu FADD_D, FSUB_D, FEQ_D, FLT_D, FLE_D, FMIN_D, FMAX_D, 61bdda74fdSxiaofeibao-xjtu FMUL_D, FDIV_D, FSQRT_D, 62bdda74fdSxiaofeibao-xjtu FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D, 63bdda74fdSxiaofeibao-xjtu FCLASS_D, FSGNJ_D, FSGNJX_D, FSGNJN_D, 64bdda74fdSxiaofeibao-xjtu ) 65bdda74fdSxiaofeibao-xjtu val isFP64Instr = isFP64Instrs.map(io.instr === _).reduce(_ || _) 66*34f9ccd0SZiyue Zhang // scalar cvt inst 67*34f9ccd0SZiyue Zhang val isSew2Cvts = Seq( 68*34f9ccd0SZiyue Zhang FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S, 69*34f9ccd0SZiyue Zhang FCVT_W_D, FCVT_WU_D, FCVT_S_D, FCVT_D_S, 70*34f9ccd0SZiyue Zhang FMV_X_W, 71*34f9ccd0SZiyue Zhang ) 72*34f9ccd0SZiyue Zhang val isSew2Cvt = isSew2Cvts.map(io.instr === _).reduce(_ || _) 73*34f9ccd0SZiyue Zhang val isLmulMf4Cvts = Seq( 74*34f9ccd0SZiyue Zhang FCVT_W_S, FCVT_WU_S, 75*34f9ccd0SZiyue Zhang FMV_X_W, 76*34f9ccd0SZiyue Zhang ) 77*34f9ccd0SZiyue Zhang val isLmulMf4Cvt = isLmulMf4Cvts.map(io.instr === _).reduce(_ || _) 78bdda74fdSxiaofeibao-xjtu val needReverseInsts = fpToVecInsts 79bdda74fdSxiaofeibao-xjtu val needReverseInst = needReverseInsts.map(_ === inst.ALL).reduce(_ || _) 80bdda74fdSxiaofeibao-xjtu io.vpuCtrl := 0.U.asTypeOf(io.vpuCtrl) 81bdda74fdSxiaofeibao-xjtu io.vpuCtrl.fpu.isFpToVecInst := isFpToVecInst 82bdda74fdSxiaofeibao-xjtu io.vpuCtrl.fpu.isFP32Instr := isFP32Instr 83bdda74fdSxiaofeibao-xjtu io.vpuCtrl.fpu.isFP64Instr := isFP64Instr 84bdda74fdSxiaofeibao-xjtu io.vpuCtrl.vill := false.B 85bdda74fdSxiaofeibao-xjtu io.vpuCtrl.vma := true.B 86bdda74fdSxiaofeibao-xjtu io.vpuCtrl.vta := true.B 87*34f9ccd0SZiyue Zhang io.vpuCtrl.vsew := Mux(isFP32Instr || isSew2Cvt, VSew.e32, VSew.e64) 88*34f9ccd0SZiyue Zhang io.vpuCtrl.vlmul := Mux(isFP32Instr || isLmulMf4Cvt, VLmul.mf4, VLmul.mf2) 89bdda74fdSxiaofeibao-xjtu io.vpuCtrl.vm := inst.VM 90bdda74fdSxiaofeibao-xjtu io.vpuCtrl.nf := inst.NF 91d9355d3aSZiyue-Zhang io.vpuCtrl.veew := inst.WIDTH 92bdda74fdSxiaofeibao-xjtu io.vpuCtrl.isReverse := needReverseInst 93bdda74fdSxiaofeibao-xjtu io.vpuCtrl.isExt := false.B 94bdda74fdSxiaofeibao-xjtu io.vpuCtrl.isNarrow := false.B 95bdda74fdSxiaofeibao-xjtu io.vpuCtrl.isDstMask := false.B 9630fcc710SZiyue Zhang io.vpuCtrl.isOpMask := false.B 97bdda74fdSxiaofeibao-xjtu} 98bdda74fdSxiaofeibao-xjtu 99bdda74fdSxiaofeibao-xjtu 1002225d46eSJiawei Linclass FPDecoder(implicit p: Parameters) extends XSModule{ 1012ce29ed6SLinJiawei val io = IO(new Bundle() { 1022ce29ed6SLinJiawei val instr = Input(UInt(32.W)) 1032ce29ed6SLinJiawei val fpCtrl = Output(new FPUCtrlSignals) 1042ce29ed6SLinJiawei }) 1052ce29ed6SLinJiawei 10698cfe81bSxgkiri private val inst: XSInstBitFields = io.instr.asTypeOf(new XSInstBitFields) 10798cfe81bSxgkiri 1082ce29ed6SLinJiawei def X = BitPat("b?") 1092ce29ed6SLinJiawei def N = BitPat("b0") 1102ce29ed6SLinJiawei def Y = BitPat("b1") 111dc597826SJiawei Lin val s = BitPat(FPU.S) 112dc597826SJiawei Lin val d = BitPat(FPU.D) 113dc597826SJiawei Lin val i = BitPat(FPU.D) 1142ce29ed6SLinJiawei 115fe73f692SLinJiawei val default = List(X,X,X,N,N,N,X,X,X) 1162ce29ed6SLinJiawei 1172ce29ed6SLinJiawei // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt 1182ce29ed6SLinJiawei val single: Array[(BitPat, List[BitPat])] = Array( 119dc597826SJiawei Lin // IntToFP 120dc597826SJiawei Lin FMV_W_X -> List(N,i,s,Y,N,Y,N,N,N), 121dc597826SJiawei Lin FCVT_S_W -> List(N,i,s,Y,Y,Y,N,N,Y), 122dc597826SJiawei Lin FCVT_S_WU-> List(N,i,s,Y,Y,Y,N,N,Y), 123dc597826SJiawei Lin FCVT_S_L -> List(N,i,s,Y,Y,Y,N,N,Y), 124dc597826SJiawei Lin FCVT_S_LU-> List(N,i,s,Y,Y,Y,N,N,Y), 125dc597826SJiawei Lin // FPToInt 126dc597826SJiawei Lin FMV_X_W -> List(N,d,i,N,N,N,N,N,N), // dont box result of fmv.fp.int 1278cc1ac81SLinJiawei FCLASS_S -> List(N,s,i,N,N,N,N,N,N), 1288cc1ac81SLinJiawei FCVT_W_S -> List(N,s,i,N,Y,N,N,N,Y), 1298cc1ac81SLinJiawei FCVT_WU_S-> List(N,s,i,N,Y,N,N,N,Y), 1308cc1ac81SLinJiawei FCVT_L_S -> List(N,s,i,N,Y,N,N,N,Y), 1318cc1ac81SLinJiawei FCVT_LU_S-> List(N,s,i,N,Y,N,N,N,Y), 1328cc1ac81SLinJiawei FEQ_S -> List(N,s,i,N,Y,N,N,N,N), 1338cc1ac81SLinJiawei FLT_S -> List(N,s,i,N,Y,N,N,N,N), 1348cc1ac81SLinJiawei FLE_S -> List(N,s,i,N,Y,N,N,N,N), 135dc597826SJiawei Lin // FPToFP 1362ce29ed6SLinJiawei FSGNJ_S -> List(N,s,s,N,N,Y,N,N,N), 1372ce29ed6SLinJiawei FSGNJN_S -> List(N,s,s,N,N,Y,N,N,N), 1382ce29ed6SLinJiawei FSGNJX_S -> List(N,s,s,N,N,Y,N,N,N), 1392ce29ed6SLinJiawei FMIN_S -> List(N,s,s,N,Y,Y,N,N,N), 1402ce29ed6SLinJiawei FMAX_S -> List(N,s,s,N,Y,Y,N,N,N), 1412ce29ed6SLinJiawei FADD_S -> List(Y,s,s,N,Y,Y,N,N,N), 1422ce29ed6SLinJiawei FSUB_S -> List(Y,s,s,N,Y,Y,N,N,N), 1432ce29ed6SLinJiawei FMUL_S -> List(N,s,s,N,Y,Y,N,N,N), 1442ce29ed6SLinJiawei FMADD_S -> List(N,s,s,N,Y,Y,N,N,N), 1452ce29ed6SLinJiawei FMSUB_S -> List(N,s,s,N,Y,Y,N,N,N), 1462ce29ed6SLinJiawei FNMADD_S -> List(N,s,s,N,Y,Y,N,N,N), 1472ce29ed6SLinJiawei FNMSUB_S -> List(N,s,s,N,Y,Y,N,N,N), 1482ce29ed6SLinJiawei FDIV_S -> List(N,s,s,N,Y,Y,Y,N,N), 1492ce29ed6SLinJiawei FSQRT_S -> List(N,s,s,N,Y,Y,N,Y,N) 1502ce29ed6SLinJiawei ) 1512ce29ed6SLinJiawei 152e50fb2d7SLinJiawei 153e50fb2d7SLinJiawei // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt 154e50fb2d7SLinJiawei val double: Array[(BitPat, List[BitPat])] = Array( 155dc597826SJiawei Lin FMV_D_X -> List(N,i,d,Y,N,Y,N,N,N), 156dc597826SJiawei Lin FCVT_D_W -> List(N,i,d,Y,Y,Y,N,N,Y), 157dc597826SJiawei Lin FCVT_D_WU-> List(N,i,d,Y,Y,Y,N,N,Y), 158dc597826SJiawei Lin FCVT_D_L -> List(N,i,d,Y,Y,Y,N,N,Y), 159dc597826SJiawei Lin FCVT_D_LU-> List(N,i,d,Y,Y,Y,N,N,Y), 1608cc1ac81SLinJiawei FMV_X_D -> List(N,d,i,N,N,N,N,N,N), 1618cc1ac81SLinJiawei FCLASS_D -> List(N,d,i,N,N,N,N,N,N), 1628cc1ac81SLinJiawei FCVT_W_D -> List(N,d,i,N,Y,N,N,N,Y), 1638cc1ac81SLinJiawei FCVT_WU_D-> List(N,d,i,N,Y,N,N,N,Y), 1648cc1ac81SLinJiawei FCVT_L_D -> List(N,d,i,N,Y,N,N,N,Y), 1658cc1ac81SLinJiawei FCVT_LU_D-> List(N,d,i,N,Y,N,N,N,Y), 166e50fb2d7SLinJiawei FCVT_S_D -> List(N,d,s,N,Y,Y,N,N,Y), 167e50fb2d7SLinJiawei FCVT_D_S -> List(N,s,d,N,Y,Y,N,N,Y), 1688cc1ac81SLinJiawei FEQ_D -> List(N,d,i,N,Y,N,N,N,N), 1698cc1ac81SLinJiawei FLT_D -> List(N,d,i,N,Y,N,N,N,N), 1708cc1ac81SLinJiawei FLE_D -> List(N,d,i,N,Y,N,N,N,N), 171e50fb2d7SLinJiawei FSGNJ_D -> List(N,d,d,N,N,Y,N,N,N), 172e50fb2d7SLinJiawei FSGNJN_D -> List(N,d,d,N,N,Y,N,N,N), 173e50fb2d7SLinJiawei FSGNJX_D -> List(N,d,d,N,N,Y,N,N,N), 174e50fb2d7SLinJiawei FMIN_D -> List(N,d,d,N,Y,Y,N,N,N), 175e50fb2d7SLinJiawei FMAX_D -> List(N,d,d,N,Y,Y,N,N,N), 176e50fb2d7SLinJiawei FADD_D -> List(Y,d,d,N,Y,Y,N,N,N), 177e50fb2d7SLinJiawei FSUB_D -> List(Y,d,d,N,Y,Y,N,N,N), 178e50fb2d7SLinJiawei FMUL_D -> List(N,d,d,N,Y,Y,N,N,N), 179e50fb2d7SLinJiawei FMADD_D -> List(N,d,d,N,Y,Y,N,N,N), 180e50fb2d7SLinJiawei FMSUB_D -> List(N,d,d,N,Y,Y,N,N,N), 181e50fb2d7SLinJiawei FNMADD_D -> List(N,d,d,N,Y,Y,N,N,N), 182e50fb2d7SLinJiawei FNMSUB_D -> List(N,d,d,N,Y,Y,N,N,N), 183e50fb2d7SLinJiawei FDIV_D -> List(N,d,d,N,Y,Y,Y,N,N), 184e50fb2d7SLinJiawei FSQRT_D -> List(N,d,d,N,Y,Y,N,Y,N) 185e50fb2d7SLinJiawei ) 186e50fb2d7SLinJiawei 187e50fb2d7SLinJiawei val table = single ++ double 1882ce29ed6SLinJiawei 1892ce29ed6SLinJiawei val decoder = DecodeLogic(io.instr, default, table) 1902ce29ed6SLinJiawei 1912ce29ed6SLinJiawei val ctrl = io.fpCtrl 1922ce29ed6SLinJiawei val sigs = Seq( 1932ce29ed6SLinJiawei ctrl.isAddSub, ctrl.typeTagIn, ctrl.typeTagOut, 1942ce29ed6SLinJiawei ctrl.fromInt, ctrl.wflags, ctrl.fpWen, 1952ce29ed6SLinJiawei ctrl.div, ctrl.sqrt, ctrl.fcvt 1962ce29ed6SLinJiawei ) 1972ce29ed6SLinJiawei sigs.zip(decoder).foreach({case (s, d) => s := d}) 19898cfe81bSxgkiri ctrl.typ := inst.TYP 19998cfe81bSxgkiri ctrl.fmt := inst.FMT 20098cfe81bSxgkiri ctrl.rm := inst.RM 2012ce29ed6SLinJiawei 2022ce29ed6SLinJiawei val fmaTable: Array[(BitPat, List[BitPat])] = Array( 203e50fb2d7SLinJiawei FADD_S -> List(BitPat("b00"),N), 204e50fb2d7SLinJiawei FADD_D -> List(BitPat("b00"),N), 205e50fb2d7SLinJiawei FSUB_S -> List(BitPat("b01"),N), 206e50fb2d7SLinJiawei FSUB_D -> List(BitPat("b01"),N), 207e50fb2d7SLinJiawei FMUL_S -> List(BitPat("b00"),N), 208e50fb2d7SLinJiawei FMUL_D -> List(BitPat("b00"),N), 209e50fb2d7SLinJiawei FMADD_S -> List(BitPat("b00"),Y), 210e50fb2d7SLinJiawei FMADD_D -> List(BitPat("b00"),Y), 211e50fb2d7SLinJiawei FMSUB_S -> List(BitPat("b01"),Y), 212e50fb2d7SLinJiawei FMSUB_D -> List(BitPat("b01"),Y), 213e50fb2d7SLinJiawei FNMADD_S-> List(BitPat("b11"),Y), 214e50fb2d7SLinJiawei FNMADD_D-> List(BitPat("b11"),Y), 215e50fb2d7SLinJiawei FNMSUB_S-> List(BitPat("b10"),Y), 216e50fb2d7SLinJiawei FNMSUB_D-> List(BitPat("b10"),Y) 2172ce29ed6SLinJiawei ) 218e50fb2d7SLinJiawei val fmaDefault = List(BitPat("b??"), N) 219e50fb2d7SLinJiawei Seq(ctrl.fmaCmd, ctrl.ren3).zip( 2202ce29ed6SLinJiawei DecodeLogic(io.instr, fmaDefault, fmaTable) 2212ce29ed6SLinJiawei ).foreach({ 2222ce29ed6SLinJiawei case (s, d) => s := d 2232ce29ed6SLinJiawei }) 2242ce29ed6SLinJiawei} 225