1c6d43980SLemover/*************************************************************************************** 2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory 4c6d43980SLemover* 5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2. 6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2. 7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at: 8c6d43980SLemover* http://license.coscl.org.cn/MulanPSL2 9c6d43980SLemover* 10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13c6d43980SLemover* 14c6d43980SLemover* See the Mulan PSL v2 for more details. 15c6d43980SLemover***************************************************************************************/ 16c6d43980SLemover 172ce29ed6SLinJiaweipackage xiangshan.backend.decode 182ce29ed6SLinJiawei 198891a219SYinan Xuimport org.chipsalliance.cde.config.Parameters 202ce29ed6SLinJiaweiimport chisel3._ 212ce29ed6SLinJiaweiimport chisel3.util._ 222ce29ed6SLinJiaweiimport freechips.rocketchip.rocket.DecodeLogic 23361e6d51SJiuyang Liuimport freechips.rocketchip.rocket.Instructions._ 2498cfe81bSxgkiriimport xiangshan.backend.decode.isa.bitfield.XSInstBitFields 25dc597826SJiawei Linimport xiangshan.backend.fu.fpu.FPU 26395c8649SZiyue-Zhangimport xiangshan.backend.fu.vector.Bundles.{VSew, VLmul} 27bdda74fdSxiaofeibao-xjtuimport xiangshan.backend.Bundles.VPUCtrlSignals 282ce29ed6SLinJiaweiimport xiangshan.{FPUCtrlSignals, XSModule} 292ce29ed6SLinJiawei 30bdda74fdSxiaofeibao-xjtuclass FPToVecDecoder(implicit p: Parameters) extends XSModule { 31bdda74fdSxiaofeibao-xjtu val io = IO(new Bundle() { 32bdda74fdSxiaofeibao-xjtu val instr = Input(UInt(32.W)) 33bdda74fdSxiaofeibao-xjtu val vpuCtrl = Output(new VPUCtrlSignals) 34bdda74fdSxiaofeibao-xjtu }) 35bdda74fdSxiaofeibao-xjtu 36bdda74fdSxiaofeibao-xjtu val inst = io.instr.asTypeOf(new XSInstBitFields) 37bdda74fdSxiaofeibao-xjtu val fpToVecInsts = Seq( 38bdda74fdSxiaofeibao-xjtu FADD_S, FSUB_S, FADD_D, FSUB_D, 39bdda74fdSxiaofeibao-xjtu FEQ_S, FLT_S, FLE_S, FEQ_D, FLT_D, FLE_D, 40bdda74fdSxiaofeibao-xjtu FMIN_S, FMAX_S, FMIN_D, FMAX_D, 41bdda74fdSxiaofeibao-xjtu FMUL_S, FMUL_D, 42bdda74fdSxiaofeibao-xjtu FDIV_S, FDIV_D, FSQRT_S, FSQRT_D, 43bdda74fdSxiaofeibao-xjtu FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D, 44bdda74fdSxiaofeibao-xjtu FCLASS_S, FCLASS_D, FSGNJ_S, FSGNJ_D, FSGNJX_S, FSGNJX_D, FSGNJN_S, FSGNJN_D, 4534f9ccd0SZiyue Zhang 4634f9ccd0SZiyue Zhang // scalar cvt inst 4734f9ccd0SZiyue Zhang FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S, 4834f9ccd0SZiyue Zhang FCVT_W_D, FCVT_WU_D, FCVT_L_D, FCVT_LU_D, FCVT_S_D, FCVT_D_S, 49*b189aafaSzmx FCVT_S_H, FCVT_H_S, FCVT_H_D, FCVT_D_H, 50*b189aafaSzmx FMV_X_W, FMV_X_D, FMV_X_H, 51bdda74fdSxiaofeibao-xjtu ) 52bdda74fdSxiaofeibao-xjtu val isFpToVecInst = fpToVecInsts.map(io.instr === _).reduce(_ || _) 53bdda74fdSxiaofeibao-xjtu val isFP32Instrs = Seq( 54bdda74fdSxiaofeibao-xjtu FADD_S, FSUB_S, FEQ_S, FLT_S, FLE_S, FMIN_S, FMAX_S, 55bdda74fdSxiaofeibao-xjtu FMUL_S, FDIV_S, FSQRT_S, 56bdda74fdSxiaofeibao-xjtu FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, 57bdda74fdSxiaofeibao-xjtu FCLASS_S, FSGNJ_S, FSGNJX_S, FSGNJN_S, 58bdda74fdSxiaofeibao-xjtu ) 59bdda74fdSxiaofeibao-xjtu val isFP32Instr = isFP32Instrs.map(io.instr === _).reduce(_ || _) 60bdda74fdSxiaofeibao-xjtu val isFP64Instrs = Seq( 61bdda74fdSxiaofeibao-xjtu FADD_D, FSUB_D, FEQ_D, FLT_D, FLE_D, FMIN_D, FMAX_D, 62bdda74fdSxiaofeibao-xjtu FMUL_D, FDIV_D, FSQRT_D, 63bdda74fdSxiaofeibao-xjtu FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D, 64bdda74fdSxiaofeibao-xjtu FCLASS_D, FSGNJ_D, FSGNJX_D, FSGNJN_D, 65bdda74fdSxiaofeibao-xjtu ) 66bdda74fdSxiaofeibao-xjtu val isFP64Instr = isFP64Instrs.map(io.instr === _).reduce(_ || _) 6734f9ccd0SZiyue Zhang // scalar cvt inst 6834f9ccd0SZiyue Zhang val isSew2Cvts = Seq( 6934f9ccd0SZiyue Zhang FCVT_W_S, FCVT_WU_S, FCVT_L_S, FCVT_LU_S, 7034f9ccd0SZiyue Zhang FCVT_W_D, FCVT_WU_D, FCVT_S_D, FCVT_D_S, 7134f9ccd0SZiyue Zhang FMV_X_W, 7234f9ccd0SZiyue Zhang ) 73*b189aafaSzmx /* 74*b189aafaSzmx The optype for FCVT_D_H and FCVT_H_D is the same, 75*b189aafaSzmx so the two instructions are distinguished by sew. 76*b189aafaSzmx FCVT_H_D:VSew.e64 77*b189aafaSzmx FCVT_D_H:VSew.e16 78*b189aafaSzmx */ 79*b189aafaSzmx val isSew2Cvth = Seq( 80*b189aafaSzmx FCVT_S_H, FCVT_H_S, FCVT_D_H, 81*b189aafaSzmx FMV_X_H, 82*b189aafaSzmx ) 83*b189aafaSzmx val isSew2Cvt32 = isSew2Cvts.map(io.instr === _).reduce(_ || _) 84*b189aafaSzmx val isSew2Cvt16 = isSew2Cvth.map(io.instr === _).reduce(_ || _) 8534f9ccd0SZiyue Zhang val isLmulMf4Cvts = Seq( 8634f9ccd0SZiyue Zhang FCVT_W_S, FCVT_WU_S, 8734f9ccd0SZiyue Zhang FMV_X_W, 8834f9ccd0SZiyue Zhang ) 8934f9ccd0SZiyue Zhang val isLmulMf4Cvt = isLmulMf4Cvts.map(io.instr === _).reduce(_ || _) 904b136a73Ssinsanction val needReverseInsts = Seq( 914b136a73Ssinsanction FADD_S, FSUB_S, FADD_D, FSUB_D, 924b136a73Ssinsanction FEQ_S, FLT_S, FLE_S, FEQ_D, FLT_D, FLE_D, 934b136a73Ssinsanction FMIN_S, FMAX_S, FMIN_D, FMAX_D, 944b136a73Ssinsanction FMUL_S, FMUL_D, 954b136a73Ssinsanction FDIV_S, FDIV_D, FSQRT_S, FSQRT_D, 964b136a73Ssinsanction FMADD_S, FMSUB_S, FNMADD_S, FNMSUB_S, FMADD_D, FMSUB_D, FNMADD_D, FNMSUB_D, 974b136a73Ssinsanction FCLASS_S, FCLASS_D, FSGNJ_S, FSGNJ_D, FSGNJX_S, FSGNJX_D, FSGNJN_S, FSGNJN_D, 984b136a73Ssinsanction ) 99bdda74fdSxiaofeibao-xjtu val needReverseInst = needReverseInsts.map(_ === inst.ALL).reduce(_ || _) 100bdda74fdSxiaofeibao-xjtu io.vpuCtrl := 0.U.asTypeOf(io.vpuCtrl) 101bdda74fdSxiaofeibao-xjtu io.vpuCtrl.fpu.isFpToVecInst := isFpToVecInst 102bdda74fdSxiaofeibao-xjtu io.vpuCtrl.fpu.isFP32Instr := isFP32Instr 103bdda74fdSxiaofeibao-xjtu io.vpuCtrl.fpu.isFP64Instr := isFP64Instr 104bdda74fdSxiaofeibao-xjtu io.vpuCtrl.vill := false.B 105bdda74fdSxiaofeibao-xjtu io.vpuCtrl.vma := true.B 106bdda74fdSxiaofeibao-xjtu io.vpuCtrl.vta := true.B 107*b189aafaSzmx io.vpuCtrl.vsew := Mux(isFP32Instr || isSew2Cvt32, VSew.e32, Mux(isSew2Cvt16, VSew.e16, VSew.e64)) 10834f9ccd0SZiyue Zhang io.vpuCtrl.vlmul := Mux(isFP32Instr || isLmulMf4Cvt, VLmul.mf4, VLmul.mf2) 109bdda74fdSxiaofeibao-xjtu io.vpuCtrl.vm := inst.VM 110bdda74fdSxiaofeibao-xjtu io.vpuCtrl.nf := inst.NF 111d9355d3aSZiyue-Zhang io.vpuCtrl.veew := inst.WIDTH 112bdda74fdSxiaofeibao-xjtu io.vpuCtrl.isReverse := needReverseInst 113bdda74fdSxiaofeibao-xjtu io.vpuCtrl.isExt := false.B 114bdda74fdSxiaofeibao-xjtu io.vpuCtrl.isNarrow := false.B 115bdda74fdSxiaofeibao-xjtu io.vpuCtrl.isDstMask := false.B 11630fcc710SZiyue Zhang io.vpuCtrl.isOpMask := false.B 117b6279fc6SZiyue Zhang io.vpuCtrl.isDependOldvd := false.B 118d8ceb649SZiyue Zhang io.vpuCtrl.isWritePartVd := false.B 119bdda74fdSxiaofeibao-xjtu} 120bdda74fdSxiaofeibao-xjtu 121bdda74fdSxiaofeibao-xjtu 1222225d46eSJiawei Linclass FPDecoder(implicit p: Parameters) extends XSModule{ 1232ce29ed6SLinJiawei val io = IO(new Bundle() { 1242ce29ed6SLinJiawei val instr = Input(UInt(32.W)) 1252ce29ed6SLinJiawei val fpCtrl = Output(new FPUCtrlSignals) 1262ce29ed6SLinJiawei }) 1272ce29ed6SLinJiawei 12898cfe81bSxgkiri private val inst: XSInstBitFields = io.instr.asTypeOf(new XSInstBitFields) 12998cfe81bSxgkiri 1302ce29ed6SLinJiawei def X = BitPat("b?") 1312ce29ed6SLinJiawei def N = BitPat("b0") 1322ce29ed6SLinJiawei def Y = BitPat("b1") 133*b189aafaSzmx val s = BitPat(FPU.S(0)) 134*b189aafaSzmx val d = BitPat(FPU.D(0)) 135*b189aafaSzmx val i = BitPat(FPU.D(0)) 1362ce29ed6SLinJiawei 137fe73f692SLinJiawei val default = List(X,X,X,N,N,N,X,X,X) 1382ce29ed6SLinJiawei 1392ce29ed6SLinJiawei // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt 1402ce29ed6SLinJiawei val single: Array[(BitPat, List[BitPat])] = Array( 141dc597826SJiawei Lin // IntToFP 142dc597826SJiawei Lin FMV_W_X -> List(N,i,s,Y,N,Y,N,N,N), 143dc597826SJiawei Lin FCVT_S_W -> List(N,i,s,Y,Y,Y,N,N,Y), 144dc597826SJiawei Lin FCVT_S_WU-> List(N,i,s,Y,Y,Y,N,N,Y), 145dc597826SJiawei Lin FCVT_S_L -> List(N,i,s,Y,Y,Y,N,N,Y), 146dc597826SJiawei Lin FCVT_S_LU-> List(N,i,s,Y,Y,Y,N,N,Y), 147dc597826SJiawei Lin // FPToInt 148dc597826SJiawei Lin FMV_X_W -> List(N,d,i,N,N,N,N,N,N), // dont box result of fmv.fp.int 1498cc1ac81SLinJiawei FCLASS_S -> List(N,s,i,N,N,N,N,N,N), 1508cc1ac81SLinJiawei FCVT_W_S -> List(N,s,i,N,Y,N,N,N,Y), 1518cc1ac81SLinJiawei FCVT_WU_S-> List(N,s,i,N,Y,N,N,N,Y), 1528cc1ac81SLinJiawei FCVT_L_S -> List(N,s,i,N,Y,N,N,N,Y), 1538cc1ac81SLinJiawei FCVT_LU_S-> List(N,s,i,N,Y,N,N,N,Y), 1548cc1ac81SLinJiawei FEQ_S -> List(N,s,i,N,Y,N,N,N,N), 1558cc1ac81SLinJiawei FLT_S -> List(N,s,i,N,Y,N,N,N,N), 1568cc1ac81SLinJiawei FLE_S -> List(N,s,i,N,Y,N,N,N,N), 157dc597826SJiawei Lin // FPToFP 1582ce29ed6SLinJiawei FSGNJ_S -> List(N,s,s,N,N,Y,N,N,N), 1592ce29ed6SLinJiawei FSGNJN_S -> List(N,s,s,N,N,Y,N,N,N), 1602ce29ed6SLinJiawei FSGNJX_S -> List(N,s,s,N,N,Y,N,N,N), 1612ce29ed6SLinJiawei FMIN_S -> List(N,s,s,N,Y,Y,N,N,N), 1622ce29ed6SLinJiawei FMAX_S -> List(N,s,s,N,Y,Y,N,N,N), 1632ce29ed6SLinJiawei FADD_S -> List(Y,s,s,N,Y,Y,N,N,N), 1642ce29ed6SLinJiawei FSUB_S -> List(Y,s,s,N,Y,Y,N,N,N), 1652ce29ed6SLinJiawei FMUL_S -> List(N,s,s,N,Y,Y,N,N,N), 1662ce29ed6SLinJiawei FMADD_S -> List(N,s,s,N,Y,Y,N,N,N), 1672ce29ed6SLinJiawei FMSUB_S -> List(N,s,s,N,Y,Y,N,N,N), 1682ce29ed6SLinJiawei FNMADD_S -> List(N,s,s,N,Y,Y,N,N,N), 1692ce29ed6SLinJiawei FNMSUB_S -> List(N,s,s,N,Y,Y,N,N,N), 1702ce29ed6SLinJiawei FDIV_S -> List(N,s,s,N,Y,Y,Y,N,N), 1712ce29ed6SLinJiawei FSQRT_S -> List(N,s,s,N,Y,Y,N,Y,N) 1722ce29ed6SLinJiawei ) 1732ce29ed6SLinJiawei 174e50fb2d7SLinJiawei 175e50fb2d7SLinJiawei // isAddSub tagIn tagOut fromInt wflags fpWen div sqrt fcvt 176e50fb2d7SLinJiawei val double: Array[(BitPat, List[BitPat])] = Array( 177dc597826SJiawei Lin FMV_D_X -> List(N,i,d,Y,N,Y,N,N,N), 178dc597826SJiawei Lin FCVT_D_W -> List(N,i,d,Y,Y,Y,N,N,Y), 179dc597826SJiawei Lin FCVT_D_WU-> List(N,i,d,Y,Y,Y,N,N,Y), 180dc597826SJiawei Lin FCVT_D_L -> List(N,i,d,Y,Y,Y,N,N,Y), 181dc597826SJiawei Lin FCVT_D_LU-> List(N,i,d,Y,Y,Y,N,N,Y), 1828cc1ac81SLinJiawei FMV_X_D -> List(N,d,i,N,N,N,N,N,N), 1838cc1ac81SLinJiawei FCLASS_D -> List(N,d,i,N,N,N,N,N,N), 1848cc1ac81SLinJiawei FCVT_W_D -> List(N,d,i,N,Y,N,N,N,Y), 1858cc1ac81SLinJiawei FCVT_WU_D-> List(N,d,i,N,Y,N,N,N,Y), 1868cc1ac81SLinJiawei FCVT_L_D -> List(N,d,i,N,Y,N,N,N,Y), 1878cc1ac81SLinJiawei FCVT_LU_D-> List(N,d,i,N,Y,N,N,N,Y), 188e50fb2d7SLinJiawei FCVT_S_D -> List(N,d,s,N,Y,Y,N,N,Y), 189e50fb2d7SLinJiawei FCVT_D_S -> List(N,s,d,N,Y,Y,N,N,Y), 1908cc1ac81SLinJiawei FEQ_D -> List(N,d,i,N,Y,N,N,N,N), 1918cc1ac81SLinJiawei FLT_D -> List(N,d,i,N,Y,N,N,N,N), 1928cc1ac81SLinJiawei FLE_D -> List(N,d,i,N,Y,N,N,N,N), 193e50fb2d7SLinJiawei FSGNJ_D -> List(N,d,d,N,N,Y,N,N,N), 194e50fb2d7SLinJiawei FSGNJN_D -> List(N,d,d,N,N,Y,N,N,N), 195e50fb2d7SLinJiawei FSGNJX_D -> List(N,d,d,N,N,Y,N,N,N), 196e50fb2d7SLinJiawei FMIN_D -> List(N,d,d,N,Y,Y,N,N,N), 197e50fb2d7SLinJiawei FMAX_D -> List(N,d,d,N,Y,Y,N,N,N), 198e50fb2d7SLinJiawei FADD_D -> List(Y,d,d,N,Y,Y,N,N,N), 199e50fb2d7SLinJiawei FSUB_D -> List(Y,d,d,N,Y,Y,N,N,N), 200e50fb2d7SLinJiawei FMUL_D -> List(N,d,d,N,Y,Y,N,N,N), 201e50fb2d7SLinJiawei FMADD_D -> List(N,d,d,N,Y,Y,N,N,N), 202e50fb2d7SLinJiawei FMSUB_D -> List(N,d,d,N,Y,Y,N,N,N), 203e50fb2d7SLinJiawei FNMADD_D -> List(N,d,d,N,Y,Y,N,N,N), 204e50fb2d7SLinJiawei FNMSUB_D -> List(N,d,d,N,Y,Y,N,N,N), 205e50fb2d7SLinJiawei FDIV_D -> List(N,d,d,N,Y,Y,Y,N,N), 206e50fb2d7SLinJiawei FSQRT_D -> List(N,d,d,N,Y,Y,N,Y,N) 207e50fb2d7SLinJiawei ) 208e50fb2d7SLinJiawei 209e50fb2d7SLinJiawei val table = single ++ double 2102ce29ed6SLinJiawei 2112ce29ed6SLinJiawei val decoder = DecodeLogic(io.instr, default, table) 2122ce29ed6SLinJiawei 2132ce29ed6SLinJiawei val ctrl = io.fpCtrl 2142ce29ed6SLinJiawei val sigs = Seq( 2152ce29ed6SLinJiawei ctrl.isAddSub, ctrl.typeTagIn, ctrl.typeTagOut, 2162ce29ed6SLinJiawei ctrl.fromInt, ctrl.wflags, ctrl.fpWen, 2172ce29ed6SLinJiawei ctrl.div, ctrl.sqrt, ctrl.fcvt 2182ce29ed6SLinJiawei ) 2192ce29ed6SLinJiawei sigs.zip(decoder).foreach({case (s, d) => s := d}) 22098cfe81bSxgkiri ctrl.typ := inst.TYP 22198cfe81bSxgkiri ctrl.fmt := inst.FMT 22298cfe81bSxgkiri ctrl.rm := inst.RM 2232ce29ed6SLinJiawei 2242ce29ed6SLinJiawei val fmaTable: Array[(BitPat, List[BitPat])] = Array( 225e50fb2d7SLinJiawei FADD_S -> List(BitPat("b00"),N), 226e50fb2d7SLinJiawei FADD_D -> List(BitPat("b00"),N), 227e50fb2d7SLinJiawei FSUB_S -> List(BitPat("b01"),N), 228e50fb2d7SLinJiawei FSUB_D -> List(BitPat("b01"),N), 229e50fb2d7SLinJiawei FMUL_S -> List(BitPat("b00"),N), 230e50fb2d7SLinJiawei FMUL_D -> List(BitPat("b00"),N), 231e50fb2d7SLinJiawei FMADD_S -> List(BitPat("b00"),Y), 232e50fb2d7SLinJiawei FMADD_D -> List(BitPat("b00"),Y), 233e50fb2d7SLinJiawei FMSUB_S -> List(BitPat("b01"),Y), 234e50fb2d7SLinJiawei FMSUB_D -> List(BitPat("b01"),Y), 235e50fb2d7SLinJiawei FNMADD_S-> List(BitPat("b11"),Y), 236e50fb2d7SLinJiawei FNMADD_D-> List(BitPat("b11"),Y), 237e50fb2d7SLinJiawei FNMSUB_S-> List(BitPat("b10"),Y), 238e50fb2d7SLinJiawei FNMSUB_D-> List(BitPat("b10"),Y) 2392ce29ed6SLinJiawei ) 240e50fb2d7SLinJiawei val fmaDefault = List(BitPat("b??"), N) 241e50fb2d7SLinJiawei Seq(ctrl.fmaCmd, ctrl.ren3).zip( 2422ce29ed6SLinJiawei DecodeLogic(io.instr, fmaDefault, fmaTable) 2432ce29ed6SLinJiawei ).foreach({ 2442ce29ed6SLinJiawei case (s, d) => s := d 2452ce29ed6SLinJiawei }) 2462ce29ed6SLinJiawei} 247