xref: /XiangShan/src/main/scala/xiangshan/backend/decode/UopInfoGen.scala (revision 3d4459fa987cd6da9aa9a4fa78361b2be313fda8)
17f9f0a79SzhanglyGit/***************************************************************************************
27f9f0a79SzhanglyGit  * Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
37f9f0a79SzhanglyGit  * Copyright (c) 2020-2021 Peng Cheng Laboratory
47f9f0a79SzhanglyGit  *
57f9f0a79SzhanglyGit  * XiangShan is licensed under Mulan PSL v2.
67f9f0a79SzhanglyGit  * You can use this software according to the terms and conditions of the Mulan PSL v2.
77f9f0a79SzhanglyGit  * You may obtain a copy of Mulan PSL v2 at:
87f9f0a79SzhanglyGit  *          http://license.coscl.org.cn/MulanPSL2
97f9f0a79SzhanglyGit  *
107f9f0a79SzhanglyGit  * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
117f9f0a79SzhanglyGit  * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
127f9f0a79SzhanglyGit  * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
137f9f0a79SzhanglyGit  *
147f9f0a79SzhanglyGit  * See the Mulan PSL v2 for more details.
157f9f0a79SzhanglyGit  ***************************************************************************************/
167f9f0a79SzhanglyGit
177f9f0a79SzhanglyGitpackage xiangshan.backend.decode
187f9f0a79SzhanglyGit
1983ba63b3SXuan Huimport org.chipsalliance.cde.config.Parameters
207f9f0a79SzhanglyGitimport chisel3._
217f9f0a79SzhanglyGitimport chisel3.util._
227f9f0a79SzhanglyGitimport freechips.rocketchip.rocket.Instructions
237f9f0a79SzhanglyGitimport freechips.rocketchip.util.uintToBitPat
247f9f0a79SzhanglyGitimport utils._
257f9f0a79SzhanglyGitimport utility._
267f9f0a79SzhanglyGitimport xiangshan.ExceptionNO.illegalInstr
277f9f0a79SzhanglyGitimport xiangshan._
287f9f0a79SzhanglyGitimport xiangshan.backend.fu.fpu.FPU
297f9f0a79SzhanglyGitimport xiangshan.backend.fu.FuType
307f9f0a79SzhanglyGitimport freechips.rocketchip.rocket.Instructions._
317f9f0a79SzhanglyGitimport xiangshan.backend.Bundles.{DecodedInst, StaticInst}
327f9f0a79SzhanglyGitimport xiangshan.backend.fu.vector.Bundles.{VType, VLmul, VSew}
337f9f0a79SzhanglyGitimport yunsuan.VpermType
34c4501a6fSZiyue-Zhangimport chisel3.util.experimental.decode.{QMCMinimizer, TruthTable, decoder}
35c4501a6fSZiyue-Zhang
36c4501a6fSZiyue-Zhangclass strdiedLSNumOfUopTable() extends Module {
37c4501a6fSZiyue-Zhang  val src = IO(Input(UInt(5.W)))
38c4501a6fSZiyue-Zhang  val out = IO(Output(UInt(4.W)))
39c4501a6fSZiyue-Zhang  // strided load/store
40c4501a6fSZiyue-Zhang  var combVemulNf : Seq[(Int, Int, Int)] = Seq()
41c4501a6fSZiyue-Zhang  for (emul <- 0 until 4) {
42c4501a6fSZiyue-Zhang    for (nf <- 0 until 8) {
43c4501a6fSZiyue-Zhang      if ((1 << emul) * (nf + 1) <= 8) {
44c4501a6fSZiyue-Zhang        combVemulNf :+= (emul, nf, (1 << emul) * (nf + 1))
45c4501a6fSZiyue-Zhang      } else {
46c4501a6fSZiyue-Zhang        combVemulNf :+= (emul, nf, 0)
47c4501a6fSZiyue-Zhang      }
48c4501a6fSZiyue-Zhang    }
49c4501a6fSZiyue-Zhang  }
50c4501a6fSZiyue-Zhang  out := decoder(QMCMinimizer, src, TruthTable(combVemulNf.map {
51c4501a6fSZiyue-Zhang    case (emul, nf, uopNum) => (BitPat((emul << 3 | nf).U(5.W)), BitPat(uopNum.U(4.W)))
52c4501a6fSZiyue-Zhang  }, BitPat.N(4)))
53c4501a6fSZiyue-Zhang}
54c4501a6fSZiyue-Zhang
55c4501a6fSZiyue-Zhangclass indexedLSNumOfUopTable() extends Module {
56c4501a6fSZiyue-Zhang  val src = IO(Input(UInt(7.W)))
57c4501a6fSZiyue-Zhang  val out = IO(Output(UInt(7.W)))
58c4501a6fSZiyue-Zhang  // strided load/store
59c4501a6fSZiyue-Zhang  var combVemulNf : Seq[(Int, Int, Int, Int)] = Seq()
60c4501a6fSZiyue-Zhang  for (emul <- 0 until 4) {
61c4501a6fSZiyue-Zhang    for (lmul <- 0 until 4) {
6255f7bedaSZiyue Zhang      var emul_val = 1 << emul
6355f7bedaSZiyue Zhang      var lmul_val = 1 << lmul
6455f7bedaSZiyue Zhang      var mul_max = if (emul_val > lmul_val) emul_val else lmul_val
6555f7bedaSZiyue Zhang      // nf = 0, number of uop = Max(lmul, emul)
6655f7bedaSZiyue Zhang      if ((1 << lmul) <= 8) {    // indexed load/store must ensure that the lmul * nf is less or equal to 8
6755f7bedaSZiyue Zhang        combVemulNf :+= (emul, lmul, 0, mul_max)
6855f7bedaSZiyue Zhang      } else {
6955f7bedaSZiyue Zhang        combVemulNf :+= (emul, lmul, 0, 0)
7055f7bedaSZiyue Zhang      }
7155f7bedaSZiyue Zhang      // nf > 0, number of uop = Max(lmul * nf, emul)
7255f7bedaSZiyue Zhang      for (nf <- 1 until 8) {
7355f7bedaSZiyue Zhang        var uop_num = if (lmul_val * (nf + 1) > emul_val) lmul_val * (nf + 1) else emul_val
7455f7bedaSZiyue Zhang        if (lmul_val * (nf + 1) <= 8) {    // indexed load/store must ensure that the lmul * nf is less or equal to 8
7555f7bedaSZiyue Zhang          combVemulNf :+= (emul, lmul, nf, uop_num)
76c4501a6fSZiyue-Zhang        } else {
77c4501a6fSZiyue-Zhang          combVemulNf :+= (emul, lmul, nf, 0)
78c4501a6fSZiyue-Zhang        }
79c4501a6fSZiyue-Zhang      }
80c4501a6fSZiyue-Zhang    }
81c4501a6fSZiyue-Zhang  }
82c4501a6fSZiyue-Zhang  out := decoder(QMCMinimizer, src, TruthTable(combVemulNf.map {
8355f7bedaSZiyue Zhang    case (emul, lmul, nf, uopNum) => (BitPat((emul << 5 | lmul << 3 | nf).U(7.W)), BitPat(uopNum.U(4.W)))
8455f7bedaSZiyue Zhang  }, BitPat.N(4)))
85c4501a6fSZiyue-Zhang}
867f9f0a79SzhanglyGit
877f9f0a79SzhanglyGitclass UopInfoGen (implicit p: Parameters) extends XSModule {
887f9f0a79SzhanglyGit  val io = IO(new UopInfoGenIO)
897f9f0a79SzhanglyGit
90c4501a6fSZiyue-Zhang  val stridedLSTable = Module(new strdiedLSNumOfUopTable)     // decoder for strided load/store
91c4501a6fSZiyue-Zhang  val indexedLSTable = Module(new indexedLSNumOfUopTable)     // decoder for indexed load/store
92c4501a6fSZiyue-Zhang
9387dd4e0dSzhanglyGit  val typeOfSplit = io.in.preInfo.typeOfSplit
9487dd4e0dSzhanglyGit  val vsew = Cat(0.U(1.W), io.in.preInfo.vsew)
9587dd4e0dSzhanglyGit  val veew = Cat(0.U(1.W), io.in.preInfo.vwidth(1, 0))
960a34fc22SZiyue Zhang  val vmvn = io.in.preInfo.vmvn
9706cb2bc1Sweidingliu  val isVlsr = io.in.preInfo.isVlsr
98c90e3eacSZiyue Zhang  val isVlsm = io.in.preInfo.isVlsm
9987dd4e0dSzhanglyGit  val vlmul = io.in.preInfo.vlmul
100c4501a6fSZiyue-Zhang  val nf = io.in.preInfo.nf
1017f9f0a79SzhanglyGit  val isComplex = io.out.isComplex
1027f9f0a79SzhanglyGit
10319d66d7fSXuan Hu  val lmul = MuxLookup(vlmul, 1.U(4.W))(Array(
1047f9f0a79SzhanglyGit    "b001".U -> 2.U,
1057f9f0a79SzhanglyGit    "b010".U -> 4.U,
1067f9f0a79SzhanglyGit    "b011".U -> 8.U
1077f9f0a79SzhanglyGit  ))
10819d66d7fSXuan Hu  val simple_lmul = MuxLookup(vlmul, 0.U(2.W))(Array(
109c4501a6fSZiyue-Zhang    "b001".U -> 1.U,
110c4501a6fSZiyue-Zhang    "b010".U -> 2.U,
111c4501a6fSZiyue-Zhang    "b011".U -> 3.U
112c4501a6fSZiyue-Zhang  ))
1137f9f0a79SzhanglyGit
1147f9f0a79SzhanglyGit  val vemul: UInt = veew.asUInt + 1.U + vlmul.asUInt + ~vsew.asUInt
1157f9f0a79SzhanglyGit
11619d66d7fSXuan Hu  val emul = MuxLookup(vemul, 1.U(4.W))(Array(
1177f9f0a79SzhanglyGit    "b001".U -> 2.U,
1187f9f0a79SzhanglyGit    "b010".U -> 4.U,
1197f9f0a79SzhanglyGit    "b011".U -> 8.U
1207f9f0a79SzhanglyGit  ))                                                              //TODO : eew and emul illegal exception need to be handled
12119d66d7fSXuan Hu  val simple_emul = MuxLookup(vemul, 0.U(2.W))(Array(
122c4501a6fSZiyue-Zhang    "b001".U -> 1.U,
123c4501a6fSZiyue-Zhang    "b010".U -> 2.U,
124c4501a6fSZiyue-Zhang    "b011".U -> 3.U
125c4501a6fSZiyue-Zhang  ))
1267f9f0a79SzhanglyGit
12719d66d7fSXuan Hu  val numOfUopVslide = MuxLookup(vlmul, 1.U(log2Up(MaxUopSize + 1).W))(Array(
1287f9f0a79SzhanglyGit    "b001".U -> 3.U,
1297f9f0a79SzhanglyGit    "b010".U -> 10.U,
1307f9f0a79SzhanglyGit    "b011".U -> 36.U
1317f9f0a79SzhanglyGit  ))
13219d66d7fSXuan Hu  val numOfUopVrgather = MuxLookup(vlmul, 1.U(log2Up(MaxUopSize + 1).W))(Array(
1337f9f0a79SzhanglyGit    "b001".U -> 4.U,
1347f9f0a79SzhanglyGit    "b010".U -> 16.U,
1357f9f0a79SzhanglyGit    "b011".U -> 64.U
1367f9f0a79SzhanglyGit  ))
1377f9f0a79SzhanglyGit  val numOfUopVrgatherei16 = Mux((!vsew.orR) && (vlmul =/= "b011".U),
1387f9f0a79SzhanglyGit    Cat(numOfUopVrgather, 0.U(1.W)),
1397f9f0a79SzhanglyGit    numOfUopVrgather
1407f9f0a79SzhanglyGit  )
14119d66d7fSXuan Hu  val numOfUopVcompress = MuxLookup(vlmul, 1.U(4.W))(Array(
1427f9f0a79SzhanglyGit    "b001".U -> 4.U,
1437f9f0a79SzhanglyGit    "b010".U -> 13.U,
1447f9f0a79SzhanglyGit    "b011".U -> 43.U
1457f9f0a79SzhanglyGit  ))
146582849ffSxiaofeibao-xjtu  val numOfUopVFRED = {
147582849ffSxiaofeibao-xjtu    // addTime include add frs1
14819d66d7fSXuan Hu     val addTime = MuxLookup(vlmul, 1.U(4.W))(Array(
149582849ffSxiaofeibao-xjtu       VLmul.m2 -> 2.U,
150582849ffSxiaofeibao-xjtu       VLmul.m4 -> 4.U,
151582849ffSxiaofeibao-xjtu       VLmul.m8 -> 8.U,
152582849ffSxiaofeibao-xjtu     ))
15319d66d7fSXuan Hu    val foldLastVlmul = MuxLookup(vsew, "b000".U)(Array(
154582849ffSxiaofeibao-xjtu      VSew.e16 -> VLmul.mf8,
155582849ffSxiaofeibao-xjtu      VSew.e32 -> VLmul.mf4,
156582849ffSxiaofeibao-xjtu      VSew.e64 -> VLmul.mf2,
157582849ffSxiaofeibao-xjtu    ))
158582849ffSxiaofeibao-xjtu    // lmul < 1, foldTime = vlmul - foldFastVlmul
159582849ffSxiaofeibao-xjtu    // lmul >= 1, foldTime = 0.U - foldFastVlmul
160582849ffSxiaofeibao-xjtu    val foldTime = Mux(vlmul(2), vlmul, 0.U) - foldLastVlmul
161582849ffSxiaofeibao-xjtu    addTime + foldTime
162582849ffSxiaofeibao-xjtu  }
163b94b1889Sxiaofeibao-xjtu  val numOfUopVFREDOSUM = {
16419d66d7fSXuan Hu    val uvlMax = MuxLookup(vsew, 0.U)(Array(
165b94b1889Sxiaofeibao-xjtu      VSew.e16 -> 8.U,
166b94b1889Sxiaofeibao-xjtu      VSew.e32 -> 4.U,
167b94b1889Sxiaofeibao-xjtu      VSew.e64 -> 2.U,
168b94b1889Sxiaofeibao-xjtu    ))
169b94b1889Sxiaofeibao-xjtu    val vlMax = Wire(UInt(7.W))
170b94b1889Sxiaofeibao-xjtu    vlMax := Mux(vlmul(2), uvlMax >> (-vlmul)(1,0), uvlMax << vlmul(1,0)).asUInt
171b94b1889Sxiaofeibao-xjtu    vlMax
172b94b1889Sxiaofeibao-xjtu  }
173904d2184SZiyue Zhang  /*
174904d2184SZiyue Zhang   * when 1 <= lmul <= 4, numOfUopWV = 2 * lmul, otherwise numOfUopWV = 1
175904d2184SZiyue Zhang   */
17619d66d7fSXuan Hu  val numOfUopWV = MuxLookup(vlmul, 1.U(4.W))(Array(
177904d2184SZiyue Zhang    "b000".U -> 2.U,
178904d2184SZiyue Zhang    "b001".U -> 4.U,
179904d2184SZiyue Zhang    "b010".U -> 8.U,
180904d2184SZiyue Zhang  ))
181904d2184SZiyue Zhang  /*
182904d2184SZiyue Zhang   * need an extra move instruction
183904d2184SZiyue Zhang   * when 1 <= lmul <= 4, numOfUopWX = 2 * lmul + 1, otherwise numOfUopWX = 2
184904d2184SZiyue Zhang   */
18519d66d7fSXuan Hu  val numOfUopWX = MuxLookup(vlmul, 2.U(4.W))(Array(
186904d2184SZiyue Zhang    "b000".U -> 3.U,
187904d2184SZiyue Zhang    "b001".U -> 5.U,
188904d2184SZiyue Zhang    "b010".U -> 9.U,
189904d2184SZiyue Zhang  ))
1907f9f0a79SzhanglyGit
191c4501a6fSZiyue-Zhang  stridedLSTable.src := Cat(simple_emul, nf)
192c4501a6fSZiyue-Zhang  val numOfUopVLoadStoreStrided = stridedLSTable.out
193c4501a6fSZiyue-Zhang  indexedLSTable.src := Cat(simple_emul, simple_lmul, nf)
194c4501a6fSZiyue-Zhang  val numOfUopVLoadStoreIndexed = indexedLSTable.out
195c4501a6fSZiyue-Zhang
1967f9f0a79SzhanglyGit  //number of uop
19719d66d7fSXuan Hu  val numOfUop = MuxLookup(typeOfSplit, 1.U(log2Up(MaxUopSize + 1).W))(Array(
198e25c13faSXuan Hu    UopSplitType.VSET -> 2.U,
1997f9f0a79SzhanglyGit    UopSplitType.VEC_0XV -> 2.U,
2007f9f0a79SzhanglyGit    UopSplitType.VEC_VVV -> lmul,
201395c8649SZiyue-Zhang    UopSplitType.VEC_VFV -> (lmul +& 1.U),
2027f9f0a79SzhanglyGit    UopSplitType.VEC_EXT2 -> lmul,
2037f9f0a79SzhanglyGit    UopSplitType.VEC_EXT4 -> lmul,
2047f9f0a79SzhanglyGit    UopSplitType.VEC_EXT8 -> lmul,
2057f9f0a79SzhanglyGit    UopSplitType.VEC_VVM -> lmul,
206395c8649SZiyue-Zhang    UopSplitType.VEC_VFM -> (lmul +& 1.U),
207582849ffSxiaofeibao-xjtu    UopSplitType.VEC_VFRED -> numOfUopVFRED,
208b94b1889Sxiaofeibao-xjtu    UopSplitType.VEC_VFREDOSUM -> numOfUopVFREDOSUM,
2097f9f0a79SzhanglyGit    UopSplitType.VEC_VXM -> (lmul +& 1.U),
2107f9f0a79SzhanglyGit    UopSplitType.VEC_VXV -> (lmul +& 1.U),
211395c8649SZiyue-Zhang    UopSplitType.VEC_VFW -> numOfUopWX, // lmul <= 4
212395c8649SZiyue-Zhang    UopSplitType.VEC_WFW -> numOfUopWX, // lmul <= 4
213904d2184SZiyue Zhang    UopSplitType.VEC_VVW -> numOfUopWV, // lmul <= 4
214904d2184SZiyue Zhang    UopSplitType.VEC_WVW -> numOfUopWV, // lmul <= 4
215904d2184SZiyue Zhang    UopSplitType.VEC_VXW -> numOfUopWX, // lmul <= 4
216904d2184SZiyue Zhang    UopSplitType.VEC_WXW -> numOfUopWX, // lmul <= 4
217904d2184SZiyue Zhang    UopSplitType.VEC_WVV -> numOfUopWV, // lmul <= 4
218904d2184SZiyue Zhang    UopSplitType.VEC_WXV -> numOfUopWX, // lmul <= 4
2197f9f0a79SzhanglyGit    UopSplitType.VEC_SLIDE1UP -> (lmul +& 1.U),
220395c8649SZiyue-Zhang    UopSplitType.VEC_FSLIDE1UP -> (lmul +& 1.U),
2217f9f0a79SzhanglyGit    UopSplitType.VEC_SLIDE1DOWN -> Cat(lmul, 0.U(1.W)),
222395c8649SZiyue-Zhang    UopSplitType.VEC_FSLIDE1DOWN -> Cat(lmul, 0.U(1.W)),
2237f9f0a79SzhanglyGit    UopSplitType.VEC_VRED -> lmul,
2247f9f0a79SzhanglyGit    UopSplitType.VEC_SLIDEUP -> (numOfUopVslide + 1.U),
2257f9f0a79SzhanglyGit    UopSplitType.VEC_SLIDEDOWN -> (numOfUopVslide + 1.U),
226cd2c45feSZiyue Zhang    UopSplitType.VEC_M0X -> lmul,
2277f9f0a79SzhanglyGit    UopSplitType.VEC_MVV -> (Cat(lmul, 0.U(1.W)) - 1.U),
2283bb22d12SZiyue Zhang    UopSplitType.VEC_VWW -> Cat(lmul, 0.U(1.W)), // lmul <= 4
2297f9f0a79SzhanglyGit    UopSplitType.VEC_RGATHER -> numOfUopVrgather,
2307f9f0a79SzhanglyGit    UopSplitType.VEC_RGATHER_VX -> (numOfUopVrgather +& 1.U),
2317f9f0a79SzhanglyGit    UopSplitType.VEC_RGATHEREI16 -> numOfUopVrgatherei16,
2325da52072SsinceforYy    UopSplitType.VEC_COMPRESS -> numOfUopVcompress,
2330a34fc22SZiyue Zhang    UopSplitType.VEC_MVNR -> (vmvn +& 1.U),
234c90e3eacSZiyue Zhang    UopSplitType.VEC_US_LDST -> Mux(isVlsr, nf +& 2.U, Mux(isVlsm, 2.U, (numOfUopVLoadStoreStrided +& 1.U))),   // with one move instruction
235c4501a6fSZiyue-Zhang    UopSplitType.VEC_S_LDST -> (numOfUopVLoadStoreStrided +& 2.U),    // with two move instructions
236c4501a6fSZiyue-Zhang    UopSplitType.VEC_I_LDST -> (numOfUopVLoadStoreIndexed +& 1.U),
2377f9f0a79SzhanglyGit  ))
2387f9f0a79SzhanglyGit
2393235a9d8SZiyue-Zhang  // number of writeback num
240792b1339SAnzooooo  val numOfWB = numOfUop
2413235a9d8SZiyue-Zhang
2427e4f0b19SZiyue-Zhang  // vector instruction's uop UopSplitType are not SCA_SIM, and when the number of uop is 1, we can regard it as a simple instruction
243*3d4459faSxiaofeibao-xjtu  isComplex := typeOfSplit =/= UopSplitType.SCA_SIM
2447f9f0a79SzhanglyGit  io.out.uopInfo.numOfUop := numOfUop
2453235a9d8SZiyue-Zhang  io.out.uopInfo.numOfWB := numOfWB
2467f9f0a79SzhanglyGit  io.out.uopInfo.lmul := lmul
2477f9f0a79SzhanglyGit
2487f9f0a79SzhanglyGit}
2497f9f0a79SzhanglyGit
2507f9f0a79SzhanglyGitclass UopInfoGenIO(implicit p: Parameters) extends XSBundle {
2517f9f0a79SzhanglyGit  val in = new Bundle {
25287dd4e0dSzhanglyGit    val preInfo = Input(new PreInfo)
2537f9f0a79SzhanglyGit  }
2547f9f0a79SzhanglyGit  val out = new Bundle {
2557f9f0a79SzhanglyGit    val isComplex = Output(Bool())
2567f9f0a79SzhanglyGit    val uopInfo = Output(new UopInfo)
2577f9f0a79SzhanglyGit  }
2587f9f0a79SzhanglyGit}
2597f9f0a79SzhanglyGit
26087dd4e0dSzhanglyGitclass PreInfo(implicit p: Parameters) extends XSBundle {
2617f9f0a79SzhanglyGit  val typeOfSplit = UopSplitType()
2627f9f0a79SzhanglyGit  val vsew = VSew()          //2 bit
2637f9f0a79SzhanglyGit  val vlmul = VLmul()
2647f9f0a79SzhanglyGit  val vwidth = UInt(3.W)     //eew
265c4501a6fSZiyue-Zhang  val nf = UInt(3.W)
2660a34fc22SZiyue Zhang  val vmvn = UInt(3.W)       // vmvnr
26706cb2bc1Sweidingliu  val isVlsr = Bool()        // is vector whole register load/store
268c90e3eacSZiyue Zhang  val isVlsm = Bool()        // is vector mask load/store
2697f9f0a79SzhanglyGit}
2707f9f0a79SzhanglyGit
2717f9f0a79SzhanglyGitclass UopInfo(implicit p: Parameters) extends XSBundle {
2727f9f0a79SzhanglyGit  val numOfUop = UInt(log2Up(MaxUopSize + 1).W)
2733235a9d8SZiyue-Zhang  val numOfWB = UInt(log2Up(MaxUopSize + 1).W)
2747f9f0a79SzhanglyGit  val lmul = UInt(4.W)
2757f9f0a79SzhanglyGit}