xref: /XiangShan/src/main/scala/xiangshan/backend/rename/RenameTable.scala (revision a8db15d829fbeffc63c1e3101725a2131cedc087)
1c6d43980SLemover/***************************************************************************************
2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory
4c6d43980SLemover*
5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2.
6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2.
7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at:
8c6d43980SLemover*          http://license.coscl.org.cn/MulanPSL2
9c6d43980SLemover*
10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
13c6d43980SLemover*
14c6d43980SLemover* See the Mulan PSL v2 for more details.
15c6d43980SLemover***************************************************************************************/
16c6d43980SLemover
17b034d3b9SLinJiaweipackage xiangshan.backend.rename
18b034d3b9SLinJiawei
192225d46eSJiawei Linimport chipsalliance.rocketchip.config.Parameters
20b034d3b9SLinJiaweiimport chisel3._
21b034d3b9SLinJiaweiimport chisel3.util._
223c02ee8fSwakafaimport utility.ParallelPriorityMux
233c02ee8fSwakafaimport utils.XSError
24b034d3b9SLinJiaweiimport xiangshan._
25b034d3b9SLinJiawei
26a7a8a6ccSHaojin Tangabstract class RegType
27a7a8a6ccSHaojin Tangcase object Reg_I extends RegType
28a7a8a6ccSHaojin Tangcase object Reg_F extends RegType
29a7a8a6ccSHaojin Tangcase object Reg_V extends RegType
30a7a8a6ccSHaojin Tang
312225d46eSJiawei Linclass RatReadPort(implicit p: Parameters) extends XSBundle {
327fa2c198SYinan Xu  val hold = Input(Bool())
33a7a8a6ccSHaojin Tang  val addr = Input(UInt(6.W))
347fa2c198SYinan Xu  val data = Output(UInt(PhyRegIdxWidth.W))
35b034d3b9SLinJiawei}
36b034d3b9SLinJiawei
372225d46eSJiawei Linclass RatWritePort(implicit p: Parameters) extends XSBundle {
387fa2c198SYinan Xu  val wen = Bool()
39a7a8a6ccSHaojin Tang  val addr = UInt(6.W)
407fa2c198SYinan Xu  val data = UInt(PhyRegIdxWidth.W)
41b034d3b9SLinJiawei}
42b034d3b9SLinJiawei
43a7a8a6ccSHaojin Tangclass RenameTable(reg_t: RegType)(implicit p: Parameters) extends XSModule {
44a7a8a6ccSHaojin Tang  val readPortsNum = reg_t match {
45a7a8a6ccSHaojin Tang    case Reg_I => 3
46a7a8a6ccSHaojin Tang    case Reg_F => 4
47a7a8a6ccSHaojin Tang    case Reg_V => 5
48a7a8a6ccSHaojin Tang  }
4966b2c4a4SYinan Xu  val io = IO(new Bundle {
50ccfddc82SHaojin Tang    val redirect = Input(Bool())
51a7a8a6ccSHaojin Tang    val readPorts = Vec(readPortsNum * RenameWidth, new RatReadPort)
527fa2c198SYinan Xu    val specWritePorts = Vec(CommitWidth, Input(new RatWritePort))
537fa2c198SYinan Xu    val archWritePorts = Vec(CommitWidth, Input(new RatWritePort))
54*a8db15d8Sfdy    val diffWritePorts = Vec(CommitWidth * MaxUopSize, Input(new RatWritePort))
552225d46eSJiawei Lin    val debug_rdata = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
56a7a8a6ccSHaojin Tang    val debug_vconfig = reg_t match { // vconfig is implemented as int reg[32]
57*a8db15d8Sfdy      case Reg_V => Some(Output(UInt(PhyRegIdxWidth.W)))
58*a8db15d8Sfdy      case _     => None
59*a8db15d8Sfdy    }
60*a8db15d8Sfdy    val diff_rdata = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
61*a8db15d8Sfdy    val diff_vconfig = reg_t match {
62*a8db15d8Sfdy      case Reg_V => Some(Output(UInt(PhyRegIdxWidth.W)))
63a7a8a6ccSHaojin Tang      case _ => None
64a7a8a6ccSHaojin Tang    }
65b034d3b9SLinJiawei  })
66b034d3b9SLinJiawei
67b034d3b9SLinJiawei  // speculative rename table
68a7a8a6ccSHaojin Tang  // fp and vec share the same free list, so the first init value of vecRAT is 32
69a7a8a6ccSHaojin Tang  val rename_table_init = reg_t match {
70d91483a6Sfdy    case Reg_I => VecInit.fill    (IntLogicRegs)(0.U(PhyRegIdxWidth.W))
71d91483a6Sfdy    case Reg_F => VecInit.tabulate(FpLogicRegs)(_.U(PhyRegIdxWidth.W))
72d91483a6Sfdy    case Reg_V => VecInit.tabulate(VecLogicRegs)(x => (x + FpLogicRegs).U(PhyRegIdxWidth.W))
73a7a8a6ccSHaojin Tang  }
7466b2c4a4SYinan Xu  val spec_table = RegInit(rename_table_init)
757fa2c198SYinan Xu  val spec_table_next = WireInit(spec_table)
76b034d3b9SLinJiawei  // arch state rename table
7766b2c4a4SYinan Xu  val arch_table = RegInit(rename_table_init)
78ccfddc82SHaojin Tang  val arch_table_next = WireDefault(arch_table)
79b034d3b9SLinJiawei
80*a8db15d8Sfdy  val difftest_table = RegInit(rename_table_init)
81*a8db15d8Sfdy  val difftest_table_next = WireDefault(difftest_table)
82*a8db15d8Sfdy
837fa2c198SYinan Xu  // For better timing, we optimize reading and writing to RenameTable as follows:
847fa2c198SYinan Xu  // (1) Writing at T0 will be actually processed at T1.
857fa2c198SYinan Xu  // (2) Reading is synchronous now.
867fa2c198SYinan Xu  // (3) RAddr at T0 will be used to access the table and get data at T0.
877fa2c198SYinan Xu  // (4) WData at T0 is bypassed to RData at T1.
88ccfddc82SHaojin Tang  val t1_redirect = RegNext(io.redirect, false.B)
897fa2c198SYinan Xu  val t1_rdata = io.readPorts.map(p => RegNext(Mux(p.hold, p.data, spec_table_next(p.addr))))
907fa2c198SYinan Xu  val t1_raddr = io.readPorts.map(p => RegEnable(p.addr, !p.hold))
91ccfddc82SHaojin Tang  val t1_wSpec = RegNext(Mux(io.redirect, 0.U.asTypeOf(io.specWritePorts), io.specWritePorts))
92b034d3b9SLinJiawei
937fa2c198SYinan Xu  // WRITE: when instruction commits or walking
947fa2c198SYinan Xu  val t1_wSpec_addr = t1_wSpec.map(w => Mux(w.wen, UIntToOH(w.addr), 0.U))
957fa2c198SYinan Xu  for ((next, i) <- spec_table_next.zipWithIndex) {
967fa2c198SYinan Xu    val matchVec = t1_wSpec_addr.map(w => w(i))
977fa2c198SYinan Xu    val wMatch = ParallelPriorityMux(matchVec.reverse, t1_wSpec.map(_.data).reverse)
987fa2c198SYinan Xu    // When there's a flush, we use arch_table to update spec_table.
99ccfddc82SHaojin Tang    next := Mux(t1_redirect, arch_table(i), Mux(VecInit(matchVec).asUInt.orR, wMatch, spec_table(i)))
1007fa2c198SYinan Xu  }
1017fa2c198SYinan Xu  spec_table := spec_table_next
1027fa2c198SYinan Xu
1037fa2c198SYinan Xu  // READ: decode-rename stage
104b034d3b9SLinJiawei  for ((r, i) <- io.readPorts.zipWithIndex) {
1057fa2c198SYinan Xu    // We use two comparisons here because r.hold has bad timing but addrs have better timing.
1067fa2c198SYinan Xu    val t0_bypass = io.specWritePorts.map(w => w.wen && Mux(r.hold, w.addr === t1_raddr(i), w.addr === r.addr))
107ccfddc82SHaojin Tang    val t1_bypass = RegNext(Mux(io.redirect, 0.U.asTypeOf(VecInit(t0_bypass)), VecInit(t0_bypass)))
1087fa2c198SYinan Xu    val bypass_data = ParallelPriorityMux(t1_bypass.reverse, t1_wSpec.map(_.data).reverse)
1097fa2c198SYinan Xu    r.data := Mux(t1_bypass.asUInt.orR, bypass_data, t1_rdata(i))
110b034d3b9SLinJiawei  }
111b034d3b9SLinJiawei
112b034d3b9SLinJiawei  for (w <- io.archWritePorts) {
1137fa2c198SYinan Xu    when (w.wen) {
114ccfddc82SHaojin Tang      arch_table_next(w.addr) := w.data
115ce4949a0SYinan Xu    }
116b034d3b9SLinJiawei  }
117ccfddc82SHaojin Tang  arch_table := arch_table_next
118b034d3b9SLinJiawei
119*a8db15d8Sfdy  for (w <- io.diffWritePorts) {
120*a8db15d8Sfdy    when(w.wen) {
121*a8db15d8Sfdy      difftest_table_next(w.addr) := w.data
122*a8db15d8Sfdy    }
123*a8db15d8Sfdy  }
124*a8db15d8Sfdy  difftest_table := difftest_table_next
125*a8db15d8Sfdy
126a7a8a6ccSHaojin Tang  io.debug_rdata := arch_table.take(32)
127a7a8a6ccSHaojin Tang  io.debug_vconfig match {
128a7a8a6ccSHaojin Tang    case None => Unit
129a7a8a6ccSHaojin Tang    case x    => x.get := arch_table.last
130a7a8a6ccSHaojin Tang  }
131*a8db15d8Sfdy
132*a8db15d8Sfdy  io.diff_rdata := difftest_table.take(32)
133*a8db15d8Sfdy  io.diff_vconfig match {
134*a8db15d8Sfdy    case None => Unit
135*a8db15d8Sfdy    case x => x.get := difftest_table.last
136*a8db15d8Sfdy  }
13744dead2fSZhangZifei}
1387fa2c198SYinan Xu
1397fa2c198SYinan Xuclass RenameTableWrapper(implicit p: Parameters) extends XSModule {
1407fa2c198SYinan Xu  val io = IO(new Bundle() {
141ccfddc82SHaojin Tang    val redirect = Input(Bool())
142ccfddc82SHaojin Tang    val robCommits = Input(new RobCommitIO)
143*a8db15d8Sfdy    val diffCommits = Input(new DiffCommitIO)
1447fa2c198SYinan Xu    val intReadPorts = Vec(RenameWidth, Vec(3, new RatReadPort))
1457fa2c198SYinan Xu    val intRenamePorts = Vec(RenameWidth, Input(new RatWritePort))
1467fa2c198SYinan Xu    val fpReadPorts = Vec(RenameWidth, Vec(4, new RatReadPort))
1477fa2c198SYinan Xu    val fpRenamePorts = Vec(RenameWidth, Input(new RatWritePort))
148a7a8a6ccSHaojin Tang    val vecReadPorts = Vec(RenameWidth, Vec(5, new RatReadPort))
149deb6421eSHaojin Tang    val vecRenamePorts = Vec(RenameWidth, Input(new RatWritePort))
1507fa2c198SYinan Xu    // for debug printing
1517fa2c198SYinan Xu    val debug_int_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
1527fa2c198SYinan Xu    val debug_fp_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
153deb6421eSHaojin Tang    val debug_vec_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
154a7a8a6ccSHaojin Tang    val debug_vconfig_rat = Output(UInt(PhyRegIdxWidth.W))
155*a8db15d8Sfdy
156*a8db15d8Sfdy    val diff_int_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
157*a8db15d8Sfdy    val diff_fp_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
158*a8db15d8Sfdy    val diff_vec_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
159*a8db15d8Sfdy    val diff_vconfig_rat = Output(UInt(PhyRegIdxWidth.W))
1607fa2c198SYinan Xu  })
1617fa2c198SYinan Xu
162a7a8a6ccSHaojin Tang  val intRat = Module(new RenameTable(Reg_I))
163a7a8a6ccSHaojin Tang  val fpRat  = Module(new RenameTable(Reg_F))
164a7a8a6ccSHaojin Tang  val vecRat = Module(new RenameTable(Reg_V))
1657fa2c198SYinan Xu
166a7a8a6ccSHaojin Tang  io.debug_int_rat := intRat.io.debug_rdata
167*a8db15d8Sfdy  io.diff_int_rat := intRat.io.diff_rdata
1687fa2c198SYinan Xu  intRat.io.readPorts <> io.intReadPorts.flatten
169ccfddc82SHaojin Tang  intRat.io.redirect := io.redirect
170c3abb8b6SYinan Xu  val intDestValid = io.robCommits.info.map(_.rfWen)
1717fa2c198SYinan Xu  for ((arch, i) <- intRat.io.archWritePorts.zipWithIndex) {
1726474c47fSYinan Xu    arch.wen  := io.robCommits.isCommit && io.robCommits.commitValid(i) && intDestValid(i)
1737fa2c198SYinan Xu    arch.addr := io.robCommits.info(i).ldest
1747fa2c198SYinan Xu    arch.data := io.robCommits.info(i).pdest
175c3abb8b6SYinan Xu    XSError(arch.wen && arch.addr === 0.U && arch.data =/= 0.U, "pdest for $0 should be 0\n")
1767fa2c198SYinan Xu  }
1777fa2c198SYinan Xu  for ((spec, i) <- intRat.io.specWritePorts.zipWithIndex) {
1786474c47fSYinan Xu    spec.wen  := io.robCommits.isWalk && io.robCommits.walkValid(i) && intDestValid(i)
1797fa2c198SYinan Xu    spec.addr := io.robCommits.info(i).ldest
180ccfddc82SHaojin Tang    spec.data := io.robCommits.info(i).pdest
181c3abb8b6SYinan Xu    XSError(spec.wen && spec.addr === 0.U && spec.data =/= 0.U, "pdest for $0 should be 0\n")
1827fa2c198SYinan Xu  }
1837fa2c198SYinan Xu  for ((spec, rename) <- intRat.io.specWritePorts.zip(io.intRenamePorts)) {
1847fa2c198SYinan Xu    when (rename.wen) {
1857fa2c198SYinan Xu      spec.wen  := true.B
1867fa2c198SYinan Xu      spec.addr := rename.addr
1877fa2c198SYinan Xu      spec.data := rename.data
1887fa2c198SYinan Xu    }
1897fa2c198SYinan Xu  }
190*a8db15d8Sfdy  for ((diff, i) <- intRat.io.diffWritePorts.zipWithIndex) {
191*a8db15d8Sfdy    diff.wen := io.diffCommits.isCommit && io.diffCommits.commitValid(i) && io.diffCommits.info(i).rfWen
192*a8db15d8Sfdy    diff.addr := io.diffCommits.info(i).ldest
193*a8db15d8Sfdy    diff.data := io.diffCommits.info(i).pdest
194*a8db15d8Sfdy  }
1957fa2c198SYinan Xu
1967fa2c198SYinan Xu  // debug read ports for difftest
197a7a8a6ccSHaojin Tang  io.debug_fp_rat := fpRat.io.debug_rdata
198*a8db15d8Sfdy  io.diff_fp_rat := fpRat.io.diff_rdata
1997fa2c198SYinan Xu  fpRat.io.readPorts <> io.fpReadPorts.flatten
200deb6421eSHaojin Tang  fpRat.io.redirect := io.redirect
2017fa2c198SYinan Xu  for ((arch, i) <- fpRat.io.archWritePorts.zipWithIndex) {
2026474c47fSYinan Xu    arch.wen  := io.robCommits.isCommit && io.robCommits.commitValid(i) && io.robCommits.info(i).fpWen
2037fa2c198SYinan Xu    arch.addr := io.robCommits.info(i).ldest
2047fa2c198SYinan Xu    arch.data := io.robCommits.info(i).pdest
2057fa2c198SYinan Xu  }
2067fa2c198SYinan Xu  for ((spec, i) <- fpRat.io.specWritePorts.zipWithIndex) {
2076474c47fSYinan Xu    spec.wen  := io.robCommits.isWalk && io.robCommits.walkValid(i) && io.robCommits.info(i).fpWen
2087fa2c198SYinan Xu    spec.addr := io.robCommits.info(i).ldest
209ccfddc82SHaojin Tang    spec.data := io.robCommits.info(i).pdest
2107fa2c198SYinan Xu  }
2117fa2c198SYinan Xu  for ((spec, rename) <- fpRat.io.specWritePorts.zip(io.fpRenamePorts)) {
2127fa2c198SYinan Xu    when (rename.wen) {
2137fa2c198SYinan Xu      spec.wen  := true.B
2147fa2c198SYinan Xu      spec.addr := rename.addr
2157fa2c198SYinan Xu      spec.data := rename.data
2167fa2c198SYinan Xu    }
2177fa2c198SYinan Xu  }
218*a8db15d8Sfdy  for ((diff, i) <- fpRat.io.diffWritePorts.zipWithIndex) {
219*a8db15d8Sfdy    diff.wen := io.diffCommits.isCommit && io.diffCommits.commitValid(i) && io.diffCommits.info(i).fpWen
220*a8db15d8Sfdy    diff.addr := io.diffCommits.info(i).ldest
221*a8db15d8Sfdy    diff.data := io.diffCommits.info(i).pdest
222*a8db15d8Sfdy  }
2237fa2c198SYinan Xu
224deb6421eSHaojin Tang  // debug read ports for difftest
225a7a8a6ccSHaojin Tang  io.debug_vec_rat := vecRat.io.debug_rdata
226*a8db15d8Sfdy  io.debug_vconfig_rat := vecRat.io.debug_vconfig.get
227*a8db15d8Sfdy  io.diff_vec_rat := vecRat.io.diff_rdata
228*a8db15d8Sfdy  io.diff_vconfig_rat := vecRat.io.diff_vconfig.get
229deb6421eSHaojin Tang  vecRat.io.readPorts <> io.vecReadPorts.flatten
230deb6421eSHaojin Tang  vecRat.io.redirect := io.redirect
23140a70bd6SZhangZifei  //TODO: RM the donTouch
23240a70bd6SZhangZifei  dontTouch(vecRat.io)
233deb6421eSHaojin Tang  for ((arch, i) <- vecRat.io.archWritePorts.zipWithIndex) {
234deb6421eSHaojin Tang    arch.wen  := io.robCommits.isCommit && io.robCommits.commitValid(i) && io.robCommits.info(i).vecWen
235deb6421eSHaojin Tang    arch.addr := io.robCommits.info(i).ldest
236deb6421eSHaojin Tang    arch.data := io.robCommits.info(i).pdest
237deb6421eSHaojin Tang  }
238deb6421eSHaojin Tang  for ((spec, i) <- vecRat.io.specWritePorts.zipWithIndex) {
239deb6421eSHaojin Tang    spec.wen  := io.robCommits.isWalk && io.robCommits.walkValid(i) && io.robCommits.info(i).vecWen
240deb6421eSHaojin Tang    spec.addr := io.robCommits.info(i).ldest
241deb6421eSHaojin Tang    spec.data := io.robCommits.info(i).pdest
242deb6421eSHaojin Tang  }
243deb6421eSHaojin Tang  for ((spec, rename) <- vecRat.io.specWritePorts.zip(io.vecRenamePorts)) {
244deb6421eSHaojin Tang    when (rename.wen) {
245deb6421eSHaojin Tang      spec.wen  := true.B
246deb6421eSHaojin Tang      spec.addr := rename.addr
247deb6421eSHaojin Tang      spec.data := rename.data
248deb6421eSHaojin Tang    }
249deb6421eSHaojin Tang  }
250*a8db15d8Sfdy  for ((diff, i) <- vecRat.io.diffWritePorts.zipWithIndex) {
251*a8db15d8Sfdy    diff.wen := io.diffCommits.isCommit && io.diffCommits.commitValid(i) && io.diffCommits.info(i).vecWen
252*a8db15d8Sfdy    diff.addr := io.diffCommits.info(i).ldest
253*a8db15d8Sfdy    diff.data := io.diffCommits.info(i).pdest
254*a8db15d8Sfdy  }
255deb6421eSHaojin Tang
2567fa2c198SYinan Xu}
257