xref: /XiangShan/src/main/scala/xiangshan/backend/rename/RenameTable.scala (revision dcf3a679f6184717f135ce501be8114afed527af)
1c6d43980SLemover/***************************************************************************************
2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory
4c6d43980SLemover*
5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2.
6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2.
7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at:
8c6d43980SLemover*          http://license.coscl.org.cn/MulanPSL2
9c6d43980SLemover*
10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
13c6d43980SLemover*
14c6d43980SLemover* See the Mulan PSL v2 for more details.
15c6d43980SLemover***************************************************************************************/
16c6d43980SLemover
17b034d3b9SLinJiaweipackage xiangshan.backend.rename
18b034d3b9SLinJiawei
192225d46eSJiawei Linimport chipsalliance.rocketchip.config.Parameters
20b034d3b9SLinJiaweiimport chisel3._
21b034d3b9SLinJiaweiimport chisel3.util._
223c02ee8fSwakafaimport utility.ParallelPriorityMux
233c02ee8fSwakafaimport utils.XSError
24b034d3b9SLinJiaweiimport xiangshan._
25b034d3b9SLinJiawei
262225d46eSJiawei Linclass RatReadPort(implicit p: Parameters) extends XSBundle {
277fa2c198SYinan Xu  val hold = Input(Bool())
28b034d3b9SLinJiawei  val addr = Input(UInt(5.W))
297fa2c198SYinan Xu  val data = Output(UInt(PhyRegIdxWidth.W))
30b034d3b9SLinJiawei}
31b034d3b9SLinJiawei
322225d46eSJiawei Linclass RatWritePort(implicit p: Parameters) extends XSBundle {
337fa2c198SYinan Xu  val wen = Bool()
347fa2c198SYinan Xu  val addr = UInt(5.W)
357fa2c198SYinan Xu  val data = UInt(PhyRegIdxWidth.W)
36b034d3b9SLinJiawei}
37b034d3b9SLinJiawei
382225d46eSJiawei Linclass RenameTable(float: Boolean)(implicit p: Parameters) extends XSModule {
3966b2c4a4SYinan Xu  val io = IO(new Bundle {
40ccfddc82SHaojin Tang    val redirect = Input(Bool())
41b034d3b9SLinJiawei    val readPorts = Vec({if(float) 4 else 3} * RenameWidth, new RatReadPort)
427fa2c198SYinan Xu    val specWritePorts = Vec(CommitWidth, Input(new RatWritePort))
437fa2c198SYinan Xu    val archWritePorts = Vec(CommitWidth, Input(new RatWritePort))
44*dcf3a679STang Haojin    val old_pdest = Vec(CommitWidth, Output(UInt(PhyRegIdxWidth.W)))
45*dcf3a679STang Haojin    val need_free = Vec(CommitWidth, Output(Bool()))
462225d46eSJiawei Lin    val debug_rdata = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
47b034d3b9SLinJiawei  })
48b034d3b9SLinJiawei
49b034d3b9SLinJiawei  // speculative rename table
5066b2c4a4SYinan Xu  val rename_table_init = VecInit.tabulate(32)(i => (if (float) i else 0).U(PhyRegIdxWidth.W))
5166b2c4a4SYinan Xu  val spec_table = RegInit(rename_table_init)
527fa2c198SYinan Xu  val spec_table_next = WireInit(spec_table)
53b034d3b9SLinJiawei  // arch state rename table
5466b2c4a4SYinan Xu  val arch_table = RegInit(rename_table_init)
55ccfddc82SHaojin Tang  val arch_table_next = WireDefault(arch_table)
56*dcf3a679STang Haojin  // old_pdest
57*dcf3a679STang Haojin  val old_pdest = RegInit(VecInit.fill(CommitWidth)(0.U(PhyRegIdxWidth.W)))
58*dcf3a679STang Haojin  val need_free = RegInit(VecInit.fill(CommitWidth)(false.B))
59b034d3b9SLinJiawei
607fa2c198SYinan Xu  // For better timing, we optimize reading and writing to RenameTable as follows:
617fa2c198SYinan Xu  // (1) Writing at T0 will be actually processed at T1.
627fa2c198SYinan Xu  // (2) Reading is synchronous now.
637fa2c198SYinan Xu  // (3) RAddr at T0 will be used to access the table and get data at T0.
647fa2c198SYinan Xu  // (4) WData at T0 is bypassed to RData at T1.
65ccfddc82SHaojin Tang  val t1_redirect = RegNext(io.redirect, false.B)
667fa2c198SYinan Xu  val t1_rdata = io.readPorts.map(p => RegNext(Mux(p.hold, p.data, spec_table_next(p.addr))))
677fa2c198SYinan Xu  val t1_raddr = io.readPorts.map(p => RegEnable(p.addr, !p.hold))
68ccfddc82SHaojin Tang  val t1_wSpec = RegNext(Mux(io.redirect, 0.U.asTypeOf(io.specWritePorts), io.specWritePorts))
69b034d3b9SLinJiawei
707fa2c198SYinan Xu  // WRITE: when instruction commits or walking
717fa2c198SYinan Xu  val t1_wSpec_addr = t1_wSpec.map(w => Mux(w.wen, UIntToOH(w.addr), 0.U))
727fa2c198SYinan Xu  for ((next, i) <- spec_table_next.zipWithIndex) {
737fa2c198SYinan Xu    val matchVec = t1_wSpec_addr.map(w => w(i))
747fa2c198SYinan Xu    val wMatch = ParallelPriorityMux(matchVec.reverse, t1_wSpec.map(_.data).reverse)
757fa2c198SYinan Xu    // When there's a flush, we use arch_table to update spec_table.
76ccfddc82SHaojin Tang    next := Mux(t1_redirect, arch_table(i), Mux(VecInit(matchVec).asUInt.orR, wMatch, spec_table(i)))
777fa2c198SYinan Xu  }
787fa2c198SYinan Xu  spec_table := spec_table_next
797fa2c198SYinan Xu
807fa2c198SYinan Xu  // READ: decode-rename stage
81b034d3b9SLinJiawei  for ((r, i) <- io.readPorts.zipWithIndex) {
827fa2c198SYinan Xu    // We use two comparisons here because r.hold has bad timing but addrs have better timing.
837fa2c198SYinan Xu    val t0_bypass = io.specWritePorts.map(w => w.wen && Mux(r.hold, w.addr === t1_raddr(i), w.addr === r.addr))
84ccfddc82SHaojin Tang    val t1_bypass = RegNext(Mux(io.redirect, 0.U.asTypeOf(VecInit(t0_bypass)), VecInit(t0_bypass)))
857fa2c198SYinan Xu    val bypass_data = ParallelPriorityMux(t1_bypass.reverse, t1_wSpec.map(_.data).reverse)
867fa2c198SYinan Xu    r.data := Mux(t1_bypass.asUInt.orR, bypass_data, t1_rdata(i))
87b034d3b9SLinJiawei  }
88b034d3b9SLinJiawei
89*dcf3a679STang Haojin  for ((w, i) <- io.archWritePorts.zipWithIndex) {
907fa2c198SYinan Xu    when (w.wen) {
91ccfddc82SHaojin Tang      arch_table_next(w.addr) := w.data
92ce4949a0SYinan Xu    }
93*dcf3a679STang Haojin    val arch_mask = VecInit.fill(PhyRegIdxWidth)(w.wen).asUInt
94*dcf3a679STang Haojin    old_pdest(i) :=
95*dcf3a679STang Haojin      MuxCase(arch_table(w.addr) & arch_mask,
96*dcf3a679STang Haojin              io.archWritePorts.take(i).reverse.map(x => (x.wen && x.addr === w.addr, x.data & arch_mask)))
97b034d3b9SLinJiawei  }
98ccfddc82SHaojin Tang  arch_table := arch_table_next
99b034d3b9SLinJiawei
100*dcf3a679STang Haojin  for (((old, free), i) <- (old_pdest zip need_free).zipWithIndex) {
101*dcf3a679STang Haojin    val hasDuplicate = old_pdest.take(i).map(_ === old)
102*dcf3a679STang Haojin    val blockedByDup = if (i == 0) false.B else VecInit(hasDuplicate).asUInt.orR
103*dcf3a679STang Haojin    free := VecInit(arch_table.map(_ =/= old)).asUInt.andR && !blockedByDup
104*dcf3a679STang Haojin  }
105*dcf3a679STang Haojin
106*dcf3a679STang Haojin  io.old_pdest := old_pdest
107*dcf3a679STang Haojin  io.need_free := need_free
1082225d46eSJiawei Lin  io.debug_rdata := arch_table
10944dead2fSZhangZifei}
1107fa2c198SYinan Xu
1117fa2c198SYinan Xuclass RenameTableWrapper(implicit p: Parameters) extends XSModule {
1127fa2c198SYinan Xu  val io = IO(new Bundle() {
113ccfddc82SHaojin Tang    val redirect = Input(Bool())
114ccfddc82SHaojin Tang    val robCommits = Input(new RobCommitIO)
1157fa2c198SYinan Xu    val intReadPorts = Vec(RenameWidth, Vec(3, new RatReadPort))
1167fa2c198SYinan Xu    val intRenamePorts = Vec(RenameWidth, Input(new RatWritePort))
1177fa2c198SYinan Xu    val fpReadPorts = Vec(RenameWidth, Vec(4, new RatReadPort))
1187fa2c198SYinan Xu    val fpRenamePorts = Vec(RenameWidth, Input(new RatWritePort))
119*dcf3a679STang Haojin    val int_old_pdest = Vec(CommitWidth, Output(UInt(PhyRegIdxWidth.W)))
120*dcf3a679STang Haojin    val fp_old_pdest = Vec(CommitWidth, Output(UInt(PhyRegIdxWidth.W)))
121*dcf3a679STang Haojin    val int_need_free = Vec(CommitWidth, Output(Bool()))
1227fa2c198SYinan Xu    // for debug printing
1237fa2c198SYinan Xu    val debug_int_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
1247fa2c198SYinan Xu    val debug_fp_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
1257fa2c198SYinan Xu  })
1267fa2c198SYinan Xu
1277fa2c198SYinan Xu  val intRat = Module(new RenameTable(float = false))
1287fa2c198SYinan Xu  val fpRat = Module(new RenameTable(float = true))
1297fa2c198SYinan Xu
1307fa2c198SYinan Xu  intRat.io.debug_rdata <> io.debug_int_rat
1317fa2c198SYinan Xu  intRat.io.readPorts <> io.intReadPorts.flatten
132ccfddc82SHaojin Tang  intRat.io.redirect := io.redirect
133ccfddc82SHaojin Tang  fpRat.io.redirect := io.redirect
134*dcf3a679STang Haojin  io.int_old_pdest := intRat.io.old_pdest
135*dcf3a679STang Haojin  io.fp_old_pdest := fpRat.io.old_pdest
136*dcf3a679STang Haojin  io.int_need_free := intRat.io.need_free
137c3abb8b6SYinan Xu  val intDestValid = io.robCommits.info.map(_.rfWen)
1387fa2c198SYinan Xu  for ((arch, i) <- intRat.io.archWritePorts.zipWithIndex) {
1396474c47fSYinan Xu    arch.wen  := io.robCommits.isCommit && io.robCommits.commitValid(i) && intDestValid(i)
1407fa2c198SYinan Xu    arch.addr := io.robCommits.info(i).ldest
1417fa2c198SYinan Xu    arch.data := io.robCommits.info(i).pdest
142c3abb8b6SYinan Xu    XSError(arch.wen && arch.addr === 0.U && arch.data =/= 0.U, "pdest for $0 should be 0\n")
1437fa2c198SYinan Xu  }
1447fa2c198SYinan Xu  for ((spec, i) <- intRat.io.specWritePorts.zipWithIndex) {
1456474c47fSYinan Xu    spec.wen  := io.robCommits.isWalk && io.robCommits.walkValid(i) && intDestValid(i)
1467fa2c198SYinan Xu    spec.addr := io.robCommits.info(i).ldest
147ccfddc82SHaojin Tang    spec.data := io.robCommits.info(i).pdest
148c3abb8b6SYinan Xu    XSError(spec.wen && spec.addr === 0.U && spec.data =/= 0.U, "pdest for $0 should be 0\n")
1497fa2c198SYinan Xu  }
1507fa2c198SYinan Xu  for ((spec, rename) <- intRat.io.specWritePorts.zip(io.intRenamePorts)) {
1517fa2c198SYinan Xu    when (rename.wen) {
1527fa2c198SYinan Xu      spec.wen  := true.B
1537fa2c198SYinan Xu      spec.addr := rename.addr
1547fa2c198SYinan Xu      spec.data := rename.data
1557fa2c198SYinan Xu    }
1567fa2c198SYinan Xu  }
1577fa2c198SYinan Xu
1587fa2c198SYinan Xu  // debug read ports for difftest
1597fa2c198SYinan Xu  fpRat.io.debug_rdata <> io.debug_fp_rat
1607fa2c198SYinan Xu  fpRat.io.readPorts <> io.fpReadPorts.flatten
1617fa2c198SYinan Xu  for ((arch, i) <- fpRat.io.archWritePorts.zipWithIndex) {
1626474c47fSYinan Xu    arch.wen  := io.robCommits.isCommit && io.robCommits.commitValid(i) && io.robCommits.info(i).fpWen
1637fa2c198SYinan Xu    arch.addr := io.robCommits.info(i).ldest
1647fa2c198SYinan Xu    arch.data := io.robCommits.info(i).pdest
1657fa2c198SYinan Xu  }
1667fa2c198SYinan Xu  for ((spec, i) <- fpRat.io.specWritePorts.zipWithIndex) {
1676474c47fSYinan Xu    spec.wen  := io.robCommits.isWalk && io.robCommits.walkValid(i) && io.robCommits.info(i).fpWen
1687fa2c198SYinan Xu    spec.addr := io.robCommits.info(i).ldest
169ccfddc82SHaojin Tang    spec.data := io.robCommits.info(i).pdest
1707fa2c198SYinan Xu  }
1717fa2c198SYinan Xu  for ((spec, rename) <- fpRat.io.specWritePorts.zip(io.fpRenamePorts)) {
1727fa2c198SYinan Xu    when (rename.wen) {
1737fa2c198SYinan Xu      spec.wen  := true.B
1747fa2c198SYinan Xu      spec.addr := rename.addr
1757fa2c198SYinan Xu      spec.data := rename.data
1767fa2c198SYinan Xu    }
1777fa2c198SYinan Xu  }
1787fa2c198SYinan Xu
1797fa2c198SYinan Xu}
180