xref: /XiangShan/src/main/scala/xiangshan/backend/rename/RenameTable.scala (revision 7fa2c198f1e99afdc20903de4fd3323056e5642f)
1c6d43980SLemover/***************************************************************************************
2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory
4c6d43980SLemover*
5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2.
6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2.
7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at:
8c6d43980SLemover*          http://license.coscl.org.cn/MulanPSL2
9c6d43980SLemover*
10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
13c6d43980SLemover*
14c6d43980SLemover* See the Mulan PSL v2 for more details.
15c6d43980SLemover***************************************************************************************/
16c6d43980SLemover
17b034d3b9SLinJiaweipackage xiangshan.backend.rename
18b034d3b9SLinJiawei
192225d46eSJiawei Linimport chipsalliance.rocketchip.config.Parameters
20b034d3b9SLinJiaweiimport chisel3._
21b034d3b9SLinJiaweiimport chisel3.util._
22*7fa2c198SYinan Xuimport utils.{ParallelPriorityMux, XSError}
23b034d3b9SLinJiaweiimport xiangshan._
24b034d3b9SLinJiawei
252225d46eSJiawei Linclass RatReadPort(implicit p: Parameters) extends XSBundle {
26*7fa2c198SYinan Xu  val hold = Input(Bool())
27b034d3b9SLinJiawei  val addr = Input(UInt(5.W))
28*7fa2c198SYinan Xu  val data = Output(UInt(PhyRegIdxWidth.W))
29b034d3b9SLinJiawei}
30b034d3b9SLinJiawei
312225d46eSJiawei Linclass RatWritePort(implicit p: Parameters) extends XSBundle {
32*7fa2c198SYinan Xu  val wen = Bool()
33*7fa2c198SYinan Xu  val addr = UInt(5.W)
34*7fa2c198SYinan Xu  val data = UInt(PhyRegIdxWidth.W)
35b034d3b9SLinJiawei}
36b034d3b9SLinJiawei
372225d46eSJiawei Linclass RenameTable(float: Boolean)(implicit p: Parameters) extends XSModule {
38b034d3b9SLinJiawei  val io = IO(new Bundle() {
392d7c7105SYinan Xu    val flush = Input(Bool())
40b034d3b9SLinJiawei    val readPorts = Vec({if(float) 4 else 3} * RenameWidth, new RatReadPort)
41*7fa2c198SYinan Xu    val specWritePorts = Vec(CommitWidth, Input(new RatWritePort))
42*7fa2c198SYinan Xu    val archWritePorts = Vec(CommitWidth, Input(new RatWritePort))
432225d46eSJiawei Lin    val debug_rdata = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
44b034d3b9SLinJiawei  })
45b034d3b9SLinJiawei
46b034d3b9SLinJiawei  // speculative rename table
47191cb795SLinJiawei  val spec_table = RegInit(VecInit(Seq.tabulate(32)(i => i.U(PhyRegIdxWidth.W))))
48*7fa2c198SYinan Xu  val spec_table_next = WireInit(spec_table)
49b034d3b9SLinJiawei  // arch state rename table
50191cb795SLinJiawei  val arch_table = RegInit(VecInit(Seq.tabulate(32)(i => i.U(PhyRegIdxWidth.W))))
51b034d3b9SLinJiawei
52*7fa2c198SYinan Xu  // For better timing, we optimize reading and writing to RenameTable as follows:
53*7fa2c198SYinan Xu  // (1) Writing at T0 will be actually processed at T1.
54*7fa2c198SYinan Xu  // (2) Reading is synchronous now.
55*7fa2c198SYinan Xu  // (3) RAddr at T0 will be used to access the table and get data at T0.
56*7fa2c198SYinan Xu  // (4) WData at T0 is bypassed to RData at T1.
57*7fa2c198SYinan Xu  val t1_rdata = io.readPorts.map(p => RegNext(Mux(p.hold, p.data, spec_table_next(p.addr))))
58*7fa2c198SYinan Xu  val t1_raddr = io.readPorts.map(p => RegEnable(p.addr, !p.hold))
59*7fa2c198SYinan Xu  val t1_wSpec = RegNext(io.specWritePorts)
60b034d3b9SLinJiawei
61*7fa2c198SYinan Xu  // WRITE: when instruction commits or walking
62*7fa2c198SYinan Xu  val t1_flush = RegNext(io.flush)
63*7fa2c198SYinan Xu  val t1_wSpec_addr = t1_wSpec.map(w => Mux(w.wen, UIntToOH(w.addr), 0.U))
64*7fa2c198SYinan Xu  for ((next, i) <- spec_table_next.zipWithIndex) {
65*7fa2c198SYinan Xu    val matchVec = t1_wSpec_addr.map(w => w(i))
66*7fa2c198SYinan Xu    val wMatch = ParallelPriorityMux(matchVec.reverse, t1_wSpec.map(_.data).reverse)
67*7fa2c198SYinan Xu    // When there's a flush, we use arch_table to update spec_table.
68*7fa2c198SYinan Xu    next := Mux(t1_flush, arch_table(i), Mux(VecInit(matchVec).asUInt.orR, wMatch, spec_table(i)))
69*7fa2c198SYinan Xu  }
70*7fa2c198SYinan Xu  spec_table := spec_table_next
71*7fa2c198SYinan Xu
72*7fa2c198SYinan Xu  // READ: decode-rename stage
73b034d3b9SLinJiawei  for ((r, i) <- io.readPorts.zipWithIndex) {
74*7fa2c198SYinan Xu    // We use two comparisons here because r.hold has bad timing but addrs have better timing.
75*7fa2c198SYinan Xu    val t0_bypass = io.specWritePorts.map(w => w.wen && Mux(r.hold, w.addr === t1_raddr(i), w.addr === r.addr))
76*7fa2c198SYinan Xu    val t1_bypass = RegNext(VecInit(t0_bypass))
77*7fa2c198SYinan Xu    val bypass_data = ParallelPriorityMux(t1_bypass.reverse, t1_wSpec.map(_.data).reverse)
78*7fa2c198SYinan Xu    r.data := Mux(t1_bypass.asUInt.orR, bypass_data, t1_rdata(i))
79b034d3b9SLinJiawei  }
80b034d3b9SLinJiawei
81b034d3b9SLinJiawei  for (w <- io.archWritePorts) {
82*7fa2c198SYinan Xu    when (w.wen) {
83*7fa2c198SYinan Xu      arch_table(w.addr) := w.data
84ce4949a0SYinan Xu    }
85b034d3b9SLinJiawei  }
86b034d3b9SLinJiawei
872225d46eSJiawei Lin  io.debug_rdata := arch_table
8844dead2fSZhangZifei}
89*7fa2c198SYinan Xu
90*7fa2c198SYinan Xuclass RenameTableWrapper(implicit p: Parameters) extends XSModule {
91*7fa2c198SYinan Xu  val io = IO(new Bundle() {
92*7fa2c198SYinan Xu    val flush = Input(Bool())
93*7fa2c198SYinan Xu    val robCommits = Flipped(new RobCommitIO)
94*7fa2c198SYinan Xu    val intReadPorts = Vec(RenameWidth, Vec(3, new RatReadPort))
95*7fa2c198SYinan Xu    val intRenamePorts = Vec(RenameWidth, Input(new RatWritePort))
96*7fa2c198SYinan Xu    val fpReadPorts = Vec(RenameWidth, Vec(4, new RatReadPort))
97*7fa2c198SYinan Xu    val fpRenamePorts = Vec(RenameWidth, Input(new RatWritePort))
98*7fa2c198SYinan Xu    // for debug printing
99*7fa2c198SYinan Xu    val debug_int_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
100*7fa2c198SYinan Xu    val debug_fp_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W)))
101*7fa2c198SYinan Xu  })
102*7fa2c198SYinan Xu
103*7fa2c198SYinan Xu  val intRat = Module(new RenameTable(float = false))
104*7fa2c198SYinan Xu  val fpRat = Module(new RenameTable(float = true))
105*7fa2c198SYinan Xu
106*7fa2c198SYinan Xu  intRat.io.flush := io.flush
107*7fa2c198SYinan Xu  intRat.io.debug_rdata <> io.debug_int_rat
108*7fa2c198SYinan Xu  intRat.io.readPorts <> io.intReadPorts.flatten
109*7fa2c198SYinan Xu  val intDestValid = io.robCommits.info.map(info => info.rfWen && info.ldest =/= 0.U)
110*7fa2c198SYinan Xu  for ((arch, i) <- intRat.io.archWritePorts.zipWithIndex) {
111*7fa2c198SYinan Xu    arch.wen  := !io.robCommits.isWalk && io.robCommits.valid(i) && intDestValid(i)
112*7fa2c198SYinan Xu    arch.addr := io.robCommits.info(i).ldest
113*7fa2c198SYinan Xu    arch.data := io.robCommits.info(i).pdest
114*7fa2c198SYinan Xu  }
115*7fa2c198SYinan Xu  for ((spec, i) <- intRat.io.specWritePorts.zipWithIndex) {
116*7fa2c198SYinan Xu    spec.wen  := io.robCommits.isWalk && io.robCommits.valid(i) && intDestValid(i)
117*7fa2c198SYinan Xu    spec.addr := io.robCommits.info(i).ldest
118*7fa2c198SYinan Xu    spec.data := io.robCommits.info(i).old_pdest
119*7fa2c198SYinan Xu  }
120*7fa2c198SYinan Xu  for ((spec, rename) <- intRat.io.specWritePorts.zip(io.intRenamePorts)) {
121*7fa2c198SYinan Xu    when (rename.wen) {
122*7fa2c198SYinan Xu      spec.wen  := true.B
123*7fa2c198SYinan Xu      spec.addr := rename.addr
124*7fa2c198SYinan Xu      spec.data := rename.data
125*7fa2c198SYinan Xu    }
126*7fa2c198SYinan Xu  }
127*7fa2c198SYinan Xu
128*7fa2c198SYinan Xu  fpRat.io.flush := io.flush
129*7fa2c198SYinan Xu  // debug read ports for difftest
130*7fa2c198SYinan Xu  fpRat.io.debug_rdata <> io.debug_fp_rat
131*7fa2c198SYinan Xu  fpRat.io.readPorts <> io.fpReadPorts.flatten
132*7fa2c198SYinan Xu  for ((arch, i) <- fpRat.io.archWritePorts.zipWithIndex) {
133*7fa2c198SYinan Xu    arch.wen  := !io.robCommits.isWalk && io.robCommits.valid(i) && io.robCommits.info(i).fpWen
134*7fa2c198SYinan Xu    arch.addr := io.robCommits.info(i).ldest
135*7fa2c198SYinan Xu    arch.data := io.robCommits.info(i).pdest
136*7fa2c198SYinan Xu  }
137*7fa2c198SYinan Xu  for ((spec, i) <- fpRat.io.specWritePorts.zipWithIndex) {
138*7fa2c198SYinan Xu    spec.wen  := io.robCommits.isWalk && io.robCommits.valid(i) && io.robCommits.info(i).fpWen
139*7fa2c198SYinan Xu    spec.addr := io.robCommits.info(i).ldest
140*7fa2c198SYinan Xu    spec.data := io.robCommits.info(i).old_pdest
141*7fa2c198SYinan Xu  }
142*7fa2c198SYinan Xu  for ((spec, rename) <- fpRat.io.specWritePorts.zip(io.fpRenamePorts)) {
143*7fa2c198SYinan Xu    when (rename.wen) {
144*7fa2c198SYinan Xu      spec.wen  := true.B
145*7fa2c198SYinan Xu      spec.addr := rename.addr
146*7fa2c198SYinan Xu      spec.data := rename.data
147*7fa2c198SYinan Xu    }
148*7fa2c198SYinan Xu  }
149*7fa2c198SYinan Xu
150*7fa2c198SYinan Xu}
151