1c6d43980SLemover/*************************************************************************************** 2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory 4c6d43980SLemover* 5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2. 6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2. 7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at: 8c6d43980SLemover* http://license.coscl.org.cn/MulanPSL2 9c6d43980SLemover* 10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13c6d43980SLemover* 14c6d43980SLemover* See the Mulan PSL v2 for more details. 15c6d43980SLemover***************************************************************************************/ 16c6d43980SLemover 17b034d3b9SLinJiaweipackage xiangshan.backend.rename 18b034d3b9SLinJiawei 192225d46eSJiawei Linimport chipsalliance.rocketchip.config.Parameters 20b034d3b9SLinJiaweiimport chisel3._ 21b034d3b9SLinJiaweiimport chisel3.util._ 227fa2c198SYinan Xuimport utils.{ParallelPriorityMux, XSError} 23b034d3b9SLinJiaweiimport xiangshan._ 24b034d3b9SLinJiawei 252225d46eSJiawei Linclass RatReadPort(implicit p: Parameters) extends XSBundle { 267fa2c198SYinan Xu val hold = Input(Bool()) 27b034d3b9SLinJiawei val addr = Input(UInt(5.W)) 287fa2c198SYinan Xu val data = Output(UInt(PhyRegIdxWidth.W)) 29b034d3b9SLinJiawei} 30b034d3b9SLinJiawei 312225d46eSJiawei Linclass RatWritePort(implicit p: Parameters) extends XSBundle { 327fa2c198SYinan Xu val wen = Bool() 337fa2c198SYinan Xu val addr = UInt(5.W) 347fa2c198SYinan Xu val data = UInt(PhyRegIdxWidth.W) 35b034d3b9SLinJiawei} 36b034d3b9SLinJiawei 372225d46eSJiawei Linclass RenameTable(float: Boolean)(implicit p: Parameters) extends XSModule { 3866b2c4a4SYinan Xu val io = IO(new Bundle { 39*ccfddc82SHaojin Tang val redirect = Input(Bool()) 40b034d3b9SLinJiawei val readPorts = Vec({if(float) 4 else 3} * RenameWidth, new RatReadPort) 417fa2c198SYinan Xu val specWritePorts = Vec(CommitWidth, Input(new RatWritePort)) 427fa2c198SYinan Xu val archWritePorts = Vec(CommitWidth, Input(new RatWritePort)) 432225d46eSJiawei Lin val debug_rdata = Vec(32, Output(UInt(PhyRegIdxWidth.W))) 44b034d3b9SLinJiawei }) 45b034d3b9SLinJiawei 46b034d3b9SLinJiawei // speculative rename table 4766b2c4a4SYinan Xu val rename_table_init = VecInit.tabulate(32)(i => (if (float) i else 0).U(PhyRegIdxWidth.W)) 4866b2c4a4SYinan Xu val spec_table = RegInit(rename_table_init) 497fa2c198SYinan Xu val spec_table_next = WireInit(spec_table) 50b034d3b9SLinJiawei // arch state rename table 5166b2c4a4SYinan Xu val arch_table = RegInit(rename_table_init) 52*ccfddc82SHaojin Tang val arch_table_next = WireDefault(arch_table) 53b034d3b9SLinJiawei 547fa2c198SYinan Xu // For better timing, we optimize reading and writing to RenameTable as follows: 557fa2c198SYinan Xu // (1) Writing at T0 will be actually processed at T1. 567fa2c198SYinan Xu // (2) Reading is synchronous now. 577fa2c198SYinan Xu // (3) RAddr at T0 will be used to access the table and get data at T0. 587fa2c198SYinan Xu // (4) WData at T0 is bypassed to RData at T1. 59*ccfddc82SHaojin Tang val t1_redirect = RegNext(io.redirect, false.B) 607fa2c198SYinan Xu val t1_rdata = io.readPorts.map(p => RegNext(Mux(p.hold, p.data, spec_table_next(p.addr)))) 617fa2c198SYinan Xu val t1_raddr = io.readPorts.map(p => RegEnable(p.addr, !p.hold)) 62*ccfddc82SHaojin Tang val t1_wSpec = RegNext(Mux(io.redirect, 0.U.asTypeOf(io.specWritePorts), io.specWritePorts)) 63b034d3b9SLinJiawei 647fa2c198SYinan Xu // WRITE: when instruction commits or walking 657fa2c198SYinan Xu val t1_wSpec_addr = t1_wSpec.map(w => Mux(w.wen, UIntToOH(w.addr), 0.U)) 667fa2c198SYinan Xu for ((next, i) <- spec_table_next.zipWithIndex) { 677fa2c198SYinan Xu val matchVec = t1_wSpec_addr.map(w => w(i)) 687fa2c198SYinan Xu val wMatch = ParallelPriorityMux(matchVec.reverse, t1_wSpec.map(_.data).reverse) 697fa2c198SYinan Xu // When there's a flush, we use arch_table to update spec_table. 70*ccfddc82SHaojin Tang next := Mux(t1_redirect, arch_table(i), Mux(VecInit(matchVec).asUInt.orR, wMatch, spec_table(i))) 717fa2c198SYinan Xu } 727fa2c198SYinan Xu spec_table := spec_table_next 737fa2c198SYinan Xu 747fa2c198SYinan Xu // READ: decode-rename stage 75b034d3b9SLinJiawei for ((r, i) <- io.readPorts.zipWithIndex) { 767fa2c198SYinan Xu // We use two comparisons here because r.hold has bad timing but addrs have better timing. 777fa2c198SYinan Xu val t0_bypass = io.specWritePorts.map(w => w.wen && Mux(r.hold, w.addr === t1_raddr(i), w.addr === r.addr)) 78*ccfddc82SHaojin Tang val t1_bypass = RegNext(Mux(io.redirect, 0.U.asTypeOf(VecInit(t0_bypass)), VecInit(t0_bypass))) 797fa2c198SYinan Xu val bypass_data = ParallelPriorityMux(t1_bypass.reverse, t1_wSpec.map(_.data).reverse) 807fa2c198SYinan Xu r.data := Mux(t1_bypass.asUInt.orR, bypass_data, t1_rdata(i)) 81b034d3b9SLinJiawei } 82b034d3b9SLinJiawei 83b034d3b9SLinJiawei for (w <- io.archWritePorts) { 847fa2c198SYinan Xu when (w.wen) { 85*ccfddc82SHaojin Tang arch_table_next(w.addr) := w.data 86ce4949a0SYinan Xu } 87b034d3b9SLinJiawei } 88*ccfddc82SHaojin Tang arch_table := arch_table_next 89b034d3b9SLinJiawei 902225d46eSJiawei Lin io.debug_rdata := arch_table 9144dead2fSZhangZifei} 927fa2c198SYinan Xu 937fa2c198SYinan Xuclass RenameTableWrapper(implicit p: Parameters) extends XSModule { 947fa2c198SYinan Xu val io = IO(new Bundle() { 95*ccfddc82SHaojin Tang val redirect = Input(Bool()) 96*ccfddc82SHaojin Tang val robCommits = Input(new RobCommitIO) 977fa2c198SYinan Xu val intReadPorts = Vec(RenameWidth, Vec(3, new RatReadPort)) 987fa2c198SYinan Xu val intRenamePorts = Vec(RenameWidth, Input(new RatWritePort)) 997fa2c198SYinan Xu val fpReadPorts = Vec(RenameWidth, Vec(4, new RatReadPort)) 1007fa2c198SYinan Xu val fpRenamePorts = Vec(RenameWidth, Input(new RatWritePort)) 1017fa2c198SYinan Xu // for debug printing 1027fa2c198SYinan Xu val debug_int_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W))) 1037fa2c198SYinan Xu val debug_fp_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W))) 1047fa2c198SYinan Xu }) 1057fa2c198SYinan Xu 1067fa2c198SYinan Xu val intRat = Module(new RenameTable(float = false)) 1077fa2c198SYinan Xu val fpRat = Module(new RenameTable(float = true)) 1087fa2c198SYinan Xu 1097fa2c198SYinan Xu intRat.io.debug_rdata <> io.debug_int_rat 1107fa2c198SYinan Xu intRat.io.readPorts <> io.intReadPorts.flatten 111*ccfddc82SHaojin Tang intRat.io.redirect := io.redirect 112*ccfddc82SHaojin Tang fpRat.io.redirect := io.redirect 113c3abb8b6SYinan Xu val intDestValid = io.robCommits.info.map(_.rfWen) 1147fa2c198SYinan Xu for ((arch, i) <- intRat.io.archWritePorts.zipWithIndex) { 1156474c47fSYinan Xu arch.wen := io.robCommits.isCommit && io.robCommits.commitValid(i) && intDestValid(i) 1167fa2c198SYinan Xu arch.addr := io.robCommits.info(i).ldest 1177fa2c198SYinan Xu arch.data := io.robCommits.info(i).pdest 118c3abb8b6SYinan Xu XSError(arch.wen && arch.addr === 0.U && arch.data =/= 0.U, "pdest for $0 should be 0\n") 1197fa2c198SYinan Xu } 1207fa2c198SYinan Xu for ((spec, i) <- intRat.io.specWritePorts.zipWithIndex) { 1216474c47fSYinan Xu spec.wen := io.robCommits.isWalk && io.robCommits.walkValid(i) && intDestValid(i) 1227fa2c198SYinan Xu spec.addr := io.robCommits.info(i).ldest 123*ccfddc82SHaojin Tang spec.data := io.robCommits.info(i).pdest 124c3abb8b6SYinan Xu XSError(spec.wen && spec.addr === 0.U && spec.data =/= 0.U, "pdest for $0 should be 0\n") 1257fa2c198SYinan Xu } 1267fa2c198SYinan Xu for ((spec, rename) <- intRat.io.specWritePorts.zip(io.intRenamePorts)) { 1277fa2c198SYinan Xu when (rename.wen) { 1287fa2c198SYinan Xu spec.wen := true.B 1297fa2c198SYinan Xu spec.addr := rename.addr 1307fa2c198SYinan Xu spec.data := rename.data 1317fa2c198SYinan Xu } 1327fa2c198SYinan Xu } 1337fa2c198SYinan Xu 1347fa2c198SYinan Xu // debug read ports for difftest 1357fa2c198SYinan Xu fpRat.io.debug_rdata <> io.debug_fp_rat 1367fa2c198SYinan Xu fpRat.io.readPorts <> io.fpReadPorts.flatten 1377fa2c198SYinan Xu for ((arch, i) <- fpRat.io.archWritePorts.zipWithIndex) { 1386474c47fSYinan Xu arch.wen := io.robCommits.isCommit && io.robCommits.commitValid(i) && io.robCommits.info(i).fpWen 1397fa2c198SYinan Xu arch.addr := io.robCommits.info(i).ldest 1407fa2c198SYinan Xu arch.data := io.robCommits.info(i).pdest 1417fa2c198SYinan Xu } 1427fa2c198SYinan Xu for ((spec, i) <- fpRat.io.specWritePorts.zipWithIndex) { 1436474c47fSYinan Xu spec.wen := io.robCommits.isWalk && io.robCommits.walkValid(i) && io.robCommits.info(i).fpWen 1447fa2c198SYinan Xu spec.addr := io.robCommits.info(i).ldest 145*ccfddc82SHaojin Tang spec.data := io.robCommits.info(i).pdest 1467fa2c198SYinan Xu } 1477fa2c198SYinan Xu for ((spec, rename) <- fpRat.io.specWritePorts.zip(io.fpRenamePorts)) { 1487fa2c198SYinan Xu when (rename.wen) { 1497fa2c198SYinan Xu spec.wen := true.B 1507fa2c198SYinan Xu spec.addr := rename.addr 1517fa2c198SYinan Xu spec.data := rename.data 1527fa2c198SYinan Xu } 1537fa2c198SYinan Xu } 1547fa2c198SYinan Xu 1557fa2c198SYinan Xu} 156