1c6d43980SLemover/*************************************************************************************** 2c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3f320e0f0SYinan Xu* Copyright (c) 2020-2021 Peng Cheng Laboratory 4c6d43980SLemover* 5c6d43980SLemover* XiangShan is licensed under Mulan PSL v2. 6c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2. 7c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at: 8c6d43980SLemover* http://license.coscl.org.cn/MulanPSL2 9c6d43980SLemover* 10c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13c6d43980SLemover* 14c6d43980SLemover* See the Mulan PSL v2 for more details. 15c6d43980SLemover***************************************************************************************/ 16c6d43980SLemover 17b034d3b9SLinJiaweipackage xiangshan.backend.rename 18b034d3b9SLinJiawei 192225d46eSJiawei Linimport chipsalliance.rocketchip.config.Parameters 20b034d3b9SLinJiaweiimport chisel3._ 21b034d3b9SLinJiaweiimport chisel3.util._ 22*7fa2c198SYinan Xuimport utils.{ParallelPriorityMux, XSError} 23b034d3b9SLinJiaweiimport xiangshan._ 24b034d3b9SLinJiawei 252225d46eSJiawei Linclass RatReadPort(implicit p: Parameters) extends XSBundle { 26*7fa2c198SYinan Xu val hold = Input(Bool()) 27b034d3b9SLinJiawei val addr = Input(UInt(5.W)) 28*7fa2c198SYinan Xu val data = Output(UInt(PhyRegIdxWidth.W)) 29b034d3b9SLinJiawei} 30b034d3b9SLinJiawei 312225d46eSJiawei Linclass RatWritePort(implicit p: Parameters) extends XSBundle { 32*7fa2c198SYinan Xu val wen = Bool() 33*7fa2c198SYinan Xu val addr = UInt(5.W) 34*7fa2c198SYinan Xu val data = UInt(PhyRegIdxWidth.W) 35b034d3b9SLinJiawei} 36b034d3b9SLinJiawei 372225d46eSJiawei Linclass RenameTable(float: Boolean)(implicit p: Parameters) extends XSModule { 38b034d3b9SLinJiawei val io = IO(new Bundle() { 392d7c7105SYinan Xu val flush = Input(Bool()) 40b034d3b9SLinJiawei val readPorts = Vec({if(float) 4 else 3} * RenameWidth, new RatReadPort) 41*7fa2c198SYinan Xu val specWritePorts = Vec(CommitWidth, Input(new RatWritePort)) 42*7fa2c198SYinan Xu val archWritePorts = Vec(CommitWidth, Input(new RatWritePort)) 432225d46eSJiawei Lin val debug_rdata = Vec(32, Output(UInt(PhyRegIdxWidth.W))) 44b034d3b9SLinJiawei }) 45b034d3b9SLinJiawei 46b034d3b9SLinJiawei // speculative rename table 47191cb795SLinJiawei val spec_table = RegInit(VecInit(Seq.tabulate(32)(i => i.U(PhyRegIdxWidth.W)))) 48*7fa2c198SYinan Xu val spec_table_next = WireInit(spec_table) 49b034d3b9SLinJiawei // arch state rename table 50191cb795SLinJiawei val arch_table = RegInit(VecInit(Seq.tabulate(32)(i => i.U(PhyRegIdxWidth.W)))) 51b034d3b9SLinJiawei 52*7fa2c198SYinan Xu // For better timing, we optimize reading and writing to RenameTable as follows: 53*7fa2c198SYinan Xu // (1) Writing at T0 will be actually processed at T1. 54*7fa2c198SYinan Xu // (2) Reading is synchronous now. 55*7fa2c198SYinan Xu // (3) RAddr at T0 will be used to access the table and get data at T0. 56*7fa2c198SYinan Xu // (4) WData at T0 is bypassed to RData at T1. 57*7fa2c198SYinan Xu val t1_rdata = io.readPorts.map(p => RegNext(Mux(p.hold, p.data, spec_table_next(p.addr)))) 58*7fa2c198SYinan Xu val t1_raddr = io.readPorts.map(p => RegEnable(p.addr, !p.hold)) 59*7fa2c198SYinan Xu val t1_wSpec = RegNext(io.specWritePorts) 60b034d3b9SLinJiawei 61*7fa2c198SYinan Xu // WRITE: when instruction commits or walking 62*7fa2c198SYinan Xu val t1_flush = RegNext(io.flush) 63*7fa2c198SYinan Xu val t1_wSpec_addr = t1_wSpec.map(w => Mux(w.wen, UIntToOH(w.addr), 0.U)) 64*7fa2c198SYinan Xu for ((next, i) <- spec_table_next.zipWithIndex) { 65*7fa2c198SYinan Xu val matchVec = t1_wSpec_addr.map(w => w(i)) 66*7fa2c198SYinan Xu val wMatch = ParallelPriorityMux(matchVec.reverse, t1_wSpec.map(_.data).reverse) 67*7fa2c198SYinan Xu // When there's a flush, we use arch_table to update spec_table. 68*7fa2c198SYinan Xu next := Mux(t1_flush, arch_table(i), Mux(VecInit(matchVec).asUInt.orR, wMatch, spec_table(i))) 69*7fa2c198SYinan Xu } 70*7fa2c198SYinan Xu spec_table := spec_table_next 71*7fa2c198SYinan Xu 72*7fa2c198SYinan Xu // READ: decode-rename stage 73b034d3b9SLinJiawei for ((r, i) <- io.readPorts.zipWithIndex) { 74*7fa2c198SYinan Xu // We use two comparisons here because r.hold has bad timing but addrs have better timing. 75*7fa2c198SYinan Xu val t0_bypass = io.specWritePorts.map(w => w.wen && Mux(r.hold, w.addr === t1_raddr(i), w.addr === r.addr)) 76*7fa2c198SYinan Xu val t1_bypass = RegNext(VecInit(t0_bypass)) 77*7fa2c198SYinan Xu val bypass_data = ParallelPriorityMux(t1_bypass.reverse, t1_wSpec.map(_.data).reverse) 78*7fa2c198SYinan Xu r.data := Mux(t1_bypass.asUInt.orR, bypass_data, t1_rdata(i)) 79b034d3b9SLinJiawei } 80b034d3b9SLinJiawei 81b034d3b9SLinJiawei for (w <- io.archWritePorts) { 82*7fa2c198SYinan Xu when (w.wen) { 83*7fa2c198SYinan Xu arch_table(w.addr) := w.data 84ce4949a0SYinan Xu } 85b034d3b9SLinJiawei } 86b034d3b9SLinJiawei 872225d46eSJiawei Lin io.debug_rdata := arch_table 8844dead2fSZhangZifei} 89*7fa2c198SYinan Xu 90*7fa2c198SYinan Xuclass RenameTableWrapper(implicit p: Parameters) extends XSModule { 91*7fa2c198SYinan Xu val io = IO(new Bundle() { 92*7fa2c198SYinan Xu val flush = Input(Bool()) 93*7fa2c198SYinan Xu val robCommits = Flipped(new RobCommitIO) 94*7fa2c198SYinan Xu val intReadPorts = Vec(RenameWidth, Vec(3, new RatReadPort)) 95*7fa2c198SYinan Xu val intRenamePorts = Vec(RenameWidth, Input(new RatWritePort)) 96*7fa2c198SYinan Xu val fpReadPorts = Vec(RenameWidth, Vec(4, new RatReadPort)) 97*7fa2c198SYinan Xu val fpRenamePorts = Vec(RenameWidth, Input(new RatWritePort)) 98*7fa2c198SYinan Xu // for debug printing 99*7fa2c198SYinan Xu val debug_int_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W))) 100*7fa2c198SYinan Xu val debug_fp_rat = Vec(32, Output(UInt(PhyRegIdxWidth.W))) 101*7fa2c198SYinan Xu }) 102*7fa2c198SYinan Xu 103*7fa2c198SYinan Xu val intRat = Module(new RenameTable(float = false)) 104*7fa2c198SYinan Xu val fpRat = Module(new RenameTable(float = true)) 105*7fa2c198SYinan Xu 106*7fa2c198SYinan Xu intRat.io.flush := io.flush 107*7fa2c198SYinan Xu intRat.io.debug_rdata <> io.debug_int_rat 108*7fa2c198SYinan Xu intRat.io.readPorts <> io.intReadPorts.flatten 109*7fa2c198SYinan Xu val intDestValid = io.robCommits.info.map(info => info.rfWen && info.ldest =/= 0.U) 110*7fa2c198SYinan Xu for ((arch, i) <- intRat.io.archWritePorts.zipWithIndex) { 111*7fa2c198SYinan Xu arch.wen := !io.robCommits.isWalk && io.robCommits.valid(i) && intDestValid(i) 112*7fa2c198SYinan Xu arch.addr := io.robCommits.info(i).ldest 113*7fa2c198SYinan Xu arch.data := io.robCommits.info(i).pdest 114*7fa2c198SYinan Xu } 115*7fa2c198SYinan Xu for ((spec, i) <- intRat.io.specWritePorts.zipWithIndex) { 116*7fa2c198SYinan Xu spec.wen := io.robCommits.isWalk && io.robCommits.valid(i) && intDestValid(i) 117*7fa2c198SYinan Xu spec.addr := io.robCommits.info(i).ldest 118*7fa2c198SYinan Xu spec.data := io.robCommits.info(i).old_pdest 119*7fa2c198SYinan Xu } 120*7fa2c198SYinan Xu for ((spec, rename) <- intRat.io.specWritePorts.zip(io.intRenamePorts)) { 121*7fa2c198SYinan Xu when (rename.wen) { 122*7fa2c198SYinan Xu spec.wen := true.B 123*7fa2c198SYinan Xu spec.addr := rename.addr 124*7fa2c198SYinan Xu spec.data := rename.data 125*7fa2c198SYinan Xu } 126*7fa2c198SYinan Xu } 127*7fa2c198SYinan Xu 128*7fa2c198SYinan Xu fpRat.io.flush := io.flush 129*7fa2c198SYinan Xu // debug read ports for difftest 130*7fa2c198SYinan Xu fpRat.io.debug_rdata <> io.debug_fp_rat 131*7fa2c198SYinan Xu fpRat.io.readPorts <> io.fpReadPorts.flatten 132*7fa2c198SYinan Xu for ((arch, i) <- fpRat.io.archWritePorts.zipWithIndex) { 133*7fa2c198SYinan Xu arch.wen := !io.robCommits.isWalk && io.robCommits.valid(i) && io.robCommits.info(i).fpWen 134*7fa2c198SYinan Xu arch.addr := io.robCommits.info(i).ldest 135*7fa2c198SYinan Xu arch.data := io.robCommits.info(i).pdest 136*7fa2c198SYinan Xu } 137*7fa2c198SYinan Xu for ((spec, i) <- fpRat.io.specWritePorts.zipWithIndex) { 138*7fa2c198SYinan Xu spec.wen := io.robCommits.isWalk && io.robCommits.valid(i) && io.robCommits.info(i).fpWen 139*7fa2c198SYinan Xu spec.addr := io.robCommits.info(i).ldest 140*7fa2c198SYinan Xu spec.data := io.robCommits.info(i).old_pdest 141*7fa2c198SYinan Xu } 142*7fa2c198SYinan Xu for ((spec, rename) <- fpRat.io.specWritePorts.zip(io.fpRenamePorts)) { 143*7fa2c198SYinan Xu when (rename.wen) { 144*7fa2c198SYinan Xu spec.wen := true.B 145*7fa2c198SYinan Xu spec.addr := rename.addr 146*7fa2c198SYinan Xu spec.data := rename.data 147*7fa2c198SYinan Xu } 148*7fa2c198SYinan Xu } 149*7fa2c198SYinan Xu 150*7fa2c198SYinan Xu} 151