1package xiangshan.backend.rob 2 3import org.chipsalliance.cde.config.Parameters 4import chisel3._ 5import chisel3.util._ 6import xiangshan._ 7import utils._ 8import utility._ 9import xiangshan.backend.Bundles.DynInst 10import xiangshan.backend.decode.VectorConstants 11import xiangshan.backend.rename.SnapshotGenerator 12 13class RenameBufferPtr(size: Int) extends CircularQueuePtr[RenameBufferPtr](size) { 14 def this()(implicit p: Parameters) = this(p(XSCoreParamsKey).RabSize) 15} 16 17object RenameBufferPtr { 18 def apply(flag: Boolean = false, v: Int = 0)(implicit p: Parameters): RenameBufferPtr = { 19 val ptr = Wire(new RenameBufferPtr(p(XSCoreParamsKey).RabSize)) 20 ptr.flag := flag.B 21 ptr.value := v.U 22 ptr 23 } 24} 25 26class RenameBufferEntry(implicit p: Parameters) extends RobCommitInfo { 27 val robIdx = new RobPtr 28} 29 30class RenameBuffer(size: Int)(implicit p: Parameters) extends XSModule with HasCircularQueuePtrHelper { 31 val io = IO(new Bundle { 32 val redirect = Input(ValidIO(new Bundle { 33 })) 34 35 val req = Vec(RenameWidth, Flipped(ValidIO(new DynInst))) 36 val fromRob = new Bundle { 37 val walkSize = Input(UInt(log2Up(size).W)) 38 val walkEnd = Input(Bool()) 39 val commitSize = Input(UInt(log2Up(size).W)) 40 } 41 42 val snpt = Input(new SnapshotPort) 43 44 val canEnq = Output(Bool()) 45 val enqPtrVec = Output(Vec(RenameWidth, new RenameBufferPtr)) 46 val vconfigPdest = Output(UInt(PhyRegIdxWidth.W)) 47 val commits = Output(new RobCommitIO) 48 val diffCommits = Output(new DiffCommitIO) 49 50 val status = Output(new Bundle { 51 val walkEnd = Bool() 52 }) 53 }) 54 55 // alias 56 private val snptSelect = io.snpt.snptSelect 57 58 // pointer 59 private val enqPtrVec = RegInit(VecInit.tabulate(RenameWidth)(idx => RenameBufferPtr(flag = false, idx))) 60 private val enqPtr = enqPtrVec.head 61 private val enqPtrOH = RegInit(1.U(size.W)) 62 private val enqPtrOHShift = CircularShift(enqPtrOH) 63 // may shift [0, RenameWidth] steps 64 private val enqPtrOHVec = VecInit.tabulate(RenameWidth + 1)(enqPtrOHShift.left) 65 private val enqPtrVecNext = Wire(enqPtrVec.cloneType) 66 67 private val deqPtrVec = RegInit(VecInit.tabulate(CommitWidth)(idx => RenameBufferPtr(flag = false, idx))) 68 private val deqPtr = deqPtrVec.head 69 private val deqPtrOH = RegInit(1.U(size.W)) 70 private val deqPtrOHShift = CircularShift(deqPtrOH) 71 private val deqPtrOHVec = VecInit.tabulate(CommitWidth + 1)(deqPtrOHShift.left) 72 private val deqPtrVecNext = Wire(deqPtrVec.cloneType) 73 XSError(deqPtr.toOH =/= deqPtrOH, p"wrong one-hot reg between $deqPtr and $deqPtrOH") 74 75 private val walkPtr = Reg(new RenameBufferPtr) 76 private val walkPtrOH = walkPtr.toOH 77 private val walkPtrOHVec = VecInit.tabulate(CommitWidth + 1)(CircularShift(walkPtrOH).left) 78 private val walkPtrNext = Wire(new RenameBufferPtr) 79 80 private val walkPtrSnapshots = SnapshotGenerator(enqPtr, io.snpt.snptEnq, io.snpt.snptDeq, io.redirect.valid, io.snpt.flushVec) 81 82 // We should extra walk these preg pairs which compressed in rob enq entry at last cycle after restored snapshots. 83 // enq firstuop: b010100 --invert--> b101011 --keep only continuous 1s from head--> b000011 84 // enq firstuop: b111101 --invert--> b000010 --keep only continuous 1s from head--> b000000 85 private val enqCompressedLastCycleMask: UInt = VecInit(io.req.indices.map(i => io.req.slice(0, i + 1).map(!_.bits.firstUop).reduce(_ && _))).asUInt 86 private val compressedLastRobEntryMaskSnapshots = SnapshotGenerator(enqCompressedLastCycleMask, io.snpt.snptEnq, io.snpt.snptDeq, io.redirect.valid, io.snpt.flushVec) 87 private val compressedExtraWalkMask = compressedLastRobEntryMaskSnapshots(snptSelect) 88 // b111111 --Cat(x,1)--> b1111111 --Reverse--> b1111111 --PriorityEncoder--> 6.U 89 // b001111 --Cat(x,1)--> b0011111 --Reverse--> b1111100 --PriorityEncoder--> 4.U 90 // b000011 --Cat(x,1)--> b0000111 --Reverse--> b1110000 --PriorityEncoder--> 2.U 91 // b000000 --Cat(x,1)--> b0000001 --Reverse--> b1000000 --PriorityEncoder--> 0.U 92 private val compressedExtraWalkSize = PriorityMux(Reverse(Cat(compressedExtraWalkMask, 1.U(1.W))), (0 to RenameWidth).map(i => (RenameWidth - i).U)) 93 94 val vcfgPtrOH = RegInit(1.U(size.W)) 95 val vcfgPtrOHShift = CircularShift(vcfgPtrOH) 96 // may shift [0, 2) steps 97 val vcfgPtrOHVec = VecInit.tabulate(2)(vcfgPtrOHShift.left) 98 99 val diffPtrOH = RegInit(1.U(size.W)) 100 val diffPtrOHShift = CircularShift(diffPtrOH) 101 // may shift [0, CommitWidth * MaxUopSize] steps 102 val diffPtrOHVec = VecInit(Seq.tabulate(CommitWidth * MaxUopSize + 1)(_ % size).map(step => diffPtrOHShift.left(step))) 103 104 // Regs 105 val renameBuffer = Mem(size, new RenameBufferEntry) 106 val renameBufferEntries = (0 until size) map (i => renameBuffer(i)) 107 108 val s_idle :: s_special_walk :: s_walk :: Nil = Enum(3) 109 val state = RegInit(s_idle) 110 val stateNext = WireInit(state) // otherwise keep state value 111 112 private val robWalkEndReg = RegInit(false.B) 113 private val robWalkEnd = io.fromRob.walkEnd || robWalkEndReg 114 115 when(io.redirect.valid) { 116 robWalkEndReg := false.B 117 }.elsewhen(io.fromRob.walkEnd) { 118 robWalkEndReg := true.B 119 } 120 121 val realNeedAlloc = io.req.map(req => req.valid && req.bits.needWriteRf) 122 val enqCount = PopCount(realNeedAlloc) 123 val commitCount = Mux(io.commits.isCommit && !io.commits.isWalk, PopCount(io.commits.commitValid), 0.U) 124 val walkCount = Mux(io.commits.isWalk && !io.commits.isCommit, PopCount(io.commits.walkValid), 0.U) 125 val specialWalkCount = Mux(io.commits.isCommit && io.commits.isWalk, PopCount(io.commits.walkValid), 0.U) 126 127 // number of pair(ldest, pdest) ready to commit to arch_rat 128 val commitSize = RegInit(0.U(log2Up(size).W)) 129 val walkSize = RegInit(0.U(log2Up(size).W)) 130 val specialWalkSize = RegInit(0.U(log2Up(size).W)) 131 132 val newCommitSize = io.fromRob.commitSize 133 val newWalkSize = io.fromRob.walkSize 134 135 val commitSizeNxt = commitSize + newCommitSize - commitCount 136 val walkSizeNxt = walkSize + newWalkSize - walkCount 137 138 val newSpecialWalkSize = Mux(io.redirect.valid && !io.snpt.useSnpt, commitSizeNxt, 0.U) 139 val specialWalkSizeNext = specialWalkSize + newSpecialWalkSize - specialWalkCount 140 141 commitSize := Mux(io.redirect.valid && !io.snpt.useSnpt, 0.U, commitSizeNxt) 142 specialWalkSize := specialWalkSizeNext 143 walkSize := Mux(io.redirect.valid, Mux(io.snpt.useSnpt, compressedExtraWalkSize, 0.U), walkSizeNxt) 144 145 walkPtrNext := MuxCase(walkPtr, Seq( 146 (state === s_idle && stateNext === s_walk) -> walkPtrSnapshots(snptSelect), 147 (state === s_special_walk && stateNext === s_walk) -> deqPtrVecNext.head, 148 (state === s_walk && io.snpt.useSnpt && io.redirect.valid) -> walkPtrSnapshots(snptSelect), 149 (state === s_walk) -> (walkPtr + walkCount), 150 )) 151 152 walkPtr := walkPtrNext 153 154 val walkCandidates = VecInit(walkPtrOHVec.map(sel => Mux1H(sel, renameBufferEntries))) 155 val commitCandidates = VecInit(deqPtrOHVec.map(sel => Mux1H(sel, renameBufferEntries))) 156 val vcfgCandidates = VecInit(vcfgPtrOHVec.map(sel => Mux1H(sel, renameBufferEntries))) 157 val diffCandidates = VecInit(diffPtrOHVec.map(sel => Mux1H(sel, renameBufferEntries))) 158 159 // update diff pointer 160 val diffPtrOHNext = Mux(state === s_idle, diffPtrOHVec(newCommitSize), diffPtrOH) 161 diffPtrOH := diffPtrOHNext 162 163 // update vcfg pointer 164 vcfgPtrOH := diffPtrOHNext 165 166 // update enq pointer 167 val enqPtrNext = Mux( 168 state === s_walk && stateNext === s_idle, 169 walkPtrNext, 170 enqPtr + enqCount 171 ) 172 val enqPtrOHNext = Mux( 173 state === s_walk && stateNext === s_idle, 174 walkPtrNext.toOH, 175 enqPtrOHVec(enqCount) 176 ) 177 enqPtr := enqPtrNext 178 enqPtrOH := enqPtrOHNext 179 enqPtrVecNext.zipWithIndex.map{ case(ptr, i) => ptr := enqPtrNext + i.U } 180 enqPtrVec := enqPtrVecNext 181 182 val deqPtrSteps = Mux1H(Seq( 183 (state === s_idle) -> commitCount, 184 (state === s_special_walk) -> specialWalkCount, 185 )) 186 187 // update deq pointer 188 val deqPtrNext = deqPtr + deqPtrSteps 189 val deqPtrOHNext = deqPtrOHVec(deqPtrSteps) 190 deqPtr := deqPtrNext 191 deqPtrOH := deqPtrOHNext 192 deqPtrVecNext.zipWithIndex.map{ case(ptr, i) => ptr := deqPtrNext + i.U } 193 deqPtrVec := deqPtrVecNext 194 195 val allocatePtrVec = VecInit((0 until RenameWidth).map(i => enqPtrVec(PopCount(realNeedAlloc.take(i))).value)) 196 allocatePtrVec.zip(io.req).zip(realNeedAlloc).map{ case((allocatePtr, req), realNeedAlloc) => 197 when(realNeedAlloc){ 198 renameBuffer(allocatePtr).ldest := req.bits.ldest 199 renameBuffer(allocatePtr).pdest := req.bits.pdest 200 renameBuffer(allocatePtr).rfWen := req.bits.rfWen 201 renameBuffer(allocatePtr).fpWen := req.bits.fpWen 202 renameBuffer(allocatePtr).vecWen := req.bits.vecWen 203 renameBuffer(allocatePtr).isMove := req.bits.eliminatedMove 204 renameBuffer(allocatePtr).robIdx := req.bits.robIdx 205 } 206 } 207 208 io.commits.isCommit := state === s_idle || state === s_special_walk 209 io.commits.isWalk := state === s_walk || state === s_special_walk 210 211 for(i <- 0 until CommitWidth) { 212 io.commits.commitValid(i) := state === s_idle && i.U < commitSize || state === s_special_walk && i.U < specialWalkSize 213 io.commits.walkValid(i) := state === s_walk && i.U < walkSize || state === s_special_walk && i.U < specialWalkSize 214 // special walk use commitPtr 215 io.commits.info(i) := Mux(state === s_idle || state === s_special_walk, commitCandidates(i), walkCandidates(i)) 216 // Todo: remove this 217 io.commits.robIdx(i) := Mux(state === s_idle || state === s_special_walk, commitCandidates(i).robIdx, walkCandidates(i).robIdx) 218 } 219 220 private val walkEndNext = walkSizeNxt === 0.U 221 private val specialWalkEndNext = specialWalkSizeNext === 0.U 222 223 // change state 224 state := stateNext 225 when(io.redirect.valid) { 226 when(io.snpt.useSnpt) { 227 stateNext := s_walk 228 }.otherwise { 229 stateNext := s_special_walk 230 } 231 }.otherwise { 232 // change stateNext 233 switch(state) { 234 // this transaction is not used actually, just list all states 235 is(s_idle) { 236 stateNext := s_idle 237 } 238 is(s_special_walk) { 239 when(specialWalkEndNext) { 240 stateNext := s_walk 241 } 242 } 243 is(s_walk) { 244 when(robWalkEnd && walkEndNext) { 245 stateNext := s_idle 246 } 247 } 248 } 249 } 250 251 val numValidEntries = distanceBetween(enqPtr, deqPtr) 252 val allowEnqueue = RegNext(numValidEntries + enqCount <= (size - RenameWidth).U, true.B) 253 254 io.canEnq := allowEnqueue && state === s_idle 255 io.enqPtrVec := enqPtrVec 256 257 io.status.walkEnd := walkEndNext 258 259 io.vconfigPdest := Mux(vcfgCandidates(0).ldest === VCONFIG_IDX.U && vcfgCandidates(0).vecWen, vcfgCandidates(0).pdest, vcfgCandidates(1).pdest) 260 261 // for difftest 262 io.diffCommits := 0.U.asTypeOf(new DiffCommitIO) 263 io.diffCommits.isCommit := state === s_idle || state === s_special_walk 264 for(i <- 0 until CommitWidth * MaxUopSize) { 265 io.diffCommits.commitValid(i) := (state === s_idle || state === s_special_walk) && i.U < newCommitSize 266 io.diffCommits.info(i) := diffCandidates(i) 267 } 268 269 XSError(isBefore(enqPtr, deqPtr) && !isFull(enqPtr, deqPtr), "\ndeqPtr is older than enqPtr!\n") 270 271 QueuePerf(RabSize, numValidEntries, numValidEntries === size.U) 272 273 XSPerfAccumulate("s_idle_to_idle", state === s_idle && stateNext === s_idle) 274 XSPerfAccumulate("s_idle_to_swlk", state === s_idle && stateNext === s_special_walk) 275 XSPerfAccumulate("s_idle_to_walk", state === s_idle && stateNext === s_walk) 276 XSPerfAccumulate("s_swlk_to_idle", state === s_special_walk && stateNext === s_idle) 277 XSPerfAccumulate("s_swlk_to_swlk", state === s_special_walk && stateNext === s_special_walk) 278 XSPerfAccumulate("s_swlk_to_walk", state === s_special_walk && stateNext === s_walk) 279 XSPerfAccumulate("s_walk_to_idle", state === s_walk && stateNext === s_idle) 280 XSPerfAccumulate("s_walk_to_swlk", state === s_walk && stateNext === s_special_walk) 281 XSPerfAccumulate("s_walk_to_walk", state === s_walk && stateNext === s_walk) 282 283 XSPerfAccumulate("disallow_enq_cycle", !allowEnqueue) 284 XSPerfAccumulate("disallow_enq_full_cycle", numValidEntries + enqCount > (size - RenameWidth).U) 285 XSPerfAccumulate("disallow_enq_not_idle_cycle", state =/= s_idle) 286} 287