15018a303SLinJiaweipackage xiangshan.backend.fu 25018a303SLinJiawei 3*2225d46eSJiawei Linimport chipsalliance.rocketchip.config.Parameters 45018a303SLinJiaweiimport chisel3._ 55018a303SLinJiaweiimport chisel3.util._ 65018a303SLinJiaweiimport xiangshan._ 75018a303SLinJiaweiimport utils._ 85018a303SLinJiawei 9*2225d46eSJiawei Linabstract class AbstractDivider(len: Int)(implicit p: Parameters) extends FunctionUnit(len){ 105018a303SLinJiawei val ctrl = IO(Input(new MulDivCtrl)) 115018a303SLinJiawei val sign = ctrl.sign 125018a303SLinJiawei} 135018a303SLinJiawei 14*2225d46eSJiawei Linclass Radix2Divider(len: Int)(implicit p: Parameters) extends AbstractDivider(len) { 155018a303SLinJiawei 165018a303SLinJiawei def abs(a: UInt, sign: Bool): (Bool, UInt) = { 175018a303SLinJiawei val s = a(len - 1) && sign 185018a303SLinJiawei (s, Mux(s, -a, a)) 195018a303SLinJiawei } 205018a303SLinJiawei 215018a303SLinJiawei val s_idle :: s_log2 :: s_shift :: s_compute :: s_finish :: Nil = Enum(5) 225018a303SLinJiawei val state = RegInit(s_idle) 235018a303SLinJiawei val newReq = (state === s_idle) && io.in.fire() 245018a303SLinJiawei 255018a303SLinJiawei val (a, b) = (io.in.bits.src(0), io.in.bits.src(1)) 265018a303SLinJiawei val divBy0 = b === 0.U(len.W) 275018a303SLinJiawei val divBy0Reg = RegEnable(divBy0, newReq) 285018a303SLinJiawei 295018a303SLinJiawei val shiftReg = Reg(UInt((1 + len * 2).W)) 305018a303SLinJiawei val hi = shiftReg(len * 2, len) 315018a303SLinJiawei val lo = shiftReg(len - 1, 0) 325018a303SLinJiawei 335018a303SLinJiawei val uop = io.in.bits.uop 345018a303SLinJiawei 355018a303SLinJiawei val (aSign, aVal) = abs(a, sign) 365018a303SLinJiawei val (bSign, bVal) = abs(b, sign) 375018a303SLinJiawei val aSignReg = RegEnable(aSign, newReq) 385018a303SLinJiawei val qSignReg = RegEnable((aSign ^ bSign) && !divBy0, newReq) 395018a303SLinJiawei val bReg = RegEnable(bVal, newReq) 405018a303SLinJiawei val aValx2Reg = RegEnable(Cat(aVal, "b0".U), newReq) 415018a303SLinJiawei val ctrlReg = RegEnable(ctrl, newReq) 425018a303SLinJiawei val uopReg = RegEnable(uop, newReq) 435018a303SLinJiawei 445018a303SLinJiawei val cnt = Counter(len) 457c8efd4aSYinan Xu when (newReq && !io.in.bits.uop.roqIdx.needFlush(io.redirectIn, io.flushIn)) { 465018a303SLinJiawei state := s_log2 475018a303SLinJiawei } .elsewhen (state === s_log2) { 485018a303SLinJiawei // `canSkipShift` is calculated as following: 495018a303SLinJiawei // bEffectiveBit = Log2(bVal, XLEN) + 1.U 505018a303SLinJiawei // aLeadingZero = 64.U - aEffectiveBit = 64.U - (Log2(aVal, XLEN) + 1.U) 515018a303SLinJiawei // canSkipShift = aLeadingZero + bEffectiveBit 525018a303SLinJiawei // = 64.U - (Log2(aVal, XLEN) + 1.U) + Log2(bVal, XLEN) + 1.U 535018a303SLinJiawei // = 64.U + Log2(bVal, XLEN) - Log2(aVal, XLEN) 545018a303SLinJiawei // = (64.U | Log2(bVal, XLEN)) - Log2(aVal, XLEN) // since Log2(bVal, XLEN) < 64.U 555018a303SLinJiawei val canSkipShift = (64.U | Log2(bReg)) - Log2(aValx2Reg) 565018a303SLinJiawei // When divide by 0, the quotient should be all 1's. 575018a303SLinJiawei // Therefore we can not shift in 0s here. 585018a303SLinJiawei // We do not skip any shift to avoid this. 595018a303SLinJiawei cnt.value := Mux(divBy0Reg, 0.U, Mux(canSkipShift >= (len-1).U, (len-1).U, canSkipShift)) 605018a303SLinJiawei state := s_shift 615018a303SLinJiawei } .elsewhen (state === s_shift) { 625018a303SLinJiawei shiftReg := aValx2Reg << cnt.value 635018a303SLinJiawei state := s_compute 645018a303SLinJiawei } .elsewhen (state === s_compute) { 655018a303SLinJiawei val enough = hi.asUInt >= bReg.asUInt 665018a303SLinJiawei shiftReg := Cat(Mux(enough, hi - bReg, hi)(len - 1, 0), lo, enough) 675018a303SLinJiawei cnt.inc() 685018a303SLinJiawei when (cnt.value === (len-1).U) { state := s_finish } 695018a303SLinJiawei } .elsewhen (state === s_finish) { 705018a303SLinJiawei when(io.out.ready){ 715018a303SLinJiawei state := s_idle 725018a303SLinJiawei } 735018a303SLinJiawei } 745018a303SLinJiawei 752d7c7105SYinan Xu val kill = state=/=s_idle && uopReg.roqIdx.needFlush(io.redirectIn, io.flushIn) 76ff8496b2SLinJiawei when(kill){ 775018a303SLinJiawei state := s_idle 785018a303SLinJiawei } 795018a303SLinJiawei 805018a303SLinJiawei val r = hi(len, 1) 815018a303SLinJiawei val resQ = Mux(qSignReg, -lo, lo) 825018a303SLinJiawei val resR = Mux(aSignReg, -r, r) 835018a303SLinJiawei 845018a303SLinJiawei val xlen = io.out.bits.data.getWidth 855018a303SLinJiawei val res = Mux(ctrlReg.isHi, resR, resQ) 865018a303SLinJiawei io.out.bits.data := Mux(ctrlReg.isW, SignExt(res(31,0),xlen), res) 875018a303SLinJiawei io.out.bits.uop := uopReg 885018a303SLinJiawei 89d0d8f03aSYinan Xu io.out.valid := state === s_finish 905018a303SLinJiawei io.in.ready := state === s_idle 915018a303SLinJiawei} 92