15018a303SLinJiaweipackage xiangshan.backend.fu 25018a303SLinJiawei 35018a303SLinJiaweiimport chisel3._ 45018a303SLinJiaweiimport chisel3.util._ 55018a303SLinJiaweiimport xiangshan._ 65018a303SLinJiaweiimport utils._ 75018a303SLinJiawei 85018a303SLinJiaweiabstract class AbstractDivider(len: Int) extends FunctionUnit( 95018a303SLinJiawei FuConfig(FuType.div, 2, 0, writeIntRf = true, writeFpRf = false, hasRedirect = false, UncertainLatency()), 105018a303SLinJiawei len 115018a303SLinJiawei){ 125018a303SLinJiawei val ctrl = IO(Input(new MulDivCtrl)) 135018a303SLinJiawei val sign = ctrl.sign 145018a303SLinJiawei} 155018a303SLinJiawei 165018a303SLinJiaweiclass Radix2Divider(len: Int) extends AbstractDivider(len) { 175018a303SLinJiawei 185018a303SLinJiawei def abs(a: UInt, sign: Bool): (Bool, UInt) = { 195018a303SLinJiawei val s = a(len - 1) && sign 205018a303SLinJiawei (s, Mux(s, -a, a)) 215018a303SLinJiawei } 225018a303SLinJiawei 235018a303SLinJiawei val s_idle :: s_log2 :: s_shift :: s_compute :: s_finish :: Nil = Enum(5) 245018a303SLinJiawei val state = RegInit(s_idle) 255018a303SLinJiawei val newReq = (state === s_idle) && io.in.fire() 265018a303SLinJiawei 275018a303SLinJiawei val (a, b) = (io.in.bits.src(0), io.in.bits.src(1)) 285018a303SLinJiawei val divBy0 = b === 0.U(len.W) 295018a303SLinJiawei val divBy0Reg = RegEnable(divBy0, newReq) 305018a303SLinJiawei 315018a303SLinJiawei val shiftReg = Reg(UInt((1 + len * 2).W)) 325018a303SLinJiawei val hi = shiftReg(len * 2, len) 335018a303SLinJiawei val lo = shiftReg(len - 1, 0) 345018a303SLinJiawei 355018a303SLinJiawei val uop = io.in.bits.uop 365018a303SLinJiawei 375018a303SLinJiawei val (aSign, aVal) = abs(a, sign) 385018a303SLinJiawei val (bSign, bVal) = abs(b, sign) 395018a303SLinJiawei val aSignReg = RegEnable(aSign, newReq) 405018a303SLinJiawei val qSignReg = RegEnable((aSign ^ bSign) && !divBy0, newReq) 415018a303SLinJiawei val bReg = RegEnable(bVal, newReq) 425018a303SLinJiawei val aValx2Reg = RegEnable(Cat(aVal, "b0".U), newReq) 435018a303SLinJiawei val ctrlReg = RegEnable(ctrl, newReq) 445018a303SLinJiawei val uopReg = RegEnable(uop, newReq) 455018a303SLinJiawei 465018a303SLinJiawei val cnt = Counter(len) 475018a303SLinJiawei when (newReq) { 485018a303SLinJiawei state := s_log2 495018a303SLinJiawei } .elsewhen (state === s_log2) { 505018a303SLinJiawei // `canSkipShift` is calculated as following: 515018a303SLinJiawei // bEffectiveBit = Log2(bVal, XLEN) + 1.U 525018a303SLinJiawei // aLeadingZero = 64.U - aEffectiveBit = 64.U - (Log2(aVal, XLEN) + 1.U) 535018a303SLinJiawei // canSkipShift = aLeadingZero + bEffectiveBit 545018a303SLinJiawei // = 64.U - (Log2(aVal, XLEN) + 1.U) + Log2(bVal, XLEN) + 1.U 555018a303SLinJiawei // = 64.U + Log2(bVal, XLEN) - Log2(aVal, XLEN) 565018a303SLinJiawei // = (64.U | Log2(bVal, XLEN)) - Log2(aVal, XLEN) // since Log2(bVal, XLEN) < 64.U 575018a303SLinJiawei val canSkipShift = (64.U | Log2(bReg)) - Log2(aValx2Reg) 585018a303SLinJiawei // When divide by 0, the quotient should be all 1's. 595018a303SLinJiawei // Therefore we can not shift in 0s here. 605018a303SLinJiawei // We do not skip any shift to avoid this. 615018a303SLinJiawei cnt.value := Mux(divBy0Reg, 0.U, Mux(canSkipShift >= (len-1).U, (len-1).U, canSkipShift)) 625018a303SLinJiawei state := s_shift 635018a303SLinJiawei } .elsewhen (state === s_shift) { 645018a303SLinJiawei shiftReg := aValx2Reg << cnt.value 655018a303SLinJiawei state := s_compute 665018a303SLinJiawei } .elsewhen (state === s_compute) { 675018a303SLinJiawei val enough = hi.asUInt >= bReg.asUInt 685018a303SLinJiawei shiftReg := Cat(Mux(enough, hi - bReg, hi)(len - 1, 0), lo, enough) 695018a303SLinJiawei cnt.inc() 705018a303SLinJiawei when (cnt.value === (len-1).U) { state := s_finish } 715018a303SLinJiawei } .elsewhen (state === s_finish) { 725018a303SLinJiawei when(io.out.ready){ 735018a303SLinJiawei state := s_idle 745018a303SLinJiawei } 755018a303SLinJiawei } 765018a303SLinJiawei 77*ff8496b2SLinJiawei val kill = state=/=s_idle && uopReg.roqIdx.needFlush(io.redirectIn) 78*ff8496b2SLinJiawei when(kill){ 795018a303SLinJiawei state := s_idle 805018a303SLinJiawei } 815018a303SLinJiawei 825018a303SLinJiawei val r = hi(len, 1) 835018a303SLinJiawei val resQ = Mux(qSignReg, -lo, lo) 845018a303SLinJiawei val resR = Mux(aSignReg, -r, r) 855018a303SLinJiawei 865018a303SLinJiawei val xlen = io.out.bits.data.getWidth 875018a303SLinJiawei val res = Mux(ctrlReg.isHi, resR, resQ) 885018a303SLinJiawei io.out.bits.data := Mux(ctrlReg.isW, SignExt(res(31,0),xlen), res) 895018a303SLinJiawei io.out.bits.uop := uopReg 905018a303SLinJiawei 91*ff8496b2SLinJiawei io.out.valid := state === s_finish && !kill 925018a303SLinJiawei io.in.ready := state === s_idle 935018a303SLinJiawei}