1*c6d43980SLemover/*************************************************************************************** 2*c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3*c6d43980SLemover* 4*c6d43980SLemover* XiangShan is licensed under Mulan PSL v2. 5*c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2. 6*c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at: 7*c6d43980SLemover* http://license.coscl.org.cn/MulanPSL2 8*c6d43980SLemover* 9*c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 10*c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 11*c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 12*c6d43980SLemover* 13*c6d43980SLemover* See the Mulan PSL v2 for more details. 14*c6d43980SLemover***************************************************************************************/ 15*c6d43980SLemover 165018a303SLinJiaweipackage xiangshan.backend.fu 175018a303SLinJiawei 182225d46eSJiawei Linimport chipsalliance.rocketchip.config.Parameters 195018a303SLinJiaweiimport chisel3._ 205018a303SLinJiaweiimport chisel3.util._ 215018a303SLinJiaweiimport xiangshan._ 225018a303SLinJiaweiimport utils._ 235018a303SLinJiawei 242225d46eSJiawei Linabstract class AbstractDivider(len: Int)(implicit p: Parameters) extends FunctionUnit(len){ 255018a303SLinJiawei val ctrl = IO(Input(new MulDivCtrl)) 265018a303SLinJiawei val sign = ctrl.sign 275018a303SLinJiawei} 285018a303SLinJiawei 292225d46eSJiawei Linclass Radix2Divider(len: Int)(implicit p: Parameters) extends AbstractDivider(len) { 305018a303SLinJiawei 315018a303SLinJiawei def abs(a: UInt, sign: Bool): (Bool, UInt) = { 325018a303SLinJiawei val s = a(len - 1) && sign 335018a303SLinJiawei (s, Mux(s, -a, a)) 345018a303SLinJiawei } 355018a303SLinJiawei 365018a303SLinJiawei val s_idle :: s_log2 :: s_shift :: s_compute :: s_finish :: Nil = Enum(5) 375018a303SLinJiawei val state = RegInit(s_idle) 385018a303SLinJiawei val newReq = (state === s_idle) && io.in.fire() 395018a303SLinJiawei 405018a303SLinJiawei val (a, b) = (io.in.bits.src(0), io.in.bits.src(1)) 415018a303SLinJiawei val divBy0 = b === 0.U(len.W) 425018a303SLinJiawei val divBy0Reg = RegEnable(divBy0, newReq) 435018a303SLinJiawei 445018a303SLinJiawei val shiftReg = Reg(UInt((1 + len * 2).W)) 455018a303SLinJiawei val hi = shiftReg(len * 2, len) 465018a303SLinJiawei val lo = shiftReg(len - 1, 0) 475018a303SLinJiawei 485018a303SLinJiawei val uop = io.in.bits.uop 495018a303SLinJiawei 505018a303SLinJiawei val (aSign, aVal) = abs(a, sign) 515018a303SLinJiawei val (bSign, bVal) = abs(b, sign) 525018a303SLinJiawei val aSignReg = RegEnable(aSign, newReq) 535018a303SLinJiawei val qSignReg = RegEnable((aSign ^ bSign) && !divBy0, newReq) 545018a303SLinJiawei val bReg = RegEnable(bVal, newReq) 555018a303SLinJiawei val aValx2Reg = RegEnable(Cat(aVal, "b0".U), newReq) 565018a303SLinJiawei val ctrlReg = RegEnable(ctrl, newReq) 575018a303SLinJiawei val uopReg = RegEnable(uop, newReq) 585018a303SLinJiawei 595018a303SLinJiawei val cnt = Counter(len) 607c8efd4aSYinan Xu when (newReq && !io.in.bits.uop.roqIdx.needFlush(io.redirectIn, io.flushIn)) { 615018a303SLinJiawei state := s_log2 625018a303SLinJiawei } .elsewhen (state === s_log2) { 635018a303SLinJiawei // `canSkipShift` is calculated as following: 645018a303SLinJiawei // bEffectiveBit = Log2(bVal, XLEN) + 1.U 655018a303SLinJiawei // aLeadingZero = 64.U - aEffectiveBit = 64.U - (Log2(aVal, XLEN) + 1.U) 665018a303SLinJiawei // canSkipShift = aLeadingZero + bEffectiveBit 675018a303SLinJiawei // = 64.U - (Log2(aVal, XLEN) + 1.U) + Log2(bVal, XLEN) + 1.U 685018a303SLinJiawei // = 64.U + Log2(bVal, XLEN) - Log2(aVal, XLEN) 695018a303SLinJiawei // = (64.U | Log2(bVal, XLEN)) - Log2(aVal, XLEN) // since Log2(bVal, XLEN) < 64.U 705018a303SLinJiawei val canSkipShift = (64.U | Log2(bReg)) - Log2(aValx2Reg) 715018a303SLinJiawei // When divide by 0, the quotient should be all 1's. 725018a303SLinJiawei // Therefore we can not shift in 0s here. 735018a303SLinJiawei // We do not skip any shift to avoid this. 745018a303SLinJiawei cnt.value := Mux(divBy0Reg, 0.U, Mux(canSkipShift >= (len-1).U, (len-1).U, canSkipShift)) 755018a303SLinJiawei state := s_shift 765018a303SLinJiawei } .elsewhen (state === s_shift) { 775018a303SLinJiawei shiftReg := aValx2Reg << cnt.value 785018a303SLinJiawei state := s_compute 795018a303SLinJiawei } .elsewhen (state === s_compute) { 805018a303SLinJiawei val enough = hi.asUInt >= bReg.asUInt 815018a303SLinJiawei shiftReg := Cat(Mux(enough, hi - bReg, hi)(len - 1, 0), lo, enough) 825018a303SLinJiawei cnt.inc() 835018a303SLinJiawei when (cnt.value === (len-1).U) { state := s_finish } 845018a303SLinJiawei } .elsewhen (state === s_finish) { 855018a303SLinJiawei when(io.out.ready){ 865018a303SLinJiawei state := s_idle 875018a303SLinJiawei } 885018a303SLinJiawei } 895018a303SLinJiawei 902d7c7105SYinan Xu val kill = state=/=s_idle && uopReg.roqIdx.needFlush(io.redirectIn, io.flushIn) 91ff8496b2SLinJiawei when(kill){ 925018a303SLinJiawei state := s_idle 935018a303SLinJiawei } 945018a303SLinJiawei 955018a303SLinJiawei val r = hi(len, 1) 965018a303SLinJiawei val resQ = Mux(qSignReg, -lo, lo) 975018a303SLinJiawei val resR = Mux(aSignReg, -r, r) 985018a303SLinJiawei 995018a303SLinJiawei val xlen = io.out.bits.data.getWidth 1005018a303SLinJiawei val res = Mux(ctrlReg.isHi, resR, resQ) 1015018a303SLinJiawei io.out.bits.data := Mux(ctrlReg.isW, SignExt(res(31,0),xlen), res) 1025018a303SLinJiawei io.out.bits.uop := uopReg 1035018a303SLinJiawei 104d0d8f03aSYinan Xu io.out.valid := state === s_finish 1055018a303SLinJiawei io.in.ready := state === s_idle 1065018a303SLinJiawei} 107