xref: /XiangShan/src/main/scala/xiangshan/backend/fu/Radix2Divider.scala (revision c6d439803a044ea209139672b25e35fe8d7f4aa0)
1*c6d43980SLemover/***************************************************************************************
2*c6d43980SLemover* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3*c6d43980SLemover*
4*c6d43980SLemover* XiangShan is licensed under Mulan PSL v2.
5*c6d43980SLemover* You can use this software according to the terms and conditions of the Mulan PSL v2.
6*c6d43980SLemover* You may obtain a copy of Mulan PSL v2 at:
7*c6d43980SLemover*          http://license.coscl.org.cn/MulanPSL2
8*c6d43980SLemover*
9*c6d43980SLemover* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
10*c6d43980SLemover* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
11*c6d43980SLemover* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
12*c6d43980SLemover*
13*c6d43980SLemover* See the Mulan PSL v2 for more details.
14*c6d43980SLemover***************************************************************************************/
15*c6d43980SLemover
165018a303SLinJiaweipackage xiangshan.backend.fu
175018a303SLinJiawei
182225d46eSJiawei Linimport chipsalliance.rocketchip.config.Parameters
195018a303SLinJiaweiimport chisel3._
205018a303SLinJiaweiimport chisel3.util._
215018a303SLinJiaweiimport xiangshan._
225018a303SLinJiaweiimport utils._
235018a303SLinJiawei
242225d46eSJiawei Linabstract class AbstractDivider(len: Int)(implicit p: Parameters) extends FunctionUnit(len){
255018a303SLinJiawei  val ctrl = IO(Input(new MulDivCtrl))
265018a303SLinJiawei  val sign = ctrl.sign
275018a303SLinJiawei}
285018a303SLinJiawei
292225d46eSJiawei Linclass Radix2Divider(len: Int)(implicit p: Parameters) extends AbstractDivider(len) {
305018a303SLinJiawei
315018a303SLinJiawei  def abs(a: UInt, sign: Bool): (Bool, UInt) = {
325018a303SLinJiawei    val s = a(len - 1) && sign
335018a303SLinJiawei    (s, Mux(s, -a, a))
345018a303SLinJiawei  }
355018a303SLinJiawei
365018a303SLinJiawei  val s_idle :: s_log2 :: s_shift :: s_compute :: s_finish :: Nil = Enum(5)
375018a303SLinJiawei  val state = RegInit(s_idle)
385018a303SLinJiawei  val newReq = (state === s_idle) && io.in.fire()
395018a303SLinJiawei
405018a303SLinJiawei  val (a, b) = (io.in.bits.src(0), io.in.bits.src(1))
415018a303SLinJiawei  val divBy0 = b === 0.U(len.W)
425018a303SLinJiawei  val divBy0Reg = RegEnable(divBy0, newReq)
435018a303SLinJiawei
445018a303SLinJiawei  val shiftReg = Reg(UInt((1 + len * 2).W))
455018a303SLinJiawei  val hi = shiftReg(len * 2, len)
465018a303SLinJiawei  val lo = shiftReg(len - 1, 0)
475018a303SLinJiawei
485018a303SLinJiawei  val uop = io.in.bits.uop
495018a303SLinJiawei
505018a303SLinJiawei  val (aSign, aVal) = abs(a, sign)
515018a303SLinJiawei  val (bSign, bVal) = abs(b, sign)
525018a303SLinJiawei  val aSignReg = RegEnable(aSign, newReq)
535018a303SLinJiawei  val qSignReg = RegEnable((aSign ^ bSign) && !divBy0, newReq)
545018a303SLinJiawei  val bReg = RegEnable(bVal, newReq)
555018a303SLinJiawei  val aValx2Reg = RegEnable(Cat(aVal, "b0".U), newReq)
565018a303SLinJiawei  val ctrlReg = RegEnable(ctrl, newReq)
575018a303SLinJiawei  val uopReg = RegEnable(uop, newReq)
585018a303SLinJiawei
595018a303SLinJiawei  val cnt = Counter(len)
607c8efd4aSYinan Xu  when (newReq && !io.in.bits.uop.roqIdx.needFlush(io.redirectIn, io.flushIn)) {
615018a303SLinJiawei    state := s_log2
625018a303SLinJiawei  } .elsewhen (state === s_log2) {
635018a303SLinJiawei    // `canSkipShift` is calculated as following:
645018a303SLinJiawei    //   bEffectiveBit = Log2(bVal, XLEN) + 1.U
655018a303SLinJiawei    //   aLeadingZero = 64.U - aEffectiveBit = 64.U - (Log2(aVal, XLEN) + 1.U)
665018a303SLinJiawei    //   canSkipShift = aLeadingZero + bEffectiveBit
675018a303SLinJiawei    //     = 64.U - (Log2(aVal, XLEN) + 1.U) + Log2(bVal, XLEN) + 1.U
685018a303SLinJiawei    //     = 64.U + Log2(bVal, XLEN) - Log2(aVal, XLEN)
695018a303SLinJiawei    //     = (64.U | Log2(bVal, XLEN)) - Log2(aVal, XLEN)  // since Log2(bVal, XLEN) < 64.U
705018a303SLinJiawei    val canSkipShift = (64.U | Log2(bReg)) - Log2(aValx2Reg)
715018a303SLinJiawei    // When divide by 0, the quotient should be all 1's.
725018a303SLinJiawei    // Therefore we can not shift in 0s here.
735018a303SLinJiawei    // We do not skip any shift to avoid this.
745018a303SLinJiawei    cnt.value := Mux(divBy0Reg, 0.U, Mux(canSkipShift >= (len-1).U, (len-1).U, canSkipShift))
755018a303SLinJiawei    state := s_shift
765018a303SLinJiawei  } .elsewhen (state === s_shift) {
775018a303SLinJiawei    shiftReg := aValx2Reg << cnt.value
785018a303SLinJiawei    state := s_compute
795018a303SLinJiawei  } .elsewhen (state === s_compute) {
805018a303SLinJiawei    val enough = hi.asUInt >= bReg.asUInt
815018a303SLinJiawei    shiftReg := Cat(Mux(enough, hi - bReg, hi)(len - 1, 0), lo, enough)
825018a303SLinJiawei    cnt.inc()
835018a303SLinJiawei    when (cnt.value === (len-1).U) { state := s_finish }
845018a303SLinJiawei  } .elsewhen (state === s_finish) {
855018a303SLinJiawei    when(io.out.ready){
865018a303SLinJiawei      state := s_idle
875018a303SLinJiawei    }
885018a303SLinJiawei  }
895018a303SLinJiawei
902d7c7105SYinan Xu  val kill = state=/=s_idle && uopReg.roqIdx.needFlush(io.redirectIn, io.flushIn)
91ff8496b2SLinJiawei  when(kill){
925018a303SLinJiawei    state := s_idle
935018a303SLinJiawei  }
945018a303SLinJiawei
955018a303SLinJiawei  val r = hi(len, 1)
965018a303SLinJiawei  val resQ = Mux(qSignReg, -lo, lo)
975018a303SLinJiawei  val resR = Mux(aSignReg, -r, r)
985018a303SLinJiawei
995018a303SLinJiawei  val xlen = io.out.bits.data.getWidth
1005018a303SLinJiawei  val res = Mux(ctrlReg.isHi, resR, resQ)
1015018a303SLinJiawei  io.out.bits.data := Mux(ctrlReg.isW, SignExt(res(31,0),xlen), res)
1025018a303SLinJiawei  io.out.bits.uop := uopReg
1035018a303SLinJiawei
104d0d8f03aSYinan Xu  io.out.valid := state === s_finish
1055018a303SLinJiawei  io.in.ready := state === s_idle
1065018a303SLinJiawei}
107