xref: /XiangShan/src/main/scala/xiangshan/mem/vector/VSplit.scala (revision 81b02df568e6e33c649394c6a76f24c2ead22990)
1/***************************************************************************************
2  * Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3  * Copyright (c) 2020-2021 Peng Cheng Laboratory
4  *
5  * XiangShan is licensed under Mulan PSL v2.
6  * You can use this software according to the terms and conditions of the Mulan PSL v2.
7  * You may obtain a copy of Mulan PSL v2 at:
8  *          http://license.coscl.org.cn/MulanPSL2
9  *
10  * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
11  * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
12  * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
13  *
14  * See the Mulan PSL v2 for more details.
15  ***************************************************************************************/
16
17package xiangshan.mem
18
19import org.chipsalliance.cde.config.Parameters
20import chisel3._
21import chisel3.util._
22import utils._
23import utility._
24import xiangshan._
25import xiangshan.backend.rob.RobPtr
26import xiangshan.backend.Bundles._
27import xiangshan.mem._
28import xiangshan.backend.fu.vector.Bundles._
29
30
31class VSplitPipeline(isVStore: Boolean = false)(implicit p: Parameters) extends VLSUModule{
32  val io = IO(new VSplitPipelineIO(isVStore))
33  // will be override later
34  def us_whole_reg(fuOpType: UInt): Bool = false.B
35  def us_mask(fuOpType: UInt): Bool = false.B
36  def us_fof(fuOpType: UInt): Bool = false.B
37  //TODO vdIdxReg should no longer be useful, don't delete it for now
38  val vdIdxReg = RegInit(0.U(3.W))
39
40  val s1_ready = WireInit(false.B)
41  io.in.ready := s1_ready
42
43  /**-----------------------------------------------------------
44    * s0 stage
45    * decode and generate AlignedType, uop mask, preIsSplit
46    * ----------------------------------------------------------
47    */
48  val s0_uop = io.in.bits.uop
49  val s0_vtype = s0_uop.vpu.vtype
50  val s0_sew = s0_vtype.vsew
51  val s0_eew = s0_uop.vpu.veew
52  val s0_lmul = s0_vtype.vlmul
53  // when load whole register or unit-stride masked , emul should be 1
54  val s0_fuOpType = s0_uop.fuOpType
55  val s0_mop = s0_fuOpType(6, 5)
56  val s0_nf = Mux(us_whole_reg(s0_fuOpType), 0.U, s0_uop.vpu.nf)
57  val s0_vm = s0_uop.vpu.vm
58  val s0_emul = Mux(us_whole_reg(s0_fuOpType) ,GenUSWholeEmul(s0_uop.vpu.nf), Mux(us_mask(s0_fuOpType), 0.U(mulBits.W), EewLog2(s0_eew) - s0_sew + s0_lmul))
59  val s0_preIsSplit = !(isUnitStride(s0_mop) && !us_fof(s0_fuOpType))
60  val s0_nfield        = s0_nf +& 1.U
61
62  val s0_valid         = Wire(Bool())
63  val s0_kill          = io.in.bits.uop.robIdx.needFlush(io.redirect)
64  val s0_can_go        = s1_ready
65  val s0_fire          = s0_valid && s0_can_go
66  val s0_out           = Wire(new VLSBundle(isVStore))
67
68  val isUsWholeReg = isUnitStride(s0_mop) && us_whole_reg(s0_fuOpType)
69  val isMaskReg = isUnitStride(s0_mop) && us_mask(s0_fuOpType)
70  val isSegment = s0_nf =/= 0.U && !us_whole_reg(s0_fuOpType)
71  val instType = Cat(isSegment, s0_mop)
72  val uopIdx = io.in.bits.uop.vpu.vuopIdx
73  val uopIdxInField = GenUopIdxInField(instType, s0_emul, s0_lmul, uopIdx)
74  val vdIdxInField = GenVdIdxInField(instType, s0_emul, s0_lmul, uopIdxInField)
75  val lmulLog2 = Mux(s0_lmul.asSInt >= 0.S, 0.U, s0_lmul)
76  val emulLog2 = Mux(s0_emul.asSInt >= 0.S, 0.U, s0_emul)
77  val numEewLog2 = emulLog2 - EewLog2(s0_eew)
78  val numSewLog2 = lmulLog2 - s0_sew
79  val numFlowsSameVdLog2 = Mux(
80    isIndexed(instType),
81    log2Up(VLENB).U - s0_sew(1,0),
82    log2Up(VLENB).U - s0_eew(1,0)
83  )
84  // numUops = nf * max(lmul, emul)
85  val lmulLog2Pos = Mux(s0_lmul.asSInt < 0.S, 0.U, s0_lmul)
86  val emulLog2Pos = Mux(s0_emul.asSInt < 0.S, 0.U, s0_emul)
87  val numUops = Mux(
88    isIndexed(s0_mop) && s0_lmul.asSInt > s0_emul.asSInt,
89    (s0_nf +& 1.U) << lmulLog2Pos,
90    (s0_nf +& 1.U) << emulLog2Pos
91  )
92
93  val vvl = io.in.bits.src_vl.asTypeOf(VConfig()).vl
94  val evl = Mux(isUsWholeReg,
95                GenUSWholeRegVL(io.in.bits.uop.vpu.nf +& 1.U, s0_eew),
96                Mux(isMaskReg,
97                    GenUSMaskRegVL(vvl),
98                    vvl))
99  val vvstart = io.in.bits.uop.vpu.vstart
100  val alignedType = Mux(isIndexed(instType), s0_sew(1, 0), s0_eew(1, 0))
101  val broadenAligendType = Mux(s0_preIsSplit, Cat("b0".U, alignedType), "b100".U) // if is unit-stride, use 128-bits memory access
102  val flowsLog2 = GenRealFlowLog2(instType, s0_emul, s0_lmul, s0_eew, s0_sew)
103  val flowsPrevThisUop = (uopIdxInField << flowsLog2).asUInt // # of flows before this uop in a field
104  val flowsPrevThisVd = (vdIdxInField << numFlowsSameVdLog2).asUInt // # of flows before this vd in a field
105  val flowsIncludeThisUop = ((uopIdxInField +& 1.U) << flowsLog2).asUInt // # of flows before this uop besides this uop
106  val flowNum = io.in.bits.flowNum.get
107  // max index in vd, only use in index instructions for calculate index
108  val maxIdxInVdIndex = GenVLMAX(Mux(s0_emul.asSInt > 0.S, 0.U, s0_emul), s0_eew(1, 0))
109  val indexVlMaxInVd = GenVlMaxMask(maxIdxInVdIndex, elemIdxBits)
110
111  // For vectore indexed  instructions:
112  //  When emul is greater than lmul, multiple uop correspond to a Vd, e.g:
113  //    vsetvli	t1,t0,e8,m1,ta,ma    lmul = 1
114  //    vluxei16.v	v2,(a0),v8       emul = 2
115  //    In this case, we need to ensure the flownumis right shift by flowsPrevThisUop, However, the mask passed to mergebuff is right shift by flowsPrevThisVd e.g:
116  //      vl = 9
117  //      srcMask = 0x1FF
118  //      uopIdxInField = 0 and vdIdxInField = 0, flowMask = 0x00FF, toMergeBuffMask = 0x01FF
119  //      uopIdxInField = 1 and vdIdxInField = 0, flowMask = 0x0001, toMergeBuffMask = 0x01FF
120  //      uopIdxInField = 0 and vdIdxInField = 0, flowMask = 0x0000, toMergeBuffMask = 0x0000
121  //      uopIdxInField = 0 and vdIdxInField = 0, flowMask = 0x0000, toMergeBuffMask = 0x0000
122  val isSpecialIndexed = isIndexed(instType) && s0_emul.asSInt > s0_lmul.asSInt
123
124  val srcMask = GenFlowMask(Mux(s0_vm, Fill(VLEN, 1.U(1.W)), io.in.bits.src_mask), vvstart, evl, true)
125  val srcMaskShiftBits = Mux(isSpecialIndexed, flowsPrevThisUop, flowsPrevThisVd)
126
127  val flowMask = ((srcMask &
128    UIntToMask(flowsIncludeThisUop.asUInt, VLEN + 1) &
129    (~UIntToMask(flowsPrevThisUop.asUInt, VLEN)).asUInt
130  ) >> srcMaskShiftBits)(VLENB - 1, 0)
131  val indexedSrcMask = (srcMask >> flowsPrevThisVd).asUInt //only for index instructions
132
133  // Used to calculate the element index.
134  // See 'splitbuffer' for 'io.out.splitIdxOffset' and 'mergebuffer' for 'merge data'
135  val indexedSplitOffset = Mux(isSpecialIndexed, flowsPrevThisUop - flowsPrevThisVd, 0.U) // only for index instructions of emul > lmul
136  val vlmax = GenVLMAX(s0_lmul, s0_sew)
137
138  // connect
139  s0_out := DontCare
140  s0_out match {case x =>
141    x.uop := io.in.bits.uop
142    x.uop.vpu.vl := evl
143    x.uop.uopIdx := uopIdx
144    x.uop.numUops := numUops
145    x.uop.lastUop := (uopIdx +& 1.U) === numUops
146    x.uop.vpu.nf  := s0_nf
147    x.flowMask := flowMask
148    x.indexedSrcMask := indexedSrcMask // Only vector indexed instructions uses it
149    x.indexedSplitOffset := indexedSplitOffset
150    x.byteMask := GenUopByteMask(flowMask, Cat("b0".U, alignedType))(VLENB - 1, 0)
151    x.fof := isUnitStride(s0_mop) && us_fof(s0_fuOpType)
152    x.baseAddr := io.in.bits.src_rs1
153    x.stride := io.in.bits.src_stride
154    x.flowNum := flowNum
155    x.nfields := s0_nfield
156    x.vm := s0_vm
157    x.usWholeReg := isUsWholeReg
158    x.usMaskReg := isMaskReg
159    x.eew := s0_eew
160    x.sew := s0_sew
161    x.emul := s0_emul
162    x.lmul := s0_lmul
163    x.vlmax := Mux(isUsWholeReg, evl, vlmax)
164    x.instType := instType
165    x.data := io.in.bits.src_vs3
166    x.vdIdxInField := vdIdxInField
167    x.preIsSplit  := s0_preIsSplit
168    x.alignedType := broadenAligendType
169    x.indexVlMaxInVd := indexVlMaxInVd
170  }
171  s0_valid := io.in.valid && !s0_kill
172  /**-------------------------------------
173    * s1 stage
174    * ------------------------------------
175    * generate UopOffset
176    */
177  val s1_valid         = RegInit(false.B)
178  val s1_kill          = Wire(Bool())
179  val s1_in            = Wire(new VLSBundle(isVStore))
180  val s1_can_go        = io.out.ready && io.toMergeBuffer.resp.valid
181  val s1_fire          = s1_valid && !s1_kill && s1_can_go
182
183  s1_ready         := s1_kill || !s1_valid || io.out.ready && io.toMergeBuffer.resp.valid
184
185  when(s0_fire){
186    s1_valid := true.B
187  }.elsewhen(s1_fire){
188    s1_valid := false.B
189  }.elsewhen(s1_kill){
190    s1_valid := false.B
191  }
192  s1_in := RegEnable(s0_out, s0_fire)
193
194  val s1_flowNum          = s1_in.flowNum
195  val s1_uop              = s1_in.uop
196  val s1_uopidx           = s1_uop.vpu.vuopIdx
197  val s1_nf               = s1_uop.vpu.nf
198  val s1_nfields          = s1_in.nfields
199  val s1_eew              = s1_in.eew
200  val s1_emul             = s1_in.emul
201  val s1_lmul             = s1_in.lmul
202  val s1_instType         = s1_in.instType
203  val s1_stride           = s1_in.stride
204  val s1_vmask            = FillInterleaved(8, s1_in.byteMask)(VLEN-1, 0)
205  val s1_alignedType      = s1_in.alignedType
206  val s1_isSpecialIndexed = isIndexed(s1_instType) && s1_emul.asSInt > s1_lmul.asSInt
207  val s1_mask             = Mux(s1_isSpecialIndexed, s1_in.indexedSrcMask, s1_in.flowMask)
208  val s1_vdIdx            = s1_in.vdIdxInField
209  val s1_fof              = s1_in.fof
210  val s1_notIndexedStride = Mux( // stride for strided/unit-stride instruction
211    isStrided(s1_instType),
212    s1_stride(XLEN - 1, 0), // for strided load, stride = x[rs2]
213    s1_nfields << s1_eew(1, 0) // for unit-stride load, stride = eew * NFIELDS
214  )
215
216  val stride     = Mux(isIndexed(s1_instType), s1_stride, s1_notIndexedStride).asUInt // if is index instructions, get index when split
217  val uopOffset  = genVUopOffset(s1_instType, s1_fof, s1_uopidx, s1_nf, s1_eew(1, 0), stride, s1_alignedType)
218  val activeNum  = Mux(s1_in.preIsSplit, PopCount(s1_in.flowMask), s1_flowNum)
219
220  s1_kill               := s1_in.uop.robIdx.needFlush(io.redirect)
221
222  // query mergeBuffer
223  io.toMergeBuffer.req.valid             := s1_fire // only can_go will get MergeBuffer entry
224  io.toMergeBuffer.req.bits.flowNum      := activeNum
225  io.toMergeBuffer.req.bits.data         := s1_in.data
226  io.toMergeBuffer.req.bits.uop          := s1_in.uop
227  io.toMergeBuffer.req.bits.mask         := s1_mask
228  io.toMergeBuffer.req.bits.vaddr        := DontCare
229  io.toMergeBuffer.req.bits.vdIdx        := s1_vdIdx  //TODO vdIdxReg should no longer be useful, don't delete it for now
230  io.toMergeBuffer.req.bits.fof          := s1_in.fof
231  io.toMergeBuffer.req.bits.vlmax        := s1_in.vlmax
232//   io.toMergeBuffer.req.bits.vdOffset :=
233
234  //TODO vdIdxReg should no longer be useful, don't delete it for now
235//  when (s1_in.uop.lastUop && s1_fire || s1_kill) {
236//    vdIdxReg := 0.U
237//  }.elsewhen(s1_fire) {
238//    vdIdxReg := vdIdxReg + 1.U
239//    XSError(vdIdxReg + 1.U === 0.U, s"Overflow! The number of vd should be less than 8\n")
240//  }
241  // out connect
242  io.out.valid          := s1_valid && io.toMergeBuffer.resp.valid && (activeNum =/= 0.U) // if activeNum == 0, this uop do nothing, can be killed.
243  io.out.bits           := s1_in
244  io.out.bits.uopOffset := uopOffset
245  io.out.bits.stride    := stride
246  io.out.bits.mBIndex   := io.toMergeBuffer.resp.bits.mBIndex
247
248  XSPerfAccumulate("split_out",     io.out.fire)
249  XSPerfAccumulate("pipe_block",    io.out.valid && !io.out.ready)
250  XSPerfAccumulate("mbuffer_block", s1_valid && io.out.ready && !io.toMergeBuffer.resp.valid)
251}
252
253abstract class VSplitBuffer(isVStore: Boolean = false)(implicit p: Parameters) extends VLSUModule{
254  val io = IO(new VSplitBufferIO(isVStore))
255
256  val uopq          = Reg(new VLSBundle(isVStore))
257  val allocated     = RegInit(false.B)
258  val needCancel    = WireInit(false.B)
259  val activeIssue   = Wire(Bool())
260  val inActiveIssue = Wire(Bool())
261  val splitFinish   = WireInit(false.B)
262
263  // for split
264  val splitIdx = RegInit(0.U(flowIdxBits.W))
265  val strideOffsetReg = RegInit(0.U(VLEN.W))
266
267  /**
268    * Redirect
269    */
270  val cancelEnq    = io.in.bits.uop.robIdx.needFlush(io.redirect)
271  val canEnqueue   = io.in.valid
272  val needEnqueue  = canEnqueue && !cancelEnq
273
274  // enqueue
275  val offset    = PopCount(needEnqueue)
276  val canAccept = !allocated || allocated && splitFinish && (activeIssue || inActiveIssue) // if is valid entry, need split finish and send last uop
277  io.in.ready  := canAccept
278  val doEnqueue = canAccept && needEnqueue
279
280  when(doEnqueue){
281    uopq := io.in.bits
282  }
283
284  //split uops
285  val issueValid       = allocated && !needCancel
286  val issueEntry       = uopq
287  val issueMbIndex     = issueEntry.mBIndex
288  val issueFlowNum     = issueEntry.flowNum
289  val issueBaseAddr    = issueEntry.baseAddr
290  val issueUop         = issueEntry.uop
291  val issueUopIdx      = issueUop.vpu.vuopIdx
292  val issueInstType    = issueEntry.instType
293  val issueUopOffset   = issueEntry.uopOffset
294  val issueEew         = issueEntry.eew
295  val issueSew         = issueEntry.sew
296  val issueLmul        = issueEntry.lmul
297  val issueEmul        = issueEntry.emul
298  val issueAlignedType = issueEntry.alignedType
299  val issuePreIsSplit  = issueEntry.preIsSplit
300  val issueByteMask    = issueEntry.byteMask
301  val issueVLMAXMask   = issueEntry.vlmax - 1.U
302  val issueIsWholeReg  = issueEntry.usWholeReg
303  val issueVLMAXLog2   = GenVLMAXLog2(issueEntry.lmul, issueSew)
304  val issueVlMaxInVd   = issueEntry.indexVlMaxInVd
305  val elemIdx = GenElemIdx(
306    instType = issueInstType,
307    emul = issueEmul,
308    lmul = issueLmul,
309    eew = issueEew,
310    sew = issueSew,
311    uopIdx = issueUopIdx,
312    flowIdx = splitIdx
313  ) // elemIdx inside an inst, for exception
314
315  val splitIdxOffset = issueEntry.indexedSplitOffset + splitIdx
316
317  val indexFlowInnerIdx = elemIdx & issueVlMaxInVd
318  val nfIdx = Mux(issueIsWholeReg, 0.U, elemIdx >> issueVLMAXLog2)
319  val fieldOffset = nfIdx << issueAlignedType // field offset inside a segment
320
321  val indexedStride    = IndexAddr( // index for indexed instruction
322    index = issueEntry.stride,
323    flow_inner_idx = indexFlowInnerIdx,
324    eew = issueEew
325  )
326  val issueStride = Mux(isIndexed(issueInstType), indexedStride, strideOffsetReg)
327  val vaddr = issueBaseAddr + issueUopOffset + issueStride
328  val mask = genVWmask128(vaddr ,issueAlignedType) // scala maske for flow
329  val flowMask = issueEntry.flowMask
330  val vecActive = (flowMask & UIntToOH(splitIdx)).orR
331  /*
332   * Unit-Stride split to one flow or two flow.
333   * for Unit-Stride, if uop's addr is aligned with 128-bits, split it to one flow, otherwise split two
334   */
335  val usLowBitsAddr    = getCheckAddrLowBits(issueBaseAddr, maxMemByteNum) + getCheckAddrLowBits(issueUopOffset, maxMemByteNum)
336  val usAligned128     = (getCheckAddrLowBits(usLowBitsAddr, maxMemByteNum) === 0.U)// addr 128-bit aligned
337  val usSplitMask      = genUSSplitMask(issueByteMask, splitIdx, getCheckAddrLowBits(usLowBitsAddr, maxMemByteNum))
338  val usNoSplit        = (usAligned128 || !getOverflowBit(getCheckAddrLowBits(usLowBitsAddr, maxMemByteNum) +& PopCount(usSplitMask), maxMemByteNum)) &&
339                          !issuePreIsSplit &&
340                          (splitIdx === 0.U)// unit-stride uop don't need to split into two flow
341  val usSplitVaddr     = genUSSplitAddr(vaddr, splitIdx)
342  val regOffset        = getCheckAddrLowBits(usLowBitsAddr, maxMemByteNum) // offset in 256-bits vd
343  XSError((splitIdx > 1.U && usNoSplit) || (splitIdx > 1.U && !issuePreIsSplit) , "Unit-Stride addr split error!\n")
344
345  // data
346  io.out.bits match { case x =>
347    x.uop                   := issueUop
348    x.vaddr                 := Mux(!issuePreIsSplit, usSplitVaddr, vaddr)
349    x.alignedType           := issueAlignedType
350    x.isvec                 := true.B
351    x.mask                  := Mux(!issuePreIsSplit, usSplitMask, mask)
352    x.reg_offset            := regOffset //for merge unit-stride data
353    x.vecActive             := Mux(!issuePreIsSplit, true.B, vecActive) // currently, unit-stride's flow always send to pipeline
354    x.is_first_ele          := DontCare
355    x.usSecondInv           := usNoSplit
356    x.elemIdx               := elemIdx
357    x.elemIdxInsideVd       := splitIdxOffset // if is Unit-Stride, elemIdx is the index of 2 splited mem request (for merge data)
358    x.uop_unit_stride_fof   := DontCare
359    x.isFirstIssue          := DontCare
360    x.mBIndex               := issueMbIndex
361  }
362
363  // redirect
364  needCancel := uopq.uop.robIdx.needFlush(io.redirect) && allocated
365
366 /* Execute logic */
367  /** Issue to scala pipeline**/
368  val allowIssue = io.out.ready
369  val issueCount = Mux(usNoSplit, 2.U, (PopCount(inActiveIssue) + PopCount(activeIssue))) // for dont need split unit-stride, issue two flow
370  splitFinish := splitIdx >= (issueFlowNum - issueCount)
371
372  // handshake
373  activeIssue := issueValid && allowIssue && (vecActive || !issuePreIsSplit) // active issue, current use in no unit-stride
374  inActiveIssue := issueValid && !vecActive && issuePreIsSplit
375  when (!issueEntry.uop.robIdx.needFlush(io.redirect)) {
376    when (!splitFinish) {
377      when (activeIssue || inActiveIssue) {
378        // The uop has not been entirly splited yet
379        splitIdx := splitIdx + issueCount
380        strideOffsetReg := Mux(!issuePreIsSplit, strideOffsetReg, strideOffsetReg + issueEntry.stride) // when normal unit-stride, don't use strideOffsetReg
381      }
382    }.otherwise {
383      when (activeIssue || inActiveIssue) {
384        // The uop is done spliting
385        splitIdx := 0.U(flowIdxBits.W) // initialize flowIdx
386        strideOffsetReg := 0.U
387      }
388    }
389  }.otherwise {
390    splitIdx := 0.U(flowIdxBits.W) // initialize flowIdx
391    strideOffsetReg := 0.U
392  }
393  // allocated
394  when(doEnqueue){ // if enqueue need to been cancelled, it will be false, so this have high priority
395    allocated := true.B
396  }.elsewhen(needCancel) { // redirect
397    allocated := false.B
398  }.elsewhen(splitFinish && (activeIssue || inActiveIssue)){ //dequeue
399    allocated := false.B
400  }
401
402  // out connect
403  io.out.valid := issueValid && (vecActive || !issuePreIsSplit) // TODO: inactive unit-stride uop do not send to pipeline
404
405  XSPerfAccumulate("out_valid",             io.out.valid)
406  XSPerfAccumulate("out_fire",              io.out.fire)
407  XSPerfAccumulate("out_fire_unitstride",   io.out.fire && !issuePreIsSplit)
408  XSPerfAccumulate("unitstride_vlenAlign",  io.out.fire && !issuePreIsSplit && getCheckAddrLowBits(io.out.bits.vaddr, maxMemByteNum) === 0.U)
409  XSPerfAccumulate("unitstride_invalid",    io.out.ready && issueValid && !issuePreIsSplit && PopCount(io.out.bits.mask).orR)
410}
411
412class VSSplitBufferImp(implicit p: Parameters) extends VSplitBuffer(isVStore = true){
413  // split data
414  val splitData = genVSData(
415        data = issueEntry.data.asUInt,
416        elemIdx = splitIdxOffset,
417        alignedType = issueAlignedType
418      )
419  val flowData = genVWdata(splitData, issueAlignedType)
420  val usSplitData      = genUSSplitData(issueEntry.data.asUInt, splitIdx, vaddr(3,0))
421
422  val sqIdx = issueUop.sqIdx + splitIdx
423  io.out.bits.uop.sqIdx := sqIdx
424
425  // send data to sq
426  val vstd = io.vstd.get
427  vstd.valid := issueValid && (vecActive || !issuePreIsSplit)
428  vstd.bits.uop := issueUop
429  vstd.bits.uop.sqIdx := sqIdx
430  vstd.bits.data := Mux(!issuePreIsSplit, usSplitData, flowData)
431  vstd.bits.debug := DontCare
432  vstd.bits.vdIdx.get := DontCare
433  vstd.bits.vdIdxInField.get := DontCare
434  vstd.bits.mask.get := Mux(!issuePreIsSplit, usSplitMask, mask)
435
436}
437
438class VLSplitBufferImp(implicit p: Parameters) extends VSplitBuffer(isVStore = false){
439  io.out.bits.uop.lqIdx := issueUop.lqIdx + splitIdx
440}
441
442class VSSplitPipelineImp(implicit p: Parameters) extends VSplitPipeline(isVStore = true){
443  override def us_whole_reg(fuOpType: UInt): Bool = fuOpType === VstuType.vsr
444  override def us_mask(fuOpType: UInt): Bool      = fuOpType === VstuType.vsm
445  override def us_fof(fuOpType: UInt): Bool       = false.B // dont have vector fof store
446}
447
448class VLSplitPipelineImp(implicit p: Parameters) extends VSplitPipeline(isVStore = false){
449
450  override def us_whole_reg(fuOpType: UInt): Bool = fuOpType === VlduType.vlr
451  override def us_mask(fuOpType: UInt): Bool      = fuOpType === VlduType.vlm
452  override def us_fof(fuOpType: UInt): Bool       = fuOpType === VlduType.vleff
453}
454
455class VLSplitImp(implicit p: Parameters) extends VLSUModule{
456  val io = IO(new VSplitIO(isVStore=false))
457  val splitPipeline = Module(new VLSplitPipelineImp())
458  val splitBuffer = Module(new VLSplitBufferImp())
459  // Split Pipeline
460  splitPipeline.io.in <> io.in
461  splitPipeline.io.redirect <> io.redirect
462  io.toMergeBuffer <> splitPipeline.io.toMergeBuffer
463
464  // Split Buffer
465  splitBuffer.io.in <> splitPipeline.io.out
466  splitBuffer.io.redirect <> io.redirect
467  io.out <> splitBuffer.io.out
468}
469
470class VSSplitImp(implicit p: Parameters) extends VLSUModule{
471  val io = IO(new VSplitIO(isVStore=true))
472  val splitPipeline = Module(new VSSplitPipelineImp())
473  val splitBuffer = Module(new VSSplitBufferImp())
474  // Split Pipeline
475  splitPipeline.io.in <> io.in
476  splitPipeline.io.redirect <> io.redirect
477  io.toMergeBuffer <> splitPipeline.io.toMergeBuffer
478
479  // Split Buffer
480  splitBuffer.io.in <> splitPipeline.io.out
481  splitBuffer.io.redirect <> io.redirect
482  io.out <> splitBuffer.io.out
483  io.vstd.get <> splitBuffer.io.vstd.get
484}
485
486