xref: /XiangShan/src/main/scala/xiangshan/backend/decode/DecodeUnitComp.scala (revision a63155a6a44b3c7714e55906b55ebf92e0efc125)
1/***************************************************************************************
2  * Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
3  * Copyright (c) 2020-2021 Peng Cheng Laboratory
4  *
5  * XiangShan is licensed under Mulan PSL v2.
6  * You can use this software according to the terms and conditions of the Mulan PSL v2.
7  * You may obtain a copy of Mulan PSL v2 at:
8  *          http://license.coscl.org.cn/MulanPSL2
9  *
10  * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
11  * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
12  * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
13  *
14  * See the Mulan PSL v2 for more details.
15  ***************************************************************************************/
16
17package xiangshan.backend.decode
18
19import chipsalliance.rocketchip.config.Parameters
20import chisel3._
21import chisel3.util._
22import freechips.rocketchip.rocket.Instructions
23import freechips.rocketchip.util.uintToBitPat
24import utils._
25import utility._
26import xiangshan.ExceptionNO.illegalInstr
27import xiangshan._
28import xiangshan.backend.fu.fpu.FPU
29import xiangshan.backend.fu.FuType
30import freechips.rocketchip.rocket.Instructions._
31import xiangshan.backend.Bundles.{DecodedInst, StaticInst}
32import xiangshan.backend.decode.isa.bitfield.XSInstBitFields
33import xiangshan.backend.fu.vector.Bundles.{VSew, VType, VLmul}
34import yunsuan.VpermType
35
36import scala.collection.Seq
37
38trait VectorConstants {
39  val MAX_VLMUL = 8
40  val FP_TMP_REG_MV = 32
41  val VECTOR_TMP_REG_LMUL = 33 // 33~47  ->  15
42}
43
44class DecodeUnitCompIO(implicit p: Parameters) extends XSBundle {
45  val enq = new Bundle { val staticInst = Input(new StaticInst) }
46  val vtype = Input(new VType)
47  val isComplex = Input(Vec(DecodeWidth - 1, Bool()))
48  val validFromIBuf = Input(Vec(DecodeWidth, Bool()))
49  val readyFromRename = Input(Vec(RenameWidth, Bool()))
50  val deq = new Bundle {
51    val decodedInsts = Output(Vec(RenameWidth, new DecodedInst))
52    val isVset = Output(Bool())
53    val readyToIBuf = Output(Vec(DecodeWidth, Bool()))
54    val validToRename = Output(Vec(RenameWidth, Bool()))
55    val complexNum = Output(UInt(3.W))
56  }
57  val csrCtrl = Input(new CustomCSRCtrlIO)
58}
59
60/**
61  * @author zly
62  */
63class DecodeUnitComp()(implicit p : Parameters) extends XSModule with DecodeUnitConstants with VectorConstants {
64  val io = IO(new DecodeUnitCompIO)
65
66  val maxUopSize = MaxUopSize
67  //input bits
68  val staticInst = Wire(new StaticInst)
69
70
71  staticInst := io.enq.staticInst
72  private val inst: XSInstBitFields = staticInst.instr.asTypeOf(new XSInstBitFields)
73
74  val src1 = Cat(0.U(1.W), inst.RS1)
75  val src2 = Cat(0.U(1.W), inst.RS2)
76  val dest = Cat(0.U(1.W), inst.RD)
77
78
79  //output bits
80  val decodedInsts = Wire(Vec(RenameWidth, new DecodedInst))
81  val validToRename = Wire(Vec(RenameWidth, Bool()))
82  val readyToIBuf = Wire(Vec(DecodeWidth, Bool()))
83  val complexNum = Wire(UInt(3.W))
84
85  //output of DecodeUnit
86  val decodedInstsSimple = Wire(new DecodedInst)
87  val numOfUop = Wire(UInt(log2Up(maxUopSize+1).W))
88  val lmul = Wire(UInt(4.W))
89  val isVsetSimple = Wire(Bool())
90
91  //pre decode
92  val simple = Module(new DecodeUnit)
93  simple.io.enq.ctrlFlow := staticInst
94  simple.io.enq.vtype := io.vtype
95  simple.io.csrCtrl := io.csrCtrl
96  decodedInstsSimple := simple.io.deq.decodedInst
97  lmul := simple.io.deq.uopInfo.lmul
98  isVsetSimple := simple.io.deq.decodedInst.isVset
99  when(isVsetSimple) {
100    when(dest === 0.U && src1 === 0.U) {
101      decodedInstsSimple.fuOpType := VSETOpType.keepVl(simple.io.deq.decodedInst.fuOpType)
102    }.elsewhen(src1 === 0.U) {
103      decodedInstsSimple.fuOpType := VSETOpType.setVlmax(simple.io.deq.decodedInst.fuOpType)
104    }
105    when(io.vtype.illegal){
106      decodedInstsSimple.flushPipe := true.B
107    }
108  }
109  //Type of uop Div
110  val typeOfSplit = decodedInstsSimple.uopSplitType
111
112  when(typeOfSplit === UopSplitType.DIR) {
113    numOfUop := Mux(dest =/= 0.U, 2.U,
114      Mux(src1 =/= 0.U, 1.U,
115        Mux(VSETOpType.isVsetvl(decodedInstsSimple.fuOpType), 2.U, 1.U)))
116  } .otherwise {
117    numOfUop := simple.io.deq.uopInfo.numOfUop
118  }
119
120
121  //uop div up to maxUopSize
122  val csBundle = Wire(Vec(maxUopSize, new DecodedInst))
123  csBundle.map { case dst =>
124    dst := decodedInstsSimple
125    dst.firstUop := false.B
126    dst.lastUop := false.B
127  }
128
129  csBundle(0).numUops := numOfUop
130  csBundle(0).firstUop := true.B
131  csBundle(numOfUop - 1.U).lastUop := true.B
132
133  switch(typeOfSplit) {
134    is(UopSplitType.DIR) {
135      when(isVsetSimple) {
136        when(dest =/= 0.U) {
137          csBundle(0).fuType := FuType.vsetiwi.U
138          csBundle(0).fuOpType := VSETOpType.switchDest(decodedInstsSimple.fuOpType)
139          csBundle(0).flushPipe := false.B
140          csBundle(0).rfWen := true.B
141          csBundle(0).vecWen := false.B
142          csBundle(1).ldest := VCONFIG_IDX.U
143          csBundle(1).rfWen := false.B
144          csBundle(1).vecWen := true.B
145        }.elsewhen(src1 =/= 0.U) {
146          csBundle(0).ldest := VCONFIG_IDX.U
147        }.elsewhen(VSETOpType.isVsetvli(decodedInstsSimple.fuOpType)) {
148          csBundle(0).fuType := FuType.vsetfwf.U
149          csBundle(0).srcType(0) := SrcType.vp
150          csBundle(0).lsrc(0) := VCONFIG_IDX.U
151        }.elsewhen(VSETOpType.isVsetvl(decodedInstsSimple.fuOpType)) {
152          csBundle(0).srcType(0) := SrcType.reg
153          csBundle(0).srcType(1) := SrcType.imm
154          csBundle(0).lsrc(1) := 0.U
155          csBundle(0).ldest := FP_TMP_REG_MV.U
156          csBundle(0).fuType := FuType.i2f.U
157          csBundle(0).rfWen := false.B
158          csBundle(0).fpWen := true.B
159          csBundle(0).vecWen := false.B
160          csBundle(0).fpu.isAddSub := false.B
161          csBundle(0).fpu.typeTagIn := FPU.D
162          csBundle(0).fpu.typeTagOut := FPU.D
163          csBundle(0).fpu.fromInt := true.B
164          csBundle(0).fpu.wflags := false.B
165          csBundle(0).fpu.fpWen := true.B
166          csBundle(0).fpu.div := false.B
167          csBundle(0).fpu.sqrt := false.B
168          csBundle(0).fpu.fcvt := false.B
169          csBundle(0).flushPipe := false.B
170          csBundle(1).fuType := FuType.vsetfwf.U
171          csBundle(1).srcType(0) := SrcType.vp
172          csBundle(1).lsrc(0) := VCONFIG_IDX.U
173          csBundle(1).srcType(1) := SrcType.fp
174          csBundle(1).lsrc(1) := FP_TMP_REG_MV.U
175          csBundle(1).ldest := VCONFIG_IDX.U
176        }
177      }
178    }
179    is(UopSplitType.VEC_VVV) {
180      for (i <- 0 until MAX_VLMUL) {
181        csBundle(i).lsrc(0) := src1 + i.U
182        csBundle(i).lsrc(1) := src2 + i.U
183        csBundle(i).lsrc(2) := dest + i.U
184        csBundle(i).ldest := dest + i.U
185        csBundle(i).uopIdx := i.U
186      }
187    }
188    is(UopSplitType.VEC_VFV) {
189      for (i <- 0 until MAX_VLMUL) {
190        csBundle(i).lsrc(1) := src2 + i.U
191        csBundle(i).lsrc(2) := dest + i.U
192        csBundle(i).ldest := dest + i.U
193        csBundle(i).uopIdx := i.U
194      }
195    }
196    is(UopSplitType.VEC_EXT2) {
197      for (i <- 0 until MAX_VLMUL / 2) {
198        csBundle(2 * i).lsrc(1) := src2 + i.U
199        csBundle(2 * i).lsrc(2) := dest + (2 * i).U
200        csBundle(2 * i).ldest := dest + (2 * i).U
201        csBundle(2 * i).uopIdx := (2 * i).U
202        csBundle(2 * i + 1).lsrc(1) := src2 + i.U
203        csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U
204        csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U
205        csBundle(2 * i + 1).uopIdx := (2 * i + 1).U
206      }
207    }
208    is(UopSplitType.VEC_EXT4) {
209      for (i <- 0 until MAX_VLMUL / 4) {
210        csBundle(4 * i).lsrc(1) := src2 + i.U
211        csBundle(4 * i).lsrc(2) := dest + (4 * i).U
212        csBundle(4 * i).ldest := dest + (4 * i).U
213        csBundle(4 * i).uopIdx := (4 * i).U
214        csBundle(4 * i + 1).lsrc(1) := src2 + i.U
215        csBundle(4 * i + 1).lsrc(2) := dest + (4 * i + 1).U
216        csBundle(4 * i + 1).ldest := dest + (4 * i + 1).U
217        csBundle(4 * i + 1).uopIdx := (4 * i + 1).U
218        csBundle(4 * i + 2).lsrc(1) := src2 + i.U
219        csBundle(4 * i + 2).lsrc(2) := dest + (4 * i + 2).U
220        csBundle(4 * i + 2).ldest := dest + (4 * i + 2).U
221        csBundle(4 * i + 2).uopIdx := (4 * i + 2).U
222        csBundle(4 * i + 3).lsrc(1) := src2 + i.U
223        csBundle(4 * i + 3).lsrc(2) := dest + (4 * i + 3).U
224        csBundle(4 * i + 3).ldest := dest + (4 * i + 3).U
225        csBundle(4 * i + 3).uopIdx := (4 * i + 3).U
226      }
227    }
228    is(UopSplitType.VEC_EXT8) {
229      for (i <- 0 until MAX_VLMUL) {
230        csBundle(i).lsrc(1) := src2
231        csBundle(i).lsrc(2) := dest + i.U
232        csBundle(i).ldest := dest + i.U
233        csBundle(i).uopIdx := i.U
234      }
235    }
236    is(UopSplitType.VEC_0XV) {
237      /*
238      FMV.D.X
239       */
240      csBundle(0).srcType(0) := SrcType.reg
241      csBundle(0).srcType(1) := SrcType.imm
242      csBundle(0).lsrc(1) := 0.U
243      csBundle(0).ldest := FP_TMP_REG_MV.U
244      csBundle(0).fuType := FuType.i2f.U
245      csBundle(0).rfWen := false.B
246      csBundle(0).fpWen := true.B
247      csBundle(0).vecWen := false.B
248      csBundle(0).fpu.isAddSub := false.B
249      csBundle(0).fpu.typeTagIn := FPU.D
250      csBundle(0).fpu.typeTagOut := FPU.D
251      csBundle(0).fpu.fromInt := true.B
252      csBundle(0).fpu.wflags := false.B
253      csBundle(0).fpu.fpWen := true.B
254      csBundle(0).fpu.div := false.B
255      csBundle(0).fpu.sqrt := false.B
256      csBundle(0).fpu.fcvt := false.B
257      /*
258      vfmv.s.f
259       */
260      csBundle(1).srcType(0) := SrcType.fp
261      csBundle(1).srcType(1) := SrcType.vp
262      csBundle(1).srcType(2) := SrcType.vp
263      csBundle(1).lsrc(0) := FP_TMP_REG_MV.U
264      csBundle(1).lsrc(1) := 0.U
265      csBundle(1).lsrc(2) := dest
266      csBundle(1).ldest := dest
267      csBundle(1).fuType := FuType.vppu.U
268      csBundle(1).fuOpType := VpermType.dummy
269      csBundle(1).rfWen := false.B
270      csBundle(1).fpWen := false.B
271      csBundle(1).vecWen := true.B
272    }
273    is(UopSplitType.VEC_VXV) {
274      /*
275      FMV.D.X
276       */
277      csBundle(0).srcType(0) := SrcType.reg
278      csBundle(0).srcType(1) := SrcType.imm
279      csBundle(0).lsrc(1) := 0.U
280      csBundle(0).ldest := FP_TMP_REG_MV.U
281      csBundle(0).fuType := FuType.i2f.U
282      csBundle(0).rfWen := false.B
283      csBundle(0).fpWen := true.B
284      csBundle(0).vecWen := false.B
285      csBundle(0).fpu.isAddSub := false.B
286      csBundle(0).fpu.typeTagIn := FPU.D
287      csBundle(0).fpu.typeTagOut := FPU.D
288      csBundle(0).fpu.fromInt := true.B
289      csBundle(0).fpu.wflags := false.B
290      csBundle(0).fpu.fpWen := true.B
291      csBundle(0).fpu.div := false.B
292      csBundle(0).fpu.sqrt := false.B
293      csBundle(0).fpu.fcvt := false.B
294      /*
295      LMUL
296       */
297      for (i <- 0 until MAX_VLMUL) {
298        csBundle(i + 1).srcType(0) := SrcType.fp
299        csBundle(i + 1).lsrc(0) := FP_TMP_REG_MV.U
300        csBundle(i + 1).lsrc(1) := src2 + i.U
301        csBundle(i + 1).lsrc(2) := dest + i.U
302        csBundle(i + 1).ldest := dest + i.U
303        csBundle(i + 1).uopIdx := i.U
304      }
305    }
306    is(UopSplitType.VEC_VVW) {
307      for (i <- 0 until MAX_VLMUL / 2) {
308        csBundle(2 * i).lsrc(0) := src1 + i.U
309        csBundle(2 * i).lsrc(1) := src2 + i.U
310        csBundle(2 * i).lsrc(2) := dest + (2 * i).U
311        csBundle(2 * i).ldest := dest + (2 * i).U
312        csBundle(2 * i).uopIdx := (2 * i).U
313        csBundle(2 * i + 1).lsrc(0) := src1 + i.U
314        csBundle(2 * i + 1).lsrc(1) := src2 + i.U
315        csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U
316        csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U
317        csBundle(2 * i + 1).uopIdx := (2 * i + 1).U
318      }
319    }
320    is(UopSplitType.VEC_VFW) {
321      for (i <- 0 until MAX_VLMUL / 2) {
322        csBundle(2 * i).lsrc(0) := src1
323        csBundle(2 * i).lsrc(1) := src2 + i.U
324        csBundle(2 * i).lsrc(2) := dest + (2 * i).U
325        csBundle(2 * i).ldest := dest + (2 * i).U
326        csBundle(2 * i).uopIdx := (2 * i).U
327        csBundle(2 * i + 1).lsrc(0) := src1
328        csBundle(2 * i + 1).lsrc(1) := src2 + i.U
329        csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U
330        csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U
331        csBundle(2 * i + 1).uopIdx := (2 * i + 1).U
332      }
333    }
334    is(UopSplitType.VEC_WVW) {
335      for (i <- 0 until MAX_VLMUL / 2) {
336        csBundle(2 * i).lsrc(0) := src1 + i.U
337        csBundle(2 * i).lsrc(1) := src2 + (2 * i).U
338        csBundle(2 * i).lsrc(2) := dest + (2 * i).U
339        csBundle(2 * i).ldest := dest + (2 * i).U
340        csBundle(2 * i).uopIdx := (2 * i).U
341        csBundle(2 * i + 1).lsrc(0) := src1 + i.U
342        csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i + 1).U
343        csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U
344        csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U
345        csBundle(2 * i + 1).uopIdx := (2 * i + 1).U
346      }
347    }
348    is(UopSplitType.VEC_VXW) {
349      /*
350      FMV.D.X
351       */
352      csBundle(0).srcType(0) := SrcType.reg
353      csBundle(0).srcType(1) := SrcType.imm
354      csBundle(0).lsrc(1) := 0.U
355      csBundle(0).ldest := FP_TMP_REG_MV.U
356      csBundle(0).fuType := FuType.i2f.U
357      csBundle(0).rfWen := false.B
358      csBundle(0).fpWen := true.B
359      csBundle(0).vecWen := false.B
360      csBundle(0).fpu.isAddSub := false.B
361      csBundle(0).fpu.typeTagIn := FPU.D
362      csBundle(0).fpu.typeTagOut := FPU.D
363      csBundle(0).fpu.fromInt := true.B
364      csBundle(0).fpu.wflags := false.B
365      csBundle(0).fpu.fpWen := true.B
366      csBundle(0).fpu.div := false.B
367      csBundle(0).fpu.sqrt := false.B
368      csBundle(0).fpu.fcvt := false.B
369
370      for (i <- 0 until MAX_VLMUL / 2) {
371        csBundle(2 * i + 1).srcType(0) := SrcType.fp
372        csBundle(2 * i + 1).lsrc(0) := FP_TMP_REG_MV.U
373        csBundle(2 * i + 1).lsrc(1) := src2 + i.U
374        csBundle(2 * i + 1).lsrc(2) := dest + (2 * i).U
375        csBundle(2 * i + 1).ldest := dest + (2 * i).U
376        csBundle(2 * i + 1).uopIdx := (2 * i).U
377        csBundle(2 * i + 2).srcType(0) := SrcType.fp
378        csBundle(2 * i + 2).lsrc(0) := FP_TMP_REG_MV.U
379        csBundle(2 * i + 2).lsrc(1) := src2 + i.U
380        csBundle(2 * i + 2).lsrc(2) := dest + (2 * i + 1).U
381        csBundle(2 * i + 2).ldest := dest + (2 * i + 1).U
382        csBundle(2 * i + 2).uopIdx := (2 * i + 1).U
383      }
384    }
385    is(UopSplitType.VEC_WXW) {
386      /*
387      FMV.D.X
388       */
389      csBundle(0).srcType(0) := SrcType.reg
390      csBundle(0).srcType(1) := SrcType.imm
391      csBundle(0).lsrc(1) := 0.U
392      csBundle(0).ldest := FP_TMP_REG_MV.U
393      csBundle(0).fuType := FuType.i2f.U
394      csBundle(0).rfWen := false.B
395      csBundle(0).fpWen := true.B
396      csBundle(0).vecWen := false.B
397      csBundle(0).fpu.isAddSub := false.B
398      csBundle(0).fpu.typeTagIn := FPU.D
399      csBundle(0).fpu.typeTagOut := FPU.D
400      csBundle(0).fpu.fromInt := true.B
401      csBundle(0).fpu.wflags := false.B
402      csBundle(0).fpu.fpWen := true.B
403      csBundle(0).fpu.div := false.B
404      csBundle(0).fpu.sqrt := false.B
405      csBundle(0).fpu.fcvt := false.B
406
407      for (i <- 0 until MAX_VLMUL / 2) {
408        csBundle(2 * i + 1).srcType(0) := SrcType.fp
409        csBundle(2 * i + 1).lsrc(0) := FP_TMP_REG_MV.U
410        csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i).U
411        csBundle(2 * i + 1).lsrc(2) := dest + (2 * i).U
412        csBundle(2 * i + 1).ldest := dest + (2 * i).U
413        csBundle(2 * i + 1).uopIdx := (2 * i).U
414        csBundle(2 * i + 2).srcType(0) := SrcType.fp
415        csBundle(2 * i + 2).lsrc(0) := FP_TMP_REG_MV.U
416        csBundle(2 * i + 2).lsrc(1) := src2 + (2 * i + 1).U
417        csBundle(2 * i + 2).lsrc(2) := dest + (2 * i + 1).U
418        csBundle(2 * i + 2).ldest := dest + (2 * i + 1).U
419        csBundle(2 * i + 2).uopIdx := (2 * i + 1).U
420      }
421    }
422    is(UopSplitType.VEC_WVV) {
423      for (i <- 0 until MAX_VLMUL / 2) {
424
425        csBundle(2 * i).lsrc(0) := src1 + i.U
426        csBundle(2 * i).lsrc(1) := src2 + (2 * i).U
427        csBundle(2 * i).lsrc(2) := dest + i.U
428        csBundle(2 * i).ldest := dest + i.U
429        csBundle(2 * i).uopIdx := (2 * i).U
430        csBundle(2 * i + 1).lsrc(0) := src1 + i.U
431        csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i + 1).U
432        csBundle(2 * i + 1).lsrc(2) := dest + i.U
433        csBundle(2 * i + 1).ldest := dest + i.U
434        csBundle(2 * i + 1).uopIdx := (2 * i + 1).U
435      }
436    }
437    is(UopSplitType.VEC_WFW) {
438      for (i <- 0 until MAX_VLMUL / 2) {
439        csBundle(2 * i).lsrc(0) := src1
440        csBundle(2 * i).lsrc(1) := src2 + (2 * i).U
441        csBundle(2 * i).lsrc(2) := dest + (2 * i).U
442        csBundle(2 * i).ldest := dest + (2 * i).U
443        csBundle(2 * i).uopIdx := (2 * i).U
444        csBundle(2 * i + 1).lsrc(0) := src1
445        csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i + 1).U
446        csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U
447        csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U
448        csBundle(2 * i + 1).uopIdx := (2 * i + 1).U
449      }
450    }
451    is(UopSplitType.VEC_WXV) {
452      /*
453      FMV.D.X
454       */
455      csBundle(0).srcType(0) := SrcType.reg
456      csBundle(0).srcType(1) := SrcType.imm
457      csBundle(0).lsrc(1) := 0.U
458      csBundle(0).ldest := FP_TMP_REG_MV.U
459      csBundle(0).fuType := FuType.i2f.U
460      csBundle(0).rfWen := false.B
461      csBundle(0).fpWen := true.B
462      csBundle(0).vecWen := false.B
463      csBundle(0).fpu.isAddSub := false.B
464      csBundle(0).fpu.typeTagIn := FPU.D
465      csBundle(0).fpu.typeTagOut := FPU.D
466      csBundle(0).fpu.fromInt := true.B
467      csBundle(0).fpu.wflags := false.B
468      csBundle(0).fpu.fpWen := true.B
469      csBundle(0).fpu.div := false.B
470      csBundle(0).fpu.sqrt := false.B
471      csBundle(0).fpu.fcvt := false.B
472
473      for (i <- 0 until MAX_VLMUL / 2) {
474        csBundle(2 * i + 1).srcType(0) := SrcType.fp
475        csBundle(2 * i + 1).lsrc(0) := FP_TMP_REG_MV.U
476        csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i).U
477        csBundle(2 * i + 1).lsrc(2) := dest + i.U
478        csBundle(2 * i + 1).ldest := dest + i.U
479        csBundle(2 * i + 1).uopIdx := (2 * i).U
480        csBundle(2 * i + 2).srcType(0) := SrcType.fp
481        csBundle(2 * i + 2).lsrc(0) := FP_TMP_REG_MV.U
482        csBundle(2 * i + 2).lsrc(1) := src2 + (2 * i + 1).U
483        csBundle(2 * i + 2).lsrc(2) := dest + i.U
484        csBundle(2 * i + 2).ldest := dest + i.U
485        csBundle(2 * i + 2).uopIdx := (2 * i + 1).U
486      }
487    }
488    is(UopSplitType.VEC_VVM) {
489      csBundle(0).lsrc(2) := dest
490      csBundle(0).ldest := dest
491      csBundle(0).uopIdx := 0.U
492      for (i <- 1 until MAX_VLMUL) {
493        csBundle(i).lsrc(0) := src1 + i.U
494        csBundle(i).lsrc(1) := src2 + i.U
495        csBundle(i).lsrc(2) := dest
496        csBundle(i).ldest := dest
497        csBundle(i).uopIdx := i.U
498      }
499      csBundle(numOfUop - 1.U).ldest := dest
500    }
501    is(UopSplitType.VEC_VFM) {
502      csBundle(0).lsrc(2) := dest
503      csBundle(0).ldest := dest
504      csBundle(0).uopIdx := 0.U
505      for (i <- 1 until MAX_VLMUL) {
506        csBundle(i).lsrc(0) := src1
507        csBundle(i).lsrc(1) := src2 + i.U
508        csBundle(i).lsrc(2) := dest
509        csBundle(i).ldest := dest
510        csBundle(i).uopIdx := i.U
511      }
512      csBundle(numOfUop - 1.U).ldest := dest
513    }
514    is(UopSplitType.VEC_VXM) {
515      /*
516      FMV.D.X
517       */
518      csBundle(0).srcType(0) := SrcType.reg
519      csBundle(0).srcType(1) := SrcType.imm
520      csBundle(0).lsrc(1) := 0.U
521      csBundle(0).ldest := FP_TMP_REG_MV.U
522      csBundle(0).fuType := FuType.i2f.U
523      csBundle(0).rfWen := false.B
524      csBundle(0).fpWen := true.B
525      csBundle(0).vecWen := false.B
526      csBundle(0).fpu.isAddSub := false.B
527      csBundle(0).fpu.typeTagIn := FPU.D
528      csBundle(0).fpu.typeTagOut := FPU.D
529      csBundle(0).fpu.fromInt := true.B
530      csBundle(0).fpu.wflags := false.B
531      csBundle(0).fpu.fpWen := true.B
532      csBundle(0).fpu.div := false.B
533      csBundle(0).fpu.sqrt := false.B
534      csBundle(0).fpu.fcvt := false.B
535      //LMUL
536      csBundle(1).srcType(0) := SrcType.fp
537      csBundle(1).lsrc(0) := FP_TMP_REG_MV.U
538      csBundle(1).lsrc(2) := dest
539      csBundle(1).ldest := dest
540      csBundle(1).uopIdx := 0.U
541      for (i <- 1 until MAX_VLMUL) {
542        csBundle(i + 1).srcType(0) := SrcType.fp
543        csBundle(i + 1).lsrc(0) := FP_TMP_REG_MV.U
544        csBundle(i + 1).lsrc(1) := src2 + i.U
545        csBundle(i + 1).lsrc(2) := dest
546        csBundle(i + 1).ldest := dest
547        csBundle(i + 1).uopIdx := i.U
548      }
549      csBundle(numOfUop - 1.U).ldest := dest
550    }
551    is(UopSplitType.VEC_SLIDE1UP) {
552      /*
553      FMV.D.X
554       */
555      csBundle(0).srcType(0) := SrcType.reg
556      csBundle(0).srcType(1) := SrcType.imm
557      csBundle(0).lsrc(1) := 0.U
558      csBundle(0).ldest := FP_TMP_REG_MV.U
559      csBundle(0).fuType := FuType.i2f.U
560      csBundle(0).rfWen := false.B
561      csBundle(0).fpWen := true.B
562      csBundle(0).vecWen := false.B
563      csBundle(0).fpu.isAddSub := false.B
564      csBundle(0).fpu.typeTagIn := FPU.D
565      csBundle(0).fpu.typeTagOut := FPU.D
566      csBundle(0).fpu.fromInt := true.B
567      csBundle(0).fpu.wflags := false.B
568      csBundle(0).fpu.fpWen := true.B
569      csBundle(0).fpu.div := false.B
570      csBundle(0).fpu.sqrt := false.B
571      csBundle(0).fpu.fcvt := false.B
572      //LMUL
573      csBundle(1).srcType(0) := SrcType.fp
574      csBundle(1).lsrc(0) := FP_TMP_REG_MV.U
575      csBundle(1).lsrc(2) := dest
576      csBundle(1).ldest := dest
577      csBundle(1).uopIdx := 0.U
578      for (i <- 1 until MAX_VLMUL) {
579        csBundle(i + 1).srcType(0) := SrcType.vp
580        csBundle(i + 1).lsrc(0) := src2 + (i - 1).U
581        csBundle(i + 1).lsrc(1) := src2 + i.U
582        csBundle(i + 1).lsrc(2) := dest + i.U
583        csBundle(i + 1).ldest := dest + i.U
584        csBundle(i + 1).uopIdx := i.U
585      }
586    }
587    is(UopSplitType.VEC_FSLIDE1UP) {
588      //LMUL
589      csBundle(0).srcType(0) := SrcType.fp
590      csBundle(0).lsrc(0) := src1
591      csBundle(0).lsrc(1) := src2
592      csBundle(0).lsrc(2) := dest
593      csBundle(0).ldest := dest
594      csBundle(0).uopIdx := 0.U
595      for (i <- 1 until MAX_VLMUL) {
596        csBundle(i).srcType(0) := SrcType.vp
597        csBundle(i).lsrc(0) := src2 + (i - 1).U
598        csBundle(i).lsrc(1) := src2 + i.U
599        csBundle(i).lsrc(2) := dest + i.U
600        csBundle(i).ldest := dest + i.U
601        csBundle(i).uopIdx := i.U
602      }
603    }
604    is(UopSplitType.VEC_SLIDE1DOWN) { // lmul+lmul = 16
605      /*
606      FMV.D.X
607       */
608      csBundle(0).srcType(0) := SrcType.reg
609      csBundle(0).srcType(1) := SrcType.imm
610      csBundle(0).lsrc(1) := 0.U
611      csBundle(0).ldest := FP_TMP_REG_MV.U
612      csBundle(0).fuType := FuType.i2f.U
613      csBundle(0).rfWen := false.B
614      csBundle(0).fpWen := true.B
615      csBundle(0).vecWen := false.B
616      csBundle(0).fpu.isAddSub := false.B
617      csBundle(0).fpu.typeTagIn := FPU.D
618      csBundle(0).fpu.typeTagOut := FPU.D
619      csBundle(0).fpu.fromInt := true.B
620      csBundle(0).fpu.wflags := false.B
621      csBundle(0).fpu.fpWen := true.B
622      csBundle(0).fpu.div := false.B
623      csBundle(0).fpu.sqrt := false.B
624      csBundle(0).fpu.fcvt := false.B
625      //LMUL
626      for (i <- 0 until MAX_VLMUL) {
627        csBundle(2 * i + 1).srcType(0) := SrcType.vp
628        csBundle(2 * i + 1).srcType(1) := SrcType.vp
629        csBundle(2 * i + 1).lsrc(0) := src2 + (i + 1).U
630        csBundle(2 * i + 1).lsrc(1) := src2 + i.U
631        csBundle(2 * i + 1).lsrc(2) := dest + i.U
632        csBundle(2 * i + 1).ldest := VECTOR_TMP_REG_LMUL.U
633        csBundle(2 * i + 1).uopIdx := (2 * i).U
634        if (2 * i + 2 < MAX_VLMUL * 2) {
635          csBundle(2 * i + 2).srcType(0) := SrcType.fp
636          csBundle(2 * i + 2).lsrc(0) := FP_TMP_REG_MV.U
637          // csBundle(2 * i + 2).lsrc(1) := src2 + i.U         // DontCare
638          csBundle(2 * i + 2).lsrc(2) := VECTOR_TMP_REG_LMUL.U
639          csBundle(2 * i + 2).ldest := dest + i.U
640          csBundle(2 * i + 2).uopIdx := (2 * i + 1).U
641        }
642      }
643      csBundle(numOfUop - 1.U).srcType(0) := SrcType.fp
644      csBundle(numOfUop - 1.U).lsrc(0) := FP_TMP_REG_MV.U
645      csBundle(numOfUop - 1.U).ldest := dest + lmul - 1.U
646    }
647    is(UopSplitType.VEC_FSLIDE1DOWN) {
648      //LMUL
649      for (i <- 0 until MAX_VLMUL) {
650        csBundle(2 * i).srcType(0) := SrcType.vp
651        csBundle(2 * i).srcType(1) := SrcType.vp
652        csBundle(2 * i).lsrc(0) := src2 + (i + 1).U
653        csBundle(2 * i).lsrc(1) := src2 + i.U
654        csBundle(2 * i).lsrc(2) := dest + i.U
655        csBundle(2 * i).ldest := VECTOR_TMP_REG_LMUL.U
656        csBundle(2 * i).uopIdx := (2 * i).U
657        csBundle(2 * i + 1).srcType(0) := SrcType.fp
658        csBundle(2 * i + 1).lsrc(0) := src1
659        csBundle(2 * i + 1).lsrc(2) := VECTOR_TMP_REG_LMUL.U
660        csBundle(2 * i + 1).ldest := dest + i.U
661        csBundle(2 * i + 1).uopIdx := (2 * i + 1).U
662      }
663      csBundle(numOfUop - 1.U).srcType(0) := SrcType.fp
664      csBundle(numOfUop - 1.U).lsrc(0) := src1
665      csBundle(numOfUop - 1.U).ldest := dest + lmul - 1.U
666    }
667    is(UopSplitType.VEC_VRED) {
668      when(simple.io.enq.vtype.vlmul === "b001".U) {
669        csBundle(0).srcType(2) := SrcType.DC
670        csBundle(0).lsrc(0) := src2 + 1.U
671        csBundle(0).lsrc(1) := src2
672        csBundle(0).ldest := VECTOR_TMP_REG_LMUL.U
673        csBundle(0).uopIdx := 0.U
674      }
675      when(simple.io.enq.vtype.vlmul === "b010".U) {
676        csBundle(0).srcType(2) := SrcType.DC
677        csBundle(0).lsrc(0) := src2 + 1.U
678        csBundle(0).lsrc(1) := src2
679        csBundle(0).ldest := VECTOR_TMP_REG_LMUL.U
680        csBundle(0).uopIdx := 0.U
681
682        csBundle(1).srcType(2) := SrcType.DC
683        csBundle(1).lsrc(0) := src2 + 3.U
684        csBundle(1).lsrc(1) := src2 + 2.U
685        csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U
686        csBundle(1).uopIdx := 1.U
687
688        csBundle(2).srcType(2) := SrcType.DC
689        csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U
690        csBundle(2).lsrc(1) := VECTOR_TMP_REG_LMUL.U
691        csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U
692        csBundle(2).uopIdx := 2.U
693      }
694      when(simple.io.enq.vtype.vlmul === "b011".U) {
695        for (i <- 0 until MAX_VLMUL) {
696          if (i < MAX_VLMUL - MAX_VLMUL / 2) {
697            csBundle(i).lsrc(0) := src2 + (i * 2 + 1).U
698            csBundle(i).lsrc(1) := src2 + (i * 2).U
699            csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U
700          } else if (i < MAX_VLMUL - MAX_VLMUL / 4) {
701            csBundle(i).lsrc(0) := (VECTOR_TMP_REG_LMUL + (i - MAX_VLMUL / 2) * 2 + 1).U
702            csBundle(i).lsrc(1) := (VECTOR_TMP_REG_LMUL + (i - MAX_VLMUL / 2) * 2).U
703            csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U
704          } else if (i < MAX_VLMUL - MAX_VLMUL / 8) {
705            csBundle(6).lsrc(0) := (VECTOR_TMP_REG_LMUL + 5).U
706            csBundle(6).lsrc(1) := (VECTOR_TMP_REG_LMUL + 4).U
707            csBundle(6).ldest := (VECTOR_TMP_REG_LMUL + 6).U
708          }
709          csBundle(i).srcType(2) := SrcType.DC
710          csBundle(i).uopIdx := i.U
711        }
712      }
713      when(simple.io.enq.vtype.vlmul.orR()) {
714        csBundle(numOfUop - 1.U).srcType(2) := SrcType.vp
715        csBundle(numOfUop - 1.U).lsrc(0) := src1
716        csBundle(numOfUop - 1.U).lsrc(1) := VECTOR_TMP_REG_LMUL.U + numOfUop - 2.U
717        csBundle(numOfUop - 1.U).lsrc(2) := dest
718        csBundle(numOfUop - 1.U).ldest := dest
719        csBundle(numOfUop - 1.U).uopIdx := numOfUop - 1.U
720      }
721    }
722    is(UopSplitType.VEC_VFRED) {
723      val vlmul = simple.io.enq.vtype.vlmul
724      val vsew = simple.io.enq.vtype.vsew
725      when(vlmul === VLmul.m8){
726        for (i <- 0 until 4) {
727          csBundle(i).lsrc(0) := src2 + (i * 2 + 1).U
728          csBundle(i).lsrc(1) := src2 + (i * 2).U
729          csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U
730          csBundle(i).uopIdx := i.U
731        }
732        for (i <- 4 until 6) {
733          csBundle(i).lsrc(0) := (VECTOR_TMP_REG_LMUL + (i - 4) * 2 + 1).U
734          csBundle(i).lsrc(1) := (VECTOR_TMP_REG_LMUL + (i - 4) * 2).U
735          csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U
736          csBundle(i).uopIdx := i.U
737        }
738        csBundle(6).lsrc(0) := (VECTOR_TMP_REG_LMUL + 5).U
739        csBundle(6).lsrc(1) := (VECTOR_TMP_REG_LMUL + 4).U
740        csBundle(6).ldest := (VECTOR_TMP_REG_LMUL + 6).U
741        csBundle(6).uopIdx := 6.U
742        when(vsew === VSew.e64) {
743          csBundle(7).lsrc(0) := (VECTOR_TMP_REG_LMUL + 6).U
744          csBundle(7).lsrc(1) := (VECTOR_TMP_REG_LMUL + 6).U
745          csBundle(7).ldest := (VECTOR_TMP_REG_LMUL + 7).U
746          csBundle(7).vpu.fpu.isFoldTo1_2 := true.B
747          csBundle(7).uopIdx := 7.U
748          csBundle(8).lsrc(0) := src1
749          csBundle(8).lsrc(1) := (VECTOR_TMP_REG_LMUL + 7).U
750          csBundle(8).ldest := dest
751          csBundle(8).uopIdx := 8.U
752        }
753        when(vsew === VSew.e32) {
754          csBundle(7).lsrc(0) := (VECTOR_TMP_REG_LMUL + 6).U
755          csBundle(7).lsrc(1) := (VECTOR_TMP_REG_LMUL + 6).U
756          csBundle(7).ldest := (VECTOR_TMP_REG_LMUL + 7).U
757          csBundle(7).vpu.fpu.isFoldTo1_2 := true.B
758          csBundle(7).uopIdx := 7.U
759          csBundle(8).lsrc(0) := (VECTOR_TMP_REG_LMUL + 7).U
760          csBundle(8).lsrc(1) := (VECTOR_TMP_REG_LMUL + 7).U
761          csBundle(8).ldest := (VECTOR_TMP_REG_LMUL + 8).U
762          csBundle(8).vpu.fpu.isFoldTo1_4 := true.B
763          csBundle(8).uopIdx := 8.U
764          csBundle(9).lsrc(0) := src1
765          csBundle(9).lsrc(1) := (VECTOR_TMP_REG_LMUL + 8).U
766          csBundle(9).ldest := dest
767          csBundle(9).uopIdx := 9.U
768        }
769        when(vsew === VSew.e16) {
770          csBundle(7).lsrc(0) := (VECTOR_TMP_REG_LMUL + 6).U
771          csBundle(7).lsrc(1) := (VECTOR_TMP_REG_LMUL + 6).U
772          csBundle(7).ldest := (VECTOR_TMP_REG_LMUL + 7).U
773          csBundle(7).vpu.fpu.isFoldTo1_2 := true.B
774          csBundle(7).uopIdx := 7.U
775          csBundle(8).lsrc(0) := (VECTOR_TMP_REG_LMUL + 7).U
776          csBundle(8).lsrc(1) := (VECTOR_TMP_REG_LMUL + 7).U
777          csBundle(8).ldest := (VECTOR_TMP_REG_LMUL + 8).U
778          csBundle(8).vpu.fpu.isFoldTo1_4 := true.B
779          csBundle(8).uopIdx := 8.U
780          csBundle(9).lsrc(0) := (VECTOR_TMP_REG_LMUL + 8).U
781          csBundle(9).lsrc(1) := (VECTOR_TMP_REG_LMUL + 8).U
782          csBundle(9).ldest := (VECTOR_TMP_REG_LMUL + 9).U
783          csBundle(9).vpu.fpu.isFoldTo1_8 := true.B
784          csBundle(9).uopIdx := 9.U
785          csBundle(10).lsrc(0) := src1
786          csBundle(10).lsrc(1) := (VECTOR_TMP_REG_LMUL + 9).U
787          csBundle(10).ldest := dest
788          csBundle(10).uopIdx := 10.U
789        }
790      }
791      when(vlmul === VLmul.m4) {
792        for (i <- 0 until 2) {
793          csBundle(i).lsrc(0) := src2 + (i * 2 + 1).U
794          csBundle(i).lsrc(1) := src2 + (i * 2).U
795          csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U
796          csBundle(i).uopIdx := i.U
797        }
798        csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U
799        csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
800        csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U
801        csBundle(2).uopIdx := 2.U
802        when(vsew === VSew.e64) {
803          csBundle(3).lsrc(0) := (VECTOR_TMP_REG_LMUL + 2).U
804          csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U
805          csBundle(3).ldest := (VECTOR_TMP_REG_LMUL + 3).U
806          csBundle(3).vpu.fpu.isFoldTo1_2 := true.B
807          csBundle(3).uopIdx := 3.U
808          csBundle(4).lsrc(0) := src1
809          csBundle(4).lsrc(1) := (VECTOR_TMP_REG_LMUL + 3).U
810          csBundle(4).ldest := dest
811          csBundle(4).uopIdx := 4.U
812        }
813        when(vsew === VSew.e32) {
814          csBundle(3).lsrc(0) := (VECTOR_TMP_REG_LMUL + 2).U
815          csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U
816          csBundle(3).ldest := (VECTOR_TMP_REG_LMUL + 3).U
817          csBundle(3).vpu.fpu.isFoldTo1_2 := true.B
818          csBundle(3).uopIdx := 3.U
819          csBundle(4).lsrc(0) := (VECTOR_TMP_REG_LMUL + 3).U
820          csBundle(4).lsrc(1) := (VECTOR_TMP_REG_LMUL + 3).U
821          csBundle(4).ldest := (VECTOR_TMP_REG_LMUL + 4).U
822          csBundle(4).vpu.fpu.isFoldTo1_4 := true.B
823          csBundle(4).uopIdx := 4.U
824          csBundle(5).lsrc(0) := src1
825          csBundle(5).lsrc(1) := (VECTOR_TMP_REG_LMUL + 4).U
826          csBundle(5).ldest := dest
827          csBundle(5).uopIdx := 5.U
828        }
829        when(vsew === VSew.e16) {
830          csBundle(3).lsrc(0) := (VECTOR_TMP_REG_LMUL + 2).U
831          csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U
832          csBundle(3).ldest := (VECTOR_TMP_REG_LMUL + 3).U
833          csBundle(3).vpu.fpu.isFoldTo1_2 := true.B
834          csBundle(3).uopIdx := 3.U
835          csBundle(4).lsrc(0) := (VECTOR_TMP_REG_LMUL + 3).U
836          csBundle(4).lsrc(1) := (VECTOR_TMP_REG_LMUL + 3).U
837          csBundle(4).ldest := (VECTOR_TMP_REG_LMUL + 4).U
838          csBundle(4).vpu.fpu.isFoldTo1_4 := true.B
839          csBundle(4).uopIdx := 4.U
840          csBundle(5).lsrc(0) := (VECTOR_TMP_REG_LMUL + 4).U
841          csBundle(5).lsrc(1) := (VECTOR_TMP_REG_LMUL + 4).U
842          csBundle(5).ldest := (VECTOR_TMP_REG_LMUL + 5).U
843          csBundle(5).vpu.fpu.isFoldTo1_8 := true.B
844          csBundle(5).uopIdx := 5.U
845          csBundle(6).lsrc(0) := src1
846          csBundle(6).lsrc(1) := (VECTOR_TMP_REG_LMUL + 5).U
847          csBundle(6).ldest := dest
848          csBundle(6).uopIdx := 6.U
849        }
850      }
851      when(vlmul === VLmul.m2) {
852        csBundle(0).lsrc(0) := src2 + 1.U
853        csBundle(0).lsrc(1) := src2 + 0.U
854        csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U
855        csBundle(0).uopIdx := 0.U
856        when(vsew === VSew.e64) {
857          csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U
858          csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
859          csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U
860          csBundle(1).vpu.fpu.isFoldTo1_2 := true.B
861          csBundle(1).uopIdx := 1.U
862          csBundle(2).lsrc(0) := src1
863          csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U
864          csBundle(2).ldest := dest
865          csBundle(2).uopIdx := 2.U
866        }
867        when(vsew === VSew.e32) {
868          csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U
869          csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
870          csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U
871          csBundle(1).vpu.fpu.isFoldTo1_2 := true.B
872          csBundle(1).uopIdx := 1.U
873          csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U
874          csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U
875          csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U
876          csBundle(2).vpu.fpu.isFoldTo1_4 := true.B
877          csBundle(2).uopIdx := 2.U
878          csBundle(3).lsrc(0) := src1
879          csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U
880          csBundle(3).ldest := dest
881          csBundle(3).uopIdx := 3.U
882        }
883        when(vsew === VSew.e16) {
884          csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U
885          csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
886          csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U
887          csBundle(1).vpu.fpu.isFoldTo1_2 := true.B
888          csBundle(1).uopIdx := 1.U
889          csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U
890          csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U
891          csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U
892          csBundle(2).vpu.fpu.isFoldTo1_4 := true.B
893          csBundle(2).uopIdx := 2.U
894          csBundle(3).lsrc(0) := (VECTOR_TMP_REG_LMUL + 2).U
895          csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U
896          csBundle(3).ldest := (VECTOR_TMP_REG_LMUL + 3).U
897          csBundle(3).vpu.fpu.isFoldTo1_8 := true.B
898          csBundle(3).uopIdx := 3.U
899          csBundle(4).lsrc(0) := src1
900          csBundle(4).lsrc(1) := (VECTOR_TMP_REG_LMUL + 3).U
901          csBundle(4).ldest := dest
902          csBundle(4).uopIdx := 4.U
903        }
904      }
905      when(vlmul === VLmul.m1) {
906        when(vsew === VSew.e64) {
907          csBundle(0).lsrc(0) := src2
908          csBundle(0).lsrc(1) := src2
909          csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U
910          csBundle(0).vpu.fpu.isFoldTo1_2 := true.B
911          csBundle(0).uopIdx := 0.U
912          csBundle(1).lsrc(0) := src1
913          csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
914          csBundle(1).ldest := dest
915          csBundle(1).uopIdx := 1.U
916        }
917        when(vsew === VSew.e32) {
918          csBundle(0).lsrc(0) := src2
919          csBundle(0).lsrc(1) := src2
920          csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U
921          csBundle(0).vpu.fpu.isFoldTo1_2 := true.B
922          csBundle(0).uopIdx := 0.U
923          csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U
924          csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
925          csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U
926          csBundle(1).vpu.fpu.isFoldTo1_4 := true.B
927          csBundle(1).uopIdx := 1.U
928          csBundle(2).lsrc(0) := src1
929          csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U
930          csBundle(2).ldest := dest
931          csBundle(2).uopIdx := 2.U
932        }
933        when(vsew === VSew.e16) {
934          csBundle(0).lsrc(0) := src2
935          csBundle(0).lsrc(1) := src2
936          csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U
937          csBundle(0).vpu.fpu.isFoldTo1_2 := true.B
938          csBundle(0).uopIdx := 0.U
939          csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U
940          csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
941          csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U
942          csBundle(1).vpu.fpu.isFoldTo1_4 := true.B
943          csBundle(1).uopIdx := 1.U
944          csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U
945          csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U
946          csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U
947          csBundle(2).vpu.fpu.isFoldTo1_8 := true.B
948          csBundle(2).uopIdx := 2.U
949          csBundle(3).lsrc(0) := src1
950          csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U
951          csBundle(3).ldest := dest
952          csBundle(3).uopIdx := 3.U
953        }
954      }
955      when(vlmul === VLmul.mf2) {
956        when(vsew === VSew.e32) {
957          csBundle(0).lsrc(0) := src2
958          csBundle(0).lsrc(1) := src2
959          csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U
960          csBundle(0).vpu.fpu.isFoldTo1_4 := true.B
961          csBundle(0).uopIdx := 0.U
962          csBundle(1).lsrc(0) := src1
963          csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
964          csBundle(1).ldest := dest
965          csBundle(1).uopIdx := 1.U
966        }
967        when(vsew === VSew.e16) {
968          csBundle(0).lsrc(0) := src2
969          csBundle(0).lsrc(1) := src2
970          csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U
971          csBundle(0).vpu.fpu.isFoldTo1_4 := true.B
972          csBundle(0).uopIdx := 0.U
973          csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U
974          csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
975          csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U
976          csBundle(1).vpu.fpu.isFoldTo1_8 := true.B
977          csBundle(1).uopIdx := 1.U
978          csBundle(2).lsrc(0) := src1
979          csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U
980          csBundle(2).ldest := dest
981          csBundle(2).uopIdx := 2.U
982        }
983      }
984      when(vlmul === VLmul.mf4) {
985        when(vsew === VSew.e16) {
986          csBundle(0).lsrc(0) := src2
987          csBundle(0).lsrc(1) := src2
988          csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U
989          csBundle(0).vpu.fpu.isFoldTo1_8 := true.B
990          csBundle(0).uopIdx := 0.U
991          csBundle(1).lsrc(0) := src1
992          csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U
993          csBundle(1).ldest := dest
994          csBundle(1).uopIdx := 1.U
995        }
996      }
997    }
998
999    is(UopSplitType.VEC_SLIDEUP) {
1000      // FMV.D.X
1001      csBundle(0).srcType(0) := SrcType.reg
1002      csBundle(0).srcType(1) := SrcType.imm
1003      csBundle(0).lsrc(1) := 0.U
1004      csBundle(0).ldest := FP_TMP_REG_MV.U
1005      csBundle(0).fuType := FuType.i2f.U
1006      csBundle(0).rfWen := false.B
1007      csBundle(0).fpWen := true.B
1008      csBundle(0).vecWen := false.B
1009      csBundle(0).fpu.isAddSub := false.B
1010      csBundle(0).fpu.typeTagIn := FPU.D
1011      csBundle(0).fpu.typeTagOut := FPU.D
1012      csBundle(0).fpu.fromInt := true.B
1013      csBundle(0).fpu.wflags := false.B
1014      csBundle(0).fpu.fpWen := true.B
1015      csBundle(0).fpu.div := false.B
1016      csBundle(0).fpu.sqrt := false.B
1017      csBundle(0).fpu.fcvt := false.B
1018      // LMUL
1019      for (i <- 0 until MAX_VLMUL)
1020        for (j <- 0 to i) {
1021          val old_vd = if (j == 0) {
1022            dest + i.U
1023          } else (VECTOR_TMP_REG_LMUL + j - 1).U
1024          val vd = if (j == i) {
1025            dest + i.U
1026          } else (VECTOR_TMP_REG_LMUL + j).U
1027          csBundle(i * (i + 1) / 2 + j + 1).srcType(0) := SrcType.fp
1028          csBundle(i * (i + 1) / 2 + j + 1).lsrc(0) := FP_TMP_REG_MV.U
1029          csBundle(i * (i + 1) / 2 + j + 1).lsrc(1) := src2 + j.U
1030          csBundle(i * (i + 1) / 2 + j + 1).lsrc(2) := old_vd
1031          csBundle(i * (i + 1) / 2 + j + 1).ldest := vd
1032          csBundle(i * (i + 1) / 2 + j + 1).uopIdx := (i * (i + 1) / 2 + j).U
1033        }
1034    }
1035
1036    is(UopSplitType.VEC_ISLIDEUP) {
1037      // LMUL
1038      for (i <- 0 until MAX_VLMUL)
1039        for (j <- 0 to i) {
1040          val old_vd = if (j == 0) {
1041            dest + i.U
1042          } else (VECTOR_TMP_REG_LMUL + j - 1).U
1043          val vd = if (j == i) {
1044            dest + i.U
1045          } else (VECTOR_TMP_REG_LMUL + j).U
1046          csBundle(i * (i + 1) / 2 + j).lsrc(1) := src2 + j.U
1047          csBundle(i * (i + 1) / 2 + j).lsrc(2) := old_vd
1048          csBundle(i * (i + 1) / 2 + j).ldest := vd
1049          csBundle(i * (i + 1) / 2 + j).uopIdx := (i * (i + 1) / 2 + j).U
1050        }
1051    }
1052
1053    is(UopSplitType.VEC_SLIDEDOWN) {
1054      // FMV.D.X
1055      csBundle(0).srcType(0) := SrcType.reg
1056      csBundle(0).srcType(1) := SrcType.imm
1057      csBundle(0).lsrc(1) := 0.U
1058      csBundle(0).ldest := FP_TMP_REG_MV.U
1059      csBundle(0).fuType := FuType.i2f.U
1060      csBundle(0).rfWen := false.B
1061      csBundle(0).fpWen := true.B
1062      csBundle(0).vecWen := false.B
1063      csBundle(0).fpu.isAddSub := false.B
1064      csBundle(0).fpu.typeTagIn := FPU.D
1065      csBundle(0).fpu.typeTagOut := FPU.D
1066      csBundle(0).fpu.fromInt := true.B
1067      csBundle(0).fpu.wflags := false.B
1068      csBundle(0).fpu.fpWen := true.B
1069      csBundle(0).fpu.div := false.B
1070      csBundle(0).fpu.sqrt := false.B
1071      csBundle(0).fpu.fcvt := false.B
1072      // LMUL
1073      for (i <- 0 until MAX_VLMUL)
1074        for (j <- (0 to i).reverse) {
1075          when(i.U < lmul) {
1076            val old_vd = if (j == 0) {
1077              dest + lmul - 1.U - i.U
1078            } else (VECTOR_TMP_REG_LMUL + j - 1).U
1079            val vd = if (j == i) {
1080              dest + lmul - 1.U - i.U
1081            } else (VECTOR_TMP_REG_LMUL + j).U
1082            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).srcType(0) := SrcType.fp
1083            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(0) := FP_TMP_REG_MV.U
1084            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(1) := src2 + lmul - 1.U - j.U
1085            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(2) := old_vd
1086            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).ldest := vd
1087            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).uopIdx := numOfUop - (i * (i + 1) / 2 + i - j + 2).U
1088          }
1089        }
1090    }
1091
1092    is(UopSplitType.VEC_ISLIDEDOWN) {
1093      // LMUL
1094      for (i <- 0 until MAX_VLMUL)
1095        for (j <- (0 to i).reverse) {
1096          when(i.U < lmul) {
1097            val old_vd = if (j == 0) {
1098              dest + lmul - 1.U - i.U
1099            } else (VECTOR_TMP_REG_LMUL + j - 1).U
1100            val vd = if (j == i) {
1101              dest + lmul - 1.U - i.U
1102            } else (VECTOR_TMP_REG_LMUL + j).U
1103            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(1) := src2 + lmul - 1.U - j.U
1104            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(2) := old_vd
1105            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).ldest := vd
1106            csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).uopIdx := numOfUop - (i * (i + 1) / 2 + i - j + 1).U
1107          }
1108        }
1109    }
1110
1111    is(UopSplitType.VEC_M0X) {
1112      // LMUL
1113      for (i <- 0 until MAX_VLMUL) {
1114        val srcType0 = if (i == 0) SrcType.DC else SrcType.vp
1115        val ldest = (VECTOR_TMP_REG_LMUL + i).U
1116        csBundle(i).srcType(0) := srcType0
1117        csBundle(i).srcType(1) := SrcType.vp
1118        csBundle(i).rfWen := false.B
1119        csBundle(i).vecWen := true.B
1120        csBundle(i).lsrc(0) := (VECTOR_TMP_REG_LMUL + i - 1).U
1121        csBundle(i).lsrc(1) := src2
1122        // csBundle(i).lsrc(2) := dest + i.U  DontCare
1123        csBundle(i).ldest := ldest
1124        csBundle(i).uopIdx := i.U
1125      }
1126      csBundle(lmul - 1.U).vecWen := false.B
1127      csBundle(lmul - 1.U).fpWen := true.B
1128      csBundle(lmul - 1.U).ldest := FP_TMP_REG_MV.U
1129      // FMV_X_D
1130      csBundle(lmul).srcType(0) := SrcType.fp
1131      csBundle(lmul).srcType(1) := SrcType.imm
1132      csBundle(lmul).lsrc(0) := FP_TMP_REG_MV.U
1133      csBundle(lmul).lsrc(1) := 0.U
1134      csBundle(lmul).ldest := dest
1135      csBundle(lmul).fuType := FuType.fmisc.U
1136      csBundle(lmul).rfWen := true.B
1137      csBundle(lmul).fpWen := false.B
1138      csBundle(lmul).vecWen := false.B
1139      csBundle(lmul).fpu.isAddSub := false.B
1140      csBundle(lmul).fpu.typeTagIn := FPU.D
1141      csBundle(lmul).fpu.typeTagOut := FPU.D
1142      csBundle(lmul).fpu.fromInt := false.B
1143      csBundle(lmul).fpu.wflags := false.B
1144      csBundle(lmul).fpu.fpWen := false.B
1145      csBundle(lmul).fpu.div := false.B
1146      csBundle(lmul).fpu.sqrt := false.B
1147      csBundle(lmul).fpu.fcvt := false.B
1148    }
1149
1150    is(UopSplitType.VEC_MVV) {
1151      // LMUL
1152      for (i <- 0 until MAX_VLMUL) {
1153        val srcType0 = if (i == 0) SrcType.DC else SrcType.vp
1154        csBundle(i * 2 + 0).srcType(0) := srcType0
1155        csBundle(i * 2 + 0).srcType(1) := SrcType.vp
1156        csBundle(i * 2 + 0).lsrc(0) := (VECTOR_TMP_REG_LMUL + i - 1).U
1157        csBundle(i * 2 + 0).lsrc(1) := src2
1158        csBundle(i * 2 + 0).lsrc(2) := dest + i.U
1159        csBundle(i * 2 + 0).ldest := dest + i.U
1160        csBundle(i * 2 + 0).uopIdx := (i * 2 + 0).U
1161
1162        csBundle(i * 2 + 1).srcType(0) := srcType0
1163        csBundle(i * 2 + 1).srcType(1) := SrcType.vp
1164        csBundle(i * 2 + 1).lsrc(0) := (VECTOR_TMP_REG_LMUL + i - 1).U
1165        csBundle(i * 2 + 1).lsrc(1) := src2
1166        // csBundle(i).lsrc(2) := dest + i.U  DontCare
1167        csBundle(i * 2 + 1).ldest := (VECTOR_TMP_REG_LMUL + i).U
1168        csBundle(i * 2 + 1).uopIdx := (i * 2 + 1).U
1169      }
1170    }
1171
1172    is(UopSplitType.VEC_M0X_VFIRST) {
1173      // LMUL
1174      csBundle(0).rfWen := false.B
1175      csBundle(0).fpWen := true.B
1176      csBundle(0).ldest := FP_TMP_REG_MV.U
1177      // FMV_X_D
1178      csBundle(1).srcType(0) := SrcType.fp
1179      csBundle(1).srcType(1) := SrcType.imm
1180      csBundle(1).lsrc(0) := FP_TMP_REG_MV.U
1181      csBundle(1).lsrc(1) := 0.U
1182      csBundle(1).ldest := dest
1183      csBundle(1).fuType := FuType.fmisc.U
1184      csBundle(1).rfWen := true.B
1185      csBundle(1).fpWen := false.B
1186      csBundle(1).vecWen := false.B
1187      csBundle(1).fpu.isAddSub := false.B
1188      csBundle(1).fpu.typeTagIn := FPU.D
1189      csBundle(1).fpu.typeTagOut := FPU.D
1190      csBundle(1).fpu.fromInt := false.B
1191      csBundle(1).fpu.wflags := false.B
1192      csBundle(1).fpu.fpWen := false.B
1193      csBundle(1).fpu.div := false.B
1194      csBundle(1).fpu.sqrt := false.B
1195      csBundle(1).fpu.fcvt := false.B
1196    }
1197    is(UopSplitType.VEC_VWW) {
1198      for (i <- 0 until MAX_VLMUL*2) {
1199        when(i.U < lmul){
1200          csBundle(i).srcType(2) := SrcType.DC
1201          csBundle(i).lsrc(0) := src2 + i.U
1202          csBundle(i).lsrc(1) := src2 + i.U
1203          // csBundle(i).lsrc(2) := dest + (2 * i).U
1204          csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U
1205          csBundle(i).uopIdx :=  i.U
1206        } otherwise {
1207          csBundle(i).srcType(2) := SrcType.DC
1208          csBundle(i).lsrc(0) := VECTOR_TMP_REG_LMUL.U + Cat((i.U-lmul),0.U(1.W)) + 1.U
1209          csBundle(i).lsrc(1) := VECTOR_TMP_REG_LMUL.U + Cat((i.U-lmul),0.U(1.W))
1210          // csBundle(i).lsrc(2) := dest + (2 * i).U
1211          csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U
1212          csBundle(i).uopIdx := i.U
1213        }
1214        csBundle(numOfUop-1.U).srcType(2) := SrcType.vp
1215        csBundle(numOfUop-1.U).lsrc(0) := src1
1216        csBundle(numOfUop-1.U).lsrc(2) := dest
1217        csBundle(numOfUop-1.U).ldest := dest
1218      }
1219    }
1220    is(UopSplitType.VEC_RGATHER) {
1221      def genCsBundle_VEC_RGATHER(len:Int): Unit ={
1222        for (i <- 0 until len)
1223          for (j <- 0 until len) {
1224            // csBundle(i * len + j).srcType(0) := SrcType.vp // SrcType.imm
1225            // csBundle(i * len + j).srcType(1) := SrcType.vp
1226            // csBundle(i * len + j).srcType(2) := SrcType.vp
1227            csBundle(i * len + j).lsrc(0) := src1 + i.U
1228            csBundle(i * len + j).lsrc(1) := src2 + j.U
1229            val vd_old = if(j==0) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j - 1).U
1230            csBundle(i * len + j).lsrc(2) := vd_old
1231            val vd = if(j==len-1) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j).U
1232            csBundle(i * len + j).ldest := vd
1233            csBundle(i * len + j).uopIdx := (i * len + j).U
1234          }
1235      }
1236      switch(simple.io.enq.vtype.vlmul) {
1237        is("b001".U ){
1238          genCsBundle_VEC_RGATHER(2)
1239        }
1240        is("b010".U ){
1241          genCsBundle_VEC_RGATHER(4)
1242        }
1243        is("b011".U ){
1244          genCsBundle_VEC_RGATHER(8)
1245        }
1246      }
1247    }
1248    is(UopSplitType.VEC_RGATHER_VX) {
1249      def genCsBundle_RGATHER_VX(len:Int): Unit ={
1250        for (i <- 0 until len)
1251          for (j <- 0 until len) {
1252            csBundle(i * len + j + 1).srcType(0) := SrcType.fp
1253            // csBundle(i * len + j + 1).srcType(1) := SrcType.vp
1254            // csBundle(i * len + j + 1).srcType(2) := SrcType.vp
1255            csBundle(i * len + j + 1).lsrc(0) := FP_TMP_REG_MV.U
1256            csBundle(i * len + j + 1).lsrc(1) := src2 + j.U
1257            val vd_old = if(j==0) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j - 1).U
1258            csBundle(i * len + j + 1).lsrc(2) := vd_old
1259            val vd = if(j==len-1) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j).U
1260            csBundle(i * len + j + 1).ldest := vd
1261            csBundle(i * len + j + 1).uopIdx := (i * len + j).U
1262          }
1263      }
1264      // FMV.D.X
1265      csBundle(0).srcType(0) := SrcType.reg
1266      csBundle(0).srcType(1) := SrcType.imm
1267      csBundle(0).lsrc(1) := 0.U
1268      csBundle(0).ldest := FP_TMP_REG_MV.U
1269      csBundle(0).fuType := FuType.i2f.U
1270      csBundle(0).rfWen := false.B
1271      csBundle(0).fpWen := true.B
1272      csBundle(0).vecWen := false.B
1273      csBundle(0).fpu.isAddSub := false.B
1274      csBundle(0).fpu.typeTagIn := FPU.D
1275      csBundle(0).fpu.typeTagOut := FPU.D
1276      csBundle(0).fpu.fromInt := true.B
1277      csBundle(0).fpu.wflags := false.B
1278      csBundle(0).fpu.fpWen := true.B
1279      csBundle(0).fpu.div := false.B
1280      csBundle(0).fpu.sqrt := false.B
1281      csBundle(0).fpu.fcvt := false.B
1282      switch(simple.io.enq.vtype.vlmul) {
1283        is("b000".U ){
1284          genCsBundle_RGATHER_VX(1)
1285        }
1286        is("b001".U ){
1287          genCsBundle_RGATHER_VX(2)
1288        }
1289        is("b010".U ){
1290          genCsBundle_RGATHER_VX(4)
1291        }
1292        is("b011".U ){
1293          genCsBundle_RGATHER_VX(8)
1294        }
1295      }
1296    }
1297    is(UopSplitType.VEC_RGATHEREI16) {
1298      def genCsBundle_VEC_RGATHEREI16_SEW8(len:Int): Unit ={
1299        for (i <- 0 until len)
1300          for (j <- 0 until len) {
1301            val vd_old0 = if(j==0) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j*2-1).U
1302            val vd0 = (VECTOR_TMP_REG_LMUL + j*2 ).U
1303            // csBundle(i * len + j).srcType(0) := SrcType.vp // SrcType.imm
1304            // csBundle(i * len + j).srcType(1) := SrcType.vp
1305            // csBundle(i * len + j).srcType(2) := SrcType.vp
1306            csBundle((i * len + j)*2+0).lsrc(0) := src1 + (i*2+0).U
1307            csBundle((i * len + j)*2+0).lsrc(1) := src2 + j.U
1308            csBundle((i * len + j)*2+0).lsrc(2) := vd_old0
1309            csBundle((i * len + j)*2+0).ldest := vd0
1310            csBundle((i * len + j)*2+0).uopIdx := ((i * len + j)*2+0).U
1311            val vd_old1 = (VECTOR_TMP_REG_LMUL + j*2).U
1312            val vd1 = if(j==len-1) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j*2+1 ).U
1313            csBundle((i * len + j)*2+1).lsrc(0) := src1 + (i*2+1).U
1314            csBundle((i * len + j)*2+1).lsrc(1) := src2 + j.U
1315            csBundle((i * len + j)*2+1).lsrc(2) := vd_old1
1316            csBundle((i * len + j)*2+1).ldest := vd1
1317            csBundle((i * len + j)*2+1).uopIdx := ((i * len + j)*2+1).U
1318          }
1319      }
1320      def genCsBundle_VEC_RGATHEREI16(len:Int): Unit ={
1321        for (i <- 0 until len)
1322          for (j <- 0 until len) {
1323            val vd_old = if(j==0) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j-1).U
1324            val vd = if(j==len-1) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j).U
1325            // csBundle(i * len + j).srcType(0) := SrcType.vp // SrcType.imm
1326            // csBundle(i * len + j).srcType(1) := SrcType.vp
1327            // csBundle(i * len + j).srcType(2) := SrcType.vp
1328            csBundle(i * len + j).lsrc(0) := src1 + i.U
1329            csBundle(i * len + j).lsrc(1) := src2 + j.U
1330            csBundle(i * len + j).lsrc(2) := vd_old
1331            csBundle(i * len + j).ldest := vd
1332            csBundle(i * len + j).uopIdx := (i * len + j).U
1333          }
1334      }
1335      switch(simple.io.enq.vtype.vlmul) {
1336        is("b000".U ){
1337          when(!simple.io.enq.vtype.vsew.orR){
1338            genCsBundle_VEC_RGATHEREI16_SEW8(1)
1339          } .otherwise{
1340            genCsBundle_VEC_RGATHEREI16(1)
1341          }
1342        }
1343        is("b001".U) {
1344          when(!simple.io.enq.vtype.vsew.orR) {
1345            genCsBundle_VEC_RGATHEREI16_SEW8(2)
1346          }.otherwise {
1347            genCsBundle_VEC_RGATHEREI16(2)
1348          }
1349        }
1350        is("b010".U) {
1351          when(!simple.io.enq.vtype.vsew.orR) {
1352            genCsBundle_VEC_RGATHEREI16_SEW8(4)
1353          }.otherwise {
1354            genCsBundle_VEC_RGATHEREI16(4)
1355          }
1356        }
1357        is("b011".U) {
1358          genCsBundle_VEC_RGATHEREI16(8)
1359        }
1360      }
1361    }
1362    is(UopSplitType.VEC_COMPRESS) {
1363      def genCsBundle_VEC_COMPRESS(len:Int): Unit ={
1364        for (i <- 0 until len){
1365          val jlen = if (i == len-1) i+1 else i+2
1366          for (j <- 0 until jlen) {
1367            val vd_old = if(i==j) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j + 1).U
1368            val vd = if(i==len-1) (dest + j.U) else{
1369              if (j == i+1) VECTOR_TMP_REG_LMUL.U else (VECTOR_TMP_REG_LMUL + j + 1).U
1370            }
1371            val src23Type = if (j == i+1) DontCare else SrcType.vp
1372            csBundle(i*(i+3)/2 + j).srcType(0) := SrcType.vp
1373            csBundle(i*(i+3)/2 + j).srcType(1) := src23Type
1374            csBundle(i*(i+3)/2 + j).srcType(2) := src23Type
1375            csBundle(i*(i+3)/2 + j).lsrc(0) := src1
1376            csBundle(i*(i+3)/2 + j).lsrc(1) := src2 + i.U
1377            csBundle(i*(i+3)/2 + j).lsrc(2) := vd_old
1378            // csBundle(i*(i+3)/2 + j).lsrc(3) := VECTOR_TMP_REG_LMUL.U
1379            csBundle(i*(i+3)/2 + j).ldest := vd
1380            csBundle(i*(i+3)/2 + j).uopIdx := (i*(i+3)/2 + j).U
1381          }
1382        }
1383      }
1384      switch(simple.io.enq.vtype.vlmul) {
1385        is("b001".U ){
1386          genCsBundle_VEC_COMPRESS(2)
1387        }
1388        is("b010".U ){
1389          genCsBundle_VEC_COMPRESS(4)
1390        }
1391        is("b011".U ){
1392          genCsBundle_VEC_COMPRESS(8)
1393        }
1394      }
1395    }
1396    is(UopSplitType.VEC_US_LD) {
1397      /*
1398      FMV.D.X
1399       */
1400      csBundle(0).srcType(0) := SrcType.reg
1401      csBundle(0).srcType(1) := SrcType.imm
1402      csBundle(0).lsrc(1) := 0.U
1403      csBundle(0).ldest := FP_TMP_REG_MV.U
1404      csBundle(0).fuType := FuType.i2f.U
1405      csBundle(0).rfWen := false.B
1406      csBundle(0).fpWen := true.B
1407      csBundle(0).vecWen := false.B
1408      csBundle(0).fpu.isAddSub := false.B
1409      csBundle(0).fpu.typeTagIn := FPU.D
1410      csBundle(0).fpu.typeTagOut := FPU.D
1411      csBundle(0).fpu.fromInt := true.B
1412      csBundle(0).fpu.wflags := false.B
1413      csBundle(0).fpu.fpWen := true.B
1414      csBundle(0).fpu.div := false.B
1415      csBundle(0).fpu.sqrt := false.B
1416      csBundle(0).fpu.fcvt := false.B
1417      //LMUL
1418      for (i <- 0 until MAX_VLMUL) {
1419        csBundle(i + 1).srcType(0) := SrcType.fp
1420        csBundle(i + 1).lsrc(0) := FP_TMP_REG_MV.U
1421        csBundle(i + 1).ldest := dest + i.U
1422        csBundle(i + 1).uopIdx := i.U
1423      }
1424    }
1425  }
1426
1427  //uops dispatch
1428  val s_normal :: s_ext :: Nil = Enum(2)
1429  val state = RegInit(s_normal)
1430  val state_next = WireDefault(state)
1431  val uopRes = RegInit(0.U)
1432
1433  //readyFromRename Counter
1434  val readyCounter = PriorityMuxDefault(io.readyFromRename.map(x => !x).zip((0 to (RenameWidth - 1)).map(_.U)), RenameWidth.U)
1435
1436  switch(state) {
1437    is(s_normal) {
1438      state_next := Mux(io.validFromIBuf(0) && (numOfUop > readyCounter) && (readyCounter =/= 0.U), s_ext, s_normal)
1439    }
1440    is(s_ext) {
1441      state_next := Mux(io.validFromIBuf(0) && (uopRes > readyCounter), s_ext, s_normal)
1442    }
1443  }
1444
1445  state := state_next
1446
1447  val uopRes0 = Mux(state === s_normal, numOfUop, uopRes)
1448  val uopResJudge = Mux(state === s_normal,
1449    io.validFromIBuf(0) && (readyCounter =/= 0.U) && (uopRes0 > readyCounter),
1450    io.validFromIBuf(0) && (uopRes0 > readyCounter))
1451  uopRes := Mux(uopResJudge, uopRes0 - readyCounter, 0.U)
1452
1453  for(i <- 0 until RenameWidth) {
1454    decodedInsts(i) := MuxCase(csBundle(i), Seq(
1455      (state === s_normal) -> csBundle(i),
1456      (state === s_ext) -> Mux((i.U + numOfUop -uopRes) < maxUopSize.U, csBundle(i.U + numOfUop - uopRes), csBundle(maxUopSize - 1))
1457    ))
1458  }
1459
1460
1461  val validSimple = Wire(Vec(DecodeWidth - 1, Bool()))
1462  validSimple.zip(io.validFromIBuf.drop(1).zip(io.isComplex)).map{ case (dst, (src1, src2)) => dst := src1 && !src2 }
1463  val notInf = Wire(Vec(DecodeWidth - 1, Bool()))
1464  notInf.zip(io.validFromIBuf.drop(1).zip(validSimple)).map{ case (dst, (src1, src2)) => dst := !src1 || src2 }
1465  val notInfVec = Wire(Vec(DecodeWidth, Bool()))
1466  notInfVec.drop(1).zip(0 until DecodeWidth - 1).map{ case (dst, i) => dst := Cat(notInf.take(i + 1)).andR}
1467  notInfVec(0) := true.B
1468
1469  complexNum := Mux(io.validFromIBuf(0) && readyCounter.orR ,
1470    Mux(uopRes0 > readyCounter, readyCounter, uopRes0),
1471    1.U)
1472  validToRename.zipWithIndex.foreach{
1473    case(dst, i) =>
1474      dst := MuxCase(false.B, Seq(
1475        (io.validFromIBuf(0) && uopRes0 > readyCounter   ) -> Mux(readyCounter > i.U, true.B, false.B),
1476        (io.validFromIBuf(0) && !(uopRes0 > readyCounter)) -> Mux(complexNum > i.U, true.B, validSimple(i.U - complexNum) && notInfVec(i.U - complexNum) && io.readyFromRename(i)),
1477      ))
1478  }
1479
1480  readyToIBuf.zipWithIndex.foreach {
1481    case (dst, i) =>
1482      dst := MuxCase(true.B, Seq(
1483        (io.validFromIBuf(0) && uopRes0 > readyCounter) -> false.B,
1484        (io.validFromIBuf(0) && !(uopRes0 > readyCounter)) -> (if (i==0) true.B else Mux(RenameWidth.U - complexNum >= i.U, notInfVec(i - 1) && validSimple(i - 1) && io.readyFromRename(i), false.B)),
1485      ))
1486  }
1487
1488  io.deq.decodedInsts := decodedInsts
1489  io.deq.isVset := isVsetSimple
1490  io.deq.complexNum := complexNum
1491  io.deq.validToRename := validToRename
1492  io.deq.readyToIBuf := readyToIBuf
1493
1494}
1495