1/*************************************************************************************** 2 * Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3 * Copyright (c) 2020-2021 Peng Cheng Laboratory 4 * 5 * XiangShan is licensed under Mulan PSL v2. 6 * You can use this software according to the terms and conditions of the Mulan PSL v2. 7 * You may obtain a copy of Mulan PSL v2 at: 8 * http://license.coscl.org.cn/MulanPSL2 9 * 10 * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11 * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12 * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13 * 14 * See the Mulan PSL v2 for more details. 15 ***************************************************************************************/ 16 17package xiangshan.backend.decode 18 19import chipsalliance.rocketchip.config.Parameters 20import chisel3._ 21import chisel3.util._ 22import freechips.rocketchip.rocket.Instructions 23import freechips.rocketchip.util.uintToBitPat 24import utils._ 25import utility._ 26import xiangshan.ExceptionNO.illegalInstr 27import xiangshan._ 28import xiangshan.backend.fu.fpu.FPU 29import xiangshan.backend.fu.FuType 30import freechips.rocketchip.rocket.Instructions._ 31import xiangshan.backend.Bundles.{DecodedInst, StaticInst} 32import xiangshan.backend.decode.isa.bitfield.XSInstBitFields 33import xiangshan.backend.fu.vector.Bundles.{VSew, VType, VLmul} 34import yunsuan.VpermType 35 36import scala.collection.Seq 37 38trait VectorConstants { 39 val MAX_VLMUL = 8 40 val FP_TMP_REG_MV = 32 41 val VECTOR_TMP_REG_LMUL = 33 // 33~47 -> 15 42} 43 44class DecodeUnitCompIO(implicit p: Parameters) extends XSBundle { 45 val enq = new Bundle { val staticInst = Input(new StaticInst) } 46 val vtype = Input(new VType) 47 val isComplex = Input(Vec(DecodeWidth - 1, Bool())) 48 val validFromIBuf = Input(Vec(DecodeWidth, Bool())) 49 val readyFromRename = Input(Vec(RenameWidth, Bool())) 50 val deq = new Bundle { 51 val decodedInsts = Output(Vec(RenameWidth, new DecodedInst)) 52 val isVset = Output(Bool()) 53 val readyToIBuf = Output(Vec(DecodeWidth, Bool())) 54 val validToRename = Output(Vec(RenameWidth, Bool())) 55 val complexNum = Output(UInt(3.W)) 56 } 57 val csrCtrl = Input(new CustomCSRCtrlIO) 58} 59 60/** 61 * @author zly 62 */ 63class DecodeUnitComp()(implicit p : Parameters) extends XSModule with DecodeUnitConstants with VectorConstants { 64 val io = IO(new DecodeUnitCompIO) 65 66 val maxUopSize = MaxUopSize 67 //input bits 68 val staticInst = Wire(new StaticInst) 69 70 71 staticInst := io.enq.staticInst 72 private val inst: XSInstBitFields = staticInst.instr.asTypeOf(new XSInstBitFields) 73 74 val src1 = Cat(0.U(1.W), inst.RS1) 75 val src2 = Cat(0.U(1.W), inst.RS2) 76 val dest = Cat(0.U(1.W), inst.RD) 77 78 79 //output bits 80 val decodedInsts = Wire(Vec(RenameWidth, new DecodedInst)) 81 val validToRename = Wire(Vec(RenameWidth, Bool())) 82 val readyToIBuf = Wire(Vec(DecodeWidth, Bool())) 83 val complexNum = Wire(UInt(3.W)) 84 85 //output of DecodeUnit 86 val decodedInstsSimple = Wire(new DecodedInst) 87 val numOfUop = Wire(UInt(log2Up(maxUopSize+1).W)) 88 val lmul = Wire(UInt(4.W)) 89 val isVsetSimple = Wire(Bool()) 90 91 //pre decode 92 val simple = Module(new DecodeUnit) 93 simple.io.enq.ctrlFlow := staticInst 94 simple.io.enq.vtype := io.vtype 95 simple.io.csrCtrl := io.csrCtrl 96 decodedInstsSimple := simple.io.deq.decodedInst 97 lmul := simple.io.deq.uopInfo.lmul 98 isVsetSimple := simple.io.deq.decodedInst.isVset 99 when(isVsetSimple) { 100 when(dest === 0.U && src1 === 0.U) { 101 decodedInstsSimple.fuOpType := VSETOpType.keepVl(simple.io.deq.decodedInst.fuOpType) 102 }.elsewhen(src1 === 0.U) { 103 decodedInstsSimple.fuOpType := VSETOpType.setVlmax(simple.io.deq.decodedInst.fuOpType) 104 } 105 when(io.vtype.illegal){ 106 decodedInstsSimple.flushPipe := true.B 107 } 108 } 109 //Type of uop Div 110 val typeOfSplit = decodedInstsSimple.uopSplitType 111 112 when(typeOfSplit === UopSplitType.DIR) { 113 numOfUop := Mux(dest =/= 0.U, 2.U, 114 Mux(src1 =/= 0.U, 1.U, 115 Mux(VSETOpType.isVsetvl(decodedInstsSimple.fuOpType), 2.U, 1.U))) 116 } .otherwise { 117 numOfUop := simple.io.deq.uopInfo.numOfUop 118 } 119 120 121 //uop div up to maxUopSize 122 val csBundle = Wire(Vec(maxUopSize, new DecodedInst)) 123 csBundle.map { case dst => 124 dst := decodedInstsSimple 125 dst.firstUop := false.B 126 dst.lastUop := false.B 127 } 128 129 csBundle(0).numUops := numOfUop 130 csBundle(0).firstUop := true.B 131 csBundle(numOfUop - 1.U).lastUop := true.B 132 133 switch(typeOfSplit) { 134 is(UopSplitType.DIR) { 135 when(isVsetSimple) { 136 when(dest =/= 0.U) { 137 csBundle(0).fuType := FuType.vsetiwi.U 138 csBundle(0).fuOpType := VSETOpType.switchDest(decodedInstsSimple.fuOpType) 139 csBundle(0).flushPipe := false.B 140 csBundle(0).rfWen := true.B 141 csBundle(0).vecWen := false.B 142 csBundle(1).ldest := VCONFIG_IDX.U 143 csBundle(1).rfWen := false.B 144 csBundle(1).vecWen := true.B 145 }.elsewhen(src1 =/= 0.U) { 146 csBundle(0).ldest := VCONFIG_IDX.U 147 }.elsewhen(VSETOpType.isVsetvli(decodedInstsSimple.fuOpType)) { 148 csBundle(0).fuType := FuType.vsetfwf.U 149 csBundle(0).srcType(0) := SrcType.vp 150 csBundle(0).lsrc(0) := VCONFIG_IDX.U 151 }.elsewhen(VSETOpType.isVsetvl(decodedInstsSimple.fuOpType)) { 152 csBundle(0).srcType(0) := SrcType.reg 153 csBundle(0).srcType(1) := SrcType.imm 154 csBundle(0).lsrc(1) := 0.U 155 csBundle(0).ldest := FP_TMP_REG_MV.U 156 csBundle(0).fuType := FuType.i2f.U 157 csBundle(0).rfWen := false.B 158 csBundle(0).fpWen := true.B 159 csBundle(0).vecWen := false.B 160 csBundle(0).fpu.isAddSub := false.B 161 csBundle(0).fpu.typeTagIn := FPU.D 162 csBundle(0).fpu.typeTagOut := FPU.D 163 csBundle(0).fpu.fromInt := true.B 164 csBundle(0).fpu.wflags := false.B 165 csBundle(0).fpu.fpWen := true.B 166 csBundle(0).fpu.div := false.B 167 csBundle(0).fpu.sqrt := false.B 168 csBundle(0).fpu.fcvt := false.B 169 csBundle(0).flushPipe := false.B 170 csBundle(1).fuType := FuType.vsetfwf.U 171 csBundle(1).srcType(0) := SrcType.vp 172 csBundle(1).lsrc(0) := VCONFIG_IDX.U 173 csBundle(1).srcType(1) := SrcType.fp 174 csBundle(1).lsrc(1) := FP_TMP_REG_MV.U 175 csBundle(1).ldest := VCONFIG_IDX.U 176 } 177 } 178 } 179 is(UopSplitType.VEC_VVV) { 180 for (i <- 0 until MAX_VLMUL) { 181 csBundle(i).lsrc(0) := src1 + i.U 182 csBundle(i).lsrc(1) := src2 + i.U 183 csBundle(i).lsrc(2) := dest + i.U 184 csBundle(i).ldest := dest + i.U 185 csBundle(i).uopIdx := i.U 186 } 187 } 188 is(UopSplitType.VEC_VFV) { 189 for (i <- 0 until MAX_VLMUL) { 190 csBundle(i).lsrc(1) := src2 + i.U 191 csBundle(i).lsrc(2) := dest + i.U 192 csBundle(i).ldest := dest + i.U 193 csBundle(i).uopIdx := i.U 194 } 195 } 196 is(UopSplitType.VEC_EXT2) { 197 for (i <- 0 until MAX_VLMUL / 2) { 198 csBundle(2 * i).lsrc(1) := src2 + i.U 199 csBundle(2 * i).lsrc(2) := dest + (2 * i).U 200 csBundle(2 * i).ldest := dest + (2 * i).U 201 csBundle(2 * i).uopIdx := (2 * i).U 202 csBundle(2 * i + 1).lsrc(1) := src2 + i.U 203 csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U 204 csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U 205 csBundle(2 * i + 1).uopIdx := (2 * i + 1).U 206 } 207 } 208 is(UopSplitType.VEC_EXT4) { 209 for (i <- 0 until MAX_VLMUL / 4) { 210 csBundle(4 * i).lsrc(1) := src2 + i.U 211 csBundle(4 * i).lsrc(2) := dest + (4 * i).U 212 csBundle(4 * i).ldest := dest + (4 * i).U 213 csBundle(4 * i).uopIdx := (4 * i).U 214 csBundle(4 * i + 1).lsrc(1) := src2 + i.U 215 csBundle(4 * i + 1).lsrc(2) := dest + (4 * i + 1).U 216 csBundle(4 * i + 1).ldest := dest + (4 * i + 1).U 217 csBundle(4 * i + 1).uopIdx := (4 * i + 1).U 218 csBundle(4 * i + 2).lsrc(1) := src2 + i.U 219 csBundle(4 * i + 2).lsrc(2) := dest + (4 * i + 2).U 220 csBundle(4 * i + 2).ldest := dest + (4 * i + 2).U 221 csBundle(4 * i + 2).uopIdx := (4 * i + 2).U 222 csBundle(4 * i + 3).lsrc(1) := src2 + i.U 223 csBundle(4 * i + 3).lsrc(2) := dest + (4 * i + 3).U 224 csBundle(4 * i + 3).ldest := dest + (4 * i + 3).U 225 csBundle(4 * i + 3).uopIdx := (4 * i + 3).U 226 } 227 } 228 is(UopSplitType.VEC_EXT8) { 229 for (i <- 0 until MAX_VLMUL) { 230 csBundle(i).lsrc(1) := src2 231 csBundle(i).lsrc(2) := dest + i.U 232 csBundle(i).ldest := dest + i.U 233 csBundle(i).uopIdx := i.U 234 } 235 } 236 is(UopSplitType.VEC_0XV) { 237 /* 238 FMV.D.X 239 */ 240 csBundle(0).srcType(0) := SrcType.reg 241 csBundle(0).srcType(1) := SrcType.imm 242 csBundle(0).lsrc(1) := 0.U 243 csBundle(0).ldest := FP_TMP_REG_MV.U 244 csBundle(0).fuType := FuType.i2f.U 245 csBundle(0).rfWen := false.B 246 csBundle(0).fpWen := true.B 247 csBundle(0).vecWen := false.B 248 csBundle(0).fpu.isAddSub := false.B 249 csBundle(0).fpu.typeTagIn := FPU.D 250 csBundle(0).fpu.typeTagOut := FPU.D 251 csBundle(0).fpu.fromInt := true.B 252 csBundle(0).fpu.wflags := false.B 253 csBundle(0).fpu.fpWen := true.B 254 csBundle(0).fpu.div := false.B 255 csBundle(0).fpu.sqrt := false.B 256 csBundle(0).fpu.fcvt := false.B 257 /* 258 vfmv.s.f 259 */ 260 csBundle(1).srcType(0) := SrcType.fp 261 csBundle(1).srcType(1) := SrcType.vp 262 csBundle(1).srcType(2) := SrcType.vp 263 csBundle(1).lsrc(0) := FP_TMP_REG_MV.U 264 csBundle(1).lsrc(1) := 0.U 265 csBundle(1).lsrc(2) := dest 266 csBundle(1).ldest := dest 267 csBundle(1).fuType := FuType.vppu.U 268 csBundle(1).fuOpType := VpermType.dummy 269 csBundle(1).rfWen := false.B 270 csBundle(1).fpWen := false.B 271 csBundle(1).vecWen := true.B 272 } 273 is(UopSplitType.VEC_VXV) { 274 /* 275 FMV.D.X 276 */ 277 csBundle(0).srcType(0) := SrcType.reg 278 csBundle(0).srcType(1) := SrcType.imm 279 csBundle(0).lsrc(1) := 0.U 280 csBundle(0).ldest := FP_TMP_REG_MV.U 281 csBundle(0).fuType := FuType.i2f.U 282 csBundle(0).rfWen := false.B 283 csBundle(0).fpWen := true.B 284 csBundle(0).vecWen := false.B 285 csBundle(0).fpu.isAddSub := false.B 286 csBundle(0).fpu.typeTagIn := FPU.D 287 csBundle(0).fpu.typeTagOut := FPU.D 288 csBundle(0).fpu.fromInt := true.B 289 csBundle(0).fpu.wflags := false.B 290 csBundle(0).fpu.fpWen := true.B 291 csBundle(0).fpu.div := false.B 292 csBundle(0).fpu.sqrt := false.B 293 csBundle(0).fpu.fcvt := false.B 294 /* 295 LMUL 296 */ 297 for (i <- 0 until MAX_VLMUL) { 298 csBundle(i + 1).srcType(0) := SrcType.fp 299 csBundle(i + 1).lsrc(0) := FP_TMP_REG_MV.U 300 csBundle(i + 1).lsrc(1) := src2 + i.U 301 csBundle(i + 1).lsrc(2) := dest + i.U 302 csBundle(i + 1).ldest := dest + i.U 303 csBundle(i + 1).uopIdx := i.U 304 } 305 } 306 is(UopSplitType.VEC_VVW) { 307 for (i <- 0 until MAX_VLMUL / 2) { 308 csBundle(2 * i).lsrc(0) := src1 + i.U 309 csBundle(2 * i).lsrc(1) := src2 + i.U 310 csBundle(2 * i).lsrc(2) := dest + (2 * i).U 311 csBundle(2 * i).ldest := dest + (2 * i).U 312 csBundle(2 * i).uopIdx := (2 * i).U 313 csBundle(2 * i + 1).lsrc(0) := src1 + i.U 314 csBundle(2 * i + 1).lsrc(1) := src2 + i.U 315 csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U 316 csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U 317 csBundle(2 * i + 1).uopIdx := (2 * i + 1).U 318 } 319 } 320 is(UopSplitType.VEC_VFW) { 321 for (i <- 0 until MAX_VLMUL / 2) { 322 csBundle(2 * i).lsrc(0) := src1 323 csBundle(2 * i).lsrc(1) := src2 + i.U 324 csBundle(2 * i).lsrc(2) := dest + (2 * i).U 325 csBundle(2 * i).ldest := dest + (2 * i).U 326 csBundle(2 * i).uopIdx := (2 * i).U 327 csBundle(2 * i + 1).lsrc(0) := src1 328 csBundle(2 * i + 1).lsrc(1) := src2 + i.U 329 csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U 330 csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U 331 csBundle(2 * i + 1).uopIdx := (2 * i + 1).U 332 } 333 } 334 is(UopSplitType.VEC_WVW) { 335 for (i <- 0 until MAX_VLMUL / 2) { 336 csBundle(2 * i).lsrc(0) := src1 + i.U 337 csBundle(2 * i).lsrc(1) := src2 + (2 * i).U 338 csBundle(2 * i).lsrc(2) := dest + (2 * i).U 339 csBundle(2 * i).ldest := dest + (2 * i).U 340 csBundle(2 * i).uopIdx := (2 * i).U 341 csBundle(2 * i + 1).lsrc(0) := src1 + i.U 342 csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i + 1).U 343 csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U 344 csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U 345 csBundle(2 * i + 1).uopIdx := (2 * i + 1).U 346 } 347 } 348 is(UopSplitType.VEC_VXW) { 349 /* 350 FMV.D.X 351 */ 352 csBundle(0).srcType(0) := SrcType.reg 353 csBundle(0).srcType(1) := SrcType.imm 354 csBundle(0).lsrc(1) := 0.U 355 csBundle(0).ldest := FP_TMP_REG_MV.U 356 csBundle(0).fuType := FuType.i2f.U 357 csBundle(0).rfWen := false.B 358 csBundle(0).fpWen := true.B 359 csBundle(0).vecWen := false.B 360 csBundle(0).fpu.isAddSub := false.B 361 csBundle(0).fpu.typeTagIn := FPU.D 362 csBundle(0).fpu.typeTagOut := FPU.D 363 csBundle(0).fpu.fromInt := true.B 364 csBundle(0).fpu.wflags := false.B 365 csBundle(0).fpu.fpWen := true.B 366 csBundle(0).fpu.div := false.B 367 csBundle(0).fpu.sqrt := false.B 368 csBundle(0).fpu.fcvt := false.B 369 370 for (i <- 0 until MAX_VLMUL / 2) { 371 csBundle(2 * i + 1).srcType(0) := SrcType.fp 372 csBundle(2 * i + 1).lsrc(0) := FP_TMP_REG_MV.U 373 csBundle(2 * i + 1).lsrc(1) := src2 + i.U 374 csBundle(2 * i + 1).lsrc(2) := dest + (2 * i).U 375 csBundle(2 * i + 1).ldest := dest + (2 * i).U 376 csBundle(2 * i + 1).uopIdx := (2 * i).U 377 csBundle(2 * i + 2).srcType(0) := SrcType.fp 378 csBundle(2 * i + 2).lsrc(0) := FP_TMP_REG_MV.U 379 csBundle(2 * i + 2).lsrc(1) := src2 + i.U 380 csBundle(2 * i + 2).lsrc(2) := dest + (2 * i + 1).U 381 csBundle(2 * i + 2).ldest := dest + (2 * i + 1).U 382 csBundle(2 * i + 2).uopIdx := (2 * i + 1).U 383 } 384 } 385 is(UopSplitType.VEC_WXW) { 386 /* 387 FMV.D.X 388 */ 389 csBundle(0).srcType(0) := SrcType.reg 390 csBundle(0).srcType(1) := SrcType.imm 391 csBundle(0).lsrc(1) := 0.U 392 csBundle(0).ldest := FP_TMP_REG_MV.U 393 csBundle(0).fuType := FuType.i2f.U 394 csBundle(0).rfWen := false.B 395 csBundle(0).fpWen := true.B 396 csBundle(0).vecWen := false.B 397 csBundle(0).fpu.isAddSub := false.B 398 csBundle(0).fpu.typeTagIn := FPU.D 399 csBundle(0).fpu.typeTagOut := FPU.D 400 csBundle(0).fpu.fromInt := true.B 401 csBundle(0).fpu.wflags := false.B 402 csBundle(0).fpu.fpWen := true.B 403 csBundle(0).fpu.div := false.B 404 csBundle(0).fpu.sqrt := false.B 405 csBundle(0).fpu.fcvt := false.B 406 407 for (i <- 0 until MAX_VLMUL / 2) { 408 csBundle(2 * i + 1).srcType(0) := SrcType.fp 409 csBundle(2 * i + 1).lsrc(0) := FP_TMP_REG_MV.U 410 csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i).U 411 csBundle(2 * i + 1).lsrc(2) := dest + (2 * i).U 412 csBundle(2 * i + 1).ldest := dest + (2 * i).U 413 csBundle(2 * i + 1).uopIdx := (2 * i).U 414 csBundle(2 * i + 2).srcType(0) := SrcType.fp 415 csBundle(2 * i + 2).lsrc(0) := FP_TMP_REG_MV.U 416 csBundle(2 * i + 2).lsrc(1) := src2 + (2 * i + 1).U 417 csBundle(2 * i + 2).lsrc(2) := dest + (2 * i + 1).U 418 csBundle(2 * i + 2).ldest := dest + (2 * i + 1).U 419 csBundle(2 * i + 2).uopIdx := (2 * i + 1).U 420 } 421 } 422 is(UopSplitType.VEC_WVV) { 423 for (i <- 0 until MAX_VLMUL / 2) { 424 425 csBundle(2 * i).lsrc(0) := src1 + i.U 426 csBundle(2 * i).lsrc(1) := src2 + (2 * i).U 427 csBundle(2 * i).lsrc(2) := dest + i.U 428 csBundle(2 * i).ldest := dest + i.U 429 csBundle(2 * i).uopIdx := (2 * i).U 430 csBundle(2 * i + 1).lsrc(0) := src1 + i.U 431 csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i + 1).U 432 csBundle(2 * i + 1).lsrc(2) := dest + i.U 433 csBundle(2 * i + 1).ldest := dest + i.U 434 csBundle(2 * i + 1).uopIdx := (2 * i + 1).U 435 } 436 } 437 is(UopSplitType.VEC_WFW) { 438 for (i <- 0 until MAX_VLMUL / 2) { 439 csBundle(2 * i).lsrc(0) := src1 440 csBundle(2 * i).lsrc(1) := src2 + (2 * i).U 441 csBundle(2 * i).lsrc(2) := dest + (2 * i).U 442 csBundle(2 * i).ldest := dest + (2 * i).U 443 csBundle(2 * i).uopIdx := (2 * i).U 444 csBundle(2 * i + 1).lsrc(0) := src1 445 csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i + 1).U 446 csBundle(2 * i + 1).lsrc(2) := dest + (2 * i + 1).U 447 csBundle(2 * i + 1).ldest := dest + (2 * i + 1).U 448 csBundle(2 * i + 1).uopIdx := (2 * i + 1).U 449 } 450 } 451 is(UopSplitType.VEC_WXV) { 452 /* 453 FMV.D.X 454 */ 455 csBundle(0).srcType(0) := SrcType.reg 456 csBundle(0).srcType(1) := SrcType.imm 457 csBundle(0).lsrc(1) := 0.U 458 csBundle(0).ldest := FP_TMP_REG_MV.U 459 csBundle(0).fuType := FuType.i2f.U 460 csBundle(0).rfWen := false.B 461 csBundle(0).fpWen := true.B 462 csBundle(0).vecWen := false.B 463 csBundle(0).fpu.isAddSub := false.B 464 csBundle(0).fpu.typeTagIn := FPU.D 465 csBundle(0).fpu.typeTagOut := FPU.D 466 csBundle(0).fpu.fromInt := true.B 467 csBundle(0).fpu.wflags := false.B 468 csBundle(0).fpu.fpWen := true.B 469 csBundle(0).fpu.div := false.B 470 csBundle(0).fpu.sqrt := false.B 471 csBundle(0).fpu.fcvt := false.B 472 473 for (i <- 0 until MAX_VLMUL / 2) { 474 csBundle(2 * i + 1).srcType(0) := SrcType.fp 475 csBundle(2 * i + 1).lsrc(0) := FP_TMP_REG_MV.U 476 csBundle(2 * i + 1).lsrc(1) := src2 + (2 * i).U 477 csBundle(2 * i + 1).lsrc(2) := dest + i.U 478 csBundle(2 * i + 1).ldest := dest + i.U 479 csBundle(2 * i + 1).uopIdx := (2 * i).U 480 csBundle(2 * i + 2).srcType(0) := SrcType.fp 481 csBundle(2 * i + 2).lsrc(0) := FP_TMP_REG_MV.U 482 csBundle(2 * i + 2).lsrc(1) := src2 + (2 * i + 1).U 483 csBundle(2 * i + 2).lsrc(2) := dest + i.U 484 csBundle(2 * i + 2).ldest := dest + i.U 485 csBundle(2 * i + 2).uopIdx := (2 * i + 1).U 486 } 487 } 488 is(UopSplitType.VEC_VVM) { 489 csBundle(0).lsrc(2) := dest 490 csBundle(0).ldest := dest 491 csBundle(0).uopIdx := 0.U 492 for (i <- 1 until MAX_VLMUL) { 493 csBundle(i).lsrc(0) := src1 + i.U 494 csBundle(i).lsrc(1) := src2 + i.U 495 csBundle(i).lsrc(2) := dest 496 csBundle(i).ldest := dest 497 csBundle(i).uopIdx := i.U 498 } 499 csBundle(numOfUop - 1.U).ldest := dest 500 } 501 is(UopSplitType.VEC_VFM) { 502 csBundle(0).lsrc(2) := dest 503 csBundle(0).ldest := dest 504 csBundle(0).uopIdx := 0.U 505 for (i <- 1 until MAX_VLMUL) { 506 csBundle(i).lsrc(0) := src1 507 csBundle(i).lsrc(1) := src2 + i.U 508 csBundle(i).lsrc(2) := dest 509 csBundle(i).ldest := dest 510 csBundle(i).uopIdx := i.U 511 } 512 csBundle(numOfUop - 1.U).ldest := dest 513 } 514 is(UopSplitType.VEC_VXM) { 515 /* 516 FMV.D.X 517 */ 518 csBundle(0).srcType(0) := SrcType.reg 519 csBundle(0).srcType(1) := SrcType.imm 520 csBundle(0).lsrc(1) := 0.U 521 csBundle(0).ldest := FP_TMP_REG_MV.U 522 csBundle(0).fuType := FuType.i2f.U 523 csBundle(0).rfWen := false.B 524 csBundle(0).fpWen := true.B 525 csBundle(0).vecWen := false.B 526 csBundle(0).fpu.isAddSub := false.B 527 csBundle(0).fpu.typeTagIn := FPU.D 528 csBundle(0).fpu.typeTagOut := FPU.D 529 csBundle(0).fpu.fromInt := true.B 530 csBundle(0).fpu.wflags := false.B 531 csBundle(0).fpu.fpWen := true.B 532 csBundle(0).fpu.div := false.B 533 csBundle(0).fpu.sqrt := false.B 534 csBundle(0).fpu.fcvt := false.B 535 //LMUL 536 csBundle(1).srcType(0) := SrcType.fp 537 csBundle(1).lsrc(0) := FP_TMP_REG_MV.U 538 csBundle(1).lsrc(2) := dest 539 csBundle(1).ldest := dest 540 csBundle(1).uopIdx := 0.U 541 for (i <- 1 until MAX_VLMUL) { 542 csBundle(i + 1).srcType(0) := SrcType.fp 543 csBundle(i + 1).lsrc(0) := FP_TMP_REG_MV.U 544 csBundle(i + 1).lsrc(1) := src2 + i.U 545 csBundle(i + 1).lsrc(2) := dest 546 csBundle(i + 1).ldest := dest 547 csBundle(i + 1).uopIdx := i.U 548 } 549 csBundle(numOfUop - 1.U).ldest := dest 550 } 551 is(UopSplitType.VEC_SLIDE1UP) { 552 /* 553 FMV.D.X 554 */ 555 csBundle(0).srcType(0) := SrcType.reg 556 csBundle(0).srcType(1) := SrcType.imm 557 csBundle(0).lsrc(1) := 0.U 558 csBundle(0).ldest := FP_TMP_REG_MV.U 559 csBundle(0).fuType := FuType.i2f.U 560 csBundle(0).rfWen := false.B 561 csBundle(0).fpWen := true.B 562 csBundle(0).vecWen := false.B 563 csBundle(0).fpu.isAddSub := false.B 564 csBundle(0).fpu.typeTagIn := FPU.D 565 csBundle(0).fpu.typeTagOut := FPU.D 566 csBundle(0).fpu.fromInt := true.B 567 csBundle(0).fpu.wflags := false.B 568 csBundle(0).fpu.fpWen := true.B 569 csBundle(0).fpu.div := false.B 570 csBundle(0).fpu.sqrt := false.B 571 csBundle(0).fpu.fcvt := false.B 572 //LMUL 573 csBundle(1).srcType(0) := SrcType.fp 574 csBundle(1).lsrc(0) := FP_TMP_REG_MV.U 575 csBundle(1).lsrc(2) := dest 576 csBundle(1).ldest := dest 577 csBundle(1).uopIdx := 0.U 578 for (i <- 1 until MAX_VLMUL) { 579 csBundle(i + 1).srcType(0) := SrcType.vp 580 csBundle(i + 1).lsrc(0) := src2 + (i - 1).U 581 csBundle(i + 1).lsrc(1) := src2 + i.U 582 csBundle(i + 1).lsrc(2) := dest + i.U 583 csBundle(i + 1).ldest := dest + i.U 584 csBundle(i + 1).uopIdx := i.U 585 } 586 } 587 is(UopSplitType.VEC_FSLIDE1UP) { 588 //LMUL 589 csBundle(0).srcType(0) := SrcType.fp 590 csBundle(0).lsrc(0) := src1 591 csBundle(0).lsrc(1) := src2 592 csBundle(0).lsrc(2) := dest 593 csBundle(0).ldest := dest 594 csBundle(0).uopIdx := 0.U 595 for (i <- 1 until MAX_VLMUL) { 596 csBundle(i).srcType(0) := SrcType.vp 597 csBundle(i).lsrc(0) := src2 + (i - 1).U 598 csBundle(i).lsrc(1) := src2 + i.U 599 csBundle(i).lsrc(2) := dest + i.U 600 csBundle(i).ldest := dest + i.U 601 csBundle(i).uopIdx := i.U 602 } 603 } 604 is(UopSplitType.VEC_SLIDE1DOWN) { // lmul+lmul = 16 605 /* 606 FMV.D.X 607 */ 608 csBundle(0).srcType(0) := SrcType.reg 609 csBundle(0).srcType(1) := SrcType.imm 610 csBundle(0).lsrc(1) := 0.U 611 csBundle(0).ldest := FP_TMP_REG_MV.U 612 csBundle(0).fuType := FuType.i2f.U 613 csBundle(0).rfWen := false.B 614 csBundle(0).fpWen := true.B 615 csBundle(0).vecWen := false.B 616 csBundle(0).fpu.isAddSub := false.B 617 csBundle(0).fpu.typeTagIn := FPU.D 618 csBundle(0).fpu.typeTagOut := FPU.D 619 csBundle(0).fpu.fromInt := true.B 620 csBundle(0).fpu.wflags := false.B 621 csBundle(0).fpu.fpWen := true.B 622 csBundle(0).fpu.div := false.B 623 csBundle(0).fpu.sqrt := false.B 624 csBundle(0).fpu.fcvt := false.B 625 //LMUL 626 for (i <- 0 until MAX_VLMUL) { 627 csBundle(2 * i + 1).srcType(0) := SrcType.vp 628 csBundle(2 * i + 1).srcType(1) := SrcType.vp 629 csBundle(2 * i + 1).lsrc(0) := src2 + (i + 1).U 630 csBundle(2 * i + 1).lsrc(1) := src2 + i.U 631 csBundle(2 * i + 1).lsrc(2) := dest + i.U 632 csBundle(2 * i + 1).ldest := VECTOR_TMP_REG_LMUL.U 633 csBundle(2 * i + 1).uopIdx := (2 * i).U 634 if (2 * i + 2 < MAX_VLMUL * 2) { 635 csBundle(2 * i + 2).srcType(0) := SrcType.fp 636 csBundle(2 * i + 2).lsrc(0) := FP_TMP_REG_MV.U 637 // csBundle(2 * i + 2).lsrc(1) := src2 + i.U // DontCare 638 csBundle(2 * i + 2).lsrc(2) := VECTOR_TMP_REG_LMUL.U 639 csBundle(2 * i + 2).ldest := dest + i.U 640 csBundle(2 * i + 2).uopIdx := (2 * i + 1).U 641 } 642 } 643 csBundle(numOfUop - 1.U).srcType(0) := SrcType.fp 644 csBundle(numOfUop - 1.U).lsrc(0) := FP_TMP_REG_MV.U 645 csBundle(numOfUop - 1.U).ldest := dest + lmul - 1.U 646 } 647 is(UopSplitType.VEC_FSLIDE1DOWN) { 648 //LMUL 649 for (i <- 0 until MAX_VLMUL) { 650 csBundle(2 * i).srcType(0) := SrcType.vp 651 csBundle(2 * i).srcType(1) := SrcType.vp 652 csBundle(2 * i).lsrc(0) := src2 + (i + 1).U 653 csBundle(2 * i).lsrc(1) := src2 + i.U 654 csBundle(2 * i).lsrc(2) := dest + i.U 655 csBundle(2 * i).ldest := VECTOR_TMP_REG_LMUL.U 656 csBundle(2 * i).uopIdx := (2 * i).U 657 csBundle(2 * i + 1).srcType(0) := SrcType.fp 658 csBundle(2 * i + 1).lsrc(0) := src1 659 csBundle(2 * i + 1).lsrc(2) := VECTOR_TMP_REG_LMUL.U 660 csBundle(2 * i + 1).ldest := dest + i.U 661 csBundle(2 * i + 1).uopIdx := (2 * i + 1).U 662 } 663 csBundle(numOfUop - 1.U).srcType(0) := SrcType.fp 664 csBundle(numOfUop - 1.U).lsrc(0) := src1 665 csBundle(numOfUop - 1.U).ldest := dest + lmul - 1.U 666 } 667 is(UopSplitType.VEC_VRED) { 668 when(simple.io.enq.vtype.vlmul === "b001".U) { 669 csBundle(0).srcType(2) := SrcType.DC 670 csBundle(0).lsrc(0) := src2 + 1.U 671 csBundle(0).lsrc(1) := src2 672 csBundle(0).ldest := VECTOR_TMP_REG_LMUL.U 673 csBundle(0).uopIdx := 0.U 674 } 675 when(simple.io.enq.vtype.vlmul === "b010".U) { 676 csBundle(0).srcType(2) := SrcType.DC 677 csBundle(0).lsrc(0) := src2 + 1.U 678 csBundle(0).lsrc(1) := src2 679 csBundle(0).ldest := VECTOR_TMP_REG_LMUL.U 680 csBundle(0).uopIdx := 0.U 681 682 csBundle(1).srcType(2) := SrcType.DC 683 csBundle(1).lsrc(0) := src2 + 3.U 684 csBundle(1).lsrc(1) := src2 + 2.U 685 csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U 686 csBundle(1).uopIdx := 1.U 687 688 csBundle(2).srcType(2) := SrcType.DC 689 csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U 690 csBundle(2).lsrc(1) := VECTOR_TMP_REG_LMUL.U 691 csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U 692 csBundle(2).uopIdx := 2.U 693 } 694 when(simple.io.enq.vtype.vlmul === "b011".U) { 695 for (i <- 0 until MAX_VLMUL) { 696 if (i < MAX_VLMUL - MAX_VLMUL / 2) { 697 csBundle(i).lsrc(0) := src2 + (i * 2 + 1).U 698 csBundle(i).lsrc(1) := src2 + (i * 2).U 699 csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U 700 } else if (i < MAX_VLMUL - MAX_VLMUL / 4) { 701 csBundle(i).lsrc(0) := (VECTOR_TMP_REG_LMUL + (i - MAX_VLMUL / 2) * 2 + 1).U 702 csBundle(i).lsrc(1) := (VECTOR_TMP_REG_LMUL + (i - MAX_VLMUL / 2) * 2).U 703 csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U 704 } else if (i < MAX_VLMUL - MAX_VLMUL / 8) { 705 csBundle(6).lsrc(0) := (VECTOR_TMP_REG_LMUL + 5).U 706 csBundle(6).lsrc(1) := (VECTOR_TMP_REG_LMUL + 4).U 707 csBundle(6).ldest := (VECTOR_TMP_REG_LMUL + 6).U 708 } 709 csBundle(i).srcType(2) := SrcType.DC 710 csBundle(i).uopIdx := i.U 711 } 712 } 713 when(simple.io.enq.vtype.vlmul.orR()) { 714 csBundle(numOfUop - 1.U).srcType(2) := SrcType.vp 715 csBundle(numOfUop - 1.U).lsrc(0) := src1 716 csBundle(numOfUop - 1.U).lsrc(1) := VECTOR_TMP_REG_LMUL.U + numOfUop - 2.U 717 csBundle(numOfUop - 1.U).lsrc(2) := dest 718 csBundle(numOfUop - 1.U).ldest := dest 719 csBundle(numOfUop - 1.U).uopIdx := numOfUop - 1.U 720 } 721 } 722 is(UopSplitType.VEC_VFRED) { 723 val vlmul = simple.io.enq.vtype.vlmul 724 val vsew = simple.io.enq.vtype.vsew 725 when(vlmul === VLmul.m8){ 726 for (i <- 0 until 4) { 727 csBundle(i).lsrc(0) := src2 + (i * 2 + 1).U 728 csBundle(i).lsrc(1) := src2 + (i * 2).U 729 csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U 730 csBundle(i).uopIdx := i.U 731 } 732 for (i <- 4 until 6) { 733 csBundle(i).lsrc(0) := (VECTOR_TMP_REG_LMUL + (i - 4) * 2 + 1).U 734 csBundle(i).lsrc(1) := (VECTOR_TMP_REG_LMUL + (i - 4) * 2).U 735 csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U 736 csBundle(i).uopIdx := i.U 737 } 738 csBundle(6).lsrc(0) := (VECTOR_TMP_REG_LMUL + 5).U 739 csBundle(6).lsrc(1) := (VECTOR_TMP_REG_LMUL + 4).U 740 csBundle(6).ldest := (VECTOR_TMP_REG_LMUL + 6).U 741 csBundle(6).uopIdx := 6.U 742 when(vsew === VSew.e64) { 743 csBundle(7).lsrc(0) := (VECTOR_TMP_REG_LMUL + 6).U 744 csBundle(7).lsrc(1) := (VECTOR_TMP_REG_LMUL + 6).U 745 csBundle(7).ldest := (VECTOR_TMP_REG_LMUL + 7).U 746 csBundle(7).vpu.fpu.isFoldTo1_2 := true.B 747 csBundle(7).uopIdx := 7.U 748 csBundle(8).lsrc(0) := src1 749 csBundle(8).lsrc(1) := (VECTOR_TMP_REG_LMUL + 7).U 750 csBundle(8).ldest := dest 751 csBundle(8).uopIdx := 8.U 752 } 753 when(vsew === VSew.e32) { 754 csBundle(7).lsrc(0) := (VECTOR_TMP_REG_LMUL + 6).U 755 csBundle(7).lsrc(1) := (VECTOR_TMP_REG_LMUL + 6).U 756 csBundle(7).ldest := (VECTOR_TMP_REG_LMUL + 7).U 757 csBundle(7).vpu.fpu.isFoldTo1_2 := true.B 758 csBundle(7).uopIdx := 7.U 759 csBundle(8).lsrc(0) := (VECTOR_TMP_REG_LMUL + 7).U 760 csBundle(8).lsrc(1) := (VECTOR_TMP_REG_LMUL + 7).U 761 csBundle(8).ldest := (VECTOR_TMP_REG_LMUL + 8).U 762 csBundle(8).vpu.fpu.isFoldTo1_4 := true.B 763 csBundle(8).uopIdx := 8.U 764 csBundle(9).lsrc(0) := src1 765 csBundle(9).lsrc(1) := (VECTOR_TMP_REG_LMUL + 8).U 766 csBundle(9).ldest := dest 767 csBundle(9).uopIdx := 9.U 768 } 769 when(vsew === VSew.e16) { 770 csBundle(7).lsrc(0) := (VECTOR_TMP_REG_LMUL + 6).U 771 csBundle(7).lsrc(1) := (VECTOR_TMP_REG_LMUL + 6).U 772 csBundle(7).ldest := (VECTOR_TMP_REG_LMUL + 7).U 773 csBundle(7).vpu.fpu.isFoldTo1_2 := true.B 774 csBundle(7).uopIdx := 7.U 775 csBundle(8).lsrc(0) := (VECTOR_TMP_REG_LMUL + 7).U 776 csBundle(8).lsrc(1) := (VECTOR_TMP_REG_LMUL + 7).U 777 csBundle(8).ldest := (VECTOR_TMP_REG_LMUL + 8).U 778 csBundle(8).vpu.fpu.isFoldTo1_4 := true.B 779 csBundle(8).uopIdx := 8.U 780 csBundle(9).lsrc(0) := (VECTOR_TMP_REG_LMUL + 8).U 781 csBundle(9).lsrc(1) := (VECTOR_TMP_REG_LMUL + 8).U 782 csBundle(9).ldest := (VECTOR_TMP_REG_LMUL + 9).U 783 csBundle(9).vpu.fpu.isFoldTo1_8 := true.B 784 csBundle(9).uopIdx := 9.U 785 csBundle(10).lsrc(0) := src1 786 csBundle(10).lsrc(1) := (VECTOR_TMP_REG_LMUL + 9).U 787 csBundle(10).ldest := dest 788 csBundle(10).uopIdx := 10.U 789 } 790 } 791 when(vlmul === VLmul.m4) { 792 for (i <- 0 until 2) { 793 csBundle(i).lsrc(0) := src2 + (i * 2 + 1).U 794 csBundle(i).lsrc(1) := src2 + (i * 2).U 795 csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U 796 csBundle(i).uopIdx := i.U 797 } 798 csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U 799 csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 800 csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U 801 csBundle(2).uopIdx := 2.U 802 when(vsew === VSew.e64) { 803 csBundle(3).lsrc(0) := (VECTOR_TMP_REG_LMUL + 2).U 804 csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U 805 csBundle(3).ldest := (VECTOR_TMP_REG_LMUL + 3).U 806 csBundle(3).vpu.fpu.isFoldTo1_2 := true.B 807 csBundle(3).uopIdx := 3.U 808 csBundle(4).lsrc(0) := src1 809 csBundle(4).lsrc(1) := (VECTOR_TMP_REG_LMUL + 3).U 810 csBundle(4).ldest := dest 811 csBundle(4).uopIdx := 4.U 812 } 813 when(vsew === VSew.e32) { 814 csBundle(3).lsrc(0) := (VECTOR_TMP_REG_LMUL + 2).U 815 csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U 816 csBundle(3).ldest := (VECTOR_TMP_REG_LMUL + 3).U 817 csBundle(3).vpu.fpu.isFoldTo1_2 := true.B 818 csBundle(3).uopIdx := 3.U 819 csBundle(4).lsrc(0) := (VECTOR_TMP_REG_LMUL + 3).U 820 csBundle(4).lsrc(1) := (VECTOR_TMP_REG_LMUL + 3).U 821 csBundle(4).ldest := (VECTOR_TMP_REG_LMUL + 4).U 822 csBundle(4).vpu.fpu.isFoldTo1_4 := true.B 823 csBundle(4).uopIdx := 4.U 824 csBundle(5).lsrc(0) := src1 825 csBundle(5).lsrc(1) := (VECTOR_TMP_REG_LMUL + 4).U 826 csBundle(5).ldest := dest 827 csBundle(5).uopIdx := 5.U 828 } 829 when(vsew === VSew.e16) { 830 csBundle(3).lsrc(0) := (VECTOR_TMP_REG_LMUL + 2).U 831 csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U 832 csBundle(3).ldest := (VECTOR_TMP_REG_LMUL + 3).U 833 csBundle(3).vpu.fpu.isFoldTo1_2 := true.B 834 csBundle(3).uopIdx := 3.U 835 csBundle(4).lsrc(0) := (VECTOR_TMP_REG_LMUL + 3).U 836 csBundle(4).lsrc(1) := (VECTOR_TMP_REG_LMUL + 3).U 837 csBundle(4).ldest := (VECTOR_TMP_REG_LMUL + 4).U 838 csBundle(4).vpu.fpu.isFoldTo1_4 := true.B 839 csBundle(4).uopIdx := 4.U 840 csBundle(5).lsrc(0) := (VECTOR_TMP_REG_LMUL + 4).U 841 csBundle(5).lsrc(1) := (VECTOR_TMP_REG_LMUL + 4).U 842 csBundle(5).ldest := (VECTOR_TMP_REG_LMUL + 5).U 843 csBundle(5).vpu.fpu.isFoldTo1_8 := true.B 844 csBundle(5).uopIdx := 5.U 845 csBundle(6).lsrc(0) := src1 846 csBundle(6).lsrc(1) := (VECTOR_TMP_REG_LMUL + 5).U 847 csBundle(6).ldest := dest 848 csBundle(6).uopIdx := 6.U 849 } 850 } 851 when(vlmul === VLmul.m2) { 852 csBundle(0).lsrc(0) := src2 + 1.U 853 csBundle(0).lsrc(1) := src2 + 0.U 854 csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U 855 csBundle(0).uopIdx := 0.U 856 when(vsew === VSew.e64) { 857 csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U 858 csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 859 csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U 860 csBundle(1).vpu.fpu.isFoldTo1_2 := true.B 861 csBundle(1).uopIdx := 1.U 862 csBundle(2).lsrc(0) := src1 863 csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U 864 csBundle(2).ldest := dest 865 csBundle(2).uopIdx := 2.U 866 } 867 when(vsew === VSew.e32) { 868 csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U 869 csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 870 csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U 871 csBundle(1).vpu.fpu.isFoldTo1_2 := true.B 872 csBundle(1).uopIdx := 1.U 873 csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U 874 csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U 875 csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U 876 csBundle(2).vpu.fpu.isFoldTo1_4 := true.B 877 csBundle(2).uopIdx := 2.U 878 csBundle(3).lsrc(0) := src1 879 csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U 880 csBundle(3).ldest := dest 881 csBundle(3).uopIdx := 3.U 882 } 883 when(vsew === VSew.e16) { 884 csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U 885 csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 886 csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U 887 csBundle(1).vpu.fpu.isFoldTo1_2 := true.B 888 csBundle(1).uopIdx := 1.U 889 csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U 890 csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U 891 csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U 892 csBundle(2).vpu.fpu.isFoldTo1_4 := true.B 893 csBundle(2).uopIdx := 2.U 894 csBundle(3).lsrc(0) := (VECTOR_TMP_REG_LMUL + 2).U 895 csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U 896 csBundle(3).ldest := (VECTOR_TMP_REG_LMUL + 3).U 897 csBundle(3).vpu.fpu.isFoldTo1_8 := true.B 898 csBundle(3).uopIdx := 3.U 899 csBundle(4).lsrc(0) := src1 900 csBundle(4).lsrc(1) := (VECTOR_TMP_REG_LMUL + 3).U 901 csBundle(4).ldest := dest 902 csBundle(4).uopIdx := 4.U 903 } 904 } 905 when(vlmul === VLmul.m1) { 906 when(vsew === VSew.e64) { 907 csBundle(0).lsrc(0) := src2 908 csBundle(0).lsrc(1) := src2 909 csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U 910 csBundle(0).vpu.fpu.isFoldTo1_2 := true.B 911 csBundle(0).uopIdx := 0.U 912 csBundle(1).lsrc(0) := src1 913 csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 914 csBundle(1).ldest := dest 915 csBundle(1).uopIdx := 1.U 916 } 917 when(vsew === VSew.e32) { 918 csBundle(0).lsrc(0) := src2 919 csBundle(0).lsrc(1) := src2 920 csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U 921 csBundle(0).vpu.fpu.isFoldTo1_2 := true.B 922 csBundle(0).uopIdx := 0.U 923 csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U 924 csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 925 csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U 926 csBundle(1).vpu.fpu.isFoldTo1_4 := true.B 927 csBundle(1).uopIdx := 1.U 928 csBundle(2).lsrc(0) := src1 929 csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U 930 csBundle(2).ldest := dest 931 csBundle(2).uopIdx := 2.U 932 } 933 when(vsew === VSew.e16) { 934 csBundle(0).lsrc(0) := src2 935 csBundle(0).lsrc(1) := src2 936 csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U 937 csBundle(0).vpu.fpu.isFoldTo1_2 := true.B 938 csBundle(0).uopIdx := 0.U 939 csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U 940 csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 941 csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U 942 csBundle(1).vpu.fpu.isFoldTo1_4 := true.B 943 csBundle(1).uopIdx := 1.U 944 csBundle(2).lsrc(0) := (VECTOR_TMP_REG_LMUL + 1).U 945 csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U 946 csBundle(2).ldest := (VECTOR_TMP_REG_LMUL + 2).U 947 csBundle(2).vpu.fpu.isFoldTo1_8 := true.B 948 csBundle(2).uopIdx := 2.U 949 csBundle(3).lsrc(0) := src1 950 csBundle(3).lsrc(1) := (VECTOR_TMP_REG_LMUL + 2).U 951 csBundle(3).ldest := dest 952 csBundle(3).uopIdx := 3.U 953 } 954 } 955 when(vlmul === VLmul.mf2) { 956 when(vsew === VSew.e32) { 957 csBundle(0).lsrc(0) := src2 958 csBundle(0).lsrc(1) := src2 959 csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U 960 csBundle(0).vpu.fpu.isFoldTo1_4 := true.B 961 csBundle(0).uopIdx := 0.U 962 csBundle(1).lsrc(0) := src1 963 csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 964 csBundle(1).ldest := dest 965 csBundle(1).uopIdx := 1.U 966 } 967 when(vsew === VSew.e16) { 968 csBundle(0).lsrc(0) := src2 969 csBundle(0).lsrc(1) := src2 970 csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U 971 csBundle(0).vpu.fpu.isFoldTo1_4 := true.B 972 csBundle(0).uopIdx := 0.U 973 csBundle(1).lsrc(0) := (VECTOR_TMP_REG_LMUL + 0).U 974 csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 975 csBundle(1).ldest := (VECTOR_TMP_REG_LMUL + 1).U 976 csBundle(1).vpu.fpu.isFoldTo1_8 := true.B 977 csBundle(1).uopIdx := 1.U 978 csBundle(2).lsrc(0) := src1 979 csBundle(2).lsrc(1) := (VECTOR_TMP_REG_LMUL + 1).U 980 csBundle(2).ldest := dest 981 csBundle(2).uopIdx := 2.U 982 } 983 } 984 when(vlmul === VLmul.mf4) { 985 when(vsew === VSew.e16) { 986 csBundle(0).lsrc(0) := src2 987 csBundle(0).lsrc(1) := src2 988 csBundle(0).ldest := (VECTOR_TMP_REG_LMUL + 0).U 989 csBundle(0).vpu.fpu.isFoldTo1_8 := true.B 990 csBundle(0).uopIdx := 0.U 991 csBundle(1).lsrc(0) := src1 992 csBundle(1).lsrc(1) := (VECTOR_TMP_REG_LMUL + 0).U 993 csBundle(1).ldest := dest 994 csBundle(1).uopIdx := 1.U 995 } 996 } 997 } 998 999 is(UopSplitType.VEC_SLIDEUP) { 1000 // FMV.D.X 1001 csBundle(0).srcType(0) := SrcType.reg 1002 csBundle(0).srcType(1) := SrcType.imm 1003 csBundle(0).lsrc(1) := 0.U 1004 csBundle(0).ldest := FP_TMP_REG_MV.U 1005 csBundle(0).fuType := FuType.i2f.U 1006 csBundle(0).rfWen := false.B 1007 csBundle(0).fpWen := true.B 1008 csBundle(0).vecWen := false.B 1009 csBundle(0).fpu.isAddSub := false.B 1010 csBundle(0).fpu.typeTagIn := FPU.D 1011 csBundle(0).fpu.typeTagOut := FPU.D 1012 csBundle(0).fpu.fromInt := true.B 1013 csBundle(0).fpu.wflags := false.B 1014 csBundle(0).fpu.fpWen := true.B 1015 csBundle(0).fpu.div := false.B 1016 csBundle(0).fpu.sqrt := false.B 1017 csBundle(0).fpu.fcvt := false.B 1018 // LMUL 1019 for (i <- 0 until MAX_VLMUL) 1020 for (j <- 0 to i) { 1021 val old_vd = if (j == 0) { 1022 dest + i.U 1023 } else (VECTOR_TMP_REG_LMUL + j - 1).U 1024 val vd = if (j == i) { 1025 dest + i.U 1026 } else (VECTOR_TMP_REG_LMUL + j).U 1027 csBundle(i * (i + 1) / 2 + j + 1).srcType(0) := SrcType.fp 1028 csBundle(i * (i + 1) / 2 + j + 1).lsrc(0) := FP_TMP_REG_MV.U 1029 csBundle(i * (i + 1) / 2 + j + 1).lsrc(1) := src2 + j.U 1030 csBundle(i * (i + 1) / 2 + j + 1).lsrc(2) := old_vd 1031 csBundle(i * (i + 1) / 2 + j + 1).ldest := vd 1032 csBundle(i * (i + 1) / 2 + j + 1).uopIdx := (i * (i + 1) / 2 + j).U 1033 } 1034 } 1035 1036 is(UopSplitType.VEC_ISLIDEUP) { 1037 // LMUL 1038 for (i <- 0 until MAX_VLMUL) 1039 for (j <- 0 to i) { 1040 val old_vd = if (j == 0) { 1041 dest + i.U 1042 } else (VECTOR_TMP_REG_LMUL + j - 1).U 1043 val vd = if (j == i) { 1044 dest + i.U 1045 } else (VECTOR_TMP_REG_LMUL + j).U 1046 csBundle(i * (i + 1) / 2 + j).lsrc(1) := src2 + j.U 1047 csBundle(i * (i + 1) / 2 + j).lsrc(2) := old_vd 1048 csBundle(i * (i + 1) / 2 + j).ldest := vd 1049 csBundle(i * (i + 1) / 2 + j).uopIdx := (i * (i + 1) / 2 + j).U 1050 } 1051 } 1052 1053 is(UopSplitType.VEC_SLIDEDOWN) { 1054 // FMV.D.X 1055 csBundle(0).srcType(0) := SrcType.reg 1056 csBundle(0).srcType(1) := SrcType.imm 1057 csBundle(0).lsrc(1) := 0.U 1058 csBundle(0).ldest := FP_TMP_REG_MV.U 1059 csBundle(0).fuType := FuType.i2f.U 1060 csBundle(0).rfWen := false.B 1061 csBundle(0).fpWen := true.B 1062 csBundle(0).vecWen := false.B 1063 csBundle(0).fpu.isAddSub := false.B 1064 csBundle(0).fpu.typeTagIn := FPU.D 1065 csBundle(0).fpu.typeTagOut := FPU.D 1066 csBundle(0).fpu.fromInt := true.B 1067 csBundle(0).fpu.wflags := false.B 1068 csBundle(0).fpu.fpWen := true.B 1069 csBundle(0).fpu.div := false.B 1070 csBundle(0).fpu.sqrt := false.B 1071 csBundle(0).fpu.fcvt := false.B 1072 // LMUL 1073 for (i <- 0 until MAX_VLMUL) 1074 for (j <- (0 to i).reverse) { 1075 when(i.U < lmul) { 1076 val old_vd = if (j == 0) { 1077 dest + lmul - 1.U - i.U 1078 } else (VECTOR_TMP_REG_LMUL + j - 1).U 1079 val vd = if (j == i) { 1080 dest + lmul - 1.U - i.U 1081 } else (VECTOR_TMP_REG_LMUL + j).U 1082 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).srcType(0) := SrcType.fp 1083 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(0) := FP_TMP_REG_MV.U 1084 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(1) := src2 + lmul - 1.U - j.U 1085 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(2) := old_vd 1086 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).ldest := vd 1087 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).uopIdx := numOfUop - (i * (i + 1) / 2 + i - j + 2).U 1088 } 1089 } 1090 } 1091 1092 is(UopSplitType.VEC_ISLIDEDOWN) { 1093 // LMUL 1094 for (i <- 0 until MAX_VLMUL) 1095 for (j <- (0 to i).reverse) { 1096 when(i.U < lmul) { 1097 val old_vd = if (j == 0) { 1098 dest + lmul - 1.U - i.U 1099 } else (VECTOR_TMP_REG_LMUL + j - 1).U 1100 val vd = if (j == i) { 1101 dest + lmul - 1.U - i.U 1102 } else (VECTOR_TMP_REG_LMUL + j).U 1103 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(1) := src2 + lmul - 1.U - j.U 1104 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).lsrc(2) := old_vd 1105 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).ldest := vd 1106 csBundle(numOfUop - (i * (i + 1) / 2 + i - j + 1).U).uopIdx := numOfUop - (i * (i + 1) / 2 + i - j + 1).U 1107 } 1108 } 1109 } 1110 1111 is(UopSplitType.VEC_M0X) { 1112 // LMUL 1113 for (i <- 0 until MAX_VLMUL) { 1114 val srcType0 = if (i == 0) SrcType.DC else SrcType.vp 1115 val ldest = (VECTOR_TMP_REG_LMUL + i).U 1116 csBundle(i).srcType(0) := srcType0 1117 csBundle(i).srcType(1) := SrcType.vp 1118 csBundle(i).rfWen := false.B 1119 csBundle(i).vecWen := true.B 1120 csBundle(i).lsrc(0) := (VECTOR_TMP_REG_LMUL + i - 1).U 1121 csBundle(i).lsrc(1) := src2 1122 // csBundle(i).lsrc(2) := dest + i.U DontCare 1123 csBundle(i).ldest := ldest 1124 csBundle(i).uopIdx := i.U 1125 } 1126 csBundle(lmul - 1.U).vecWen := false.B 1127 csBundle(lmul - 1.U).fpWen := true.B 1128 csBundle(lmul - 1.U).ldest := FP_TMP_REG_MV.U 1129 // FMV_X_D 1130 csBundle(lmul).srcType(0) := SrcType.fp 1131 csBundle(lmul).srcType(1) := SrcType.imm 1132 csBundle(lmul).lsrc(0) := FP_TMP_REG_MV.U 1133 csBundle(lmul).lsrc(1) := 0.U 1134 csBundle(lmul).ldest := dest 1135 csBundle(lmul).fuType := FuType.fmisc.U 1136 csBundle(lmul).rfWen := true.B 1137 csBundle(lmul).fpWen := false.B 1138 csBundle(lmul).vecWen := false.B 1139 csBundle(lmul).fpu.isAddSub := false.B 1140 csBundle(lmul).fpu.typeTagIn := FPU.D 1141 csBundle(lmul).fpu.typeTagOut := FPU.D 1142 csBundle(lmul).fpu.fromInt := false.B 1143 csBundle(lmul).fpu.wflags := false.B 1144 csBundle(lmul).fpu.fpWen := false.B 1145 csBundle(lmul).fpu.div := false.B 1146 csBundle(lmul).fpu.sqrt := false.B 1147 csBundle(lmul).fpu.fcvt := false.B 1148 } 1149 1150 is(UopSplitType.VEC_MVV) { 1151 // LMUL 1152 for (i <- 0 until MAX_VLMUL) { 1153 val srcType0 = if (i == 0) SrcType.DC else SrcType.vp 1154 csBundle(i * 2 + 0).srcType(0) := srcType0 1155 csBundle(i * 2 + 0).srcType(1) := SrcType.vp 1156 csBundle(i * 2 + 0).lsrc(0) := (VECTOR_TMP_REG_LMUL + i - 1).U 1157 csBundle(i * 2 + 0).lsrc(1) := src2 1158 csBundle(i * 2 + 0).lsrc(2) := dest + i.U 1159 csBundle(i * 2 + 0).ldest := dest + i.U 1160 csBundle(i * 2 + 0).uopIdx := (i * 2 + 0).U 1161 1162 csBundle(i * 2 + 1).srcType(0) := srcType0 1163 csBundle(i * 2 + 1).srcType(1) := SrcType.vp 1164 csBundle(i * 2 + 1).lsrc(0) := (VECTOR_TMP_REG_LMUL + i - 1).U 1165 csBundle(i * 2 + 1).lsrc(1) := src2 1166 // csBundle(i).lsrc(2) := dest + i.U DontCare 1167 csBundle(i * 2 + 1).ldest := (VECTOR_TMP_REG_LMUL + i).U 1168 csBundle(i * 2 + 1).uopIdx := (i * 2 + 1).U 1169 } 1170 } 1171 1172 is(UopSplitType.VEC_M0X_VFIRST) { 1173 // LMUL 1174 csBundle(0).rfWen := false.B 1175 csBundle(0).fpWen := true.B 1176 csBundle(0).ldest := FP_TMP_REG_MV.U 1177 // FMV_X_D 1178 csBundle(1).srcType(0) := SrcType.fp 1179 csBundle(1).srcType(1) := SrcType.imm 1180 csBundle(1).lsrc(0) := FP_TMP_REG_MV.U 1181 csBundle(1).lsrc(1) := 0.U 1182 csBundle(1).ldest := dest 1183 csBundle(1).fuType := FuType.fmisc.U 1184 csBundle(1).rfWen := true.B 1185 csBundle(1).fpWen := false.B 1186 csBundle(1).vecWen := false.B 1187 csBundle(1).fpu.isAddSub := false.B 1188 csBundle(1).fpu.typeTagIn := FPU.D 1189 csBundle(1).fpu.typeTagOut := FPU.D 1190 csBundle(1).fpu.fromInt := false.B 1191 csBundle(1).fpu.wflags := false.B 1192 csBundle(1).fpu.fpWen := false.B 1193 csBundle(1).fpu.div := false.B 1194 csBundle(1).fpu.sqrt := false.B 1195 csBundle(1).fpu.fcvt := false.B 1196 } 1197 is(UopSplitType.VEC_VWW) { 1198 for (i <- 0 until MAX_VLMUL*2) { 1199 when(i.U < lmul){ 1200 csBundle(i).srcType(2) := SrcType.DC 1201 csBundle(i).lsrc(0) := src2 + i.U 1202 csBundle(i).lsrc(1) := src2 + i.U 1203 // csBundle(i).lsrc(2) := dest + (2 * i).U 1204 csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U 1205 csBundle(i).uopIdx := i.U 1206 } otherwise { 1207 csBundle(i).srcType(2) := SrcType.DC 1208 csBundle(i).lsrc(0) := VECTOR_TMP_REG_LMUL.U + Cat((i.U-lmul),0.U(1.W)) + 1.U 1209 csBundle(i).lsrc(1) := VECTOR_TMP_REG_LMUL.U + Cat((i.U-lmul),0.U(1.W)) 1210 // csBundle(i).lsrc(2) := dest + (2 * i).U 1211 csBundle(i).ldest := (VECTOR_TMP_REG_LMUL + i).U 1212 csBundle(i).uopIdx := i.U 1213 } 1214 csBundle(numOfUop-1.U).srcType(2) := SrcType.vp 1215 csBundle(numOfUop-1.U).lsrc(0) := src1 1216 csBundle(numOfUop-1.U).lsrc(2) := dest 1217 csBundle(numOfUop-1.U).ldest := dest 1218 } 1219 } 1220 is(UopSplitType.VEC_RGATHER) { 1221 def genCsBundle_VEC_RGATHER(len:Int): Unit ={ 1222 for (i <- 0 until len) 1223 for (j <- 0 until len) { 1224 // csBundle(i * len + j).srcType(0) := SrcType.vp // SrcType.imm 1225 // csBundle(i * len + j).srcType(1) := SrcType.vp 1226 // csBundle(i * len + j).srcType(2) := SrcType.vp 1227 csBundle(i * len + j).lsrc(0) := src1 + i.U 1228 csBundle(i * len + j).lsrc(1) := src2 + j.U 1229 val vd_old = if(j==0) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j - 1).U 1230 csBundle(i * len + j).lsrc(2) := vd_old 1231 val vd = if(j==len-1) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j).U 1232 csBundle(i * len + j).ldest := vd 1233 csBundle(i * len + j).uopIdx := (i * len + j).U 1234 } 1235 } 1236 switch(simple.io.enq.vtype.vlmul) { 1237 is("b001".U ){ 1238 genCsBundle_VEC_RGATHER(2) 1239 } 1240 is("b010".U ){ 1241 genCsBundle_VEC_RGATHER(4) 1242 } 1243 is("b011".U ){ 1244 genCsBundle_VEC_RGATHER(8) 1245 } 1246 } 1247 } 1248 is(UopSplitType.VEC_RGATHER_VX) { 1249 def genCsBundle_RGATHER_VX(len:Int): Unit ={ 1250 for (i <- 0 until len) 1251 for (j <- 0 until len) { 1252 csBundle(i * len + j + 1).srcType(0) := SrcType.fp 1253 // csBundle(i * len + j + 1).srcType(1) := SrcType.vp 1254 // csBundle(i * len + j + 1).srcType(2) := SrcType.vp 1255 csBundle(i * len + j + 1).lsrc(0) := FP_TMP_REG_MV.U 1256 csBundle(i * len + j + 1).lsrc(1) := src2 + j.U 1257 val vd_old = if(j==0) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j - 1).U 1258 csBundle(i * len + j + 1).lsrc(2) := vd_old 1259 val vd = if(j==len-1) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j).U 1260 csBundle(i * len + j + 1).ldest := vd 1261 csBundle(i * len + j + 1).uopIdx := (i * len + j).U 1262 } 1263 } 1264 // FMV.D.X 1265 csBundle(0).srcType(0) := SrcType.reg 1266 csBundle(0).srcType(1) := SrcType.imm 1267 csBundle(0).lsrc(1) := 0.U 1268 csBundle(0).ldest := FP_TMP_REG_MV.U 1269 csBundle(0).fuType := FuType.i2f.U 1270 csBundle(0).rfWen := false.B 1271 csBundle(0).fpWen := true.B 1272 csBundle(0).vecWen := false.B 1273 csBundle(0).fpu.isAddSub := false.B 1274 csBundle(0).fpu.typeTagIn := FPU.D 1275 csBundle(0).fpu.typeTagOut := FPU.D 1276 csBundle(0).fpu.fromInt := true.B 1277 csBundle(0).fpu.wflags := false.B 1278 csBundle(0).fpu.fpWen := true.B 1279 csBundle(0).fpu.div := false.B 1280 csBundle(0).fpu.sqrt := false.B 1281 csBundle(0).fpu.fcvt := false.B 1282 switch(simple.io.enq.vtype.vlmul) { 1283 is("b000".U ){ 1284 genCsBundle_RGATHER_VX(1) 1285 } 1286 is("b001".U ){ 1287 genCsBundle_RGATHER_VX(2) 1288 } 1289 is("b010".U ){ 1290 genCsBundle_RGATHER_VX(4) 1291 } 1292 is("b011".U ){ 1293 genCsBundle_RGATHER_VX(8) 1294 } 1295 } 1296 } 1297 is(UopSplitType.VEC_RGATHEREI16) { 1298 def genCsBundle_VEC_RGATHEREI16_SEW8(len:Int): Unit ={ 1299 for (i <- 0 until len) 1300 for (j <- 0 until len) { 1301 val vd_old0 = if(j==0) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j*2-1).U 1302 val vd0 = (VECTOR_TMP_REG_LMUL + j*2 ).U 1303 // csBundle(i * len + j).srcType(0) := SrcType.vp // SrcType.imm 1304 // csBundle(i * len + j).srcType(1) := SrcType.vp 1305 // csBundle(i * len + j).srcType(2) := SrcType.vp 1306 csBundle((i * len + j)*2+0).lsrc(0) := src1 + (i*2+0).U 1307 csBundle((i * len + j)*2+0).lsrc(1) := src2 + j.U 1308 csBundle((i * len + j)*2+0).lsrc(2) := vd_old0 1309 csBundle((i * len + j)*2+0).ldest := vd0 1310 csBundle((i * len + j)*2+0).uopIdx := ((i * len + j)*2+0).U 1311 val vd_old1 = (VECTOR_TMP_REG_LMUL + j*2).U 1312 val vd1 = if(j==len-1) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j*2+1 ).U 1313 csBundle((i * len + j)*2+1).lsrc(0) := src1 + (i*2+1).U 1314 csBundle((i * len + j)*2+1).lsrc(1) := src2 + j.U 1315 csBundle((i * len + j)*2+1).lsrc(2) := vd_old1 1316 csBundle((i * len + j)*2+1).ldest := vd1 1317 csBundle((i * len + j)*2+1).uopIdx := ((i * len + j)*2+1).U 1318 } 1319 } 1320 def genCsBundle_VEC_RGATHEREI16(len:Int): Unit ={ 1321 for (i <- 0 until len) 1322 for (j <- 0 until len) { 1323 val vd_old = if(j==0) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j-1).U 1324 val vd = if(j==len-1) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j).U 1325 // csBundle(i * len + j).srcType(0) := SrcType.vp // SrcType.imm 1326 // csBundle(i * len + j).srcType(1) := SrcType.vp 1327 // csBundle(i * len + j).srcType(2) := SrcType.vp 1328 csBundle(i * len + j).lsrc(0) := src1 + i.U 1329 csBundle(i * len + j).lsrc(1) := src2 + j.U 1330 csBundle(i * len + j).lsrc(2) := vd_old 1331 csBundle(i * len + j).ldest := vd 1332 csBundle(i * len + j).uopIdx := (i * len + j).U 1333 } 1334 } 1335 switch(simple.io.enq.vtype.vlmul) { 1336 is("b000".U ){ 1337 when(!simple.io.enq.vtype.vsew.orR){ 1338 genCsBundle_VEC_RGATHEREI16_SEW8(1) 1339 } .otherwise{ 1340 genCsBundle_VEC_RGATHEREI16(1) 1341 } 1342 } 1343 is("b001".U) { 1344 when(!simple.io.enq.vtype.vsew.orR) { 1345 genCsBundle_VEC_RGATHEREI16_SEW8(2) 1346 }.otherwise { 1347 genCsBundle_VEC_RGATHEREI16(2) 1348 } 1349 } 1350 is("b010".U) { 1351 when(!simple.io.enq.vtype.vsew.orR) { 1352 genCsBundle_VEC_RGATHEREI16_SEW8(4) 1353 }.otherwise { 1354 genCsBundle_VEC_RGATHEREI16(4) 1355 } 1356 } 1357 is("b011".U) { 1358 genCsBundle_VEC_RGATHEREI16(8) 1359 } 1360 } 1361 } 1362 is(UopSplitType.VEC_COMPRESS) { 1363 def genCsBundle_VEC_COMPRESS(len:Int): Unit ={ 1364 for (i <- 0 until len){ 1365 val jlen = if (i == len-1) i+1 else i+2 1366 for (j <- 0 until jlen) { 1367 val vd_old = if(i==j) (dest + i.U) else (VECTOR_TMP_REG_LMUL + j + 1).U 1368 val vd = if(i==len-1) (dest + j.U) else{ 1369 if (j == i+1) VECTOR_TMP_REG_LMUL.U else (VECTOR_TMP_REG_LMUL + j + 1).U 1370 } 1371 val src23Type = if (j == i+1) DontCare else SrcType.vp 1372 csBundle(i*(i+3)/2 + j).srcType(0) := SrcType.vp 1373 csBundle(i*(i+3)/2 + j).srcType(1) := src23Type 1374 csBundle(i*(i+3)/2 + j).srcType(2) := src23Type 1375 csBundle(i*(i+3)/2 + j).lsrc(0) := src1 1376 csBundle(i*(i+3)/2 + j).lsrc(1) := src2 + i.U 1377 csBundle(i*(i+3)/2 + j).lsrc(2) := vd_old 1378 // csBundle(i*(i+3)/2 + j).lsrc(3) := VECTOR_TMP_REG_LMUL.U 1379 csBundle(i*(i+3)/2 + j).ldest := vd 1380 csBundle(i*(i+3)/2 + j).uopIdx := (i*(i+3)/2 + j).U 1381 } 1382 } 1383 } 1384 switch(simple.io.enq.vtype.vlmul) { 1385 is("b001".U ){ 1386 genCsBundle_VEC_COMPRESS(2) 1387 } 1388 is("b010".U ){ 1389 genCsBundle_VEC_COMPRESS(4) 1390 } 1391 is("b011".U ){ 1392 genCsBundle_VEC_COMPRESS(8) 1393 } 1394 } 1395 } 1396 is(UopSplitType.VEC_US_LD) { 1397 /* 1398 FMV.D.X 1399 */ 1400 csBundle(0).srcType(0) := SrcType.reg 1401 csBundle(0).srcType(1) := SrcType.imm 1402 csBundle(0).lsrc(1) := 0.U 1403 csBundle(0).ldest := FP_TMP_REG_MV.U 1404 csBundle(0).fuType := FuType.i2f.U 1405 csBundle(0).rfWen := false.B 1406 csBundle(0).fpWen := true.B 1407 csBundle(0).vecWen := false.B 1408 csBundle(0).fpu.isAddSub := false.B 1409 csBundle(0).fpu.typeTagIn := FPU.D 1410 csBundle(0).fpu.typeTagOut := FPU.D 1411 csBundle(0).fpu.fromInt := true.B 1412 csBundle(0).fpu.wflags := false.B 1413 csBundle(0).fpu.fpWen := true.B 1414 csBundle(0).fpu.div := false.B 1415 csBundle(0).fpu.sqrt := false.B 1416 csBundle(0).fpu.fcvt := false.B 1417 //LMUL 1418 for (i <- 0 until MAX_VLMUL) { 1419 csBundle(i + 1).srcType(0) := SrcType.fp 1420 csBundle(i + 1).lsrc(0) := FP_TMP_REG_MV.U 1421 csBundle(i + 1).ldest := dest + i.U 1422 csBundle(i + 1).uopIdx := i.U 1423 } 1424 } 1425 } 1426 1427 //uops dispatch 1428 val s_normal :: s_ext :: Nil = Enum(2) 1429 val state = RegInit(s_normal) 1430 val state_next = WireDefault(state) 1431 val uopRes = RegInit(0.U) 1432 1433 //readyFromRename Counter 1434 val readyCounter = PriorityMuxDefault(io.readyFromRename.map(x => !x).zip((0 to (RenameWidth - 1)).map(_.U)), RenameWidth.U) 1435 1436 switch(state) { 1437 is(s_normal) { 1438 state_next := Mux(io.validFromIBuf(0) && (numOfUop > readyCounter) && (readyCounter =/= 0.U), s_ext, s_normal) 1439 } 1440 is(s_ext) { 1441 state_next := Mux(io.validFromIBuf(0) && (uopRes > readyCounter), s_ext, s_normal) 1442 } 1443 } 1444 1445 state := state_next 1446 1447 val uopRes0 = Mux(state === s_normal, numOfUop, uopRes) 1448 val uopResJudge = Mux(state === s_normal, 1449 io.validFromIBuf(0) && (readyCounter =/= 0.U) && (uopRes0 > readyCounter), 1450 io.validFromIBuf(0) && (uopRes0 > readyCounter)) 1451 uopRes := Mux(uopResJudge, uopRes0 - readyCounter, 0.U) 1452 1453 for(i <- 0 until RenameWidth) { 1454 decodedInsts(i) := MuxCase(csBundle(i), Seq( 1455 (state === s_normal) -> csBundle(i), 1456 (state === s_ext) -> Mux((i.U + numOfUop -uopRes) < maxUopSize.U, csBundle(i.U + numOfUop - uopRes), csBundle(maxUopSize - 1)) 1457 )) 1458 } 1459 1460 1461 val validSimple = Wire(Vec(DecodeWidth - 1, Bool())) 1462 validSimple.zip(io.validFromIBuf.drop(1).zip(io.isComplex)).map{ case (dst, (src1, src2)) => dst := src1 && !src2 } 1463 val notInf = Wire(Vec(DecodeWidth - 1, Bool())) 1464 notInf.zip(io.validFromIBuf.drop(1).zip(validSimple)).map{ case (dst, (src1, src2)) => dst := !src1 || src2 } 1465 val notInfVec = Wire(Vec(DecodeWidth, Bool())) 1466 notInfVec.drop(1).zip(0 until DecodeWidth - 1).map{ case (dst, i) => dst := Cat(notInf.take(i + 1)).andR} 1467 notInfVec(0) := true.B 1468 1469 complexNum := Mux(io.validFromIBuf(0) && readyCounter.orR , 1470 Mux(uopRes0 > readyCounter, readyCounter, uopRes0), 1471 1.U) 1472 validToRename.zipWithIndex.foreach{ 1473 case(dst, i) => 1474 dst := MuxCase(false.B, Seq( 1475 (io.validFromIBuf(0) && uopRes0 > readyCounter ) -> Mux(readyCounter > i.U, true.B, false.B), 1476 (io.validFromIBuf(0) && !(uopRes0 > readyCounter)) -> Mux(complexNum > i.U, true.B, validSimple(i.U - complexNum) && notInfVec(i.U - complexNum) && io.readyFromRename(i)), 1477 )) 1478 } 1479 1480 readyToIBuf.zipWithIndex.foreach { 1481 case (dst, i) => 1482 dst := MuxCase(true.B, Seq( 1483 (io.validFromIBuf(0) && uopRes0 > readyCounter) -> false.B, 1484 (io.validFromIBuf(0) && !(uopRes0 > readyCounter)) -> (if (i==0) true.B else Mux(RenameWidth.U - complexNum >= i.U, notInfVec(i - 1) && validSimple(i - 1) && io.readyFromRename(i), false.B)), 1485 )) 1486 } 1487 1488 io.deq.decodedInsts := decodedInsts 1489 io.deq.isVset := isVsetSimple 1490 io.deq.complexNum := complexNum 1491 io.deq.validToRename := validToRename 1492 io.deq.readyToIBuf := readyToIBuf 1493 1494} 1495