package xiangshan.backend.datapath import org.chipsalliance.cde.config.Parameters import chisel3._ import chisel3.util._ import difftest.{DiffFpWriteback, DiffIntWriteback, DiffVecV0Writeback, DiffVecWriteback, DifftestModule} import utility.XSError import xiangshan.backend.BackendParams import xiangshan.backend.Bundles.{ExuOutput, WriteBackBundle} import xiangshan.backend.datapath.DataConfig._ import xiangshan.backend.regfile.RfWritePortWithConfig import xiangshan.{Redirect, XSBundle, XSModule} import xiangshan.SrcType.v0 import xiangshan.backend.fu.vector.Bundles.Vstart class WbArbiterDispatcherIO[T <: Data](private val gen: T, n: Int) extends Bundle { val in = Flipped(DecoupledIO(gen)) val out = Vec(n, DecoupledIO(gen)) } class WbArbiterDispatcher[T <: Data](private val gen: T, n: Int, acceptCond: T => (Seq[Bool], Bool)) (implicit p: Parameters) extends Module { val io = IO(new WbArbiterDispatcherIO(gen, n)) private val acceptVec: Vec[Bool] = VecInit(acceptCond(io.in.bits)._1) XSError(io.in.valid && PopCount(acceptVec) > 1.U, p"[ExeUnit] accept vec should no more than 1, ${Binary(acceptVec.asUInt)} ") io.out.zipWithIndex.foreach { case (out, i) => out.valid := acceptVec(i) && io.in.valid out.bits := io.in.bits } io.in.ready := Cat(io.out.zip(acceptVec).map{ case(out, canAccept) => out.ready && canAccept}).orR || acceptCond(io.in.bits)._2 } class WbArbiterIO()(implicit p: Parameters, params: WbArbiterParams) extends XSBundle { val flush = Flipped(ValidIO(new Redirect)) val in: MixedVec[DecoupledIO[WriteBackBundle]] = Flipped(params.genInput) val out: MixedVec[ValidIO[WriteBackBundle]] = params.genOutput def inGroup: Map[Int, Seq[DecoupledIO[WriteBackBundle]]] = in.groupBy(_.bits.params.port).map(x => (x._1, x._2.sortBy(_.bits.params.priority).toSeq)) } class RealWBCollideChecker(params: WbArbiterParams)(implicit p: Parameters) extends XSModule { val io = IO(new WbArbiterIO()(p, params)) private val inGroup: Map[Int, Seq[DecoupledIO[WriteBackBundle]]] = io.inGroup private val arbiters: Seq[Option[RealWBArbiter[WriteBackBundle]]] = Seq.tabulate(params.numOut) { x => { if (inGroup.contains(x)) { Some(Module(new RealWBArbiter(new WriteBackBundle(inGroup.values.head.head.bits.params, backendParams), inGroup(x).length))) } else { None } }} arbiters.zipWithIndex.foreach { case (arb, i) => if (arb.nonEmpty) { arb.get.io.in.zip(inGroup(i)).foreach { case (arbIn, wbIn) => arbIn <> wbIn } } } io.out.zip(arbiters).foreach { case (wbOut, arb) => if (arb.nonEmpty) { val arbOut = arb.get.io.out arbOut.ready := true.B wbOut.valid := arbOut.valid wbOut.bits := arbOut.bits } else { wbOut := 0.U.asTypeOf(wbOut) } } def getInOutMap: Map[Int, Int] = { (params.wbCfgs.indices zip params.wbCfgs.map(_.port)).toMap } } class WbDataPathIO()(implicit p: Parameters, params: BackendParams) extends XSBundle { val flush = Flipped(ValidIO(new Redirect())) val fromTop = new Bundle { val hartId = Input(UInt(8.W)) } val fromIntExu: MixedVec[MixedVec[DecoupledIO[ExuOutput]]] = Flipped(params.intSchdParams.get.genExuOutputDecoupledBundle) val fromFpExu: MixedVec[MixedVec[DecoupledIO[ExuOutput]]] = Flipped(params.fpSchdParams.get.genExuOutputDecoupledBundle) val fromVfExu: MixedVec[MixedVec[DecoupledIO[ExuOutput]]] = Flipped(params.vfSchdParams.get.genExuOutputDecoupledBundle) val fromMemExu: MixedVec[MixedVec[DecoupledIO[ExuOutput]]] = Flipped(params.memSchdParams.get.genExuOutputDecoupledBundle) val fromCSR = Input(new Bundle { val vstart = Vstart() }) val toIntPreg = Flipped(MixedVec(Vec(params.numPregWb(IntData()), new RfWritePortWithConfig(params.intPregParams.dataCfg, params.intPregParams.addrWidth)))) val toFpPreg = Flipped(MixedVec(Vec(params.numPregWb(FpData()), new RfWritePortWithConfig(params.fpPregParams.dataCfg, params.fpPregParams.addrWidth)))) val toVfPreg = Flipped(MixedVec(Vec(params.numPregWb(VecData()), new RfWritePortWithConfig(params.vfPregParams.dataCfg, params.vfPregParams.addrWidth)))) val toV0Preg = Flipped(MixedVec(Vec(params.numPregWb(V0Data()), new RfWritePortWithConfig(params.v0PregParams.dataCfg, params.v0PregParams.addrWidth)))) val toVlPreg = Flipped(MixedVec(Vec(params.numPregWb(VlData()), new RfWritePortWithConfig(params.vlPregParams.dataCfg, params.vlPregParams.addrWidth)))) val toCtrlBlock = new Bundle { val writeback: MixedVec[ValidIO[ExuOutput]] = params.genWrite2CtrlBundles } } class WbDataPath(params: BackendParams)(implicit p: Parameters) extends XSModule { val io = IO(new WbDataPathIO()(p, params)) // split val fromExuPre = collection.mutable.Seq() ++ (io.fromIntExu ++ io.fromFpExu ++ io.fromVfExu ++ io.fromMemExu).flatten val fromExuVld: Seq[DecoupledIO[ExuOutput]] = fromExuPre.filter(_.bits.params.hasVLoadFu).toSeq val vldMgu: Seq[VldMergeUnit] = fromExuVld.map(x => Module(new VldMergeUnit(x.bits.params))) vldMgu.zip(fromExuVld).foreach{ case (mgu, exu) => mgu.io.flush := io.flush mgu.io.writeback <> exu // Since xs will flush pipe, when vstart is not 0 and execute vector mem inst, the value of vstart in CSR is the // first element of this vector instruction. When exception occurs, the vstart in writeback bundle is the new one, // So this vstart should never be used as the beginning of vector mem operation. mgu.io.writeback.bits.vls.get.vpu.vstart := io.fromCSR.vstart } val wbReplaceVld = fromExuPre val vldIdx: Seq[Int] = vldMgu.map(x => fromExuPre.indexWhere(_.bits.params == x.params)) println("vldIdx: " + vldIdx) vldIdx.zip(vldMgu).foreach{ case (id, wb) => wbReplaceVld.update(id, wb.io.writebackAfterMerge) } val fromExu = Wire(chiselTypeOf(MixedVecInit(wbReplaceVld.toSeq))) // io.fromExuPre ------------------------------------------------------------> fromExu // \ / // -> vldMgu.io.writeback -> vldMgu.io.writebackAfterMerge / (fromExu zip wbReplaceVld).foreach { case (sink, source) => sink.valid := source.valid sink.bits := source.bits source.ready := sink.ready } // fromExu -> ArbiterInput val intArbiterInputsWire = Wire(chiselTypeOf(fromExu)) val intArbiterInputsWireY = intArbiterInputsWire.filter(_.bits.params.writeIntRf) val intArbiterInputsWireN = intArbiterInputsWire.filterNot(_.bits.params.writeIntRf) val fpArbiterInputsWire = Wire(chiselTypeOf(fromExu)) val fpArbiterInputsWireY = fpArbiterInputsWire.filter(_.bits.params.writeFpRf) val fpArbiterInputsWireN = fpArbiterInputsWire.filterNot(_.bits.params.writeFpRf) val vfArbiterInputsWire = Wire(chiselTypeOf(fromExu)) val vfArbiterInputsWireY = vfArbiterInputsWire.filter(_.bits.params.writeVfRf) val vfArbiterInputsWireN = vfArbiterInputsWire.filterNot(_.bits.params.writeVfRf) val v0ArbiterInputsWire = Wire(chiselTypeOf(fromExu)) val v0ArbiterInputsWireY = v0ArbiterInputsWire.filter(_.bits.params.writeV0Rf) val v0ArbiterInputsWireN = v0ArbiterInputsWire.filterNot(_.bits.params.writeV0Rf) val vlArbiterInputsWire = Wire(chiselTypeOf(fromExu)) val vlArbiterInputsWireY = vlArbiterInputsWire.filter(_.bits.params.writeVlRf) val vlArbiterInputsWireN = vlArbiterInputsWire.filterNot(_.bits.params.writeVlRf) def acceptCond(exuOutput: ExuOutput): (Seq[Bool], Bool) = { val intWen = exuOutput.intWen.getOrElse(false.B) val fpwen = exuOutput.fpWen.getOrElse(false.B) val vecWen = exuOutput.vecWen.getOrElse(false.B) val v0Wen = exuOutput.v0Wen.getOrElse(false.B) val vlWen = exuOutput.vlWen.getOrElse(false.B) (Seq(intWen, fpwen, vecWen, v0Wen, vlWen), !intWen && !fpwen && !vecWen && !v0Wen && !vlWen) } intArbiterInputsWire.zip(fpArbiterInputsWire).zip(vfArbiterInputsWire).zip(v0ArbiterInputsWire).zip(vlArbiterInputsWire).zip(fromExu).foreach { case (((((intArbiterInput, fpArbiterInput), vfArbiterInput), v0ArbiterInput), vlArbiterInput), exuOut) => val writeCond = acceptCond(exuOut.bits) val intWrite = Wire(Bool()) val fpWrite = Wire(Bool()) val vfWrite = Wire(Bool()) val v0Write = Wire(Bool()) val vlWrite = Wire(Bool()) val notWrite = Wire(Bool()) intWrite := exuOut.valid && writeCond._1(0) fpWrite := exuOut.valid && writeCond._1(1) vfWrite := exuOut.valid && writeCond._1(2) v0Write := exuOut.valid && writeCond._1(3) vlWrite := exuOut.valid && writeCond._1(4) notWrite := writeCond._2 intArbiterInput.valid := intWrite intArbiterInput.bits := exuOut.bits fpArbiterInput.valid := fpWrite fpArbiterInput.bits := exuOut.bits vfArbiterInput.valid := vfWrite vfArbiterInput.bits := exuOut.bits v0ArbiterInput.valid := v0Write v0ArbiterInput.bits := exuOut.bits vlArbiterInput.valid := vlWrite vlArbiterInput.bits := exuOut.bits if (exuOut.bits.params.writeIntRf && exuOut.bits.params.isVfExeUnit) { intWrite := RegNext(exuOut.valid && writeCond._1(0)) intArbiterInput.bits := RegEnable(exuOut.bits, exuOut.valid) } println(s"[WbDataPath] exu: ${exuOut.bits.params.exuIdx}, uncertain: ${exuOut.bits.params.hasUncertainLatency}, certain: ${exuOut.bits.params.latencyCertain}") // only EXUs with uncertain latency need result of arbiter // the result data can be maintained until getting success in arbiter if (exuOut.bits.params.hasUncertainLatency) { exuOut.ready := intArbiterInput.ready && intWrite || fpArbiterInput.ready && fpWrite || vfArbiterInput.ready && vfWrite || v0ArbiterInput.ready && v0Write || vlArbiterInput.ready && vlWrite || notWrite } else { exuOut.ready := true.B // for EXUs with certain latency, if the request fails in arbiter, the result data will be permanently lost when (intWrite) { assert(intArbiterInput.ready, s"exu ${exuOut.bits.params.exuIdx} failed to write int regfile\n") } when(fpWrite) { assert(fpArbiterInput.ready, s"exu ${exuOut.bits.params.exuIdx} failed to write fp regfile\n") } when (vfWrite) { assert(vfArbiterInput.ready, s"exu ${exuOut.bits.params.exuIdx} failed to write vf regfile\n") } when (v0Write) { assert(v0ArbiterInput.ready, s"exu ${exuOut.bits.params.exuIdx} failed to write v0 regfile\n") } when (vlWrite) { assert(vlArbiterInput.ready, s"exu ${exuOut.bits.params.exuIdx} failed to write vl regfile\n") } } // the ports not writting back pregs are always ready // the ports set highest priority are always ready if (exuOut.bits.params.hasNoDataWB || exuOut.bits.params.isHighestWBPriority) { exuOut.ready := true.B } } intArbiterInputsWireN.foreach(_.ready := false.B) fpArbiterInputsWireN.foreach(_.ready := false.B) vfArbiterInputsWireN.foreach(_.ready := false.B) v0ArbiterInputsWireN.foreach(_.ready := false.B) vlArbiterInputsWireN.foreach(_.ready := false.B) println(s"[WbDataPath] write int preg: " + s"IntExu(${io.fromIntExu.flatten.count(_.bits.params.writeIntRf)}) " + s"FpExu(${io.fromFpExu.flatten.count(_.bits.params.writeIntRf)}) " + s"VfExu(${io.fromVfExu.flatten.count(_.bits.params.writeIntRf)}) " + s"MemExu(${io.fromMemExu.flatten.count(_.bits.params.writeIntRf)})" ) println(s"[WbDataPath] write fp preg: " + s"IntExu(${io.fromIntExu.flatten.count(_.bits.params.writeFpRf)}) " + s"FpExu(${io.fromFpExu.flatten.count(_.bits.params.writeFpRf)}) " + s"VfExu(${io.fromVfExu.flatten.count(_.bits.params.writeFpRf)}) " + s"MemExu(${io.fromMemExu.flatten.count(_.bits.params.writeFpRf)})" ) println(s"[WbDataPath] write vf preg: " + s"IntExu(${io.fromIntExu.flatten.count(_.bits.params.writeVfRf)}) " + s"FpExu(${io.fromFpExu.flatten.count(_.bits.params.writeVfRf)}) " + s"VfExu(${io.fromVfExu.flatten.count(_.bits.params.writeVfRf)}) " + s"MemExu(${io.fromMemExu.flatten.count(_.bits.params.writeVfRf)})" ) println(s"[WbDataPath] write v0 preg: " + s"IntExu(${io.fromIntExu.flatten.count(_.bits.params.writeV0Rf)}) " + s"FpExu(${io.fromFpExu.flatten.count(_.bits.params.writeV0Rf)}) " + s"VfExu(${io.fromVfExu.flatten.count(_.bits.params.writeV0Rf)}) " + s"MemExu(${io.fromMemExu.flatten.count(_.bits.params.writeV0Rf)})" ) println(s"[WbDataPath] write vl preg: " + s"IntExu(${io.fromIntExu.flatten.count(_.bits.params.writeVlRf)}) " + s"FpExu(${io.fromFpExu.flatten.count(_.bits.params.writeVlRf)}) " + s"VfExu(${io.fromVfExu.flatten.count(_.bits.params.writeVlRf)}) " + s"MemExu(${io.fromMemExu.flatten.count(_.bits.params.writeVlRf)})" ) // wb arbiter private val intWbArbiter = Module(new RealWBCollideChecker(params.getIntWbArbiterParams)) private val fpWbArbiter = Module(new RealWBCollideChecker(params.getFpWbArbiterParams)) private val vfWbArbiter = Module(new RealWBCollideChecker(params.getVfWbArbiterParams)) private val v0WbArbiter = Module(new RealWBCollideChecker(params.getV0WbArbiterParams)) private val vlWbArbiter = Module(new RealWBCollideChecker(params.getVlWbArbiterParams)) println(s"[WbDataPath] int preg write back port num: ${intWbArbiter.io.out.size}, active port: ${intWbArbiter.io.inGroup.keys.toSeq.sorted}") println(s"[WbDataPath] fp preg write back port num: ${fpWbArbiter.io.out.size}, active port: ${fpWbArbiter.io.inGroup.keys.toSeq.sorted}") println(s"[WbDataPath] vf preg write back port num: ${vfWbArbiter.io.out.size}, active port: ${vfWbArbiter.io.inGroup.keys.toSeq.sorted}") println(s"[WbDataPath] v0 preg write back port num: ${v0WbArbiter.io.out.size}, active port: ${v0WbArbiter.io.inGroup.keys.toSeq.sorted}") println(s"[WbDataPath] vl preg write back port num: ${vlWbArbiter.io.out.size}, active port: ${vlWbArbiter.io.inGroup.keys.toSeq.sorted}") // module assign intWbArbiter.io.flush <> io.flush require(intWbArbiter.io.in.size == intArbiterInputsWireY.size, s"intWbArbiter input size: ${intWbArbiter.io.in.size}, all int wb size: ${intArbiterInputsWireY.size}") intWbArbiter.io.in.zip(intArbiterInputsWireY).foreach { case (arbiterIn, in) => arbiterIn.valid := in.valid && in.bits.intWen.get in.ready := arbiterIn.ready arbiterIn.bits.fromExuOutput(in.bits, "int") } private val intWbArbiterOut = intWbArbiter.io.out fpWbArbiter.io.flush <> io.flush require(fpWbArbiter.io.in.size == fpArbiterInputsWireY.size, s"fpWbArbiter input size: ${fpWbArbiter.io.in.size}, all fp wb size: ${fpArbiterInputsWireY.size}") fpWbArbiter.io.in.zip(fpArbiterInputsWireY).foreach { case (arbiterIn, in) => arbiterIn.valid := in.valid && (in.bits.fpWen.getOrElse(false.B)) in.ready := arbiterIn.ready arbiterIn.bits.fromExuOutput(in.bits, "fp") } private val fpWbArbiterOut = fpWbArbiter.io.out vfWbArbiter.io.flush <> io.flush require(vfWbArbiter.io.in.size == vfArbiterInputsWireY.size, s"vfWbArbiter input size: ${vfWbArbiter.io.in.size}, all vf wb size: ${vfArbiterInputsWireY.size}") vfWbArbiter.io.in.zip(vfArbiterInputsWireY).foreach { case (arbiterIn, in) => arbiterIn.valid := in.valid && (in.bits.vecWen.getOrElse(false.B)) in.ready := arbiterIn.ready arbiterIn.bits.fromExuOutput(in.bits, "vf") } private val vfWbArbiterOut = vfWbArbiter.io.out v0WbArbiter.io.flush <> io.flush require(v0WbArbiter.io.in.size == v0ArbiterInputsWireY.size, s"v0WbArbiter input size: ${v0WbArbiter.io.in.size}, all v0 wb size: ${v0ArbiterInputsWireY.size}") v0WbArbiter.io.in.zip(v0ArbiterInputsWireY).foreach { case (arbiterIn, in) => arbiterIn.valid := in.valid && (in.bits.v0Wen.getOrElse(false.B)) in.ready := arbiterIn.ready arbiterIn.bits.fromExuOutput(in.bits, "v0") } private val v0WbArbiterOut = v0WbArbiter.io.out vlWbArbiter.io.flush <> io.flush require(vlWbArbiter.io.in.size == vlArbiterInputsWireY.size, s"vlWbArbiter input size: ${vlWbArbiter.io.in.size}, all vl wb size: ${vlArbiterInputsWireY.size}") vlWbArbiter.io.in.zip(vlArbiterInputsWireY).foreach { case (arbiterIn, in) => arbiterIn.valid := in.valid && (in.bits.vlWen.getOrElse(false.B)) in.ready := arbiterIn.ready arbiterIn.bits.fromExuOutput(in.bits, "vl") } private val vlWbArbiterOut = vlWbArbiter.io.out // WB -> CtrlBlock private val intExuInputs = io.fromIntExu.flatten.toSeq private val intExuWBs = WireInit(MixedVecInit(intExuInputs)) private val fpExuInputs = io.fromFpExu.flatten.toSeq private val fpExuWBs = WireInit(MixedVecInit(fpExuInputs)) private val vfExuInputs = io.fromVfExu.flatten.toSeq private val vfExuWBs = WireInit(MixedVecInit(vfExuInputs)) private val memExuInputs = io.fromMemExu.flatten.toSeq private val memExuWBs = WireInit(MixedVecInit(memExuInputs)) // only fired port can write back to ctrl block (intExuWBs zip intExuInputs).foreach { case (wb, input) => wb.valid := input.fire } (fpExuWBs zip fpExuInputs).foreach { case (wb, input) => wb.valid := input.fire } (vfExuWBs zip vfExuInputs).foreach { case (wb, input) => wb.valid := input.fire } (memExuWBs zip memExuInputs).foreach { case (wb, input) => wb.valid := input.fire } // io assign private val toIntPreg: MixedVec[RfWritePortWithConfig] = MixedVecInit(intWbArbiterOut.map(x => x.bits.asIntRfWriteBundle(x.fire)).toSeq) private val toFpPreg: MixedVec[RfWritePortWithConfig] = MixedVecInit(fpWbArbiterOut.map(x => x.bits.asFpRfWriteBundle(x.fire)).toSeq) private val toVfPreg: MixedVec[RfWritePortWithConfig] = MixedVecInit(vfWbArbiterOut.map(x => x.bits.asVfRfWriteBundle(x.fire)).toSeq) private val toV0Preg: MixedVec[RfWritePortWithConfig] = MixedVecInit(v0WbArbiterOut.map(x => x.bits.asV0RfWriteBundle(x.fire)).toSeq) private val toVlPreg: MixedVec[RfWritePortWithConfig] = MixedVecInit(vlWbArbiterOut.map(x => x.bits.asVlRfWriteBundle(x.fire)).toSeq) private val wb2Ctrl = intExuWBs ++ fpExuWBs ++ vfExuWBs ++ memExuWBs io.toIntPreg := toIntPreg io.toFpPreg := toFpPreg io.toVfPreg := toVfPreg io.toV0Preg := toV0Preg io.toVlPreg := toVlPreg io.toCtrlBlock.writeback.zip(wb2Ctrl).foreach { case (sink, source) => sink.valid := source.valid sink.bits := source.bits source.ready := true.B } // debug if(backendParams.debugEn) { dontTouch(intArbiterInputsWire) dontTouch(fpArbiterInputsWire) dontTouch(vfArbiterInputsWire) dontTouch(v0ArbiterInputsWire) dontTouch(vlArbiterInputsWire) } // difftest if (env.EnableDifftest || env.AlwaysBasicDiff) { intWbArbiterOut.foreach(out => { val difftest = DifftestModule(new DiffIntWriteback(IntPhyRegs)) difftest.coreid := io.fromTop.hartId difftest.valid := out.fire && out.bits.rfWen difftest.address := out.bits.pdest difftest.data := out.bits.data }) } if (env.EnableDifftest || env.AlwaysBasicDiff) { fpWbArbiterOut.foreach(out => { val difftest = DifftestModule(new DiffFpWriteback(FpPhyRegs)) difftest.coreid := io.fromTop.hartId difftest.valid := out.fire // all fp instr will write fp rf difftest.address := out.bits.pdest difftest.data := out.bits.data }) } if (env.EnableDifftest || env.AlwaysBasicDiff) { vfWbArbiterOut.foreach(out => { val difftest = DifftestModule(new DiffVecWriteback(VfPhyRegs)) difftest.coreid := io.fromTop.hartId difftest.valid := out.fire difftest.address := out.bits.pdest difftest.data(0) := out.bits.data(63, 0) difftest.data(1) := out.bits.data(127, 64) }) } if (env.EnableDifftest || env.AlwaysBasicDiff) { v0WbArbiterOut.foreach(out => { val difftest = DifftestModule(new DiffVecV0Writeback(V0PhyRegs)) difftest.coreid := io.fromTop.hartId difftest.valid := out.fire difftest.address := out.bits.pdest difftest.data(0) := out.bits.data(63, 0) difftest.data(1) := out.bits.data(127, 64) }) } }