1/*************************************************************************************** 2* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3* Copyright (c) 2020-2021 Peng Cheng Laboratory 4* 5* XiangShan is licensed under Mulan PSL v2. 6* You can use this software according to the terms and conditions of the Mulan PSL v2. 7* You may obtain a copy of Mulan PSL v2 at: 8* http://license.coscl.org.cn/MulanPSL2 9* 10* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13* 14* See the Mulan PSL v2 for more details. 15***************************************************************************************/ 16 17package xiangshan.backend.exu 18 19import org.chipsalliance.cde.config.Parameters 20import chisel3._ 21import chisel3.experimental.hierarchy.{Definition, instantiable} 22import chisel3.util._ 23import freechips.rocketchip.diplomacy.{LazyModule, LazyModuleImp} 24import utility.DelayN 25import utils._ 26import xiangshan.backend.fu.{CSRFileIO, FenceIO, FuncUnitInput} 27import xiangshan.backend.Bundles.{ExuInput, ExuOutput, MemExuInput, MemExuOutput} 28import xiangshan.{FPUCtrlSignals, HasXSParameter, Redirect, XSBundle, XSModule} 29import xiangshan.backend.datapath.WbConfig.{PregWB, _} 30import xiangshan.backend.fu.FuType 31 32class ExeUnitIO(params: ExeUnitParams)(implicit p: Parameters) extends XSBundle { 33 val flush = Flipped(ValidIO(new Redirect())) 34 val in = Flipped(DecoupledIO(new ExuInput(params))) 35 val out = DecoupledIO(new ExuOutput(params)) 36 val csrio = if (params.hasCSR) Some(new CSRFileIO) else None 37 val fenceio = if (params.hasFence) Some(new FenceIO) else None 38 val frm = if (params.needSrcFrm) Some(Input(UInt(3.W))) else None 39} 40 41class ExeUnit(exuParams: ExeUnitParams)(implicit p: Parameters) extends LazyModule { 42 override def shouldBeInlined: Boolean = false 43 44 lazy val module = new ExeUnitImp(this)(p, exuParams) 45} 46 47class ExeUnitImp( 48 override val wrapper: ExeUnit 49)(implicit 50 p: Parameters, exuParams: ExeUnitParams 51) extends LazyModuleImp(wrapper) with HasXSParameter{ 52 private val fuCfgs = exuParams.fuConfigs 53 54 val io = IO(new ExeUnitIO(exuParams)) 55 56 val funcUnit = fuCfgs.map(cfg => { 57 assert(cfg.fuGen != null, cfg.name + "Cfg'fuGen is null !!!") 58 val module = cfg.fuGen(p, cfg) 59 module 60 }) 61 62 val funcUnits = fuCfgs.zip(funcUnit).map{case(cfg, fu) => 63 val clk_en = WireInit(false.B) 64 val fuVld_en = WireInit(false.B) 65 val fuVld_en_reg = RegInit(false.B) 66 val uncer_en_reg = RegInit(false.B) 67 68 val lat0 = FuType.isLat0(io.in.bits.fuType) 69 val latN = FuType.isLatN(io.in.bits.fuType) 70 val uncerLat = FuType.isUncerLat(io.in.bits.fuType) 71 72 def lat: Int = cfg.latency.latencyVal.getOrElse(0) 73 74 val fuVldVec = (io.in.valid && latN) +: Seq.fill(lat)(RegInit(false.B)) 75 val fuRdyVec = Seq.fill(lat)(Wire(Bool())) :+ io.out.ready 76 77 for (i <- 0 until lat) { 78 fuRdyVec(i) := !fuVldVec(i + 1) || fuRdyVec(i + 1) 79 } 80 81 for (i <- 1 to lat) { 82 when(fuRdyVec(i - 1) && fuVldVec(i - 1)) { 83 fuVldVec(i) := fuVldVec(i - 1) 84 }.elsewhen(fuRdyVec(i)) { 85 fuVldVec(i) := false.B 86 } 87 } 88 fuVld_en := fuVldVec.map(v => v).reduce(_ || _) 89 fuVld_en_reg := fuVld_en 90 91 when(uncerLat && io.in.fire) { 92 uncer_en_reg := true.B 93 }.elsewhen(uncerLat && io.out.fire) { 94 uncer_en_reg := false.B 95 } 96 97 when(lat0 && io.in.fire) { 98 clk_en := true.B 99 }.elsewhen(latN && fuVld_en || fuVld_en_reg) { 100 clk_en := true.B 101 }.elsewhen(uncerLat && io.in.fire || uncer_en_reg) { 102 clk_en := true.B 103 } 104 105 if (cfg.ckAlwaysEn) { 106 clk_en := true.B 107 } 108 109 val clk_gate = Module(new ClockGate) 110 clk_gate.io.TE := false.B 111 clk_gate.io.E := clk_en 112 clk_gate.io.CK := clock 113 fu.clock := clk_gate.io.Q 114 fu 115 } 116 117 val busy = RegInit(false.B) 118 val robIdx = RegEnable(io.in.bits.robIdx, io.in.fire) 119 when (io.in.fire && io.in.bits.robIdx.needFlush(io.flush)) { 120 busy := false.B 121 }.elsewhen(busy && robIdx.needFlush(io.flush)){ 122 busy := false.B 123 }.elsewhen(io.out.fire) { 124 busy := false.B 125 }.elsewhen(io.in.fire) { 126 busy := true.B 127 } 128 129 if (exuParams.latencyCertain){ 130 busy := false.B 131 } 132 133 exuParams.wbPortConfigs.map{ 134 x => x match { 135 case IntWB(port, priority) => assert(priority >= 0 && priority <= 2, 136 s"${exuParams.name}: WbPort must priority=0 or priority=1") 137 case VfWB (port, priority) => assert(priority >= 0 && priority <= 2, 138 s"${exuParams.name}: WbPort must priority=0 or priority=1") 139 case _ => 140 } 141 } 142 val intWbPort = exuParams.getIntWBPort 143 if (intWbPort.isDefined){ 144 val sameIntPortExuParam = backendParams.allExuParams.filter(_.getIntWBPort.isDefined) 145 .filter(_.getIntWBPort.get.port == intWbPort.get.port) 146 val samePortOneCertainOneUncertain = sameIntPortExuParam.map(_.latencyCertain).contains(true) && sameIntPortExuParam.map(_.latencyCertain).contains(false) 147 if (samePortOneCertainOneUncertain) sameIntPortExuParam.map(samePort => 148 samePort.wbPortConfigs.map( 149 x => x match { 150 case IntWB(port, priority) => { 151 if (!samePort.latencyCertain) assert(priority == 1, 152 s"${samePort.name}: IntWbPort $port must latencyCertain priority=0 or latencyUnCertain priority=1") 153 else assert(priority == 0, 154 s"${samePort.name}: IntWbPort $port must latencyCertain priority=0 or latencyUnCertain priority=1") 155 } 156 case _ => 157 } 158 ) 159 ) 160 } 161 val vfWbPort = exuParams.getVfWBPort 162 if (vfWbPort.isDefined) { 163 val sameVfPortExuParam = backendParams.allExuParams.filter(_.getVfWBPort.isDefined) 164 .filter(_.getVfWBPort.get.port == vfWbPort.get.port) 165 val samePortOneCertainOneUncertain = sameVfPortExuParam.map(_.latencyCertain).contains(true) && sameVfPortExuParam.map(_.latencyCertain).contains(false) 166 if (samePortOneCertainOneUncertain) sameVfPortExuParam.map(samePort => 167 samePort.wbPortConfigs.map( 168 x => x match { 169 case VfWB(port, priority) => { 170 if (!samePort.latencyCertain) assert(priority == 1, 171 s"${samePort.name}: VfWbPort $port must latencyCertain priority=0 or latencyUnCertain priority=1") 172 else assert(priority == 0, 173 s"${samePort.name}: VfWbPort $port must latencyCertain priority=0 or latencyUnCertain priority=1") 174 } 175 case _ => 176 } 177 ) 178 ) 179 } 180 if(backendParams.debugEn) { 181 dontTouch(io.out.ready) 182 } 183 // rob flush --> funcUnits 184 funcUnits.zipWithIndex.foreach { case (fu, i) => 185 fu.io.flush <> io.flush 186 } 187 188 def acceptCond(input: ExuInput): Seq[Bool] = { 189 input.params.fuConfigs.map(_.fuSel(input)) 190 } 191 192 val in1ToN = Module(new Dispatcher(new ExuInput(exuParams), funcUnits.length, acceptCond)) 193 194 // ExeUnit.in <---> Dispatcher.in 195 in1ToN.io.in.valid := io.in.valid && !busy 196 in1ToN.io.in.bits := io.in.bits 197 io.in.ready := !busy && in1ToN.io.in.ready 198 199 // Dispatcher.out <---> FunctionUnits 200 in1ToN.io.out.zip(funcUnits.map(_.io.in)).foreach { 201 case (source: DecoupledIO[ExuInput], sink: DecoupledIO[FuncUnitInput]) => 202 sink.valid := source.valid 203 source.ready := sink.ready 204 205 sink.bits.data.src.zip(source.bits.src).foreach { case(fuSrc, exuSrc) => fuSrc := exuSrc } 206 sink.bits.data.pc .foreach(x => x := source.bits.pc.get) 207 sink.bits.data.imm := source.bits.imm 208 sink.bits.ctrl.fuOpType := source.bits.fuOpType 209 sink.bits.ctrl.robIdx := source.bits.robIdx 210 sink.bits.ctrl.pdest := source.bits.pdest 211 sink.bits.ctrl.rfWen .foreach(x => x := source.bits.rfWen.get) 212 sink.bits.ctrl.fpWen .foreach(x => x := source.bits.fpWen.get) 213 sink.bits.ctrl.vecWen .foreach(x => x := source.bits.vecWen.get) 214 sink.bits.ctrl.flushPipe .foreach(x => x := source.bits.flushPipe.get) 215 sink.bits.ctrl.preDecode .foreach(x => x := source.bits.preDecode.get) 216 sink.bits.ctrl.ftqIdx .foreach(x => x := source.bits.ftqIdx.get) 217 sink.bits.ctrl.ftqOffset .foreach(x => x := source.bits.ftqOffset.get) 218 sink.bits.ctrl.predictInfo .foreach(x => x := source.bits.predictInfo.get) 219 sink.bits.ctrl.fpu .foreach(x => x := source.bits.fpu.get) 220 sink.bits.ctrl.vpu .foreach(x => x := source.bits.vpu.get) 221 sink.bits.perfDebugInfo := source.bits.perfDebugInfo 222 } 223 224 private val fuOutValidOH = funcUnits.map(_.io.out.valid) 225 XSError(PopCount(fuOutValidOH) > 1.U, p"fuOutValidOH ${Binary(VecInit(fuOutValidOH).asUInt)} should be one-hot)\n") 226 private val fuOutBitsVec = funcUnits.map(_.io.out.bits) 227 private val fuRedirectVec: Seq[Option[ValidIO[Redirect]]] = funcUnits.map(_.io.out.bits.res.redirect) 228 229 // Assume that one fu can only write int or fp or vec, 230 // otherwise, wenVec should be assigned to wen in fu. 231 private val fuIntWenVec = funcUnits.map(x => x.cfg.writeIntRf.B && x.io.out.bits.ctrl.rfWen.getOrElse(false.B)) 232 private val fuFpWenVec = funcUnits.map(x => x.cfg.writeFpRf.B && x.io.out.bits.ctrl.fpWen.getOrElse(false.B)) 233 private val fuVecWenVec = funcUnits.map(x => x.cfg.writeVecRf.B && x.io.out.bits.ctrl.vecWen.getOrElse(false.B)) 234 // FunctionUnits <---> ExeUnit.out 235 io.out.valid := Cat(fuOutValidOH).orR 236 funcUnits.foreach(fu => fu.io.out.ready := io.out.ready) 237 238 // select one fu's result 239 io.out.bits.data := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.res.data)) 240 io.out.bits.robIdx := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.robIdx)) 241 io.out.bits.pdest := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.pdest)) 242 io.out.bits.intWen.foreach(x => x := Mux1H(fuOutValidOH, fuIntWenVec)) 243 io.out.bits.fpWen.foreach(x => x := Mux1H(fuOutValidOH, fuFpWenVec)) 244 io.out.bits.vecWen.foreach(x => x := Mux1H(fuOutValidOH, fuVecWenVec)) 245 io.out.bits.redirect.foreach(x => x := Mux1H((fuOutValidOH zip fuRedirectVec).filter(_._2.isDefined).map(x => (x._1, x._2.get)))) 246 io.out.bits.fflags.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.res.fflags.getOrElse(0.U.asTypeOf(io.out.bits.fflags.get))))) 247 io.out.bits.wflags.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.fpu.getOrElse(0.U.asTypeOf(new FPUCtrlSignals)).wflags))) 248 io.out.bits.vxsat.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.res.vxsat.getOrElse(0.U.asTypeOf(io.out.bits.vxsat.get))))) 249 io.out.bits.exceptionVec.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.exceptionVec.getOrElse(0.U.asTypeOf(io.out.bits.exceptionVec.get))))) 250 io.out.bits.flushPipe.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.flushPipe.getOrElse(0.U.asTypeOf(io.out.bits.flushPipe.get))))) 251 io.out.bits.replay.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.replay.getOrElse(0.U.asTypeOf(io.out.bits.replay.get))))) 252 io.out.bits.predecodeInfo.foreach(x => x := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.ctrl.preDecode.getOrElse(0.U.asTypeOf(io.out.bits.predecodeInfo.get))))) 253 254 io.csrio.foreach(exuio => funcUnits.foreach(fu => fu.io.csrio.foreach{ 255 fuio => 256 exuio <> fuio 257 fuio.exception := DelayN(exuio.exception, 2) 258 })) 259 io.fenceio.foreach(exuio => funcUnits.foreach(fu => fu.io.fenceio.foreach(fuio => fuio <> exuio))) 260 io.frm.foreach(exuio => funcUnits.foreach(fu => fu.io.frm.foreach(fuio => fuio <> exuio))) 261 262 // debug info 263 io.out.bits.debug := 0.U.asTypeOf(io.out.bits.debug) 264 io.out.bits.debug.isPerfCnt := funcUnits.map(_.io.csrio.map(_.isPerfCnt)).map(_.getOrElse(false.B)).reduce(_ || _) 265 io.out.bits.debugInfo := Mux1H(fuOutValidOH, fuOutBitsVec.map(_.perfDebugInfo)) 266} 267 268class DispatcherIO[T <: Data](private val gen: T, n: Int) extends Bundle { 269 val in = Flipped(DecoupledIO(gen)) 270 271 val out = Vec(n, DecoupledIO(gen)) 272} 273 274class Dispatcher[T <: Data](private val gen: T, n: Int, acceptCond: T => Seq[Bool]) 275 (implicit p: Parameters) 276 extends Module { 277 278 val io = IO(new DispatcherIO(gen, n)) 279 280 private val acceptVec: Vec[Bool] = VecInit(acceptCond(io.in.bits)) 281 282 XSError(io.in.valid && PopCount(acceptVec) > 1.U, s"s[ExeUnit] accept vec should no more than 1, ${Binary(acceptVec.asUInt)} ") 283 XSError(io.in.valid && PopCount(acceptVec) === 0.U, "[ExeUnit] there is a inst not dispatched to any fu") 284 285 io.out.zipWithIndex.foreach { case (out, i) => 286 out.valid := acceptVec(i) && io.in.valid 287 out.bits := io.in.bits 288 } 289 290 io.in.ready := Mux1H(acceptVec,io.out.map(_.ready)) 291} 292 293class MemExeUnitIO (implicit p: Parameters) extends XSBundle { 294 val flush = Flipped(ValidIO(new Redirect())) 295 val in = Flipped(DecoupledIO(new MemExuInput())) 296 val out = DecoupledIO(new MemExuOutput()) 297} 298 299class MemExeUnit(exuParams: ExeUnitParams)(implicit p: Parameters) extends XSModule { 300 val io = IO(new MemExeUnitIO) 301 val fu = exuParams.fuConfigs.head.fuGen(p, exuParams.fuConfigs.head) 302 fu.io.flush := io.flush 303 fu.io.in.valid := io.in.valid 304 io.in.ready := fu.io.in.ready 305 306 fu.io.in.bits.ctrl.robIdx := io.in.bits.uop.robIdx 307 fu.io.in.bits.ctrl.pdest := io.in.bits.uop.pdest 308 fu.io.in.bits.ctrl.fuOpType := io.in.bits.uop.fuOpType 309 fu.io.in.bits.data.imm := io.in.bits.uop.imm 310 fu.io.in.bits.data.src.zip(io.in.bits.src).foreach(x => x._1 := x._2) 311 fu.io.in.bits.perfDebugInfo := io.in.bits.uop.debugInfo 312 313 io.out.valid := fu.io.out.valid 314 fu.io.out.ready := io.out.ready 315 316 io.out.bits := 0.U.asTypeOf(io.out.bits) // dontCare other fields 317 io.out.bits.data := fu.io.out.bits.res.data 318 io.out.bits.uop.robIdx := fu.io.out.bits.ctrl.robIdx 319 io.out.bits.uop.pdest := fu.io.out.bits.ctrl.pdest 320 io.out.bits.uop.fuType := io.in.bits.uop.fuType 321 io.out.bits.uop.fuOpType:= io.in.bits.uop.fuOpType 322 io.out.bits.uop.sqIdx := io.in.bits.uop.sqIdx 323 io.out.bits.uop.debugInfo := fu.io.out.bits.perfDebugInfo 324 325 io.out.bits.debug := 0.U.asTypeOf(io.out.bits.debug) 326} 327