xref: /XiangShan/src/main/scala/xiangshan/backend/CtrlBlock.scala (revision d8a66f7ecacc2b3538a1083b0716b7066c77ba3f)
1package xiangshan.backend
2
3import chisel3._
4import chisel3.util._
5import utils._
6import xiangshan._
7import xiangshan.backend.decode.{DecodeStage, ImmUnion}
8import xiangshan.backend.rename.{BusyTable, Rename}
9import xiangshan.backend.dispatch.Dispatch
10import xiangshan.backend.exu._
11import xiangshan.backend.exu.Exu.exuConfigs
12import xiangshan.backend.ftq.{Ftq, FtqRead, GetPcByFtq}
13import xiangshan.backend.regfile.RfReadPort
14import xiangshan.backend.roq.{Roq, RoqCSRIO, RoqLsqIO, RoqPtr}
15import xiangshan.mem.LsqEnqIO
16
17class CtrlToIntBlockIO extends XSBundle {
18  val enqIqCtrl = Vec(exuParameters.IntExuCnt, DecoupledIO(new MicroOp))
19  val readRf = Vec(NRIntReadPorts, Output(UInt(PhyRegIdxWidth.W)))
20  val jumpPc = Output(UInt(VAddrBits.W))
21  val jalr_target = Output(UInt(VAddrBits.W))
22  // int block only uses port 0~7
23  val readPortIndex = Vec(exuParameters.IntExuCnt, Output(UInt(log2Ceil(8 / 2).W))) // TODO parameterize 8 here
24  val redirect = ValidIO(new Redirect)
25  val flush = Output(Bool())
26}
27
28class CtrlToFpBlockIO extends XSBundle {
29  val enqIqCtrl = Vec(exuParameters.FpExuCnt, DecoupledIO(new MicroOp))
30  val readRf = Vec(NRFpReadPorts, Output(UInt(PhyRegIdxWidth.W)))
31  // fp block uses port 0~11
32  val readPortIndex = Vec(exuParameters.FpExuCnt, Output(UInt(log2Ceil((NRFpReadPorts - exuParameters.StuCnt) / 3).W)))
33  val redirect = ValidIO(new Redirect)
34  val flush = Output(Bool())
35}
36
37class CtrlToLsBlockIO extends XSBundle {
38  val enqIqCtrl = Vec(exuParameters.LsExuCnt, DecoupledIO(new MicroOp))
39  val enqLsq = Flipped(new LsqEnqIO)
40  val redirect = ValidIO(new Redirect)
41  val flush = Output(Bool())
42}
43
44class RedirectGenerator extends XSModule with HasCircularQueuePtrHelper {
45  val io = IO(new Bundle() {
46    val loadRelay = Flipped(ValidIO(new Redirect))
47    val exuMispredict = Vec(exuParameters.JmpCnt + exuParameters.AluCnt, Flipped(ValidIO(new ExuOutput)))
48    val flush = Input(Bool())
49    val stage2FtqRead = new FtqRead
50    val stage2Redirect = ValidIO(new Redirect)
51    val stage3Redirect = ValidIO(new Redirect)
52  })
53  /*
54        LoadQueue  Jump  ALU0  ALU1  ALU2  ALU3   exception    Stage1
55          |         |      |    |     |     |         |
56          |============= reg & compare =====|         |       ========
57                            |                         |
58                            |                         |
59                            |                         |        Stage2
60                            |                         |
61                    redirect (flush backend)          |
62                    |                                 |
63               === reg ===                            |       ========
64                    |                                 |
65                    |----- mux (exception first) -----|        Stage3
66                            |
67                redirect (send to frontend)
68   */
69  def selectOlderRedirect(x: Valid[Redirect], y: Valid[Redirect]): Valid[Redirect] = {
70    Mux(x.valid,
71      Mux(y.valid,
72        Mux(isAfter(x.bits.roqIdx, y.bits.roqIdx), y, x),
73        x
74      ),
75      y
76    )
77  }
78  def selectOlderExuOutWithFlag(x: Valid[ExuOutput], y: Valid[ExuOutput]): (Valid[ExuOutput], Bool) = {
79    val yIsOlder = Mux(x.valid,
80      Mux(y.valid,
81        Mux(isAfter(x.bits.redirect.roqIdx, y.bits.redirect.roqIdx), true.B, false.B),
82        false.B
83      ),
84      true.B
85    )
86    val sel = Mux(yIsOlder, y, x)
87    (sel, yIsOlder)
88  }
89  def selectOlderExuOut(x: Valid[ExuOutput], y: Valid[ExuOutput]): Valid[ExuOutput] = {
90    selectOlderExuOutWithFlag(x, y)._1
91  }
92  val jumpOut = io.exuMispredict.head
93  val oldestAluOut = ParallelOperation(io.exuMispredict.tail, selectOlderExuOut)
94  val (oldestExuOut, jumpIsOlder) = selectOlderExuOutWithFlag(oldestAluOut, jumpOut) // select between jump and alu
95
96  val oldestMispredict = selectOlderRedirect(io.loadRelay, {
97    val redirect = Wire(Valid(new Redirect))
98    redirect.valid := oldestExuOut.valid
99    redirect.bits := oldestExuOut.bits.redirect
100    redirect
101  })
102
103  XSDebug(oldestExuOut.valid, p"exuMispredict: ${Binary(Cat(io.exuMispredict.map(_.valid)))}\n")
104
105  val s1_isJump = RegNext(jumpIsOlder, init = false.B)
106  val s1_jumpTarget = RegEnable(jumpOut.bits.redirect.cfiUpdate.target, jumpOut.valid)
107  val s1_imm12_reg = RegEnable(oldestExuOut.bits.uop.ctrl.imm(11, 0), oldestExuOut.valid)
108  val s1_pd = RegEnable(oldestExuOut.bits.uop.cf.pd, oldestExuOut.valid)
109  val s1_redirect_bits_reg = Reg(new Redirect)
110  val s1_redirect_valid_reg = RegInit(false.B)
111
112  // stage1 -> stage2
113  when(oldestMispredict.valid && !oldestMispredict.bits.roqIdx.needFlush(io.stage2Redirect, io.flush)){
114    s1_redirect_bits_reg := oldestMispredict.bits
115    s1_redirect_valid_reg := true.B
116  }.otherwise({
117    s1_redirect_valid_reg := false.B
118  })
119  io.stage2Redirect.valid := s1_redirect_valid_reg && !io.flush
120  io.stage2Redirect.bits := s1_redirect_bits_reg
121  io.stage2Redirect.bits.cfiUpdate := DontCare
122  // at stage2, we read ftq to get pc
123  io.stage2FtqRead.ptr := s1_redirect_bits_reg.ftqIdx
124
125  // stage3, calculate redirect target
126  val s2_isJump = RegNext(s1_isJump)
127  val s2_jumpTarget = RegEnable(s1_jumpTarget, s1_redirect_valid_reg)
128  val s2_imm12_reg = RegEnable(s1_imm12_reg, s1_redirect_valid_reg)
129  val s2_pd = RegEnable(s1_pd, s1_redirect_valid_reg)
130  val s2_redirect_bits_reg = RegEnable(s1_redirect_bits_reg, enable = s1_redirect_valid_reg)
131  val s2_redirect_valid_reg = RegNext(s1_redirect_valid_reg && !io.flush, init = false.B)
132
133  val ftqRead = io.stage2FtqRead.entry
134  val cfiUpdate_pc =
135    Cat(ftqRead.ftqPC.head(VAddrBits - s2_redirect_bits_reg.ftqOffset.getWidth - instOffsetBits),
136        s2_redirect_bits_reg.ftqOffset,
137        0.U(instOffsetBits.W))
138  val real_pc =
139    GetPcByFtq(ftqRead.ftqPC, s2_redirect_bits_reg.ftqOffset,
140               ftqRead.lastPacketPC.valid,
141               ftqRead.lastPacketPC.bits)
142  val brTarget = real_pc + SignExt(ImmUnion.B.toImm32(s2_imm12_reg), XLEN)
143  val snpc = real_pc + Mux(s2_pd.isRVC, 2.U, 4.U)
144  val isReplay = RedirectLevel.flushItself(s2_redirect_bits_reg.level)
145  val target = Mux(isReplay,
146    real_pc, // repaly from itself
147    Mux(s2_redirect_bits_reg.cfiUpdate.taken,
148      Mux(s2_isJump, s2_jumpTarget, brTarget),
149      snpc
150    )
151  )
152  io.stage3Redirect.valid := s2_redirect_valid_reg
153  io.stage3Redirect.bits := s2_redirect_bits_reg
154  val stage3CfiUpdate = io.stage3Redirect.bits.cfiUpdate
155  stage3CfiUpdate.pc := cfiUpdate_pc
156  stage3CfiUpdate.pd := s2_pd
157  stage3CfiUpdate.rasSp := ftqRead.rasSp
158  stage3CfiUpdate.rasEntry := ftqRead.rasTop
159  stage3CfiUpdate.hist := ftqRead.hist
160  stage3CfiUpdate.predHist := ftqRead.predHist
161  stage3CfiUpdate.specCnt := ftqRead.specCnt(s2_redirect_bits_reg.ftqOffset)
162  stage3CfiUpdate.predTaken := s2_redirect_bits_reg.cfiUpdate.predTaken
163  stage3CfiUpdate.sawNotTakenBranch := VecInit((0 until PredictWidth).map{ i =>
164    if(i == 0) false.B else Cat(ftqRead.br_mask.take(i)).orR()
165  })(s2_redirect_bits_reg.ftqOffset)
166  stage3CfiUpdate.target := target
167  stage3CfiUpdate.taken := s2_redirect_bits_reg.cfiUpdate.taken
168  stage3CfiUpdate.isMisPred := s2_redirect_bits_reg.cfiUpdate.isMisPred
169}
170
171class CtrlBlock extends XSModule with HasCircularQueuePtrHelper {
172  val io = IO(new Bundle {
173    val frontend = Flipped(new FrontendToBackendIO)
174    val fromIntBlock = Flipped(new IntBlockToCtrlIO)
175    val fromFpBlock = Flipped(new FpBlockToCtrlIO)
176    val fromLsBlock = Flipped(new LsBlockToCtrlIO)
177    val toIntBlock = new CtrlToIntBlockIO
178    val toFpBlock = new CtrlToFpBlockIO
179    val toLsBlock = new CtrlToLsBlockIO
180    val roqio = new Bundle {
181      // to int block
182      val toCSR = new RoqCSRIO
183      val exception = ValidIO(new ExceptionInfo)
184      // to mem block
185      val lsq = new RoqLsqIO
186    }
187  })
188
189  val difftestIO = IO(new Bundle() {
190    val fromRoq = new Bundle() {
191      val commit = Output(UInt(32.W))
192      val thisPC = Output(UInt(XLEN.W))
193      val thisINST = Output(UInt(32.W))
194      val skip = Output(UInt(32.W))
195      val wen = Output(UInt(32.W))
196      val wdata = Output(Vec(CommitWidth, UInt(XLEN.W))) // set difftest width to 6
197      val wdst = Output(Vec(CommitWidth, UInt(32.W))) // set difftest width to 6
198      val wpc = Output(Vec(CommitWidth, UInt(XLEN.W))) // set difftest width to 6
199      val isRVC = Output(UInt(32.W))
200      val scFailed = Output(Bool())
201    }
202  })
203  difftestIO <> DontCare
204
205  val ftq = Module(new Ftq)
206  val trapIO = IO(new TrapIO())
207  trapIO <> DontCare
208
209  val decode = Module(new DecodeStage)
210  val rename = Module(new Rename)
211  val dispatch = Module(new Dispatch)
212  val intBusyTable = Module(new BusyTable(NRIntReadPorts, NRIntWritePorts))
213  val fpBusyTable = Module(new BusyTable(NRFpReadPorts, NRFpWritePorts))
214  val redirectGen = Module(new RedirectGenerator)
215
216  val roqWbSize = NRIntWritePorts + NRFpWritePorts + exuParameters.StuCnt
217
218  val roq = Module(new Roq(roqWbSize))
219
220  val backendRedirect = redirectGen.io.stage2Redirect
221  val frontendRedirect = redirectGen.io.stage3Redirect
222  val flush = roq.io.flushOut.valid
223  val flushReg = RegNext(flush)
224
225  redirectGen.io.exuMispredict.zip(io.fromIntBlock.exuRedirect).map({case (x, y) =>
226    x.valid := y.valid && y.bits.redirect.cfiUpdate.isMisPred
227    x.bits := y.bits
228  })
229  redirectGen.io.loadRelay := io.fromLsBlock.replay
230  redirectGen.io.flush := flushReg
231
232  ftq.io.enq <> io.frontend.fetchInfo
233  for(i <- 0 until CommitWidth){
234    ftq.io.roq_commits(i).valid := roq.io.commits.valid(i) && !roq.io.commits.isWalk
235    ftq.io.roq_commits(i).bits := roq.io.commits.info(i)
236  }
237  ftq.io.redirect <> backendRedirect
238  ftq.io.flush := flushReg
239  ftq.io.flushIdx := RegNext(roq.io.flushOut.bits.ftqIdx)
240  ftq.io.flushOffset := RegNext(roq.io.flushOut.bits.ftqOffset)
241  ftq.io.frontendRedirect <> frontendRedirect
242  ftq.io.exuWriteback <> io.fromIntBlock.exuRedirect
243
244  ftq.io.ftqRead(1) <> redirectGen.io.stage2FtqRead
245  ftq.io.ftqRead(2).ptr := roq.io.flushOut.bits.ftqIdx
246  val flushPC = GetPcByFtq(
247    ftq.io.ftqRead(2).entry.ftqPC,
248    RegEnable(roq.io.flushOut.bits.ftqOffset, roq.io.flushOut.valid),
249    ftq.io.ftqRead(2).entry.lastPacketPC.valid,
250    ftq.io.ftqRead(2).entry.lastPacketPC.bits
251  )
252
253  val flushRedirect = Wire(Valid(new Redirect))
254  flushRedirect.valid := flushReg
255  flushRedirect.bits := DontCare
256  flushRedirect.bits.ftqIdx := RegEnable(roq.io.flushOut.bits.ftqIdx, flush)
257  flushRedirect.bits.interrupt := true.B
258  flushRedirect.bits.cfiUpdate.target := Mux(io.roqio.toCSR.isXRet || roq.io.exception.valid,
259    io.roqio.toCSR.trapTarget,
260    flushPC + 4.U // flush pipe
261  )
262
263  io.frontend.redirect_cfiUpdate := Mux(flushRedirect.valid, flushRedirect, frontendRedirect)
264  io.frontend.commit_cfiUpdate := ftq.io.commit_ftqEntry
265  io.frontend.ftqEnqPtr := ftq.io.enqPtr
266  io.frontend.ftqLeftOne := ftq.io.leftOne
267
268  decode.io.in <> io.frontend.cfVec
269
270  val jumpInst = dispatch.io.enqIQCtrl(0).bits
271  val ftqOffsetReg = Reg(UInt(log2Up(PredictWidth).W))
272  ftqOffsetReg := jumpInst.cf.ftqOffset
273  ftq.io.ftqRead(0).ptr := jumpInst.cf.ftqPtr // jump
274  io.toIntBlock.jumpPc := GetPcByFtq(
275    ftq.io.ftqRead(0).entry.ftqPC, ftqOffsetReg,
276    ftq.io.ftqRead(0).entry.lastPacketPC.valid,
277    ftq.io.ftqRead(0).entry.lastPacketPC.bits
278  )
279  io.toIntBlock.jalr_target := ftq.io.ftqRead(0).entry.target
280
281  // pipeline between decode and dispatch
282  for (i <- 0 until RenameWidth) {
283    PipelineConnect(decode.io.out(i), rename.io.in(i), rename.io.in(i).ready,
284      io.frontend.redirect_cfiUpdate.valid)
285  }
286
287  rename.io.redirect <> backendRedirect
288  rename.io.flush := flushReg
289  rename.io.roqCommits <> roq.io.commits
290  rename.io.out <> dispatch.io.fromRename
291  rename.io.renameBypass <> dispatch.io.renameBypass
292
293  dispatch.io.redirect <> backendRedirect
294  dispatch.io.flush := flushReg
295  dispatch.io.enqRoq <> roq.io.enq
296  dispatch.io.enqLsq <> io.toLsBlock.enqLsq
297  dispatch.io.readIntRf <> io.toIntBlock.readRf
298  dispatch.io.readFpRf <> io.toFpBlock.readRf
299  dispatch.io.allocPregs.zipWithIndex.foreach { case (preg, i) =>
300    intBusyTable.io.allocPregs(i).valid := preg.isInt
301    fpBusyTable.io.allocPregs(i).valid := preg.isFp
302    intBusyTable.io.allocPregs(i).bits := preg.preg
303    fpBusyTable.io.allocPregs(i).bits := preg.preg
304  }
305  dispatch.io.numExist <> io.fromIntBlock.numExist ++ io.fromFpBlock.numExist ++ io.fromLsBlock.numExist
306  dispatch.io.enqIQCtrl <> io.toIntBlock.enqIqCtrl ++ io.toFpBlock.enqIqCtrl ++ io.toLsBlock.enqIqCtrl
307//  dispatch.io.enqIQData <> io.toIntBlock.enqIqData ++ io.toFpBlock.enqIqData ++ io.toLsBlock.enqIqData
308
309
310  fpBusyTable.io.flush := flushReg
311  intBusyTable.io.flush := flushReg
312  for((wb, setPhyRegRdy) <- io.fromIntBlock.wbRegs.zip(intBusyTable.io.wbPregs)){
313    setPhyRegRdy.valid := wb.valid && wb.bits.uop.ctrl.rfWen
314    setPhyRegRdy.bits := wb.bits.uop.pdest
315  }
316  for((wb, setPhyRegRdy) <- io.fromFpBlock.wbRegs.zip(fpBusyTable.io.wbPregs)){
317    setPhyRegRdy.valid := wb.valid && wb.bits.uop.ctrl.fpWen
318    setPhyRegRdy.bits := wb.bits.uop.pdest
319  }
320  intBusyTable.io.read <> dispatch.io.readIntState
321  fpBusyTable.io.read <> dispatch.io.readFpState
322
323  roq.io.redirect <> backendRedirect
324  roq.io.exeWbResults.zip(
325    io.fromIntBlock.wbRegs ++ io.fromFpBlock.wbRegs ++ io.fromLsBlock.stOut
326  ).foreach{
327    case(x, y) =>
328      x.bits := y.bits
329      x.valid := y.valid
330  }
331
332  // TODO: is 'backendRedirect' necesscary?
333  io.toIntBlock.redirect <> backendRedirect
334  io.toIntBlock.flush <> flushReg
335  io.toFpBlock.redirect <> backendRedirect
336  io.toFpBlock.flush <> flushReg
337  io.toLsBlock.redirect <> backendRedirect
338  io.toLsBlock.flush <> flushReg
339
340  if (env.DualCoreDifftest) {
341    difftestIO.fromRoq <> roq.difftestIO
342    trapIO <> roq.trapIO
343  }
344
345  dispatch.io.readPortIndex.intIndex <> io.toIntBlock.readPortIndex
346  dispatch.io.readPortIndex.fpIndex <> io.toFpBlock.readPortIndex
347
348  // roq to int block
349  io.roqio.toCSR <> roq.io.csr
350  io.roqio.exception := roq.io.exception
351  io.roqio.exception.bits.uop.cf.pc := flushPC
352  // roq to mem block
353  io.roqio.lsq <> roq.io.lsq
354}
355