xref: /XiangShan/src/main/scala/xiangshan/mem/lsqueue/LoadQueueUncache.scala (revision a035c20d751f9db7891973ed1a6f0184093e7b6e)
1e9e6cd09SYanqin Li/***************************************************************************************
2e9e6cd09SYanqin Li * Copyright (c) 2024 Beijing Institute of Open Source Chip (BOSC)
3e9e6cd09SYanqin Li * Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences
4e9e6cd09SYanqin Li * Copyright (c) 2020-2021 Peng Cheng Laboratory
5e9e6cd09SYanqin Li *
6e9e6cd09SYanqin Li * XiangShan is licensed under Mulan PSL v2.
7e9e6cd09SYanqin Li * You can use this software according to the terms and conditions of the Mulan PSL v2.
8e9e6cd09SYanqin Li * You may obtain a copy of Mulan PSL v2 at:
9e9e6cd09SYanqin Li *          http://license.coscl.org.cn/MulanPSL2
10e9e6cd09SYanqin Li *
11e9e6cd09SYanqin Li * THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
12e9e6cd09SYanqin Li * EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
13e9e6cd09SYanqin Li * MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
14e9e6cd09SYanqin Li *
15e9e6cd09SYanqin Li * See the Mulan PSL v2 for more details.
16e9e6cd09SYanqin Li ***************************************************************************************/
17e9e6cd09SYanqin Lipackage xiangshan.mem
18e9e6cd09SYanqin Li
19e9e6cd09SYanqin Liimport chisel3._
20e9e6cd09SYanqin Liimport chisel3.util._
21e9e6cd09SYanqin Liimport org.chipsalliance.cde.config._
22e9e6cd09SYanqin Liimport xiangshan._
23e9e6cd09SYanqin Liimport xiangshan.backend.rob.{RobPtr, RobLsqIO}
24e9e6cd09SYanqin Liimport xiangshan.ExceptionNO._
25e9e6cd09SYanqin Liimport xiangshan.cache._
26e9e6cd09SYanqin Liimport utils._
27e9e6cd09SYanqin Liimport utility._
28e9e6cd09SYanqin Liimport xiangshan.backend.Bundles
29e9e6cd09SYanqin Liimport xiangshan.backend.Bundles.{DynInst, MemExuOutput}
30e9e6cd09SYanqin Liimport xiangshan.backend.fu.FuConfig.LduCfg
31e10e20c6SYanqin Liimport xiangshan.backend.HasMemBlockParameters
32e9e6cd09SYanqin Li
33e9e6cd09SYanqin Liclass UncacheEntry(entryIndex: Int)(implicit p: Parameters) extends XSModule
34e9e6cd09SYanqin Li  with HasCircularQueuePtrHelper
35e9e6cd09SYanqin Li  with HasLoadHelper
36e9e6cd09SYanqin Li{
37e9e6cd09SYanqin Li  val io = IO(new Bundle() {
38e9e6cd09SYanqin Li    /* control */
39e9e6cd09SYanqin Li    val redirect = Flipped(Valid(new Redirect))
40e9e6cd09SYanqin Li    // redirect flush
41e9e6cd09SYanqin Li    val flush = Output(Bool())
42e9e6cd09SYanqin Li    // mmio commit
43e9e6cd09SYanqin Li    val rob = Flipped(new RobLsqIO)
44e9e6cd09SYanqin Li    // mmio select
45e9e6cd09SYanqin Li    val mmioSelect = Output(Bool())
46e9e6cd09SYanqin Li
47e9e6cd09SYanqin Li    /* transaction */
48e9e6cd09SYanqin Li    // from ldu
49e9e6cd09SYanqin Li    val req = Flipped(Valid(new LqWriteBundle))
50e9e6cd09SYanqin Li    // to ldu: mmio, data
51e9e6cd09SYanqin Li    val mmioOut = DecoupledIO(new MemExuOutput)
52e9e6cd09SYanqin Li    val mmioRawData = Output(new LoadDataFromLQBundle)
53e9e6cd09SYanqin Li    // to ldu: nc with data
54e9e6cd09SYanqin Li    val ncOut = DecoupledIO(new LsPipelineBundle)
55e9e6cd09SYanqin Li    // <=> uncache
56e9e6cd09SYanqin Li    val uncache = new UncacheWordIO
57e9e6cd09SYanqin Li    // exception generated by outer bus
58e9e6cd09SYanqin Li    val exception = Valid(new LqWriteBundle)
59e9e6cd09SYanqin Li  })
60e9e6cd09SYanqin Li
61e9e6cd09SYanqin Li  val req_valid = RegInit(false.B)
62e9e6cd09SYanqin Li  val isNC = RegInit(false.B)
63e9e6cd09SYanqin Li  val req = Reg(new LqWriteBundle)
64e9e6cd09SYanqin Li
65e9e6cd09SYanqin Li  val s_idle :: s_req :: s_resp :: s_wait :: Nil = Enum(4)
66e9e6cd09SYanqin Li  val uncacheState = RegInit(s_idle)
67e9e6cd09SYanqin Li  val uncacheData = Reg(io.uncache.resp.bits.data.cloneType)
68e9e6cd09SYanqin Li  val nderr = RegInit(false.B)
69e9e6cd09SYanqin Li
70e9e6cd09SYanqin Li  val writeback = Mux(req.nc, io.ncOut.fire, io.mmioOut.fire)
71e9e6cd09SYanqin Li
72e9e6cd09SYanqin Li  /**
73e9e6cd09SYanqin Li    * Flush
74e9e6cd09SYanqin Li    *
75e9e6cd09SYanqin Li    * 1. direct flush during idle
76e9e6cd09SYanqin Li    * 2. otherwise delayed flush until receiving uncache resp
77e9e6cd09SYanqin Li    */
78e9e6cd09SYanqin Li  val needFlushReg = RegInit(false.B)
79e9e6cd09SYanqin Li  val needFlush = req_valid && req.uop.robIdx.needFlush(io.redirect)
80e9e6cd09SYanqin Li  val flush = (needFlush && uncacheState===s_idle) || (io.uncache.resp.fire && needFlushReg)
81e9e6cd09SYanqin Li  when(flush){
82e9e6cd09SYanqin Li    needFlushReg := false.B
83e9e6cd09SYanqin Li  }.elsewhen(needFlush){
84e9e6cd09SYanqin Li    needFlushReg := true.B
85e9e6cd09SYanqin Li  }
86e9e6cd09SYanqin Li
87e9e6cd09SYanqin Li  /* enter req */
88e9e6cd09SYanqin Li  when (flush) {
89e9e6cd09SYanqin Li    req_valid := false.B
90e9e6cd09SYanqin Li  } .elsewhen (io.req.valid) {
91e9e6cd09SYanqin Li    req_valid := true.B
92e9e6cd09SYanqin Li    req := io.req.bits
93e9e6cd09SYanqin Li    nderr := false.B
94e9e6cd09SYanqin Li  } .elsewhen (writeback) {
95e9e6cd09SYanqin Li    req_valid := false.B
96e9e6cd09SYanqin Li  }
978b33cd30Sklin02  XSError(!flush && io.req.valid && req_valid, p"LoadQueueUncache: You can not write an valid entry: $entryIndex")
98e9e6cd09SYanqin Li
99e9e6cd09SYanqin Li  /**
100e9e6cd09SYanqin Li    * Memory mapped IO / NC operations
101e9e6cd09SYanqin Li    *
102e9e6cd09SYanqin Li    * States:
103e9e6cd09SYanqin Li    * (1) s_idle: wait for mmio reaching ROB's head / nc req valid from loadunit
104e9e6cd09SYanqin Li    * (2) s_req: wait to be sent to uncache channel until req selected and uncache ready
105e9e6cd09SYanqin Li    * (3) s_resp: wait for response from uncache channel
106e9e6cd09SYanqin Li    * (4) s_wait: wait for loadunit to receive writeback req
107e9e6cd09SYanqin Li    */
108e9e6cd09SYanqin Li  val pendingld = GatedValidRegNext(io.rob.pendingMMIOld)
109e9e6cd09SYanqin Li  val pendingPtr = GatedRegNext(io.rob.pendingPtr)
110e9e6cd09SYanqin Li  val canSendReq = req_valid && !needFlush && Mux(
111e9e6cd09SYanqin Li    req.nc, true.B,
112e9e6cd09SYanqin Li    pendingld && req.uop.robIdx === pendingPtr
113e9e6cd09SYanqin Li  )
114e9e6cd09SYanqin Li  switch (uncacheState) {
115e9e6cd09SYanqin Li    is (s_idle) {
116e9e6cd09SYanqin Li      when (canSendReq) {
117e9e6cd09SYanqin Li        uncacheState := s_req
118e9e6cd09SYanqin Li      }
119e9e6cd09SYanqin Li    }
120e9e6cd09SYanqin Li    is (s_req) {
121e9e6cd09SYanqin Li      when (io.uncache.req.fire) {
122e9e6cd09SYanqin Li        uncacheState := s_resp
123e9e6cd09SYanqin Li      }
124e9e6cd09SYanqin Li    }
125e9e6cd09SYanqin Li    is (s_resp) {
126e9e6cd09SYanqin Li      when (io.uncache.resp.fire) {
127e9e6cd09SYanqin Li        when (needFlushReg) {
128e9e6cd09SYanqin Li          uncacheState := s_idle
129e9e6cd09SYanqin Li        }.otherwise{
130e9e6cd09SYanqin Li          uncacheState := s_wait
131e9e6cd09SYanqin Li        }
132e9e6cd09SYanqin Li      }
133e9e6cd09SYanqin Li    }
134e9e6cd09SYanqin Li    is (s_wait) {
135e9e6cd09SYanqin Li      when (writeback) {
136e9e6cd09SYanqin Li        uncacheState := s_idle
137e9e6cd09SYanqin Li      }
138e9e6cd09SYanqin Li    }
139e9e6cd09SYanqin Li  }
140e9e6cd09SYanqin Li
141e9e6cd09SYanqin Li  /* control */
142e9e6cd09SYanqin Li  io.flush := flush
143e9e6cd09SYanqin Li  io.rob.mmio := DontCare
144e9e6cd09SYanqin Li  io.rob.uop := DontCare
145e9e6cd09SYanqin Li  io.mmioSelect := (uncacheState =/= s_idle) && req.mmio
146e9e6cd09SYanqin Li
147e9e6cd09SYanqin Li  /* uncahce req */
148e9e6cd09SYanqin Li  io.uncache.req.valid     := uncacheState === s_req
149e9e6cd09SYanqin Li  io.uncache.req.bits      := DontCare
150e9e6cd09SYanqin Li  io.uncache.req.bits.cmd  := MemoryOpConstants.M_XRD
151e9e6cd09SYanqin Li  io.uncache.req.bits.data := DontCare
152e9e6cd09SYanqin Li  io.uncache.req.bits.addr := req.paddr
153e9e6cd09SYanqin Li  io.uncache.req.bits.vaddr:= req.vaddr
154e9e6cd09SYanqin Li  io.uncache.req.bits.mask := Mux(req.paddr(3), req.mask(15, 8), req.mask(7, 0))
155e9e6cd09SYanqin Li  io.uncache.req.bits.id   := entryIndex.U
156e9e6cd09SYanqin Li  io.uncache.req.bits.instrtype := DontCare
157e9e6cd09SYanqin Li  io.uncache.req.bits.replayCarry := DontCare
158e9e6cd09SYanqin Li  io.uncache.req.bits.atomic := req.atomic
159e9e6cd09SYanqin Li  io.uncache.req.bits.nc := req.nc
160519244c7SYanqin Li  io.uncache.req.bits.memBackTypeMM := req.memBackTypeMM
161e9e6cd09SYanqin Li
162e9e6cd09SYanqin Li  io.uncache.resp.ready := true.B
163e9e6cd09SYanqin Li
164e9e6cd09SYanqin Li  /* uncahce resp */
165e9e6cd09SYanqin Li  when (io.uncache.resp.fire) {
166e9e6cd09SYanqin Li    uncacheData := io.uncache.resp.bits.data
167e9e6cd09SYanqin Li    nderr := io.uncache.resp.bits.nderr
168e9e6cd09SYanqin Li  }
169e9e6cd09SYanqin Li
170e9e6cd09SYanqin Li  /* uncahce writeback */
171e9e6cd09SYanqin Li  val selUop = req.uop
172e9e6cd09SYanqin Li  val func = selUop.fuOpType
173e9e6cd09SYanqin Li  val raddr = req.paddr
174e9e6cd09SYanqin Li  val rdataSel = LookupTree(raddr(2, 0), List(
175e9e6cd09SYanqin Li      "b000".U -> uncacheData(63,  0),
176e9e6cd09SYanqin Li      "b001".U -> uncacheData(63,  8),
177e9e6cd09SYanqin Li      "b010".U -> uncacheData(63, 16),
178e9e6cd09SYanqin Li      "b011".U -> uncacheData(63, 24),
179e9e6cd09SYanqin Li      "b100".U -> uncacheData(63, 32),
180e9e6cd09SYanqin Li      "b101".U -> uncacheData(63, 40),
181e9e6cd09SYanqin Li      "b110".U -> uncacheData(63, 48),
182e9e6cd09SYanqin Li      "b111".U -> uncacheData(63, 56)
183e9e6cd09SYanqin Li    ))
184e9e6cd09SYanqin Li  val rdataPartialLoad = rdataHelper(selUop, rdataSel)
185e9e6cd09SYanqin Li
186e9e6cd09SYanqin Li  io.mmioOut.valid := false.B
187e9e6cd09SYanqin Li  io.mmioOut.bits := DontCare
188e9e6cd09SYanqin Li  io.mmioRawData := DontCare
189e9e6cd09SYanqin Li  io.ncOut.valid := false.B
190e9e6cd09SYanqin Li  io.ncOut.bits := DontCare
191e9e6cd09SYanqin Li
192e9e6cd09SYanqin Li  when(req.nc){
193e9e6cd09SYanqin Li    io.ncOut.valid := (uncacheState === s_wait)
194e9e6cd09SYanqin Li    io.ncOut.bits := DontCare
195e9e6cd09SYanqin Li    io.ncOut.bits.uop := selUop
196e9e6cd09SYanqin Li    io.ncOut.bits.uop.lqIdx := req.uop.lqIdx
197e9e6cd09SYanqin Li    io.ncOut.bits.uop.exceptionVec(loadAccessFault) := nderr
198e9e6cd09SYanqin Li    io.ncOut.bits.data := rdataPartialLoad
199e9e6cd09SYanqin Li    io.ncOut.bits.paddr := req.paddr
200e9e6cd09SYanqin Li    io.ncOut.bits.vaddr := req.vaddr
201e9e6cd09SYanqin Li    io.ncOut.bits.nc := true.B
202e9e6cd09SYanqin Li    io.ncOut.bits.mask := Mux(req.paddr(3), req.mask(15, 8), req.mask(7, 0))
203e9e6cd09SYanqin Li    io.ncOut.bits.schedIndex := req.schedIndex
204e9e6cd09SYanqin Li    io.ncOut.bits.isvec := req.isvec
205e9e6cd09SYanqin Li    io.ncOut.bits.is128bit := req.is128bit
206e9e6cd09SYanqin Li    io.ncOut.bits.vecActive := req.vecActive
207e9e6cd09SYanqin Li  }.otherwise{
208e9e6cd09SYanqin Li    io.mmioOut.valid := (uncacheState === s_wait)
209e9e6cd09SYanqin Li    io.mmioOut.bits := DontCare
210e9e6cd09SYanqin Li    io.mmioOut.bits.uop := selUop
211e9e6cd09SYanqin Li    io.mmioOut.bits.uop.lqIdx := req.uop.lqIdx
212e9e6cd09SYanqin Li    io.mmioOut.bits.uop.exceptionVec(loadAccessFault) := nderr
213e9e6cd09SYanqin Li    io.mmioOut.bits.data := rdataPartialLoad
214e9e6cd09SYanqin Li    io.mmioOut.bits.debug.isMMIO := true.B
215e9e6cd09SYanqin Li    io.mmioOut.bits.debug.isNC := false.B
216e9e6cd09SYanqin Li    io.mmioOut.bits.debug.paddr := req.paddr
217e9e6cd09SYanqin Li    io.mmioOut.bits.debug.vaddr := req.vaddr
218e9e6cd09SYanqin Li    io.mmioRawData.lqData := uncacheData
219e9e6cd09SYanqin Li    io.mmioRawData.uop := req.uop
220e9e6cd09SYanqin Li    io.mmioRawData.addrOffset := req.paddr
221e9e6cd09SYanqin Li  }
222e9e6cd09SYanqin Li
223e9e6cd09SYanqin Li  io.exception.valid := writeback
224e9e6cd09SYanqin Li  io.exception.bits := req
225e9e6cd09SYanqin Li  io.exception.bits.uop.exceptionVec(loadAccessFault) := nderr
226e9e6cd09SYanqin Li
227e9e6cd09SYanqin Li  /* debug log */
2288b33cd30Sklin02  XSDebug(io.uncache.req.fire,
2298b33cd30Sklin02    "uncache req: pc %x addr %x data %x op %x mask %x\n",
230e9e6cd09SYanqin Li    req.uop.pc,
231e9e6cd09SYanqin Li    io.uncache.req.bits.addr,
232e9e6cd09SYanqin Li    io.uncache.req.bits.data,
233e9e6cd09SYanqin Li    io.uncache.req.bits.cmd,
234e9e6cd09SYanqin Li    io.uncache.req.bits.mask
235e9e6cd09SYanqin Li  )
2368b33cd30Sklin02  XSInfo(io.ncOut.fire,
2378b33cd30Sklin02    "int load miss write to cbd robidx %d lqidx %d pc 0x%x mmio %x\n",
238e9e6cd09SYanqin Li    io.ncOut.bits.uop.robIdx.asUInt,
239e9e6cd09SYanqin Li    io.ncOut.bits.uop.lqIdx.asUInt,
240e9e6cd09SYanqin Li    io.ncOut.bits.uop.pc,
241e9e6cd09SYanqin Li    true.B
242e9e6cd09SYanqin Li  )
2438b33cd30Sklin02  XSInfo(io.mmioOut.fire,
2448b33cd30Sklin02    "int load miss write to cbd robidx %d lqidx %d pc 0x%x mmio %x\n",
245e9e6cd09SYanqin Li    io.mmioOut.bits.uop.robIdx.asUInt,
246e9e6cd09SYanqin Li    io.mmioOut.bits.uop.lqIdx.asUInt,
247e9e6cd09SYanqin Li    io.mmioOut.bits.uop.pc,
248e9e6cd09SYanqin Li    true.B
249e9e6cd09SYanqin Li  )
250e9e6cd09SYanqin Li
251e9e6cd09SYanqin Li}
252e9e6cd09SYanqin Li
253e9e6cd09SYanqin Liclass LoadQueueUncache(implicit p: Parameters) extends XSModule
254e9e6cd09SYanqin Li  with HasCircularQueuePtrHelper
255e9e6cd09SYanqin Li  with HasMemBlockParameters
256e9e6cd09SYanqin Li{
257e9e6cd09SYanqin Li  val io = IO(new Bundle() {
258e9e6cd09SYanqin Li    /* control */
259e9e6cd09SYanqin Li    val redirect = Flipped(Valid(new Redirect))
260e9e6cd09SYanqin Li    // mmio commit
261e9e6cd09SYanqin Li    val rob = Flipped(new RobLsqIO)
262e9e6cd09SYanqin Li
263e9e6cd09SYanqin Li    /* transaction */
264e9e6cd09SYanqin Li    // enqueue: from ldu s3
265e9e6cd09SYanqin Li    val req = Vec(LoadPipelineWidth, Flipped(Decoupled(new LqWriteBundle)))
266e9e6cd09SYanqin Li    // writeback: mmio to ldu s0, s3
267e9e6cd09SYanqin Li    val mmioOut = Vec(LoadPipelineWidth, DecoupledIO(new MemExuOutput))
268e9e6cd09SYanqin Li    val mmioRawData = Vec(LoadPipelineWidth, Output(new LoadDataFromLQBundle))
269e9e6cd09SYanqin Li    // writeback: nc to ldu s0--s3
270e9e6cd09SYanqin Li    val ncOut = Vec(LoadPipelineWidth, Decoupled(new LsPipelineBundle))
271e9e6cd09SYanqin Li    // <=>uncache
272e9e6cd09SYanqin Li    val uncache = new UncacheWordIO
273e9e6cd09SYanqin Li
274e9e6cd09SYanqin Li    /* except */
275e9e6cd09SYanqin Li    // rollback from frontend when buffer is full
276e9e6cd09SYanqin Li    val rollback = Output(Valid(new Redirect))
277e9e6cd09SYanqin Li    // exception generated by outer bus
278e9e6cd09SYanqin Li    val exception = Valid(new LqWriteBundle)
279e9e6cd09SYanqin Li  })
280e9e6cd09SYanqin Li
281e9e6cd09SYanqin Li  /******************************************************************
282e9e6cd09SYanqin Li   * Structure
283e9e6cd09SYanqin Li   ******************************************************************/
284e9e6cd09SYanqin Li  val entries = Seq.tabulate(LoadUncacheBufferSize)(i => Module(new UncacheEntry(i)))
285e9e6cd09SYanqin Li
286e9e6cd09SYanqin Li  val freeList = Module(new FreeList(
287e9e6cd09SYanqin Li    size = LoadUncacheBufferSize,
288e9e6cd09SYanqin Li    allocWidth = LoadPipelineWidth,
289e9e6cd09SYanqin Li    freeWidth = 4,
290e9e6cd09SYanqin Li    enablePreAlloc = true,
291e9e6cd09SYanqin Li    moduleName = "LoadQueueUncache freelist"
292e9e6cd09SYanqin Li  ))
293e9e6cd09SYanqin Li  freeList.io := DontCare
294e9e6cd09SYanqin Li
295e9e6cd09SYanqin Li  // set default IO
296e9e6cd09SYanqin Li  entries.foreach {
297e9e6cd09SYanqin Li    case (e) =>
298e9e6cd09SYanqin Li      e.io.req.valid := false.B
299e9e6cd09SYanqin Li      e.io.req.bits := DontCare
300e9e6cd09SYanqin Li      e.io.uncache.req.ready := false.B
301e9e6cd09SYanqin Li      e.io.uncache.resp.valid := false.B
302e9e6cd09SYanqin Li      e.io.uncache.resp.bits := DontCare
303e9e6cd09SYanqin Li      e.io.ncOut.ready := false.B
304e9e6cd09SYanqin Li      e.io.mmioOut.ready := false.B
305e9e6cd09SYanqin Li  }
306e9e6cd09SYanqin Li  io.uncache.req.valid := false.B
307e9e6cd09SYanqin Li  io.uncache.req.bits := DontCare
308e9e6cd09SYanqin Li  io.uncache.resp.ready := false.B
309e9e6cd09SYanqin Li  for (w <- 0 until LoadPipelineWidth) {
310e9e6cd09SYanqin Li    io.mmioOut(w).valid := false.B
311e9e6cd09SYanqin Li    io.mmioOut(w).bits := DontCare
312e9e6cd09SYanqin Li    io.mmioRawData(w) := DontCare
313e9e6cd09SYanqin Li    io.ncOut(w).valid := false.B
314e9e6cd09SYanqin Li    io.ncOut(w).bits := DontCare
315e9e6cd09SYanqin Li  }
316e9e6cd09SYanqin Li
317e9e6cd09SYanqin Li
318e9e6cd09SYanqin Li  /******************************************************************
319e9e6cd09SYanqin Li   * Enqueue
320e9e6cd09SYanqin Li   *
321e9e6cd09SYanqin Li   * s1: hold
322e9e6cd09SYanqin Li   * s2: confirm enqueue and write entry
323e9e6cd09SYanqin Li   *    valid: no redirect, no exception, no replay, is mmio/nc
324e9e6cd09SYanqin Li   *    ready: freelist can allocate
325e9e6cd09SYanqin Li   ******************************************************************/
326e9e6cd09SYanqin Li
327*a035c20dSYanqin Li  val s1_sortedVec = HwSort(VecInit(io.req.map { case x => DataWithPtr(x.valid, x.bits, x.bits.uop.robIdx) }))
328*a035c20dSYanqin Li  val s1_req = VecInit(s1_sortedVec.map(_.bits))
329*a035c20dSYanqin Li  val s1_valid = VecInit(s1_sortedVec.map(_.valid))
330e9e6cd09SYanqin Li  val s2_enqueue = Wire(Vec(LoadPipelineWidth, Bool()))
331e9e6cd09SYanqin Li  io.req.zipWithIndex.foreach{ case (r, i) =>
332*a035c20dSYanqin Li    r.ready := true.B
333e9e6cd09SYanqin Li  }
334e9e6cd09SYanqin Li
335e9e6cd09SYanqin Li  // s2: enqueue
336e9e6cd09SYanqin Li  val s2_req = (0 until LoadPipelineWidth).map(i => {RegEnable(s1_req(i), s1_valid(i))})
337e9e6cd09SYanqin Li  val s2_valid = (0 until LoadPipelineWidth).map(i => {
338e9e6cd09SYanqin Li    RegNext(s1_valid(i)) &&
339e9e6cd09SYanqin Li    !s2_req(i).uop.robIdx.needFlush(RegNext(io.redirect)) &&
340e9e6cd09SYanqin Li    !s2_req(i).uop.robIdx.needFlush(io.redirect)
341e9e6cd09SYanqin Li  })
342e9e6cd09SYanqin Li  val s2_has_exception = s2_req.map(x => ExceptionNO.selectByFu(x.uop.exceptionVec, LduCfg).asUInt.orR)
343e9e6cd09SYanqin Li  val s2_need_replay = s2_req.map(_.rep_info.need_rep)
344e9e6cd09SYanqin Li
345e9e6cd09SYanqin Li  for (w <- 0 until LoadPipelineWidth) {
346e9e6cd09SYanqin Li    s2_enqueue(w) := s2_valid(w) && !s2_has_exception(w) && !s2_need_replay(w) && (s2_req(w).mmio || s2_req(w).nc)
347e9e6cd09SYanqin Li  }
348e9e6cd09SYanqin Li
349e9e6cd09SYanqin Li  val s2_enqValidVec = Wire(Vec(LoadPipelineWidth, Bool()))
350e9e6cd09SYanqin Li  val s2_enqIndexVec = Wire(Vec(LoadPipelineWidth, UInt()))
351e9e6cd09SYanqin Li
352e9e6cd09SYanqin Li  for (w <- 0 until LoadPipelineWidth) {
353e9e6cd09SYanqin Li    freeList.io.allocateReq(w) := true.B
354e9e6cd09SYanqin Li  }
355e9e6cd09SYanqin Li
356e9e6cd09SYanqin Li  // freeList real-allocate
357e9e6cd09SYanqin Li  for (w <- 0 until LoadPipelineWidth) {
358e9e6cd09SYanqin Li    freeList.io.doAllocate(w) := s2_enqValidVec(w)
359e9e6cd09SYanqin Li  }
360e9e6cd09SYanqin Li
361e9e6cd09SYanqin Li  for (w <- 0 until LoadPipelineWidth) {
362e9e6cd09SYanqin Li    val offset = PopCount(s2_enqueue.take(w))
36354b55f34SYanqin Li    s2_enqValidVec(w) := s2_enqueue(w) && freeList.io.canAllocate(offset)
364e9e6cd09SYanqin Li    s2_enqIndexVec(w) := freeList.io.allocateSlot(offset)
365e9e6cd09SYanqin Li  }
366e9e6cd09SYanqin Li
367e9e6cd09SYanqin Li
368e9e6cd09SYanqin Li  /******************************************************************
369e9e6cd09SYanqin Li   * Uncache Transaction
370e9e6cd09SYanqin Li   *
371e9e6cd09SYanqin Li   * 1. uncache req
372e9e6cd09SYanqin Li   * 2. uncache resp
373e9e6cd09SYanqin Li   * 3. writeback
374e9e6cd09SYanqin Li   ******************************************************************/
375e9e6cd09SYanqin Li  private val NC_WB_MOD = NCWBPorts.length
376e9e6cd09SYanqin Li
377e9e6cd09SYanqin Li  val uncacheReq = Wire(DecoupledIO(io.uncache.req.bits.cloneType))
378e9e6cd09SYanqin Li  val mmioSelect = entries.map(e => e.io.mmioSelect).reduce(_ || _)
379e9e6cd09SYanqin Li  val mmioReq = Wire(DecoupledIO(io.uncache.req.bits.cloneType))
380e9e6cd09SYanqin Li  // TODO lyq: It's best to choose in robIdx order / the order in which they enter
381e9e6cd09SYanqin Li  val ncReqArb = Module(new RRArbiterInit(io.uncache.req.bits.cloneType, LoadUncacheBufferSize))
382e9e6cd09SYanqin Li
383e9e6cd09SYanqin Li  val mmioOut = Wire(DecoupledIO(io.mmioOut(0).bits.cloneType))
384e9e6cd09SYanqin Li  val mmioRawData = Wire(io.mmioRawData(0).cloneType)
385e9e6cd09SYanqin Li  val ncOut = Wire(chiselTypeOf(io.ncOut))
386e9e6cd09SYanqin Li  val ncOutValidVec = VecInit(entries.map(e => e.io.ncOut.valid))
387e9e6cd09SYanqin Li  val ncOutValidVecRem = SubVec.getMaskRem(ncOutValidVec, NC_WB_MOD)
388e9e6cd09SYanqin Li
389e9e6cd09SYanqin Li  // init
390e9e6cd09SYanqin Li  uncacheReq.valid := false.B
391e9e6cd09SYanqin Li  uncacheReq.bits  := DontCare
392e9e6cd09SYanqin Li  mmioReq.valid := false.B
393e9e6cd09SYanqin Li  mmioReq.bits := DontCare
394e9e6cd09SYanqin Li  mmioOut.valid := false.B
395e9e6cd09SYanqin Li  mmioOut.bits := DontCare
396e9e6cd09SYanqin Li  mmioRawData := DontCare
397e9e6cd09SYanqin Li  for (i <- 0 until LoadUncacheBufferSize) {
398e9e6cd09SYanqin Li    ncReqArb.io.in(i).valid := false.B
399e9e6cd09SYanqin Li    ncReqArb.io.in(i).bits := DontCare
400e9e6cd09SYanqin Li  }
401e9e6cd09SYanqin Li  for (i <- 0 until LoadPipelineWidth) {
402e9e6cd09SYanqin Li    ncOut(i).valid := false.B
403e9e6cd09SYanqin Li    ncOut(i).bits := DontCare
404e9e6cd09SYanqin Li  }
405e9e6cd09SYanqin Li
406e9e6cd09SYanqin Li  entries.zipWithIndex.foreach {
407e9e6cd09SYanqin Li    case (e, i) =>
408e9e6cd09SYanqin Li      // enqueue
409e9e6cd09SYanqin Li      for (w <- 0 until LoadPipelineWidth) {
410e9e6cd09SYanqin Li        when (s2_enqValidVec(w) && (i.U === s2_enqIndexVec(w))) {
411e9e6cd09SYanqin Li          e.io.req.valid := true.B
412e9e6cd09SYanqin Li          e.io.req.bits := s2_req(w)
413e9e6cd09SYanqin Li        }
414e9e6cd09SYanqin Li      }
415e9e6cd09SYanqin Li
416e9e6cd09SYanqin Li      // control
417e9e6cd09SYanqin Li      e.io.redirect <> io.redirect
418e9e6cd09SYanqin Li      e.io.rob <> io.rob
419e9e6cd09SYanqin Li
420e9e6cd09SYanqin Li      // uncache req, writeback
421e9e6cd09SYanqin Li      when (e.io.mmioSelect) {
422e9e6cd09SYanqin Li        mmioReq.valid := e.io.uncache.req.valid
423e9e6cd09SYanqin Li        mmioReq.bits := e.io.uncache.req.bits
424e9e6cd09SYanqin Li        e.io.uncache.req.ready := mmioReq.ready
425e9e6cd09SYanqin Li
426e9e6cd09SYanqin Li        e.io.mmioOut.ready := mmioOut.ready
427e9e6cd09SYanqin Li        mmioOut.valid := e.io.mmioOut.valid
428e9e6cd09SYanqin Li        mmioOut.bits := e.io.mmioOut.bits
429e9e6cd09SYanqin Li        mmioRawData := e.io.mmioRawData
430e9e6cd09SYanqin Li
431e9e6cd09SYanqin Li      }.otherwise{
432e9e6cd09SYanqin Li        ncReqArb.io.in(i).valid := e.io.uncache.req.valid
433e9e6cd09SYanqin Li        ncReqArb.io.in(i).bits := e.io.uncache.req.bits
434e9e6cd09SYanqin Li        e.io.uncache.req.ready := ncReqArb.io.in(i).ready
435e9e6cd09SYanqin Li
436e9e6cd09SYanqin Li        (0 until NC_WB_MOD).map { w =>
437e9e6cd09SYanqin Li          val (idx, ncOutValid) = PriorityEncoderWithFlag(ncOutValidVecRem(w))
438e9e6cd09SYanqin Li          val port = NCWBPorts(w)
439e9e6cd09SYanqin Li          when((i.U === idx) && ncOutValid) {
440e9e6cd09SYanqin Li            ncOut(port).valid := ncOutValid
441e9e6cd09SYanqin Li            ncOut(port).bits := e.io.ncOut.bits
442e9e6cd09SYanqin Li            e.io.ncOut.ready := ncOut(port).ready
443e9e6cd09SYanqin Li          }
444e9e6cd09SYanqin Li        }
445e9e6cd09SYanqin Li
446e9e6cd09SYanqin Li      }
447e9e6cd09SYanqin Li
448e9e6cd09SYanqin Li      // uncache resp
449e9e6cd09SYanqin Li      when (i.U === io.uncache.resp.bits.id) {
450e9e6cd09SYanqin Li        e.io.uncache.resp <> io.uncache.resp
451e9e6cd09SYanqin Li      }
452e9e6cd09SYanqin Li
453e9e6cd09SYanqin Li  }
454e9e6cd09SYanqin Li
455e9e6cd09SYanqin Li  mmioReq.ready := false.B
456e9e6cd09SYanqin Li  ncReqArb.io.out.ready := false.B
457e9e6cd09SYanqin Li  when(mmioSelect){
458e9e6cd09SYanqin Li    uncacheReq <> mmioReq
459e9e6cd09SYanqin Li  }.otherwise{
460e9e6cd09SYanqin Li    uncacheReq <> ncReqArb.io.out
461e9e6cd09SYanqin Li  }
462e9e6cd09SYanqin Li
463e9e6cd09SYanqin Li  // uncache Request
464e9e6cd09SYanqin Li  AddPipelineReg(uncacheReq, io.uncache.req, false.B)
465e9e6cd09SYanqin Li
466e9e6cd09SYanqin Li  // uncache Writeback
467e9e6cd09SYanqin Li  AddPipelineReg(mmioOut, io.mmioOut(UncacheWBPort), false.B)
468e9e6cd09SYanqin Li  io.mmioRawData(UncacheWBPort) := RegEnable(mmioRawData, mmioOut.fire)
469e9e6cd09SYanqin Li
470e9e6cd09SYanqin Li  (0 until LoadPipelineWidth).foreach { i => AddPipelineReg(ncOut(i), io.ncOut(i), false.B) }
471e9e6cd09SYanqin Li
472e9e6cd09SYanqin Li  // uncache exception
473e9e6cd09SYanqin Li  io.exception.valid := Cat(entries.map(_.io.exception.valid)).orR
474e9e6cd09SYanqin Li  io.exception.bits := ParallelPriorityMux(entries.map(e =>
475e9e6cd09SYanqin Li    (e.io.exception.valid, e.io.exception.bits)
476e9e6cd09SYanqin Li  ))
477e9e6cd09SYanqin Li
478e9e6cd09SYanqin Li  // rob
479e9e6cd09SYanqin Li  for (i <- 0 until LoadPipelineWidth) {
480e9e6cd09SYanqin Li    io.rob.mmio(i) := RegNext(s1_valid(i) && s1_req(i).mmio)
481e9e6cd09SYanqin Li    io.rob.uop(i) := RegEnable(s1_req(i).uop, s1_valid(i))
482e9e6cd09SYanqin Li  }
483e9e6cd09SYanqin Li
484e9e6cd09SYanqin Li
485e9e6cd09SYanqin Li  /******************************************************************
486e9e6cd09SYanqin Li   * Deallocate
487e9e6cd09SYanqin Li   ******************************************************************/
488e9e6cd09SYanqin Li  // UncacheBuffer deallocate
489e9e6cd09SYanqin Li  val freeMaskVec = Wire(Vec(LoadUncacheBufferSize, Bool()))
490e9e6cd09SYanqin Li
491e9e6cd09SYanqin Li  // init
492e9e6cd09SYanqin Li  freeMaskVec.map(e => e := false.B)
493e9e6cd09SYanqin Li
494e9e6cd09SYanqin Li  // dealloc logic
495e9e6cd09SYanqin Li  entries.zipWithIndex.foreach {
496e9e6cd09SYanqin Li    case (e, i) =>
497e9e6cd09SYanqin Li      when ((e.io.mmioSelect && e.io.mmioOut.fire) || e.io.ncOut.fire || e.io.flush) {
498e9e6cd09SYanqin Li        freeMaskVec(i) := true.B
499e9e6cd09SYanqin Li      }
500e9e6cd09SYanqin Li  }
501e9e6cd09SYanqin Li
502e9e6cd09SYanqin Li  freeList.io.free := freeMaskVec.asUInt
503e9e6cd09SYanqin Li
504e9e6cd09SYanqin Li
505e9e6cd09SYanqin Li  /******************************************************************
506e9e6cd09SYanqin Li   * Uncache rollback detection
507e9e6cd09SYanqin Li   *
508e9e6cd09SYanqin Li   * When uncache loads enqueue, it searches uncache loads, They can not enqueue and need re-execution.
509e9e6cd09SYanqin Li   *
510e9e6cd09SYanqin Li   * Cycle 0: uncache enqueue.
511e9e6cd09SYanqin Li   * Cycle 1: Select oldest uncache loads.
512e9e6cd09SYanqin Li   * Cycle 2: Redirect Fire.
513e9e6cd09SYanqin Li   *   Choose the oldest load from LoadPipelineWidth oldest loads.
514e9e6cd09SYanqin Li   *   Prepare redirect request according to the detected rejection.
515e9e6cd09SYanqin Li   *   Fire redirect request (if valid)
516e9e6cd09SYanqin Li   *
517e9e6cd09SYanqin Li   *               Load_S3  .... Load_S3
518e9e6cd09SYanqin Li   * stage 0:        lq            lq
519e9e6cd09SYanqin Li   *                 |             | (can not enqueue)
520e9e6cd09SYanqin Li   * stage 1:        lq            lq
521e9e6cd09SYanqin Li   *                 |             |
522e9e6cd09SYanqin Li   *                 ---------------
523e9e6cd09SYanqin Li   *                        |
524e9e6cd09SYanqin Li   * stage 2:               lq
525e9e6cd09SYanqin Li   *                        |
526e9e6cd09SYanqin Li   *                     rollback req
527e9e6cd09SYanqin Li   *
528e9e6cd09SYanqin Li   ******************************************************************/
529e9e6cd09SYanqin Li  def selectOldestRedirect(xs: Seq[Valid[Redirect]]): Vec[Bool] = {
530e9e6cd09SYanqin Li    val compareVec = (0 until xs.length).map(i => (0 until i).map(j => isAfter(xs(j).bits.robIdx, xs(i).bits.robIdx)))
531e9e6cd09SYanqin Li    val resultOnehot = VecInit((0 until xs.length).map(i => Cat((0 until xs.length).map(j =>
532e9e6cd09SYanqin Li      (if (j < i) !xs(j).valid || compareVec(i)(j)
533e9e6cd09SYanqin Li      else if (j == i) xs(i).valid
534e9e6cd09SYanqin Li      else !xs(j).valid || !compareVec(j)(i))
535e9e6cd09SYanqin Li    )).andR))
536e9e6cd09SYanqin Li    resultOnehot
537e9e6cd09SYanqin Li  }
538e9e6cd09SYanqin Li  val reqNeedCheck = VecInit((0 until LoadPipelineWidth).map(w =>
539e9e6cd09SYanqin Li    s2_enqueue(w) && !s2_enqValidVec(w)
540e9e6cd09SYanqin Li  ))
541e9e6cd09SYanqin Li  val reqSelUops = VecInit(s2_req.map(_.uop))
542e9e6cd09SYanqin Li  val allRedirect = (0 until LoadPipelineWidth).map(i => {
543e9e6cd09SYanqin Li    val redirect = Wire(Valid(new Redirect))
544e9e6cd09SYanqin Li    redirect.valid := reqNeedCheck(i)
545e9e6cd09SYanqin Li    redirect.bits             := DontCare
546e9e6cd09SYanqin Li    redirect.bits.isRVC       := reqSelUops(i).preDecodeInfo.isRVC
547e9e6cd09SYanqin Li    redirect.bits.robIdx      := reqSelUops(i).robIdx
548e9e6cd09SYanqin Li    redirect.bits.ftqIdx      := reqSelUops(i).ftqPtr
549e9e6cd09SYanqin Li    redirect.bits.ftqOffset   := reqSelUops(i).ftqOffset
550e9e6cd09SYanqin Li    redirect.bits.level       := RedirectLevel.flush
551e9e6cd09SYanqin Li    redirect.bits.cfiUpdate.target := reqSelUops(i).pc // TODO: check if need pc
552e9e6cd09SYanqin Li    redirect.bits.debug_runahead_checkpoint_id := reqSelUops(i).debugInfo.runahead_checkpoint_id
553e9e6cd09SYanqin Li    redirect
554e9e6cd09SYanqin Li  })
555e9e6cd09SYanqin Li  val oldestOneHot = selectOldestRedirect(allRedirect)
556e9e6cd09SYanqin Li  val oldestRedirect = Mux1H(oldestOneHot, allRedirect)
557e9e6cd09SYanqin Li  val lastCycleRedirect = Wire(Valid(new Redirect))
558e9e6cd09SYanqin Li  lastCycleRedirect.valid := RegNext(io.redirect.valid)
559e9e6cd09SYanqin Li  lastCycleRedirect.bits := RegEnable(io.redirect.bits, io.redirect.valid)
560e9e6cd09SYanqin Li  val lastLastCycleRedirect = Wire(Valid(new Redirect))
561e9e6cd09SYanqin Li  lastLastCycleRedirect.valid := RegNext(lastCycleRedirect.valid)
562e9e6cd09SYanqin Li  lastLastCycleRedirect.bits := RegEnable(lastCycleRedirect.bits, lastCycleRedirect.valid)
563e9e6cd09SYanqin Li  io.rollback.valid := GatedValidRegNext(oldestRedirect.valid &&
564e9e6cd09SYanqin Li                      !oldestRedirect.bits.robIdx.needFlush(io.redirect) &&
565e9e6cd09SYanqin Li                      !oldestRedirect.bits.robIdx.needFlush(lastCycleRedirect) &&
566e9e6cd09SYanqin Li                      !oldestRedirect.bits.robIdx.needFlush(lastLastCycleRedirect))
567e9e6cd09SYanqin Li  io.rollback.bits := RegEnable(oldestRedirect.bits, oldestRedirect.valid)
568e9e6cd09SYanqin Li
569e9e6cd09SYanqin Li
570e9e6cd09SYanqin Li  /******************************************************************
571e9e6cd09SYanqin Li   * Perf Counter
572e9e6cd09SYanqin Li   ******************************************************************/
573e9e6cd09SYanqin Li  val validCount = freeList.io.validCount
574e9e6cd09SYanqin Li  val allowEnqueue = !freeList.io.empty
575e9e6cd09SYanqin Li  QueuePerf(LoadUncacheBufferSize, validCount, !allowEnqueue)
576e9e6cd09SYanqin Li
577e9e6cd09SYanqin Li  XSPerfAccumulate("mmio_uncache_req", io.uncache.req.fire && !io.uncache.req.bits.nc)
578e9e6cd09SYanqin Li  XSPerfAccumulate("mmio_writeback_success", io.mmioOut(0).fire)
579e9e6cd09SYanqin Li  XSPerfAccumulate("mmio_writeback_blocked", io.mmioOut(0).valid && !io.mmioOut(0).ready)
580e9e6cd09SYanqin Li  XSPerfAccumulate("nc_uncache_req", io.uncache.req.fire && io.uncache.req.bits.nc)
581e9e6cd09SYanqin Li  XSPerfAccumulate("nc_writeback_success", io.ncOut(0).fire)
582e9e6cd09SYanqin Li  XSPerfAccumulate("nc_writeback_blocked", io.ncOut(0).valid && !io.ncOut(0).ready)
583e9e6cd09SYanqin Li  XSPerfAccumulate("uncache_full_rollback", io.rollback.valid)
584e9e6cd09SYanqin Li
585e9e6cd09SYanqin Li  val perfEvents: Seq[(String, UInt)] = Seq(
586e9e6cd09SYanqin Li    ("mmio_uncache_req", io.uncache.req.fire && !io.uncache.req.bits.nc),
587e9e6cd09SYanqin Li    ("mmio_writeback_success", io.mmioOut(0).fire),
588e9e6cd09SYanqin Li    ("mmio_writeback_blocked", io.mmioOut(0).valid && !io.mmioOut(0).ready),
589e9e6cd09SYanqin Li    ("nc_uncache_req", io.uncache.req.fire && io.uncache.req.bits.nc),
590e9e6cd09SYanqin Li    ("nc_writeback_success", io.ncOut(0).fire),
591e9e6cd09SYanqin Li    ("nc_writeback_blocked", io.ncOut(0).valid && !io.ncOut(0).ready),
592e9e6cd09SYanqin Li    ("uncache_full_rollback", io.rollback.valid)
593e9e6cd09SYanqin Li  )
594e9e6cd09SYanqin Li  // end
595e9e6cd09SYanqin Li}
596