xref: /XiangShan/src/main/scala/xiangshan/mem/pipeline/AtomicsUnit.scala (revision f97664b365f9dd3442b0c0e094348b2cfdb405e8)
1024ee227SWilliam Wangpackage xiangshan.mem
2024ee227SWilliam Wang
3024ee227SWilliam Wangimport chisel3._
4024ee227SWilliam Wangimport chisel3.util._
5024ee227SWilliam Wangimport utils._
6024ee227SWilliam Wangimport xiangshan._
7024ee227SWilliam Wangimport xiangshan.cache.{DCacheWordIO, TlbRequestIO, TlbCmd, MemoryOpConstants}
8024ee227SWilliam Wangimport xiangshan.backend.LSUOpType
9024ee227SWilliam Wang
10024ee227SWilliam Wangclass AtomicsUnit extends XSModule with MemoryOpConstants{
11024ee227SWilliam Wang  val io = IO(new Bundle() {
12024ee227SWilliam Wang    val in            = Flipped(Decoupled(new ExuInput))
13024ee227SWilliam Wang    val out           = Decoupled(new ExuOutput)
14024ee227SWilliam Wang    val dcache        = new DCacheWordIO
15024ee227SWilliam Wang    val dtlb          = new TlbRequestIO
16024ee227SWilliam Wang    val flush_sbuffer = new SbufferFlushBundle
17024ee227SWilliam Wang    val tlbFeedback   = ValidIO(new TlbFeedback)
18024ee227SWilliam Wang    val redirect      = Flipped(ValidIO(new Redirect))
1911131ea4SYinan Xu    val exceptionAddr = ValidIO(UInt(VAddrBits.W))
20024ee227SWilliam Wang  })
21024ee227SWilliam Wang
228a5bdd64Swangkaifan  val difftestIO = IO(new Bundle() {
238a5bdd64Swangkaifan    val atomicResp = Output(Bool())
248a5bdd64Swangkaifan    val atomicAddr = Output(UInt(64.W))
258a5bdd64Swangkaifan    val atomicData = Output(UInt(64.W))
268a5bdd64Swangkaifan    val atomicMask = Output(UInt(8.W))
27*f97664b3Swangkaifan    val atomicFuop = Output(UInt(8.W))
28*f97664b3Swangkaifan    val atomicOut  = Output(UInt(64.W))
298a5bdd64Swangkaifan  })
308a5bdd64Swangkaifan  difftestIO <> DontCare
318a5bdd64Swangkaifan
32024ee227SWilliam Wang  //-------------------------------------------------------
33024ee227SWilliam Wang  // Atomics Memory Accsess FSM
34024ee227SWilliam Wang  //-------------------------------------------------------
35024ee227SWilliam Wang  val s_invalid :: s_tlb  :: s_flush_sbuffer_req :: s_flush_sbuffer_resp :: s_cache_req :: s_cache_resp :: s_finish :: Nil = Enum(7)
36024ee227SWilliam Wang  val state = RegInit(s_invalid)
37024ee227SWilliam Wang  val in = Reg(new ExuInput())
380d045bd0SYinan Xu  val exceptionVec = RegInit(0.U.asTypeOf(ExceptionVec()))
39024ee227SWilliam Wang  val atom_override_xtval = RegInit(false.B)
40024ee227SWilliam Wang  // paddr after translation
41024ee227SWilliam Wang  val paddr = Reg(UInt())
42cff68e26SWilliam Wang  val is_mmio = Reg(Bool())
43024ee227SWilliam Wang  // dcache response data
44024ee227SWilliam Wang  val resp_data = Reg(UInt())
45*f97664b3Swangkaifan  val resp_data_wire = WireInit(0.U)
46024ee227SWilliam Wang  val is_lrsc_valid = Reg(Bool())
47024ee227SWilliam Wang
488a5bdd64Swangkaifan  // Difftest signals
498a5bdd64Swangkaifan  val paddr_reg = Reg(UInt(64.W))
508a5bdd64Swangkaifan  val data_reg = Reg(UInt(64.W))
518a5bdd64Swangkaifan  val mask_reg = Reg(UInt(8.W))
52*f97664b3Swangkaifan  val fuop_reg = Reg(UInt(8.W))
538a5bdd64Swangkaifan
5411131ea4SYinan Xu  io.exceptionAddr.valid := atom_override_xtval
5511131ea4SYinan Xu  io.exceptionAddr.bits  := in.src1
56024ee227SWilliam Wang
57024ee227SWilliam Wang  // assign default value to output signals
58024ee227SWilliam Wang  io.in.ready          := false.B
59024ee227SWilliam Wang  io.out.valid         := false.B
60024ee227SWilliam Wang  io.out.bits          := DontCare
61024ee227SWilliam Wang
62024ee227SWilliam Wang  io.dcache.req.valid  := false.B
63024ee227SWilliam Wang  io.dcache.req.bits   := DontCare
64024ee227SWilliam Wang  io.dcache.resp.ready := false.B
65024ee227SWilliam Wang
66024ee227SWilliam Wang  io.dtlb.req.valid    := false.B
67024ee227SWilliam Wang  io.dtlb.req.bits     := DontCare
680cab60cbSZhangZifei  io.dtlb.resp.ready   := false.B
69024ee227SWilliam Wang
70024ee227SWilliam Wang  io.flush_sbuffer.valid := false.B
71024ee227SWilliam Wang
72024ee227SWilliam Wang  XSDebug("state: %d\n", state)
73024ee227SWilliam Wang
74024ee227SWilliam Wang  when (state === s_invalid) {
75024ee227SWilliam Wang    io.in.ready := true.B
76024ee227SWilliam Wang    when (io.in.fire()) {
77024ee227SWilliam Wang      in := io.in.bits
78024ee227SWilliam Wang      state := s_tlb
79024ee227SWilliam Wang    }
80024ee227SWilliam Wang  }
81024ee227SWilliam Wang
82024ee227SWilliam Wang  // Send TLB feedback to store issue queue
83024ee227SWilliam Wang  // we send feedback right after we receives request
84024ee227SWilliam Wang  // also, we always treat amo as tlb hit
85024ee227SWilliam Wang  // since we will continue polling tlb all by ourself
86665ccb1fSYinan Xu  io.tlbFeedback.valid       := RegNext(RegNext(io.in.valid))
87024ee227SWilliam Wang  io.tlbFeedback.bits.hit    := true.B
88024ee227SWilliam Wang  io.tlbFeedback.bits.roqIdx := in.uop.roqIdx
89024ee227SWilliam Wang
90024ee227SWilliam Wang  // tlb translation, manipulating signals && deal with exception
91024ee227SWilliam Wang  when (state === s_tlb) {
92024ee227SWilliam Wang    // send req to dtlb
93024ee227SWilliam Wang    // keep firing until tlb hit
94024ee227SWilliam Wang    io.dtlb.req.valid       := true.B
95024ee227SWilliam Wang    io.dtlb.req.bits.vaddr  := in.src1
96024ee227SWilliam Wang    io.dtlb.req.bits.roqIdx := in.uop.roqIdx
97cd3bc62aSZhangZifei    io.dtlb.resp.ready      := true.B
98024ee227SWilliam Wang    val is_lr = in.uop.ctrl.fuOpType === LSUOpType.lr_w || in.uop.ctrl.fuOpType === LSUOpType.lr_d
99cff68e26SWilliam Wang    io.dtlb.req.bits.cmd    := Mux(is_lr, TlbCmd.atom_read, TlbCmd.atom_write)
100024ee227SWilliam Wang    io.dtlb.req.bits.debug.pc := in.uop.cf.pc
101024ee227SWilliam Wang
1020cab60cbSZhangZifei    when(io.dtlb.resp.fire && !io.dtlb.resp.bits.miss){
103024ee227SWilliam Wang      // exception handling
104024ee227SWilliam Wang      val addrAligned = LookupTree(in.uop.ctrl.fuOpType(1,0), List(
105024ee227SWilliam Wang        "b00".U   -> true.B,              //b
106024ee227SWilliam Wang        "b01".U   -> (in.src1(0) === 0.U),   //h
107024ee227SWilliam Wang        "b10".U   -> (in.src1(1,0) === 0.U), //w
108024ee227SWilliam Wang        "b11".U   -> (in.src1(2,0) === 0.U)  //d
109024ee227SWilliam Wang      ))
1100d045bd0SYinan Xu      exceptionVec(storeAddrMisaligned) := !addrAligned
1110d045bd0SYinan Xu      exceptionVec(storePageFault)      := io.dtlb.resp.bits.excp.pf.st
1120d045bd0SYinan Xu      exceptionVec(loadPageFault)       := io.dtlb.resp.bits.excp.pf.ld
113a8e04b1dSYinan Xu      exceptionVec(storeAccessFault)    := io.dtlb.resp.bits.excp.af.st
114a8e04b1dSYinan Xu      exceptionVec(loadAccessFault)     := io.dtlb.resp.bits.excp.af.ld
115cff68e26SWilliam Wang      val exception = !addrAligned ||
116cff68e26SWilliam Wang        io.dtlb.resp.bits.excp.pf.st ||
117cff68e26SWilliam Wang        io.dtlb.resp.bits.excp.pf.ld ||
118cff68e26SWilliam Wang        io.dtlb.resp.bits.excp.af.st ||
119cff68e26SWilliam Wang        io.dtlb.resp.bits.excp.af.ld
120cff68e26SWilliam Wang      is_mmio := io.dtlb.resp.bits.mmio
121024ee227SWilliam Wang      when (exception) {
122024ee227SWilliam Wang        // check for exceptions
123024ee227SWilliam Wang        // if there are exceptions, no need to execute it
124024ee227SWilliam Wang        state := s_finish
125024ee227SWilliam Wang        atom_override_xtval := true.B
126024ee227SWilliam Wang      } .otherwise {
127024ee227SWilliam Wang        paddr := io.dtlb.resp.bits.paddr
128024ee227SWilliam Wang        state := s_flush_sbuffer_req
129024ee227SWilliam Wang      }
130024ee227SWilliam Wang    }
131024ee227SWilliam Wang  }
132024ee227SWilliam Wang
133024ee227SWilliam Wang
134024ee227SWilliam Wang  when (state === s_flush_sbuffer_req) {
135024ee227SWilliam Wang    io.flush_sbuffer.valid := true.B
136024ee227SWilliam Wang    state := s_flush_sbuffer_resp
137024ee227SWilliam Wang  }
138024ee227SWilliam Wang
139024ee227SWilliam Wang  when (state === s_flush_sbuffer_resp) {
140024ee227SWilliam Wang    when (io.flush_sbuffer.empty) {
141024ee227SWilliam Wang      state := s_cache_req
142024ee227SWilliam Wang    }
143024ee227SWilliam Wang  }
144024ee227SWilliam Wang
145024ee227SWilliam Wang  when (state === s_cache_req) {
146024ee227SWilliam Wang    io.dcache.req.valid := true.B
147024ee227SWilliam Wang    io.dcache.req.bits.cmd := LookupTree(in.uop.ctrl.fuOpType, List(
148024ee227SWilliam Wang      LSUOpType.lr_w      -> M_XLR,
149024ee227SWilliam Wang      LSUOpType.sc_w      -> M_XSC,
150024ee227SWilliam Wang      LSUOpType.amoswap_w -> M_XA_SWAP,
151024ee227SWilliam Wang      LSUOpType.amoadd_w  -> M_XA_ADD,
152024ee227SWilliam Wang      LSUOpType.amoxor_w  -> M_XA_XOR,
153024ee227SWilliam Wang      LSUOpType.amoand_w  -> M_XA_AND,
154024ee227SWilliam Wang      LSUOpType.amoor_w   -> M_XA_OR,
155024ee227SWilliam Wang      LSUOpType.amomin_w  -> M_XA_MIN,
156024ee227SWilliam Wang      LSUOpType.amomax_w  -> M_XA_MAX,
157024ee227SWilliam Wang      LSUOpType.amominu_w -> M_XA_MINU,
158024ee227SWilliam Wang      LSUOpType.amomaxu_w -> M_XA_MAXU,
159024ee227SWilliam Wang
160024ee227SWilliam Wang      LSUOpType.lr_d      -> M_XLR,
161024ee227SWilliam Wang      LSUOpType.sc_d      -> M_XSC,
162024ee227SWilliam Wang      LSUOpType.amoswap_d -> M_XA_SWAP,
163024ee227SWilliam Wang      LSUOpType.amoadd_d  -> M_XA_ADD,
164024ee227SWilliam Wang      LSUOpType.amoxor_d  -> M_XA_XOR,
165024ee227SWilliam Wang      LSUOpType.amoand_d  -> M_XA_AND,
166024ee227SWilliam Wang      LSUOpType.amoor_d   -> M_XA_OR,
167024ee227SWilliam Wang      LSUOpType.amomin_d  -> M_XA_MIN,
168024ee227SWilliam Wang      LSUOpType.amomax_d  -> M_XA_MAX,
169024ee227SWilliam Wang      LSUOpType.amominu_d -> M_XA_MINU,
170024ee227SWilliam Wang      LSUOpType.amomaxu_d -> M_XA_MAXU
171024ee227SWilliam Wang    ))
172024ee227SWilliam Wang
173024ee227SWilliam Wang    io.dcache.req.bits.addr := paddr
174024ee227SWilliam Wang    io.dcache.req.bits.data := genWdata(in.src2, in.uop.ctrl.fuOpType(1,0))
175024ee227SWilliam Wang    // TODO: atomics do need mask: fix mask
176024ee227SWilliam Wang    io.dcache.req.bits.mask := genWmask(paddr, in.uop.ctrl.fuOpType(1,0))
177024ee227SWilliam Wang    io.dcache.req.bits.meta.id       := DontCare
178024ee227SWilliam Wang    io.dcache.req.bits.meta.paddr    := paddr
179024ee227SWilliam Wang    io.dcache.req.bits.meta.tlb_miss := false.B
180024ee227SWilliam Wang    io.dcache.req.bits.meta.replay   := false.B
181024ee227SWilliam Wang
182024ee227SWilliam Wang    when(io.dcache.req.fire()){
183024ee227SWilliam Wang      state := s_cache_resp
1848a5bdd64Swangkaifan      paddr_reg := io.dcache.req.bits.addr
1858a5bdd64Swangkaifan      data_reg := io.dcache.req.bits.data
1868a5bdd64Swangkaifan      mask_reg := io.dcache.req.bits.mask
187*f97664b3Swangkaifan      fuop_reg := in.uop.ctrl.fuOpType
188024ee227SWilliam Wang    }
189024ee227SWilliam Wang  }
190024ee227SWilliam Wang
191024ee227SWilliam Wang  when (state === s_cache_resp) {
192024ee227SWilliam Wang    io.dcache.resp.ready := true.B
193024ee227SWilliam Wang    when(io.dcache.resp.fire()) {
194024ee227SWilliam Wang      is_lrsc_valid := io.dcache.resp.bits.meta.id
195024ee227SWilliam Wang      val rdata = io.dcache.resp.bits.data
196024ee227SWilliam Wang      val rdataSel = LookupTree(paddr(2, 0), List(
197024ee227SWilliam Wang        "b000".U -> rdata(63, 0),
198024ee227SWilliam Wang        "b001".U -> rdata(63, 8),
199024ee227SWilliam Wang        "b010".U -> rdata(63, 16),
200024ee227SWilliam Wang        "b011".U -> rdata(63, 24),
201024ee227SWilliam Wang        "b100".U -> rdata(63, 32),
202024ee227SWilliam Wang        "b101".U -> rdata(63, 40),
203024ee227SWilliam Wang        "b110".U -> rdata(63, 48),
204024ee227SWilliam Wang        "b111".U -> rdata(63, 56)
205024ee227SWilliam Wang      ))
206024ee227SWilliam Wang
207*f97664b3Swangkaifan      resp_data_wire := LookupTree(in.uop.ctrl.fuOpType, List(
208024ee227SWilliam Wang        LSUOpType.lr_w      -> SignExt(rdataSel(31, 0), XLEN),
2097962cc88SWilliam Wang        LSUOpType.sc_w      -> rdata,
210024ee227SWilliam Wang        LSUOpType.amoswap_w -> SignExt(rdataSel(31, 0), XLEN),
211024ee227SWilliam Wang        LSUOpType.amoadd_w  -> SignExt(rdataSel(31, 0), XLEN),
212024ee227SWilliam Wang        LSUOpType.amoxor_w  -> SignExt(rdataSel(31, 0), XLEN),
213024ee227SWilliam Wang        LSUOpType.amoand_w  -> SignExt(rdataSel(31, 0), XLEN),
214024ee227SWilliam Wang        LSUOpType.amoor_w   -> SignExt(rdataSel(31, 0), XLEN),
215024ee227SWilliam Wang        LSUOpType.amomin_w  -> SignExt(rdataSel(31, 0), XLEN),
216024ee227SWilliam Wang        LSUOpType.amomax_w  -> SignExt(rdataSel(31, 0), XLEN),
217024ee227SWilliam Wang        LSUOpType.amominu_w -> SignExt(rdataSel(31, 0), XLEN),
218024ee227SWilliam Wang        LSUOpType.amomaxu_w -> SignExt(rdataSel(31, 0), XLEN),
219024ee227SWilliam Wang
220024ee227SWilliam Wang        LSUOpType.lr_d      -> SignExt(rdataSel(63, 0), XLEN),
2217962cc88SWilliam Wang        LSUOpType.sc_d      -> rdata,
222024ee227SWilliam Wang        LSUOpType.amoswap_d -> SignExt(rdataSel(63, 0), XLEN),
223024ee227SWilliam Wang        LSUOpType.amoadd_d  -> SignExt(rdataSel(63, 0), XLEN),
224024ee227SWilliam Wang        LSUOpType.amoxor_d  -> SignExt(rdataSel(63, 0), XLEN),
225024ee227SWilliam Wang        LSUOpType.amoand_d  -> SignExt(rdataSel(63, 0), XLEN),
226024ee227SWilliam Wang        LSUOpType.amoor_d   -> SignExt(rdataSel(63, 0), XLEN),
227024ee227SWilliam Wang        LSUOpType.amomin_d  -> SignExt(rdataSel(63, 0), XLEN),
228024ee227SWilliam Wang        LSUOpType.amomax_d  -> SignExt(rdataSel(63, 0), XLEN),
229024ee227SWilliam Wang        LSUOpType.amominu_d -> SignExt(rdataSel(63, 0), XLEN),
230024ee227SWilliam Wang        LSUOpType.amomaxu_d -> SignExt(rdataSel(63, 0), XLEN)
231024ee227SWilliam Wang      ))
232024ee227SWilliam Wang
233*f97664b3Swangkaifan      resp_data := resp_data_wire
234024ee227SWilliam Wang      state := s_finish
235024ee227SWilliam Wang    }
236024ee227SWilliam Wang  }
237024ee227SWilliam Wang
238024ee227SWilliam Wang  when (state === s_finish) {
239024ee227SWilliam Wang    io.out.valid := true.B
240024ee227SWilliam Wang    io.out.bits.uop := in.uop
2410d045bd0SYinan Xu    io.out.bits.uop.cf.exceptionVec := exceptionVec
242024ee227SWilliam Wang    io.out.bits.uop.diffTestDebugLrScValid := is_lrsc_valid
243024ee227SWilliam Wang    io.out.bits.data := resp_data
244024ee227SWilliam Wang    io.out.bits.redirectValid := false.B
245024ee227SWilliam Wang    io.out.bits.redirect := DontCare
246024ee227SWilliam Wang    io.out.bits.brUpdate := DontCare
247cff68e26SWilliam Wang    io.out.bits.debug.isMMIO := is_mmio
24807635e87Swangkaifan    io.out.bits.debug.paddr := paddr
249024ee227SWilliam Wang    when (io.out.fire()) {
250024ee227SWilliam Wang      XSDebug("atomics writeback: pc %x data %x\n", io.out.bits.uop.cf.pc, io.dcache.resp.bits.data)
251024ee227SWilliam Wang      state := s_invalid
252024ee227SWilliam Wang    }
253024ee227SWilliam Wang  }
254024ee227SWilliam Wang
255024ee227SWilliam Wang  when(io.redirect.valid){
256024ee227SWilliam Wang    atom_override_xtval := false.B
257024ee227SWilliam Wang  }
2588a5bdd64Swangkaifan
2598a5bdd64Swangkaifan  if (env.DualCoreDifftest) {
2608a5bdd64Swangkaifan    difftestIO.atomicResp := WireInit(io.dcache.resp.fire())
2618a5bdd64Swangkaifan    difftestIO.atomicAddr := WireInit(paddr_reg)
2628a5bdd64Swangkaifan    difftestIO.atomicData := WireInit(data_reg)
2638a5bdd64Swangkaifan    difftestIO.atomicMask := WireInit(mask_reg)
264*f97664b3Swangkaifan    difftestIO.atomicFuop := WireInit(fuop_reg)
265*f97664b3Swangkaifan    difftestIO.atomicOut  := resp_data_wire
2668a5bdd64Swangkaifan  }
267024ee227SWilliam Wang}