1/*************************************************************************************** 2* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3* Copyright (c) 2020-2021 Peng Cheng Laboratory 4* 5* XiangShan is licensed under Mulan PSL v2. 6* You can use this software according to the terms and conditions of the Mulan PSL v2. 7* You may obtain a copy of Mulan PSL v2 at: 8* http://license.coscl.org.cn/MulanPSL2 9* 10* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13* 14* See the Mulan PSL v2 for more details. 15***************************************************************************************/ 16 17package xiangshan.mem 18 19import chipsalliance.rocketchip.config.Parameters 20import chisel3._ 21import chisel3.util._ 22import utils._ 23import utility._ 24import xiangshan.ExceptionNO._ 25import xiangshan._ 26import xiangshan.backend.fu.PMPRespBundle 27import xiangshan.cache.mmu.{TlbCmd, TlbReq, TlbRequestIO, TlbResp} 28 29// Store Pipeline Stage 0 30// Generate addr, use addr to query DCache and DTLB 31class StoreUnit_S0(implicit p: Parameters) extends XSModule { 32 val io = IO(new Bundle() { 33 val in = Flipped(Decoupled(new ExuInput)) 34 val rsIdx = Input(UInt(log2Up(IssQueSize).W)) 35 val isFirstIssue = Input(Bool()) 36 val out = Decoupled(new LsPipelineBundle) 37 val dtlbReq = DecoupledIO(new TlbReq) 38 }) 39 40 // send req to dtlb 41 // val saddr = io.in.bits.src(0) + SignExt(io.in.bits.uop.ctrl.imm(11,0), VAddrBits) 42 val imm12 = WireInit(io.in.bits.uop.ctrl.imm(11,0)) 43 val saddr_lo = io.in.bits.src(0)(11,0) + Cat(0.U(1.W), imm12) 44 val saddr_hi = Mux(saddr_lo(12), 45 Mux(imm12(11), io.in.bits.src(0)(VAddrBits-1, 12), io.in.bits.src(0)(VAddrBits-1, 12)+1.U), 46 Mux(imm12(11), io.in.bits.src(0)(VAddrBits-1, 12)+SignExt(1.U, VAddrBits-12), io.in.bits.src(0)(VAddrBits-1, 12)), 47 ) 48 val saddr = Cat(saddr_hi, saddr_lo(11,0)) 49 50 io.dtlbReq.bits.vaddr := saddr 51 io.dtlbReq.valid := io.in.valid 52 io.dtlbReq.bits.cmd := TlbCmd.write 53 io.dtlbReq.bits.size := LSUOpType.size(io.in.bits.uop.ctrl.fuOpType) 54 io.dtlbReq.bits.kill := DontCare 55 io.dtlbReq.bits.debug.robIdx := io.in.bits.uop.robIdx 56 io.dtlbReq.bits.debug.pc := io.in.bits.uop.cf.pc 57 io.dtlbReq.bits.debug.isFirstIssue := io.isFirstIssue 58 59 io.out.bits := DontCare 60 io.out.bits.vaddr := saddr 61 62 // Now data use its own io 63 // io.out.bits.data := genWdata(io.in.bits.src(1), io.in.bits.uop.ctrl.fuOpType(1,0)) 64 io.out.bits.data := io.in.bits.src(1) // FIXME: remove data from pipeline 65 io.out.bits.uop := io.in.bits.uop 66 io.out.bits.miss := DontCare 67 io.out.bits.rsIdx := io.rsIdx 68 io.out.bits.mask := genWmask(io.out.bits.vaddr, io.in.bits.uop.ctrl.fuOpType(1,0)) 69 io.out.bits.isFirstIssue := io.isFirstIssue 70 io.out.bits.wlineflag := io.in.bits.uop.ctrl.fuOpType === LSUOpType.cbo_zero 71 io.out.valid := io.in.valid 72 io.in.ready := io.out.ready 73 74 // exception check 75 val addrAligned = LookupTree(io.in.bits.uop.ctrl.fuOpType(1,0), List( 76 "b00".U -> true.B, //b 77 "b01".U -> (io.out.bits.vaddr(0) === 0.U), //h 78 "b10".U -> (io.out.bits.vaddr(1,0) === 0.U), //w 79 "b11".U -> (io.out.bits.vaddr(2,0) === 0.U) //d 80 )) 81 82 io.out.bits.uop.cf.exceptionVec(storeAddrMisaligned) := !addrAligned 83 84 XSPerfAccumulate("in_valid", io.in.valid) 85 XSPerfAccumulate("in_fire", io.in.fire) 86 XSPerfAccumulate("in_fire_first_issue", io.in.fire && io.isFirstIssue) 87 XSPerfAccumulate("addr_spec_success", io.out.fire() && saddr(VAddrBits-1, 12) === io.in.bits.src(0)(VAddrBits-1, 12)) 88 XSPerfAccumulate("addr_spec_failed", io.out.fire() && saddr(VAddrBits-1, 12) =/= io.in.bits.src(0)(VAddrBits-1, 12)) 89 XSPerfAccumulate("addr_spec_success_once", io.out.fire() && saddr(VAddrBits-1, 12) === io.in.bits.src(0)(VAddrBits-1, 12) && io.isFirstIssue) 90 XSPerfAccumulate("addr_spec_failed_once", io.out.fire() && saddr(VAddrBits-1, 12) =/= io.in.bits.src(0)(VAddrBits-1, 12) && io.isFirstIssue) 91} 92 93// Store Pipeline Stage 1 94// TLB resp (send paddr to dcache) 95class StoreUnit_S1(implicit p: Parameters) extends XSModule { 96 val io = IO(new Bundle() { 97 val in = Flipped(Decoupled(new LsPipelineBundle)) 98 val out = Decoupled(new LsPipelineBundle) 99 val lsq = ValidIO(new LsPipelineBundle()) 100 val dtlbResp = Flipped(DecoupledIO(new TlbResp())) 101 val rsFeedback = ValidIO(new RSFeedback) 102 val reExecuteQuery = Valid(new LoadReExecuteQueryIO) 103 }) 104 105 // mmio cbo decoder 106 val is_mmio_cbo = io.in.bits.uop.ctrl.fuOpType === LSUOpType.cbo_clean || 107 io.in.bits.uop.ctrl.fuOpType === LSUOpType.cbo_flush || 108 io.in.bits.uop.ctrl.fuOpType === LSUOpType.cbo_inval 109 110 val s1_paddr = io.dtlbResp.bits.paddr(0) 111 val s1_tlb_miss = io.dtlbResp.bits.miss 112 val s1_mmio = is_mmio_cbo 113 val s1_exception = ExceptionNO.selectByFu(io.out.bits.uop.cf.exceptionVec, staCfg).asUInt.orR 114 115 io.in.ready := true.B 116 117 io.dtlbResp.ready := true.B // TODO: why dtlbResp needs a ready? 118 119 // st-ld violation dectect request. 120 io.reExecuteQuery.valid := io.in.valid && !s1_tlb_miss 121 io.reExecuteQuery.bits.robIdx := io.in.bits.uop.robIdx 122 io.reExecuteQuery.bits.paddr := s1_paddr 123 io.reExecuteQuery.bits.mask := io.in.bits.mask 124 125 // Send TLB feedback to store issue queue 126 // Store feedback is generated in store_s1, sent to RS in store_s2 127 io.rsFeedback.valid := io.in.valid 128 io.rsFeedback.bits.hit := !s1_tlb_miss 129 io.rsFeedback.bits.flushState := io.dtlbResp.bits.ptwBack 130 io.rsFeedback.bits.rsIdx := io.in.bits.rsIdx 131 io.rsFeedback.bits.sourceType := RSFeedbackType.tlbMiss 132 XSDebug(io.rsFeedback.valid, 133 "S1 Store: tlbHit: %d robIdx: %d\n", 134 io.rsFeedback.bits.hit, 135 io.rsFeedback.bits.rsIdx 136 ) 137 io.rsFeedback.bits.dataInvalidSqIdx := DontCare 138 139 // get paddr from dtlb, check if rollback is needed 140 // writeback store inst to lsq 141 io.out.valid := io.in.valid && !s1_tlb_miss 142 io.out.bits := io.in.bits 143 io.out.bits.paddr := s1_paddr 144 io.out.bits.miss := false.B 145 io.out.bits.mmio := s1_mmio 146 io.out.bits.atomic := s1_mmio 147 io.out.bits.uop.cf.exceptionVec(storePageFault) := io.dtlbResp.bits.excp(0).pf.st 148 io.out.bits.uop.cf.exceptionVec(storeAccessFault) := io.dtlbResp.bits.excp(0).af.st 149 150 io.lsq.valid := io.in.valid 151 io.lsq.bits := io.out.bits 152 io.lsq.bits.miss := s1_tlb_miss 153 154 // mmio inst with exception will be writebacked immediately 155 // io.out.valid := io.in.valid && (!io.out.bits.mmio || s1_exception) && !s1_tlb_miss 156 157 XSPerfAccumulate("in_valid", io.in.valid) 158 XSPerfAccumulate("in_fire", io.in.fire) 159 XSPerfAccumulate("in_fire_first_issue", io.in.fire && io.in.bits.isFirstIssue) 160 XSPerfAccumulate("tlb_miss", io.in.fire && s1_tlb_miss) 161 XSPerfAccumulate("tlb_miss_first_issue", io.in.fire && s1_tlb_miss && io.in.bits.isFirstIssue) 162} 163 164class StoreUnit_S2(implicit p: Parameters) extends XSModule { 165 val io = IO(new Bundle() { 166 val in = Flipped(Decoupled(new LsPipelineBundle)) 167 val pmpResp = Flipped(new PMPRespBundle) 168 val static_pm = Input(Valid(Bool())) 169 val out = Decoupled(new LsPipelineBundle) 170 }) 171 val pmp = WireInit(io.pmpResp) 172 when (io.static_pm.valid) { 173 pmp.ld := false.B 174 pmp.st := false.B 175 pmp.instr := false.B 176 pmp.mmio := io.static_pm.bits 177 } 178 179 val s2_exception = ExceptionNO.selectByFu(io.out.bits.uop.cf.exceptionVec, staCfg).asUInt.orR 180 val is_mmio = io.in.bits.mmio || pmp.mmio 181 182 io.in.ready := true.B 183 io.out.bits := io.in.bits 184 io.out.bits.mmio := is_mmio && !s2_exception 185 io.out.bits.atomic := io.in.bits.atomic || pmp.atomic 186 io.out.bits.uop.cf.exceptionVec(storeAccessFault) := io.in.bits.uop.cf.exceptionVec(storeAccessFault) || pmp.st 187 io.out.valid := io.in.valid && (!is_mmio || s2_exception) 188} 189 190class StoreUnit_S3(implicit p: Parameters) extends XSModule { 191 val io = IO(new Bundle() { 192 val in = Flipped(Decoupled(new LsPipelineBundle)) 193 val stout = DecoupledIO(new ExuOutput) // writeback store 194 }) 195 196 io.in.ready := true.B 197 198 io.stout.valid := io.in.valid 199 io.stout.bits.uop := io.in.bits.uop 200 io.stout.bits.data := DontCare 201 io.stout.bits.redirectValid := false.B 202 io.stout.bits.redirect := DontCare 203 io.stout.bits.debug.isMMIO := io.in.bits.mmio 204 io.stout.bits.debug.paddr := io.in.bits.paddr 205 io.stout.bits.debug.vaddr := io.in.bits.vaddr 206 io.stout.bits.debug.isPerfCnt := false.B 207 io.stout.bits.fflags := DontCare 208 209} 210 211class StoreUnit(implicit p: Parameters) extends XSModule { 212 val io = IO(new Bundle() { 213 val stin = Flipped(Decoupled(new ExuInput)) 214 val redirect = Flipped(ValidIO(new Redirect)) 215 val feedbackSlow = ValidIO(new RSFeedback) 216 val tlb = new TlbRequestIO() 217 val pmp = Flipped(new PMPRespBundle()) 218 val rsIdx = Input(UInt(log2Up(IssQueSize).W)) 219 val isFirstIssue = Input(Bool()) 220 val lsq = ValidIO(new LsPipelineBundle) 221 val lsq_replenish = Output(new LsPipelineBundle()) 222 val stout = DecoupledIO(new ExuOutput) // writeback store 223 // store mask, send to sq in store_s0 224 val storeMaskOut = Valid(new StoreMaskBundle) 225 val reExecuteQuery = Valid(new LoadReExecuteQueryIO) 226 val issue = Valid(new ExuInput) 227 }) 228 229 val store_s0 = Module(new StoreUnit_S0) 230 val store_s1 = Module(new StoreUnit_S1) 231 val store_s2 = Module(new StoreUnit_S2) 232 val store_s3 = Module(new StoreUnit_S3) 233 234 store_s0.io.in <> io.stin 235 store_s0.io.dtlbReq <> io.tlb.req 236 io.tlb.req_kill := false.B 237 store_s0.io.rsIdx := io.rsIdx 238 store_s0.io.isFirstIssue := io.isFirstIssue 239 240 io.storeMaskOut.valid := store_s0.io.in.valid 241 io.storeMaskOut.bits.mask := store_s0.io.out.bits.mask 242 io.storeMaskOut.bits.sqIdx := store_s0.io.out.bits.uop.sqIdx 243 244 PipelineConnect(store_s0.io.out, store_s1.io.in, true.B, store_s0.io.out.bits.uop.robIdx.needFlush(io.redirect)) 245 io.issue.valid := store_s1.io.in.valid && !store_s1.io.dtlbResp.bits.miss 246 io.issue.bits := RegEnable(store_s0.io.in.bits, store_s0.io.in.valid) 247 248 store_s1.io.dtlbResp <> io.tlb.resp 249 io.lsq <> store_s1.io.lsq 250 io.reExecuteQuery := store_s1.io.reExecuteQuery 251 252 PipelineConnect(store_s1.io.out, store_s2.io.in, true.B, store_s1.io.out.bits.uop.robIdx.needFlush(io.redirect)) 253 254 // feedback tlb miss to RS in store_s2 255 io.feedbackSlow.bits := RegNext(store_s1.io.rsFeedback.bits) 256 io.feedbackSlow.valid := RegNext(store_s1.io.rsFeedback.valid && !store_s1.io.out.bits.uop.robIdx.needFlush(io.redirect)) 257 258 store_s2.io.pmpResp <> io.pmp 259 store_s2.io.static_pm := RegNext(io.tlb.resp.bits.static_pm) 260 io.lsq_replenish := store_s2.io.out.bits // mmio and exception 261 PipelineConnect(store_s2.io.out, store_s3.io.in, true.B, store_s2.io.out.bits.uop.robIdx.needFlush(io.redirect)) 262 263 store_s3.io.stout <> io.stout 264 265 private def printPipeLine(pipeline: LsPipelineBundle, cond: Bool, name: String): Unit = { 266 XSDebug(cond, 267 p"$name" + p" pc ${Hexadecimal(pipeline.uop.cf.pc)} " + 268 p"addr ${Hexadecimal(pipeline.vaddr)} -> ${Hexadecimal(pipeline.paddr)} " + 269 p"op ${Binary(pipeline.uop.ctrl.fuOpType)} " + 270 p"data ${Hexadecimal(pipeline.data)} " + 271 p"mask ${Hexadecimal(pipeline.mask)}\n" 272 ) 273 } 274 275 printPipeLine(store_s0.io.out.bits, store_s0.io.out.valid, "S0") 276 printPipeLine(store_s1.io.out.bits, store_s1.io.out.valid, "S1") 277} 278