1/*************************************************************************************** 2* Copyright (c) 2020-2021 Institute of Computing Technology, Chinese Academy of Sciences 3* Copyright (c) 2020-2021 Peng Cheng Laboratory 4* 5* XiangShan is licensed under Mulan PSL v2. 6* You can use this software according to the terms and conditions of the Mulan PSL v2. 7* You may obtain a copy of Mulan PSL v2 at: 8* http://license.coscl.org.cn/MulanPSL2 9 10* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, 11* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, 12* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE. 13* 14* See the Mulan PSL v2 for more details. 15***************************************************************************************/ 16 17package xiangshan.cache.mmu 18 19import org.chipsalliance.cde.config.Parameters 20import chisel3._ 21import chisel3.util._ 22import difftest._ 23import freechips.rocketchip.util.SRAMAnnotation 24import xiangshan._ 25import utils._ 26import utility._ 27import xiangshan.backend.fu.{PMPChecker, PMPReqBundle, PMPConfig => XSPMPConfig} 28import xiangshan.backend.rob.RobPtr 29import xiangshan.backend.fu.util.HasCSRConst 30import freechips.rocketchip.rocket.PMPConfig 31 32/** TLB module 33 * support block request and non-block request io at the same time 34 * return paddr at next cycle, then go for pmp/pma check 35 * @param Width: The number of requestors 36 * @param Block: Blocked or not for each requestor ports 37 * @param q: TLB Parameters, like entry number, each TLB has its own parameters 38 * @param p: XiangShan Paramemters, like XLEN 39 */ 40 41class TLB(Width: Int, nRespDups: Int = 1, Block: Seq[Boolean], q: TLBParameters)(implicit p: Parameters) extends TlbModule 42 with HasCSRConst 43 with HasPerfEvents 44{ 45 val io = IO(new TlbIO(Width, nRespDups, q)) 46 47 val req = io.requestor.map(_.req) 48 val resp = io.requestor.map(_.resp) 49 val ptw = io.ptw 50 val pmp = io.pmp 51 val refill_to_mem = io.refill_to_mem 52 53 /** Sfence.vma & Svinval 54 * Sfence.vma will 1. flush old entries 2. flush inflight 3. flush pipe 55 * Svinval will 1. flush old entries 2. flush inflight 56 * So, Svinval will not flush pipe, which means 57 * it should not drop reqs from pipe and should return right resp 58 */ 59 val sfence = DelayN(io.sfence, q.fenceDelay) 60 val csr = io.csr 61 val satp = DelayN(io.csr.satp, q.fenceDelay) 62 val vsatp = DelayN(io.csr.vsatp, q.fenceDelay) 63 val hgatp = DelayN(io.csr.hgatp, q.fenceDelay) 64 65 val flush_mmu = DelayN(sfence.valid || csr.satp.changed || csr.vsatp.changed || csr.hgatp.changed, q.fenceDelay) 66 val mmu_flush_pipe = DelayN(sfence.valid && sfence.bits.flushPipe, q.fenceDelay) // for svinval, won't flush pipe 67 val flush_pipe = io.flushPipe 68 val redirect = io.redirect 69 val req_in = req 70 val req_out = req.map(a => RegEnable(a.bits, a.fire)) 71 val req_out_v = (0 until Width).map(i => ValidHold(req_in(i).fire && !req_in(i).bits.kill, resp(i).fire, flush_pipe(i))) 72 73 val isHyperInst = (0 until Width).map(i => req_out_v(i) && req_out(i).hyperinst) 74 75 // ATTENTION: csr and flush from backend are delayed. csr should not be later than flush. 76 // because, csr will influence tlb behavior. 77 val ifecth = if (q.fetchi) true.B else false.B 78 val mode_tmp = if (q.useDmode) csr.priv.dmode else csr.priv.imode 79 val mode = (0 until Width).map(i => Mux(isHyperInst(i), csr.priv.spvp, mode_tmp)) 80 val virt_in = csr.priv.virt 81 val virt_out = req.map(a => RegEnable(csr.priv.virt, a.fire)) 82 val sum = (0 until Width).map(i => Mux(virt_out(i) || isHyperInst(i), io.csr.priv.vsum, io.csr.priv.sum)) 83 val mxr = (0 until Width).map(i => Mux(virt_out(i) || isHyperInst(i), io.csr.priv.vmxr || io.csr.priv.mxr, io.csr.priv.mxr)) 84 val req_in_s2xlate = (0 until Width).map(i => MuxCase(noS2xlate, Seq( 85 (!(virt_in || req_in(i).bits.hyperinst)) -> noS2xlate, 86 (csr.vsatp.mode =/= 0.U && csr.hgatp.mode =/= 0.U) -> allStage, 87 (csr.vsatp.mode === 0.U) -> onlyStage2, 88 (csr.hgatp.mode === 0.U) -> onlyStage1 89 ))) 90 val req_out_s2xlate = (0 until Width).map(i => MuxCase(noS2xlate, Seq( 91 (!(virt_out(i) || isHyperInst(i))) -> noS2xlate, 92 (csr.vsatp.mode =/= 0.U && csr.hgatp.mode =/= 0.U) -> allStage, 93 (csr.vsatp.mode === 0.U) -> onlyStage2, 94 (csr.hgatp.mode === 0.U) -> onlyStage1 95 ))) 96 val need_gpa = RegInit(false.B) 97 val need_gpa_robidx = Reg(new RobPtr) 98 val need_gpa_vpn = Reg(UInt(vpnLen.W)) 99 val need_gpa_gvpn = Reg(UInt(vpnLen.W)) 100 val resp_gpa_refill = RegInit(false.B) 101 val hasGpf = Wire(Vec(Width, Bool())) 102 103 val vmEnable = (0 until Width).map(i => !(isHyperInst(i) || virt_out(i)) && (if (EnbaleTlbDebug) (satp.mode === 8.U) 104 else (satp.mode === 8.U) && (mode(i) < ModeM))) 105 val s2xlateEnable = (0 until Width).map(i => (isHyperInst(i) || virt_out(i)) && (vsatp.mode === 8.U || hgatp.mode === 8.U) && (mode(i) < ModeM)) 106 val portTranslateEnable = (0 until Width).map(i => (vmEnable(i) || s2xlateEnable(i)) && RegEnable(!req(i).bits.no_translate, req(i).valid)) 107 108 109 val refill = ptw.resp.fire && !(ptw.resp.bits.getGpa) && !flush_mmu 110 refill_to_mem := DontCare 111 val entries = Module(new TlbStorageWrapper(Width, q, nRespDups)) 112 entries.io.base_connect(sfence, csr, satp) 113 if (q.outReplace) { io.replace <> entries.io.replace } 114 for (i <- 0 until Width) { 115 entries.io.r_req_apply(io.requestor(i).req.valid, get_pn(req_in(i).bits.vaddr), i, req_in_s2xlate(i)) 116 entries.io.w_apply(refill, ptw.resp.bits) 117 // TODO: RegNext enable:req.valid 118 resp(i).bits.debug.isFirstIssue := RegEnable(req(i).bits.debug.isFirstIssue, req(i).valid) 119 resp(i).bits.debug.robIdx := RegEnable(req(i).bits.debug.robIdx, req(i).valid) 120 } 121 122 // read TLB, get hit/miss, paddr, perm bits 123 val readResult = (0 until Width).map(TLBRead(_)) 124 val hitVec = readResult.map(_._1) 125 val missVec = readResult.map(_._2) 126 val pmp_addr = readResult.map(_._3) 127 val perm = readResult.map(_._4) 128 val g_perm = readResult.map(_._5) 129 // check pmp use paddr (for timing optization, use pmp_addr here) 130 // check permisson 131 (0 until Width).foreach{i => 132 pmp_check(pmp_addr(i), req_out(i).size, req_out(i).cmd, i) 133 for (d <- 0 until nRespDups) { 134 perm_check(perm(i)(d), req_out(i).cmd, i, d, g_perm(i)(d), req_out(i).hlvx, req_out_s2xlate(i)) 135 } 136 hasGpf(i) := resp(i).bits.excp(0).gpf.ld || resp(i).bits.excp(0).gpf.st || resp(i).bits.excp(0).gpf.instr 137 } 138 139 // handle block or non-block io 140 // for non-block io, just return the above result, send miss to ptw 141 // for block io, hold the request, send miss to ptw, 142 // when ptw back, return the result 143 (0 until Width) foreach {i => 144 if (Block(i)) handle_block(i) 145 else handle_nonblock(i) 146 } 147 io.ptw.resp.ready := true.B 148 149 /************************ main body above | method/log/perf below ****************************/ 150 def TLBRead(i: Int) = { 151 val (e_hit, e_ppn, e_perm, e_g_perm, e_s2xlate) = entries.io.r_resp_apply(i) 152 val (p_hit, p_ppn, p_perm, p_gvpn, p_g_perm, p_s2xlate) = ptw_resp_bypass(get_pn(req_in(i).bits.vaddr), req_in_s2xlate(i)) 153 val enable = portTranslateEnable(i) 154 val isOnlys2xlate = req_out_s2xlate(i) === onlyStage2 155 val need_gpa_vpn_hit = need_gpa_vpn === get_pn(req_out(i).vaddr) 156 val isitlb = TlbCmd.isExec(req_out(i).cmd) 157 158 when (!isitlb && need_gpa_robidx.needFlush(redirect) || isitlb && flush_pipe(i)){ 159 need_gpa := false.B 160 resp_gpa_refill := false.B 161 need_gpa_vpn := 0.U 162 }.elsewhen (req_out_v(i) && !p_hit && !(resp_gpa_refill && need_gpa_vpn_hit) && !isOnlys2xlate && hasGpf(i) && need_gpa === false.B && !io.requestor(i).req_kill) { 163 need_gpa := true.B 164 need_gpa_vpn := get_pn(req_out(i).vaddr) 165 resp_gpa_refill := false.B 166 need_gpa_robidx := req_out(i).debug.robIdx 167 }.elsewhen (ptw.resp.fire && need_gpa && need_gpa_vpn === ptw.resp.bits.getVpn(need_gpa_vpn)) { 168 need_gpa_gvpn := ptw.resp.bits.s2.entry.tag 169 resp_gpa_refill := true.B 170 } 171 172 when (req_out_v(i) && hasGpf(i) && resp_gpa_refill && need_gpa_vpn_hit ){ 173 need_gpa := false.B 174 } 175 176 TimeOutAssert(need_gpa && !resp_gpa_refill, timeOutThreshold, s"port{i} need gpa long time not refill.") 177 178 val hit = e_hit || p_hit 179 val miss = (!hit && enable) || hasGpf(i) && !p_hit && !(resp_gpa_refill && need_gpa_vpn_hit) && !isOnlys2xlate 180 hit.suggestName(s"hit_read_${i}") 181 miss.suggestName(s"miss_read_${i}") 182 183 val vaddr = SignExt(req_out(i).vaddr, PAddrBits) 184 resp(i).bits.miss := miss 185 resp(i).bits.ptwBack := ptw.resp.fire 186 resp(i).bits.memidx := RegEnable(req_in(i).bits.memidx, req_in(i).valid) 187 188 val ppn = WireInit(VecInit(Seq.fill(nRespDups)(0.U(ppnLen.W)))) 189 val perm = WireInit(VecInit(Seq.fill(nRespDups)(0.U.asTypeOf(new TlbPermBundle)))) 190 val gvpn = WireInit(VecInit(Seq.fill(nRespDups)(0.U(vpnLen.W)))) 191 val g_perm = WireInit(VecInit(Seq.fill(nRespDups)(0.U.asTypeOf(new TlbPermBundle)))) 192 val r_s2xlate = WireInit(VecInit(Seq.fill(nRespDups)(0.U(2.W)))) 193 for (d <- 0 until nRespDups) { 194 ppn(d) := Mux(p_hit, p_ppn, e_ppn(d)) 195 perm(d) := Mux(p_hit, p_perm, e_perm(d)) 196 gvpn(d) := Mux(hasGpf(i), Mux(p_hit, p_gvpn, need_gpa_gvpn), 0.U) 197 g_perm(d) := Mux(p_hit, p_g_perm, e_g_perm(d)) 198 r_s2xlate(d) := Mux(p_hit, p_s2xlate, e_s2xlate(d)) 199 val paddr = Cat(ppn(d), get_off(req_out(i).vaddr)) 200 val gpaddr = Cat(gvpn(d), get_off(req_out(i).vaddr)) 201 resp(i).bits.paddr(d) := Mux(enable, paddr, vaddr) 202 resp(i).bits.gpaddr(d) := Mux(r_s2xlate(d) === onlyStage2, vaddr, gpaddr) 203 } 204 205 XSDebug(req_out_v(i), p"(${i.U}) hit:${hit} miss:${miss} ppn:${Hexadecimal(ppn(0))} perm:${perm(0)}\n") 206 207 val pmp_paddr = resp(i).bits.paddr(0) 208 209 (hit, miss, pmp_paddr, perm, g_perm) 210 } 211 212 def pmp_check(addr: UInt, size: UInt, cmd: UInt, idx: Int): Unit = { 213 pmp(idx).valid := resp(idx).valid 214 pmp(idx).bits.addr := addr 215 pmp(idx).bits.size := size 216 pmp(idx).bits.cmd := cmd 217 } 218 219 def perm_check(perm: TlbPermBundle, cmd: UInt, idx: Int, nDups: Int, g_perm: TlbPermBundle, hlvx: Bool, s2xlate: UInt) = { 220 // for timing optimization, pmp check is divided into dynamic and static 221 // dynamic: superpage (or full-connected reg entries) -> check pmp when translation done 222 // static: 4K pages (or sram entries) -> check pmp with pre-checked results 223 val hasS2xlate = s2xlate =/= noS2xlate 224 val onlyS2 = s2xlate === onlyStage2 225 val af = perm.af || (hasS2xlate && g_perm.af) 226 227 // Stage 1 perm check 228 val pf = perm.pf 229 val ldUpdate = !perm.a && TlbCmd.isRead(cmd) && !TlbCmd.isAmo(cmd) // update A/D through exception 230 val stUpdate = (!perm.a || !perm.d) && (TlbCmd.isWrite(cmd) || TlbCmd.isAmo(cmd)) // update A/D through exception 231 val instrUpdate = !perm.a && TlbCmd.isExec(cmd) // update A/D through exception 232 val modeCheck = !(mode(idx) === ModeU && !perm.u || mode(idx) === ModeS && perm.u && (!sum(idx) || ifecth)) 233 val ldPermFail = !(modeCheck && Mux(hlvx, perm.x, perm.r || mxr(idx) && perm.x)) 234 val stPermFail = !(modeCheck && perm.w) 235 val instrPermFail = !(modeCheck && perm.x) 236 val ldPf = (ldPermFail || pf) && (TlbCmd.isRead(cmd) && !TlbCmd.isAmo(cmd)) 237 val stPf = (stPermFail || pf) && (TlbCmd.isWrite(cmd) || TlbCmd.isAmo(cmd)) 238 val instrPf = (instrPermFail || pf) && TlbCmd.isExec(cmd) 239 val s1_valid = portTranslateEnable(idx) && !onlyS2 240 241 // Stage 2 perm check 242 val gpf = g_perm.pf 243 val g_ldUpdate = !g_perm.a && TlbCmd.isRead(cmd) && !TlbCmd.isAmo(cmd) 244 val g_stUpdate = (!g_perm.a || !g_perm.d) && (TlbCmd.isWrite(cmd) || TlbCmd.isAmo(cmd)) 245 val g_instrUpdate = !g_perm.a && TlbCmd.isExec(cmd) 246 val g_ldPermFail = !Mux(hlvx, g_perm.x, (g_perm.r || io.csr.priv.mxr && g_perm.x)) 247 val g_stPermFail = !g_perm.w 248 val g_instrPermFail = !g_perm.x 249 val ldGpf = (g_ldPermFail || gpf) && (TlbCmd.isRead(cmd) && !TlbCmd.isAmo(cmd)) 250 val stGpf = (g_stPermFail || gpf) && (TlbCmd.isWrite(cmd) || TlbCmd.isAmo(cmd)) 251 val instrGpf = (g_instrPermFail || gpf) && TlbCmd.isExec(cmd) 252 val s2_valid = hasS2xlate && portTranslateEnable(idx) 253 254 val fault_valid = s1_valid || s2_valid 255 256 // when pf and gpf can't happens simultaneously 257 val hasPf = (ldPf || ldUpdate || stPf || stUpdate || instrPf || instrUpdate) && s1_valid && !af 258 resp(idx).bits.excp(nDups).pf.ld := (ldPf || ldUpdate) && s1_valid && !af 259 resp(idx).bits.excp(nDups).pf.st := (stPf || stUpdate) && s1_valid && !af 260 resp(idx).bits.excp(nDups).pf.instr := (instrPf || instrUpdate) && s1_valid && !af 261 // NOTE: pf need && with !af, page fault has higher priority than access fault 262 // but ptw may also have access fault, then af happens, the translation is wrong. 263 // In this case, pf has lower priority than af 264 265 resp(idx).bits.excp(nDups).gpf.ld := (ldGpf || g_ldUpdate) && s2_valid && !af && !hasPf 266 resp(idx).bits.excp(nDups).gpf.st := (stGpf || g_stUpdate) && s2_valid && !af && !hasPf 267 resp(idx).bits.excp(nDups).gpf.instr := (instrGpf || g_instrUpdate) && s2_valid && !af && !hasPf 268 269 resp(idx).bits.excp(nDups).af.ld := af && TlbCmd.isRead(cmd) && fault_valid 270 resp(idx).bits.excp(nDups).af.st := af && TlbCmd.isWrite(cmd) && fault_valid 271 resp(idx).bits.excp(nDups).af.instr := af && TlbCmd.isExec(cmd) && fault_valid 272 273 274 } 275 276 def handle_nonblock(idx: Int): Unit = { 277 io.requestor(idx).resp.valid := req_out_v(idx) 278 io.requestor(idx).req.ready := io.requestor(idx).resp.ready // should always be true 279 XSError(!io.requestor(idx).resp.ready, s"${q.name} port ${idx} is non-block, resp.ready must be true.B") 280 281 val req_need_gpa = hasGpf(idx) 282 val req_s2xlate = Wire(UInt(2.W)) 283 req_s2xlate := MuxCase(noS2xlate, Seq( 284 (!(virt_out(idx) || req_out(idx).hyperinst)) -> noS2xlate, 285 (csr.vsatp.mode =/= 0.U && csr.hgatp.mode =/= 0.U) -> allStage, 286 (csr.vsatp.mode === 0.U) -> onlyStage2, 287 (csr.hgatp.mode === 0.U || req_need_gpa) -> onlyStage1 288 )) 289 290 val ptw_just_back = ptw.resp.fire && req_s2xlate === ptw.resp.bits.s2xlate && ptw.resp.bits.hit(get_pn(req_out(idx).vaddr), io.csr.satp.asid, io.csr.vsatp.asid, io.csr.hgatp.asid, true, false) 291 // TODO: RegNext enable: ptw.resp.valid ? req.valid 292 val ptw_resp_bits_reg = RegEnable(ptw.resp.bits, ptw.resp.valid) 293 val ptw_already_back = GatedValidRegNext(ptw.resp.fire) && req_s2xlate === ptw_resp_bits_reg.s2xlate && ptw_resp_bits_reg.hit(get_pn(req_out(idx).vaddr), io.csr.satp.asid, io.csr.vsatp.asid, io.csr.hgatp.asid, allType = true) 294 io.ptw.req(idx).valid := req_out_v(idx) && missVec(idx) && !(ptw_just_back || ptw_already_back) // TODO: remove the regnext, timing 295 io.tlbreplay(idx) := req_out_v(idx) && missVec(idx) && (ptw_just_back || ptw_already_back) 296 when (io.requestor(idx).req_kill && GatedValidRegNext(io.requestor(idx).req.fire)) { 297 io.ptw.req(idx).valid := false.B 298 io.tlbreplay(idx) := true.B 299 } 300 io.ptw.req(idx).bits.vpn := get_pn(req_out(idx).vaddr) 301 io.ptw.req(idx).bits.s2xlate := req_s2xlate 302 io.ptw.req(idx).bits.getGpa := req_need_gpa && hitVec(idx) 303 io.ptw.req(idx).bits.memidx := req_out(idx).memidx 304 } 305 306 def handle_block(idx: Int): Unit = { 307 // three valid: 1.if exist a entry; 2.if sent to ptw; 3.unset resp.valid 308 io.requestor(idx).req.ready := !req_out_v(idx) || io.requestor(idx).resp.fire 309 // req_out_v for if there is a request, may long latency, fixme 310 311 // miss request entries 312 val req_need_gpa = hasGpf(idx) 313 val miss_req_vpn = get_pn(req_out(idx).vaddr) 314 val miss_req_memidx = req_out(idx).memidx 315 val miss_req_s2xlate = Wire(UInt(2.W)) 316 miss_req_s2xlate := MuxCase(noS2xlate, Seq( 317 (!(virt_out(idx) || req_out(idx).hyperinst)) -> noS2xlate, 318 (csr.vsatp.mode =/= 0.U && csr.hgatp.mode =/= 0.U) -> allStage, 319 (csr.vsatp.mode === 0.U) -> onlyStage2, 320 (csr.hgatp.mode === 0.U || req_need_gpa) -> onlyStage1 321 )) 322 val miss_req_s2xlate_reg = RegEnable(miss_req_s2xlate, io.ptw.req(idx).fire) 323 val hasS2xlate = miss_req_s2xlate_reg =/= noS2xlate 324 val onlyS2 = miss_req_s2xlate_reg === onlyStage2 325 val hit_s1 = io.ptw.resp.bits.s1.hit(miss_req_vpn, Mux(hasS2xlate, io.csr.vsatp.asid, io.csr.satp.asid), io.csr.hgatp.asid, allType = true, false, hasS2xlate) 326 val hit_s2 = io.ptw.resp.bits.s2.hit(miss_req_vpn, io.csr.hgatp.asid) 327 val hit = Mux(onlyS2, hit_s2, hit_s1) && io.ptw.resp.valid && miss_req_s2xlate_reg === io.ptw.resp.bits.s2xlate 328 329 val new_coming_valid = WireInit(false.B) 330 new_coming_valid := req_in(idx).fire && !req_in(idx).bits.kill && !flush_pipe(idx) 331 val new_coming = GatedValidRegNext(new_coming_valid) 332 val miss_wire = new_coming && missVec(idx) 333 val miss_v = ValidHoldBypass(miss_wire, resp(idx).fire, flush_pipe(idx)) 334 val miss_req_v = ValidHoldBypass(miss_wire || (miss_v && flush_mmu && !mmu_flush_pipe), 335 io.ptw.req(idx).fire || resp(idx).fire, flush_pipe(idx)) 336 337 // when ptw resp, check if hit, reset miss_v, resp to lsu/ifu 338 resp(idx).valid := req_out_v(idx) && !(miss_v && portTranslateEnable(idx)) 339 when (io.ptw.resp.fire && hit && req_out_v(idx) && portTranslateEnable(idx)) { 340 val stage1 = io.ptw.resp.bits.s1 341 val stage2 = io.ptw.resp.bits.s2 342 val s2xlate = io.ptw.resp.bits.s2xlate 343 resp(idx).valid := true.B 344 resp(idx).bits.miss := false.B 345 val s1_paddr = Cat(stage1.genPPN(get_pn(req_out(idx).vaddr)), get_off(req_out(idx).vaddr)) 346 val s2_paddr = Cat(stage2.genPPNS2(get_pn(req_out(idx).vaddr)), get_off(req_out(idx).vaddr)) 347 for (d <- 0 until nRespDups) { 348 resp(idx).bits.paddr(d) := Mux(s2xlate =/= noS2xlate, s2_paddr, s1_paddr) 349 resp(idx).bits.gpaddr(d) := s1_paddr 350 perm_check(stage1, req_out(idx).cmd, idx, d, stage2, req_out(idx).hlvx, s2xlate) 351 } 352 pmp_check(resp(idx).bits.paddr(0), req_out(idx).size, req_out(idx).cmd, idx) 353 354 // NOTE: the unfiltered req would be handled by Repeater 355 } 356 assert(RegNext(!resp(idx).valid || resp(idx).ready, true.B), "when tlb resp valid, ready should be true, must") 357 assert(RegNext(req_out_v(idx) || !(miss_v || miss_req_v), true.B), "when not req_out_v, should not set miss_v/miss_req_v") 358 359 val ptw_req = io.ptw.req(idx) 360 ptw_req.valid := miss_req_v 361 ptw_req.bits.vpn := miss_req_vpn 362 ptw_req.bits.s2xlate := miss_req_s2xlate 363 ptw_req.bits.getGpa := req_need_gpa && hitVec(idx) 364 ptw_req.bits.memidx := miss_req_memidx 365 366 io.tlbreplay(idx) := false.B 367 368 // NOTE: when flush pipe, tlb should abandon last req 369 // however, some outside modules like icache, dont care flushPipe, and still waiting for tlb resp 370 // just resp valid and raise page fault to go through. The pipe(ifu) will abandon it. 371 if (!q.outsideRecvFlush) { 372 when (req_out_v(idx) && flush_pipe(idx) && portTranslateEnable(idx)) { 373 resp(idx).valid := true.B 374 for (d <- 0 until nRespDups) { 375 resp(idx).bits.excp(d).pf.ld := true.B // sfence happened, pf for not to use this addr 376 resp(idx).bits.excp(d).pf.st := true.B 377 resp(idx).bits.excp(d).pf.instr := true.B 378 } 379 } 380 } 381 } 382 383 // when ptw resp, tlb at refill_idx maybe set to miss by force. 384 // Bypass ptw resp to check. 385 def ptw_resp_bypass(vpn: UInt, s2xlate: UInt) = { 386 // TODO: RegNext enable: ptw.resp.valid 387 val hasS2xlate = s2xlate =/= noS2xlate 388 val onlyS2 = s2xlate === onlyStage2 389 val onlyS1 = s2xlate === onlyStage1 390 val s2xlate_hit = s2xlate === ptw.resp.bits.s2xlate 391 val resp_hit = ptw.resp.bits.hit(vpn, io.csr.satp.asid, io.csr.vsatp.asid, io.csr.hgatp.asid, true, false) 392 val p_hit = GatedValidRegNext(resp_hit && io.ptw.resp.fire && s2xlate_hit) 393 val ppn_s1 = ptw.resp.bits.s1.genPPN(vpn) 394 val gvpn = Mux(onlyS2, vpn, ppn_s1) 395 val ppn_s2 = ptw.resp.bits.s2.genPPNS2(gvpn) 396 val p_ppn = RegEnable(Mux(hasS2xlate, ppn_s2, ppn_s1), io.ptw.resp.fire) 397 val p_perm = RegEnable(ptwresp_to_tlbperm(ptw.resp.bits.s1), io.ptw.resp.fire) 398 val p_gvpn = RegEnable(Mux(onlyS2, ptw.resp.bits.s2.entry.tag, ppn_s1), io.ptw.resp.fire) 399 val p_g_perm = RegEnable(hptwresp_to_tlbperm(ptw.resp.bits.s2), io.ptw.resp.fire) 400 val p_s2xlate = RegEnable(ptw.resp.bits.s2xlate, io.ptw.resp.fire) 401 (p_hit, p_ppn, p_perm, p_gvpn, p_g_perm, p_s2xlate) 402 } 403 404 // assert 405 for(i <- 0 until Width) { 406 TimeOutAssert(req_out_v(i) && !resp(i).valid, timeOutThreshold, s"{q.name} port{i} long time no resp valid.") 407 } 408 409 // perf event 410 val result_ok = req_in.map(a => GatedValidRegNext(a.fire)) 411 val perfEvents = 412 Seq( 413 ("access", PopCount((0 until Width).map{i => if (Block(i)) io.requestor(i).req.fire else portTranslateEnable(i) && result_ok(i) })), 414 ("miss ", PopCount((0 until Width).map{i => if (Block(i)) portTranslateEnable(i) && result_ok(i) && missVec(i) else ptw.req(i).fire })), 415 ) 416 generatePerfEvent() 417 418 // perf log 419 for (i <- 0 until Width) { 420 if (Block(i)) { 421 XSPerfAccumulate(s"access${i}",result_ok(i) && portTranslateEnable(i)) 422 XSPerfAccumulate(s"miss${i}", result_ok(i) && missVec(i)) 423 } else { 424 XSPerfAccumulate("first_access" + Integer.toString(i, 10), result_ok(i) && portTranslateEnable(i) && RegEnable(req(i).bits.debug.isFirstIssue, req(i).valid)) 425 XSPerfAccumulate("access" + Integer.toString(i, 10), result_ok(i) && portTranslateEnable(i)) 426 XSPerfAccumulate("first_miss" + Integer.toString(i, 10), result_ok(i) && portTranslateEnable(i) && missVec(i) && RegEnable(req(i).bits.debug.isFirstIssue, req(i).valid)) 427 XSPerfAccumulate("miss" + Integer.toString(i, 10), result_ok(i) && portTranslateEnable(i) && missVec(i)) 428 } 429 } 430 XSPerfAccumulate("ptw_resp_count", ptw.resp.fire) 431 XSPerfAccumulate("ptw_resp_pf_count", ptw.resp.fire && ptw.resp.bits.s1.pf) 432 433 // Log 434 for(i <- 0 until Width) { 435 XSDebug(req(i).valid, p"req(${i.U}): (${req(i).valid} ${req(i).ready}) ${req(i).bits}\n") 436 XSDebug(resp(i).valid, p"resp(${i.U}): (${resp(i).valid} ${resp(i).ready}) ${resp(i).bits}\n") 437 } 438 439 XSDebug(io.sfence.valid, p"Sfence: ${io.sfence}\n") 440 XSDebug(ParallelOR(req_out_v) || ptw.resp.valid, p"vmEnable:${vmEnable} hit:${Binary(VecInit(hitVec).asUInt)} miss:${Binary(VecInit(missVec).asUInt)}\n") 441 for (i <- ptw.req.indices) { 442 XSDebug(ptw.req(i).fire, p"L2TLB req:${ptw.req(i).bits}\n") 443 } 444 XSDebug(ptw.resp.valid, p"L2TLB resp:${ptw.resp.bits} (v:${ptw.resp.valid}r:${ptw.resp.ready}) \n") 445 446 println(s"${q.name}: page: ${q.NWays} ${q.Associative} ${q.Replacer.get}") 447 448 if (env.EnableDifftest) { 449 for (i <- 0 until Width) { 450 val pf = io.requestor(i).resp.bits.excp(0).pf.instr || io.requestor(i).resp.bits.excp(0).pf.st || io.requestor(i).resp.bits.excp(0).pf.ld 451 val gpf = io.requestor(i).resp.bits.excp(0).gpf.instr || io.requestor(i).resp.bits.excp(0).gpf.st || io.requestor(i).resp.bits.excp(0).gpf.ld 452 val af = io.requestor(i).resp.bits.excp(0).af.instr || io.requestor(i).resp.bits.excp(0).af.st || io.requestor(i).resp.bits.excp(0).af.ld 453 val difftest = DifftestModule(new DiffL1TLBEvent) 454 difftest.coreid := io.hartId 455 difftest.valid := RegNext(io.requestor(i).req.fire) && !io.requestor(i).req_kill && io.requestor(i).resp.fire && !io.requestor(i).resp.bits.miss && !pf && !af && !gpf && portTranslateEnable(i) 456 if (!Seq("itlb", "ldtlb", "sttlb").contains(q.name)) { 457 difftest.valid := false.B 458 } 459 difftest.index := TLBDiffId(p(XSCoreParamsKey).HartId).U 460 difftest.vpn := RegEnable(get_pn(req_in(i).bits.vaddr), req_in(i).valid) 461 difftest.ppn := get_pn(io.requestor(i).resp.bits.paddr(0)) 462 difftest.satp := Cat(io.csr.satp.mode, io.csr.satp.asid, io.csr.satp.ppn) 463 difftest.vsatp := Cat(io.csr.vsatp.mode, io.csr.vsatp.asid, io.csr.vsatp.ppn) 464 difftest.hgatp := Cat(io.csr.hgatp.mode, io.csr.hgatp.asid, io.csr.hgatp.ppn) 465 val req_need_gpa = gpf 466 val req_s2xlate = Wire(UInt(2.W)) 467 req_s2xlate := MuxCase(noS2xlate, Seq( 468 (!RegNext(virt_in || req_in(i).bits.hyperinst)) -> noS2xlate, 469 (vsatp.mode =/= 0.U && hgatp.mode =/= 0.U) -> allStage, 470 (vsatp.mode === 0.U) -> onlyStage2, 471 (hgatp.mode === 0.U || req_need_gpa) -> onlyStage1 472 )) 473 difftest.s2xlate := req_s2xlate 474 } 475 } 476} 477 478object TLBDiffId { 479 var i: Int = 0 480 var lastHartId: Int = -1 481 def apply(hartId: Int): Int = { 482 if (lastHartId != hartId) { 483 i = 0 484 lastHartId = hartId 485 } 486 i += 1 487 i - 1 488 } 489} 490 491class TLBNonBlock(Width: Int, nRespDups: Int = 1, q: TLBParameters)(implicit p: Parameters) extends TLB(Width, nRespDups, Seq.fill(Width)(false), q) 492class TLBBLock(Width: Int, nRespDups: Int = 1, q: TLBParameters)(implicit p: Parameters) extends TLB(Width, nRespDups, Seq.fill(Width)(true), q) 493 494class TlbReplace(Width: Int, q: TLBParameters)(implicit p: Parameters) extends TlbModule { 495 val io = IO(new TlbReplaceIO(Width, q)) 496 497 if (q.Associative == "fa") { 498 val re = ReplacementPolicy.fromString(q.Replacer, q.NWays) 499 re.access(io.page.access.map(_.touch_ways)) 500 io.page.refillIdx := re.way 501 } else { // set-acco && plru 502 val re = ReplacementPolicy.fromString(q.Replacer, q.NSets, q.NWays) 503 re.access(io.page.access.map(_.sets), io.page.access.map(_.touch_ways)) 504 io.page.refillIdx := { if (q.NWays == 1) 0.U else re.way(io.page.chosen_set) } 505 } 506} 507