| 1 | // SPDX-License-Identifier: GPL-2.0-only |
| 2 | /* |
| 3 | * Copyright (C) 2015 - ARM Ltd |
| 4 | * Author: Marc Zyngier <marc.zyngier@arm.com> |
| 5 | */ |
| 6 | |
| 7 | #include <linux/irqflags.h> |
| 8 | |
| 9 | #include <asm/kvm_hyp.h> |
| 10 | #include <asm/kvm_mmu.h> |
| 11 | #include <asm/tlbflush.h> |
| 12 | |
| 13 | struct tlb_inv_context { |
| 14 | struct kvm_s2_mmu *mmu; |
| 15 | unsigned long flags; |
| 16 | u64 tcr; |
| 17 | u64 sctlr; |
| 18 | }; |
| 19 | |
| 20 | static void enter_vmid_context(struct kvm_s2_mmu *mmu, |
| 21 | struct tlb_inv_context *cxt) |
| 22 | { |
| 23 | struct kvm_vcpu *vcpu = kvm_get_running_vcpu(); |
| 24 | u64 val; |
| 25 | |
| 26 | local_irq_save(cxt->flags); |
| 27 | |
| 28 | if (vcpu && mmu != vcpu->arch.hw_mmu) |
| 29 | cxt->mmu = vcpu->arch.hw_mmu; |
| 30 | else |
| 31 | cxt->mmu = NULL; |
| 32 | |
| 33 | if (cpus_have_final_cap(ARM64_WORKAROUND_SPECULATIVE_AT)) { |
| 34 | /* |
| 35 | * For CPUs that are affected by ARM errata 1165522 or 1530923, |
| 36 | * we cannot trust stage-1 to be in a correct state at that |
| 37 | * point. Since we do not want to force a full load of the |
| 38 | * vcpu state, we prevent the EL1 page-table walker to |
| 39 | * allocate new TLBs. This is done by setting the EPD bits |
| 40 | * in the TCR_EL1 register. We also need to prevent it to |
| 41 | * allocate IPA->PA walks, so we enable the S1 MMU... |
| 42 | */ |
| 43 | val = cxt->tcr = read_sysreg_el1(SYS_TCR); |
| 44 | val |= TCR_EPD1_MASK | TCR_EPD0_MASK; |
| 45 | write_sysreg_el1(val, SYS_TCR); |
| 46 | val = cxt->sctlr = read_sysreg_el1(SYS_SCTLR); |
| 47 | val |= SCTLR_ELx_M; |
| 48 | write_sysreg_el1(val, SYS_SCTLR); |
| 49 | } |
| 50 | |
| 51 | /* |
| 52 | * With VHE enabled, we have HCR_EL2.{E2H,TGE} = {1,1}, and |
| 53 | * most TLB operations target EL2/EL0. In order to affect the |
| 54 | * guest TLBs (EL1/EL0), we need to change one of these two |
| 55 | * bits. Changing E2H is impossible (goodbye TTBR1_EL2), so |
| 56 | * let's flip TGE before executing the TLB operation. |
| 57 | * |
| 58 | * ARM erratum 1165522 requires some special handling (again), |
| 59 | * as we need to make sure both stages of translation are in |
| 60 | * place before clearing TGE. __load_stage2() already |
| 61 | * has an ISB in order to deal with this. |
| 62 | */ |
| 63 | __load_stage2(mmu, mmu->arch); |
| 64 | val = read_sysreg(hcr_el2); |
| 65 | val &= ~HCR_TGE; |
| 66 | write_sysreg_hcr(val); |
| 67 | isb(); |
| 68 | } |
| 69 | |
| 70 | static void exit_vmid_context(struct tlb_inv_context *cxt) |
| 71 | { |
| 72 | /* |
| 73 | * We're done with the TLB operation, let's restore the host's |
| 74 | * view of HCR_EL2. |
| 75 | */ |
| 76 | write_sysreg_hcr(HCR_HOST_VHE_FLAGS); |
| 77 | isb(); |
| 78 | |
| 79 | /* ... and the stage-2 MMU context that we switched away from */ |
| 80 | if (cxt->mmu) |
| 81 | __load_stage2(cxt->mmu, cxt->mmu->arch); |
| 82 | |
| 83 | if (cpus_have_final_cap(ARM64_WORKAROUND_SPECULATIVE_AT)) { |
| 84 | /* Restore the registers to what they were */ |
| 85 | write_sysreg_el1(cxt->tcr, SYS_TCR); |
| 86 | write_sysreg_el1(cxt->sctlr, SYS_SCTLR); |
| 87 | } |
| 88 | |
| 89 | local_irq_restore(cxt->flags); |
| 90 | } |
| 91 | |
| 92 | void __kvm_tlb_flush_vmid_ipa(struct kvm_s2_mmu *mmu, |
| 93 | phys_addr_t ipa, int level) |
| 94 | { |
| 95 | struct tlb_inv_context cxt; |
| 96 | |
| 97 | dsb(ishst); |
| 98 | |
| 99 | /* Switch to requested VMID */ |
| 100 | enter_vmid_context(mmu, cxt: &cxt); |
| 101 | |
| 102 | /* |
| 103 | * We could do so much better if we had the VA as well. |
| 104 | * Instead, we invalidate Stage-2 for this IPA, and the |
| 105 | * whole of Stage-1. Weep... |
| 106 | */ |
| 107 | ipa >>= 12; |
| 108 | __tlbi_level(ipas2e1is, ipa, level); |
| 109 | |
| 110 | /* |
| 111 | * We have to ensure completion of the invalidation at Stage-2, |
| 112 | * since a table walk on another CPU could refill a TLB with a |
| 113 | * complete (S1 + S2) walk based on the old Stage-2 mapping if |
| 114 | * the Stage-1 invalidation happened first. |
| 115 | */ |
| 116 | dsb(ish); |
| 117 | __tlbi(vmalle1is); |
| 118 | dsb(ish); |
| 119 | isb(); |
| 120 | |
| 121 | exit_vmid_context(cxt: &cxt); |
| 122 | } |
| 123 | |
| 124 | void __kvm_tlb_flush_vmid_ipa_nsh(struct kvm_s2_mmu *mmu, |
| 125 | phys_addr_t ipa, int level) |
| 126 | { |
| 127 | struct tlb_inv_context cxt; |
| 128 | |
| 129 | dsb(nshst); |
| 130 | |
| 131 | /* Switch to requested VMID */ |
| 132 | enter_vmid_context(mmu, cxt: &cxt); |
| 133 | |
| 134 | /* |
| 135 | * We could do so much better if we had the VA as well. |
| 136 | * Instead, we invalidate Stage-2 for this IPA, and the |
| 137 | * whole of Stage-1. Weep... |
| 138 | */ |
| 139 | ipa >>= 12; |
| 140 | __tlbi_level(ipas2e1, ipa, level); |
| 141 | |
| 142 | /* |
| 143 | * We have to ensure completion of the invalidation at Stage-2, |
| 144 | * since a table walk on another CPU could refill a TLB with a |
| 145 | * complete (S1 + S2) walk based on the old Stage-2 mapping if |
| 146 | * the Stage-1 invalidation happened first. |
| 147 | */ |
| 148 | dsb(nsh); |
| 149 | __tlbi(vmalle1); |
| 150 | dsb(nsh); |
| 151 | isb(); |
| 152 | |
| 153 | exit_vmid_context(cxt: &cxt); |
| 154 | } |
| 155 | |
| 156 | void __kvm_tlb_flush_vmid_range(struct kvm_s2_mmu *mmu, |
| 157 | phys_addr_t start, unsigned long pages) |
| 158 | { |
| 159 | struct tlb_inv_context cxt; |
| 160 | unsigned long stride; |
| 161 | |
| 162 | /* |
| 163 | * Since the range of addresses may not be mapped at |
| 164 | * the same level, assume the worst case as PAGE_SIZE |
| 165 | */ |
| 166 | stride = PAGE_SIZE; |
| 167 | start = round_down(start, stride); |
| 168 | |
| 169 | dsb(ishst); |
| 170 | |
| 171 | /* Switch to requested VMID */ |
| 172 | enter_vmid_context(mmu, cxt: &cxt); |
| 173 | |
| 174 | __flush_s2_tlb_range_op(ipas2e1is, start, pages, stride, |
| 175 | TLBI_TTL_UNKNOWN); |
| 176 | |
| 177 | dsb(ish); |
| 178 | __tlbi(vmalle1is); |
| 179 | dsb(ish); |
| 180 | isb(); |
| 181 | |
| 182 | exit_vmid_context(cxt: &cxt); |
| 183 | } |
| 184 | |
| 185 | void __kvm_tlb_flush_vmid(struct kvm_s2_mmu *mmu) |
| 186 | { |
| 187 | struct tlb_inv_context cxt; |
| 188 | |
| 189 | dsb(ishst); |
| 190 | |
| 191 | /* Switch to requested VMID */ |
| 192 | enter_vmid_context(mmu, cxt: &cxt); |
| 193 | |
| 194 | __tlbi(vmalls12e1is); |
| 195 | dsb(ish); |
| 196 | isb(); |
| 197 | |
| 198 | exit_vmid_context(cxt: &cxt); |
| 199 | } |
| 200 | |
| 201 | void __kvm_flush_cpu_context(struct kvm_s2_mmu *mmu) |
| 202 | { |
| 203 | struct tlb_inv_context cxt; |
| 204 | |
| 205 | /* Switch to requested VMID */ |
| 206 | enter_vmid_context(mmu, cxt: &cxt); |
| 207 | |
| 208 | __tlbi(vmalle1); |
| 209 | asm volatile("ic iallu" ); |
| 210 | dsb(nsh); |
| 211 | isb(); |
| 212 | |
| 213 | exit_vmid_context(cxt: &cxt); |
| 214 | } |
| 215 | |
| 216 | void __kvm_flush_vm_context(void) |
| 217 | { |
| 218 | dsb(ishst); |
| 219 | __tlbi(alle1is); |
| 220 | dsb(ish); |
| 221 | } |
| 222 | |
| 223 | /* |
| 224 | * TLB invalidation emulation for NV. For any given instruction, we |
| 225 | * perform the following transformtions: |
| 226 | * |
| 227 | * - a TLBI targeting EL2 S1 is remapped to EL1 S1 |
| 228 | * - a non-shareable TLBI is upgraded to being inner-shareable |
| 229 | * - an outer-shareable TLBI is also mapped to inner-shareable |
| 230 | * - an nXS TLBI is upgraded to XS |
| 231 | */ |
| 232 | int __kvm_tlbi_s1e2(struct kvm_s2_mmu *mmu, u64 va, u64 sys_encoding) |
| 233 | { |
| 234 | struct tlb_inv_context cxt; |
| 235 | int ret = 0; |
| 236 | |
| 237 | /* |
| 238 | * The guest will have provided its own DSB ISHST before trapping. |
| 239 | * If it hasn't, that's its own problem, and we won't paper over it |
| 240 | * (plus, there is plenty of extra synchronisation before we even |
| 241 | * get here...). |
| 242 | */ |
| 243 | |
| 244 | if (mmu) |
| 245 | enter_vmid_context(mmu, cxt: &cxt); |
| 246 | |
| 247 | switch (sys_encoding) { |
| 248 | case OP_TLBI_ALLE2: |
| 249 | case OP_TLBI_ALLE2IS: |
| 250 | case OP_TLBI_ALLE2OS: |
| 251 | case OP_TLBI_VMALLE1: |
| 252 | case OP_TLBI_VMALLE1IS: |
| 253 | case OP_TLBI_VMALLE1OS: |
| 254 | case OP_TLBI_ALLE2NXS: |
| 255 | case OP_TLBI_ALLE2ISNXS: |
| 256 | case OP_TLBI_ALLE2OSNXS: |
| 257 | case OP_TLBI_VMALLE1NXS: |
| 258 | case OP_TLBI_VMALLE1ISNXS: |
| 259 | case OP_TLBI_VMALLE1OSNXS: |
| 260 | __tlbi(vmalle1is); |
| 261 | break; |
| 262 | case OP_TLBI_VAE2: |
| 263 | case OP_TLBI_VAE2IS: |
| 264 | case OP_TLBI_VAE2OS: |
| 265 | case OP_TLBI_VAE1: |
| 266 | case OP_TLBI_VAE1IS: |
| 267 | case OP_TLBI_VAE1OS: |
| 268 | case OP_TLBI_VAE2NXS: |
| 269 | case OP_TLBI_VAE2ISNXS: |
| 270 | case OP_TLBI_VAE2OSNXS: |
| 271 | case OP_TLBI_VAE1NXS: |
| 272 | case OP_TLBI_VAE1ISNXS: |
| 273 | case OP_TLBI_VAE1OSNXS: |
| 274 | __tlbi(vae1is, va); |
| 275 | break; |
| 276 | case OP_TLBI_VALE2: |
| 277 | case OP_TLBI_VALE2IS: |
| 278 | case OP_TLBI_VALE2OS: |
| 279 | case OP_TLBI_VALE1: |
| 280 | case OP_TLBI_VALE1IS: |
| 281 | case OP_TLBI_VALE1OS: |
| 282 | case OP_TLBI_VALE2NXS: |
| 283 | case OP_TLBI_VALE2ISNXS: |
| 284 | case OP_TLBI_VALE2OSNXS: |
| 285 | case OP_TLBI_VALE1NXS: |
| 286 | case OP_TLBI_VALE1ISNXS: |
| 287 | case OP_TLBI_VALE1OSNXS: |
| 288 | __tlbi(vale1is, va); |
| 289 | break; |
| 290 | case OP_TLBI_ASIDE1: |
| 291 | case OP_TLBI_ASIDE1IS: |
| 292 | case OP_TLBI_ASIDE1OS: |
| 293 | case OP_TLBI_ASIDE1NXS: |
| 294 | case OP_TLBI_ASIDE1ISNXS: |
| 295 | case OP_TLBI_ASIDE1OSNXS: |
| 296 | __tlbi(aside1is, va); |
| 297 | break; |
| 298 | case OP_TLBI_VAAE1: |
| 299 | case OP_TLBI_VAAE1IS: |
| 300 | case OP_TLBI_VAAE1OS: |
| 301 | case OP_TLBI_VAAE1NXS: |
| 302 | case OP_TLBI_VAAE1ISNXS: |
| 303 | case OP_TLBI_VAAE1OSNXS: |
| 304 | __tlbi(vaae1is, va); |
| 305 | break; |
| 306 | case OP_TLBI_VAALE1: |
| 307 | case OP_TLBI_VAALE1IS: |
| 308 | case OP_TLBI_VAALE1OS: |
| 309 | case OP_TLBI_VAALE1NXS: |
| 310 | case OP_TLBI_VAALE1ISNXS: |
| 311 | case OP_TLBI_VAALE1OSNXS: |
| 312 | __tlbi(vaale1is, va); |
| 313 | break; |
| 314 | case OP_TLBI_RVAE2: |
| 315 | case OP_TLBI_RVAE2IS: |
| 316 | case OP_TLBI_RVAE2OS: |
| 317 | case OP_TLBI_RVAE1: |
| 318 | case OP_TLBI_RVAE1IS: |
| 319 | case OP_TLBI_RVAE1OS: |
| 320 | case OP_TLBI_RVAE2NXS: |
| 321 | case OP_TLBI_RVAE2ISNXS: |
| 322 | case OP_TLBI_RVAE2OSNXS: |
| 323 | case OP_TLBI_RVAE1NXS: |
| 324 | case OP_TLBI_RVAE1ISNXS: |
| 325 | case OP_TLBI_RVAE1OSNXS: |
| 326 | __tlbi(rvae1is, va); |
| 327 | break; |
| 328 | case OP_TLBI_RVALE2: |
| 329 | case OP_TLBI_RVALE2IS: |
| 330 | case OP_TLBI_RVALE2OS: |
| 331 | case OP_TLBI_RVALE1: |
| 332 | case OP_TLBI_RVALE1IS: |
| 333 | case OP_TLBI_RVALE1OS: |
| 334 | case OP_TLBI_RVALE2NXS: |
| 335 | case OP_TLBI_RVALE2ISNXS: |
| 336 | case OP_TLBI_RVALE2OSNXS: |
| 337 | case OP_TLBI_RVALE1NXS: |
| 338 | case OP_TLBI_RVALE1ISNXS: |
| 339 | case OP_TLBI_RVALE1OSNXS: |
| 340 | __tlbi(rvale1is, va); |
| 341 | break; |
| 342 | case OP_TLBI_RVAAE1: |
| 343 | case OP_TLBI_RVAAE1IS: |
| 344 | case OP_TLBI_RVAAE1OS: |
| 345 | case OP_TLBI_RVAAE1NXS: |
| 346 | case OP_TLBI_RVAAE1ISNXS: |
| 347 | case OP_TLBI_RVAAE1OSNXS: |
| 348 | __tlbi(rvaae1is, va); |
| 349 | break; |
| 350 | case OP_TLBI_RVAALE1: |
| 351 | case OP_TLBI_RVAALE1IS: |
| 352 | case OP_TLBI_RVAALE1OS: |
| 353 | case OP_TLBI_RVAALE1NXS: |
| 354 | case OP_TLBI_RVAALE1ISNXS: |
| 355 | case OP_TLBI_RVAALE1OSNXS: |
| 356 | __tlbi(rvaale1is, va); |
| 357 | break; |
| 358 | default: |
| 359 | ret = -EINVAL; |
| 360 | } |
| 361 | dsb(ish); |
| 362 | isb(); |
| 363 | |
| 364 | if (mmu) |
| 365 | exit_vmid_context(cxt: &cxt); |
| 366 | |
| 367 | return ret; |
| 368 | } |
| 369 | |