1 // SPDX-License-Identifier: GPL-2.0
5 * Copyright (C) 2021 Western Digital Corporation or its affiliates.
8 #include <linux/compiler.h>
12 #include "processor.h"
14 #define DEFAULT_RISCV_GUEST_STACK_VADDR_MIN 0xac0000
16 static uint64_t page_align(struct kvm_vm *vm, uint64_t v)
18 return (v + vm->page_size) & ~(vm->page_size - 1);
21 static uint64_t pte_addr(struct kvm_vm *vm, uint64_t entry)
23 return ((entry & PGTBL_PTE_ADDR_MASK) >> PGTBL_PTE_ADDR_SHIFT) <<
24 PGTBL_PAGE_SIZE_SHIFT;
27 static uint64_t ptrs_per_pte(struct kvm_vm *vm)
29 return PGTBL_PAGE_SIZE / sizeof(uint64_t);
32 static uint64_t pte_index_mask[] = {
39 static uint32_t pte_index_shift[] = {
46 static uint64_t pte_index(struct kvm_vm *vm, vm_vaddr_t gva, int level)
48 TEST_ASSERT(level > -1,
49 "Negative page table level (%d) not possible", level);
50 TEST_ASSERT(level < vm->pgtable_levels,
51 "Invalid page table level (%d)", level);
53 return (gva & pte_index_mask[level]) >> pte_index_shift[level];
56 void virt_arch_pgd_alloc(struct kvm_vm *vm)
58 size_t nr_pages = page_align(vm, ptrs_per_pte(vm) * 8) / vm->page_size;
63 vm->pgd = vm_phy_pages_alloc(vm, nr_pages,
64 KVM_GUEST_PAGE_TABLE_MIN_PADDR,
65 vm->memslots[MEM_REGION_PT]);
66 vm->pgd_created = true;
69 void virt_arch_pg_map(struct kvm_vm *vm, uint64_t vaddr, uint64_t paddr)
71 uint64_t *ptep, next_ppn;
72 int level = vm->pgtable_levels - 1;
74 TEST_ASSERT((vaddr % vm->page_size) == 0,
75 "Virtual address not on page boundary,\n"
76 " vaddr: 0x%lx vm->page_size: 0x%x", vaddr, vm->page_size);
77 TEST_ASSERT(sparsebit_is_set(vm->vpages_valid,
78 (vaddr >> vm->page_shift)),
79 "Invalid virtual address, vaddr: 0x%lx", vaddr);
80 TEST_ASSERT((paddr % vm->page_size) == 0,
81 "Physical address not on page boundary,\n"
82 " paddr: 0x%lx vm->page_size: 0x%x", paddr, vm->page_size);
83 TEST_ASSERT((paddr >> vm->page_shift) <= vm->max_gfn,
84 "Physical address beyond maximum supported,\n"
85 " paddr: 0x%lx vm->max_gfn: 0x%lx vm->page_size: 0x%x",
86 paddr, vm->max_gfn, vm->page_size);
88 ptep = addr_gpa2hva(vm, vm->pgd) + pte_index(vm, vaddr, level) * 8;
90 next_ppn = vm_alloc_page_table(vm) >> PGTBL_PAGE_SIZE_SHIFT;
91 *ptep = (next_ppn << PGTBL_PTE_ADDR_SHIFT) |
97 ptep = addr_gpa2hva(vm, pte_addr(vm, *ptep)) +
98 pte_index(vm, vaddr, level) * 8;
99 if (!*ptep && level > 0) {
100 next_ppn = vm_alloc_page_table(vm) >>
101 PGTBL_PAGE_SIZE_SHIFT;
102 *ptep = (next_ppn << PGTBL_PTE_ADDR_SHIFT) |
103 PGTBL_PTE_VALID_MASK;
108 paddr = paddr >> PGTBL_PAGE_SIZE_SHIFT;
109 *ptep = (paddr << PGTBL_PTE_ADDR_SHIFT) |
110 PGTBL_PTE_PERM_MASK | PGTBL_PTE_VALID_MASK;
113 vm_paddr_t addr_arch_gva2gpa(struct kvm_vm *vm, vm_vaddr_t gva)
116 int level = vm->pgtable_levels - 1;
118 if (!vm->pgd_created)
121 ptep = addr_gpa2hva(vm, vm->pgd) + pte_index(vm, gva, level) * 8;
127 ptep = addr_gpa2hva(vm, pte_addr(vm, *ptep)) +
128 pte_index(vm, gva, level) * 8;
134 return pte_addr(vm, *ptep) + (gva & (vm->page_size - 1));
137 TEST_FAIL("No mapping for vm virtual address gva: 0x%lx level: %d",
142 static void pte_dump(FILE *stream, struct kvm_vm *vm, uint8_t indent,
143 uint64_t page, int level)
146 static const char *const type[] = { "pte", "pmd", "pud", "p4d"};
152 for (pte = page; pte < page + ptrs_per_pte(vm) * 8; pte += 8) {
153 ptep = addr_gpa2hva(vm, pte);
156 fprintf(stream, "%*s%s: %lx: %lx at %p\n", indent, "",
157 type[level], pte, *ptep, ptep);
158 pte_dump(stream, vm, indent + 1,
159 pte_addr(vm, *ptep), level - 1);
164 void virt_arch_dump(FILE *stream, struct kvm_vm *vm, uint8_t indent)
166 int level = vm->pgtable_levels - 1;
169 if (!vm->pgd_created)
172 for (pgd = vm->pgd; pgd < vm->pgd + ptrs_per_pte(vm) * 8; pgd += 8) {
173 ptep = addr_gpa2hva(vm, pgd);
176 fprintf(stream, "%*spgd: %lx: %lx at %p\n", indent, "",
178 pte_dump(stream, vm, indent + 1,
179 pte_addr(vm, *ptep), level - 1);
183 void riscv_vcpu_mmu_setup(struct kvm_vcpu *vcpu)
185 struct kvm_vm *vm = vcpu->vm;
189 * The RISC-V Sv48 MMU mode supports 56-bit physical address
190 * for 48-bit virtual address with 4KB last level page size.
193 case VM_MODE_P52V48_4K:
194 case VM_MODE_P48V48_4K:
195 case VM_MODE_P40V48_4K:
198 TEST_FAIL("Unknown guest mode, mode: 0x%x", vm->mode);
201 satp = (vm->pgd >> PGTBL_PAGE_SIZE_SHIFT) & SATP_PPN;
202 satp |= SATP_MODE_48;
204 vcpu_set_reg(vcpu, RISCV_GENERAL_CSR_REG(satp), satp);
207 void vcpu_arch_dump(FILE *stream, struct kvm_vcpu *vcpu, uint8_t indent)
209 struct kvm_riscv_core core;
211 vcpu_get_reg(vcpu, RISCV_CORE_REG(mode), &core.mode);
212 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.pc), &core.regs.pc);
213 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.ra), &core.regs.ra);
214 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.sp), &core.regs.sp);
215 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.gp), &core.regs.gp);
216 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.tp), &core.regs.tp);
217 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.t0), &core.regs.t0);
218 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.t1), &core.regs.t1);
219 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.t2), &core.regs.t2);
220 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s0), &core.regs.s0);
221 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s1), &core.regs.s1);
222 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.a0), &core.regs.a0);
223 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.a1), &core.regs.a1);
224 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.a2), &core.regs.a2);
225 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.a3), &core.regs.a3);
226 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.a4), &core.regs.a4);
227 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.a5), &core.regs.a5);
228 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.a6), &core.regs.a6);
229 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.a7), &core.regs.a7);
230 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s2), &core.regs.s2);
231 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s3), &core.regs.s3);
232 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s4), &core.regs.s4);
233 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s5), &core.regs.s5);
234 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s6), &core.regs.s6);
235 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s7), &core.regs.s7);
236 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s8), &core.regs.s8);
237 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s9), &core.regs.s9);
238 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s10), &core.regs.s10);
239 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.s11), &core.regs.s11);
240 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.t3), &core.regs.t3);
241 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.t4), &core.regs.t4);
242 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.t5), &core.regs.t5);
243 vcpu_get_reg(vcpu, RISCV_CORE_REG(regs.t6), &core.regs.t6);
246 " MODE: 0x%lx\n", core.mode);
248 " PC: 0x%016lx RA: 0x%016lx SP: 0x%016lx GP: 0x%016lx\n",
249 core.regs.pc, core.regs.ra, core.regs.sp, core.regs.gp);
251 " TP: 0x%016lx T0: 0x%016lx T1: 0x%016lx T2: 0x%016lx\n",
252 core.regs.tp, core.regs.t0, core.regs.t1, core.regs.t2);
254 " S0: 0x%016lx S1: 0x%016lx A0: 0x%016lx A1: 0x%016lx\n",
255 core.regs.s0, core.regs.s1, core.regs.a0, core.regs.a1);
257 " A2: 0x%016lx A3: 0x%016lx A4: 0x%016lx A5: 0x%016lx\n",
258 core.regs.a2, core.regs.a3, core.regs.a4, core.regs.a5);
260 " A6: 0x%016lx A7: 0x%016lx S2: 0x%016lx S3: 0x%016lx\n",
261 core.regs.a6, core.regs.a7, core.regs.s2, core.regs.s3);
263 " S4: 0x%016lx S5: 0x%016lx S6: 0x%016lx S7: 0x%016lx\n",
264 core.regs.s4, core.regs.s5, core.regs.s6, core.regs.s7);
266 " S8: 0x%016lx S9: 0x%016lx S10: 0x%016lx S11: 0x%016lx\n",
267 core.regs.s8, core.regs.s9, core.regs.s10, core.regs.s11);
269 " T3: 0x%016lx T4: 0x%016lx T5: 0x%016lx T6: 0x%016lx\n",
270 core.regs.t3, core.regs.t4, core.regs.t5, core.regs.t6);
273 static void __aligned(16) guest_unexp_trap(void)
275 sbi_ecall(KVM_RISCV_SELFTESTS_SBI_EXT,
276 KVM_RISCV_SELFTESTS_SBI_UNEXP,
280 void vcpu_arch_set_entry_point(struct kvm_vcpu *vcpu, void *guest_code)
282 vcpu_set_reg(vcpu, RISCV_CORE_REG(regs.pc), (unsigned long)guest_code);
285 struct kvm_vcpu *vm_arch_vcpu_add(struct kvm_vm *vm, uint32_t vcpu_id)
289 unsigned long stack_vaddr;
290 unsigned long current_gp = 0;
291 struct kvm_mp_state mps;
292 struct kvm_vcpu *vcpu;
294 stack_size = vm->page_size == 4096 ? DEFAULT_STACK_PGS * vm->page_size :
296 stack_vaddr = __vm_vaddr_alloc(vm, stack_size,
297 DEFAULT_RISCV_GUEST_STACK_VADDR_MIN,
300 vcpu = __vm_vcpu_add(vm, vcpu_id);
301 riscv_vcpu_mmu_setup(vcpu);
304 * With SBI HSM support in KVM RISC-V, all secondary VCPUs are
305 * powered-off by default so we ensure that all secondary VCPUs
306 * are powered-on using KVM_SET_MP_STATE ioctl().
308 mps.mp_state = KVM_MP_STATE_RUNNABLE;
309 r = __vcpu_ioctl(vcpu, KVM_SET_MP_STATE, &mps);
310 TEST_ASSERT(!r, "IOCTL KVM_SET_MP_STATE failed (error %d)", r);
312 /* Setup global pointer of guest to be same as the host */
314 "add %0, gp, zero" : "=r" (current_gp) : : "memory");
315 vcpu_set_reg(vcpu, RISCV_CORE_REG(regs.gp), current_gp);
317 /* Setup stack pointer and program counter of guest */
318 vcpu_set_reg(vcpu, RISCV_CORE_REG(regs.sp), stack_vaddr + stack_size);
320 /* Setup default exception vector of guest */
321 vcpu_set_reg(vcpu, RISCV_GENERAL_CSR_REG(stvec), (unsigned long)guest_unexp_trap);
326 void vcpu_args_set(struct kvm_vcpu *vcpu, unsigned int num, ...)
329 uint64_t id = RISCV_CORE_REG(regs.a0);
332 TEST_ASSERT(num >= 1 && num <= 8, "Unsupported number of args,\n"
337 for (i = 0; i < num; i++) {
340 id = RISCV_CORE_REG(regs.a0);
343 id = RISCV_CORE_REG(regs.a1);
346 id = RISCV_CORE_REG(regs.a2);
349 id = RISCV_CORE_REG(regs.a3);
352 id = RISCV_CORE_REG(regs.a4);
355 id = RISCV_CORE_REG(regs.a5);
358 id = RISCV_CORE_REG(regs.a6);
361 id = RISCV_CORE_REG(regs.a7);
364 vcpu_set_reg(vcpu, id, va_arg(ap, uint64_t));
370 void assert_on_unhandled_exception(struct kvm_vcpu *vcpu)
374 struct sbiret sbi_ecall(int ext, int fid, unsigned long arg0,
375 unsigned long arg1, unsigned long arg2,
376 unsigned long arg3, unsigned long arg4,
379 register uintptr_t a0 asm ("a0") = (uintptr_t)(arg0);
380 register uintptr_t a1 asm ("a1") = (uintptr_t)(arg1);
381 register uintptr_t a2 asm ("a2") = (uintptr_t)(arg2);
382 register uintptr_t a3 asm ("a3") = (uintptr_t)(arg3);
383 register uintptr_t a4 asm ("a4") = (uintptr_t)(arg4);
384 register uintptr_t a5 asm ("a5") = (uintptr_t)(arg5);
385 register uintptr_t a6 asm ("a6") = (uintptr_t)(fid);
386 register uintptr_t a7 asm ("a7") = (uintptr_t)(ext);
391 : "+r" (a0), "+r" (a1)
392 : "r" (a2), "r" (a3), "r" (a4), "r" (a5), "r" (a6), "r" (a7)
400 bool guest_sbi_probe_extension(int extid, long *out_val)
404 ret = sbi_ecall(SBI_EXT_BASE, SBI_EXT_BASE_PROBE_EXT, extid,
407 __GUEST_ASSERT(!ret.error || ret.error == SBI_ERR_NOT_SUPPORTED,
408 "ret.error=%ld, ret.value=%ld\n", ret.error, ret.value);
410 if (ret.error == SBI_ERR_NOT_SUPPORTED)
414 *out_val = ret.value;