diff --git a/arch/riscv/include/asm/kvm_cove.h b/arch/riscv/include/asm/kvm_cove.h index 38c280509c51..f9ce258dfab8 100644 --- a/arch/riscv/include/asm/kvm_cove.h +++ b/arch/riscv/include/asm/kvm_cove.h @@ -138,7 +138,10 @@ int kvm_riscv_cove_init(void); /* TVM related functions */ void kvm_riscv_cove_vm_destroy(struct kvm *kvm); -int kvm_riscv_cove_vm_init(struct kvm *kvm); +int kvm_riscv_cove_vm_single_step_init(struct kvm_vcpu *vcpu, + unsigned long fdt_address, + unsigned long tap_addr); +int kvm_riscv_cove_vm_multi_step_init(struct kvm *kvm); /* TVM VCPU related functions */ void kvm_riscv_cove_vcpu_destroy(struct kvm_vcpu *vcpu); @@ -173,7 +176,13 @@ static inline int kvm_riscv_cove_hardware_enable(void) {return 0; } /* TVM related functions */ static inline void kvm_riscv_cove_vm_destroy(struct kvm *kvm) {} -static inline int kvm_riscv_cove_vm_init(struct kvm *kvm) {return -1; } +static inline int kvm_riscv_cove_vm_single_step_init(struct kvm_vcpu *vcpu, + unsigned long fdt_address, + unsigned long tap_addr) +{ + return -1; +} +static inline int kvm_riscv_cove_vm_multi_step_init(struct kvm *kvm) {return -1; } /* TVM VCPU related functions */ static inline void kvm_riscv_cove_vcpu_destroy(struct kvm_vcpu *vcpu) {} diff --git a/arch/riscv/include/asm/kvm_cove_sbi.h b/arch/riscv/include/asm/kvm_cove_sbi.h index c9302650adc8..1314227adfad 100644 --- a/arch/riscv/include/asm/kvm_cove_sbi.h +++ b/arch/riscv/include/asm/kvm_cove_sbi.h @@ -78,6 +78,10 @@ int sbi_covh_tvm_demote_page(unsigned long tvmid, int sbi_covh_tvm_remove_pages(unsigned long tvmid, unsigned long tvm_base_page_addr, unsigned long len); +int sbi_covh_tsm_promote_to_tvm(unsigned long fdt_address, + unsigned long tap_addr, + unsigned long sepc, + unsigned long *tvmid); /* Functions related to CoVE Interrupt Management(COVI) Extension */ int sbi_covi_tvm_aia_init(unsigned long tvm_gid, struct sbi_cove_tvm_aia_params *tvm_aia_params); diff --git a/arch/riscv/include/asm/sbi.h b/arch/riscv/include/asm/sbi.h index 57c3579ae652..01e9e5b1d7a2 100644 --- a/arch/riscv/include/asm/sbi.h +++ b/arch/riscv/include/asm/sbi.h @@ -374,6 +374,7 @@ enum sbi_ext_covh_fid { SBI_EXT_COVH_TVM_PROMOTE_PAGE, SBI_EXT_COVH_TVM_DEMOTE_PAGE, SBI_EXT_COVH_TVM_REMOVE_PAGES, + SBI_EXT_COVH_PROMOTE_TO_TVM, }; enum sbi_ext_covi_fid { diff --git a/arch/riscv/kvm/Makefile b/arch/riscv/kvm/Makefile index 31f4dbd97b03..fba7ebd0cd72 100644 --- a/arch/riscv/kvm/Makefile +++ b/arch/riscv/kvm/Makefile @@ -31,4 +31,4 @@ kvm-y += aia.o kvm-y += aia_device.o kvm-y += aia_aplic.o kvm-y += aia_imsic.o -kvm-$(CONFIG_RISCV_COVE_HOST) += cove_sbi.o cove.o vcpu_sbi_covg.o +kvm-$(CONFIG_RISCV_COVE_HOST) += cove_sbi.o cove.o vcpu_sbi_covg.o vcpu_sbi_covh.o diff --git a/arch/riscv/kvm/cove.c b/arch/riscv/kvm/cove.c index a9f3b67bfeae..ed7dc0fbf08b 100644 --- a/arch/riscv/kvm/cove.c +++ b/arch/riscv/kvm/cove.c @@ -633,12 +633,12 @@ void kvm_riscv_cove_vcpu_destroy(struct kvm_vcpu *vcpu) int kvm_riscv_cove_vcpu_init(struct kvm_vcpu *vcpu) { - int rc; - struct kvm *kvm; struct kvm_cove_tvm_vcpu_context *tvcpuc; struct kvm_cove_tvm_context *tvmc; - struct page *vcpus_page; unsigned long vcpus_phys_addr; + struct page *vcpus_page; + struct kvm *kvm; + int rc; if (!vcpu) return -EINVAL; @@ -659,15 +659,20 @@ int kvm_riscv_cove_vcpu_init(struct kvm_vcpu *vcpu) if (!tvcpuc) return -ENOMEM; - vcpus_page = alloc_pages(GFP_KERNEL | __GFP_ZERO, + tvcpuc->vcpu = vcpu; + tvcpuc->vcpu_state.npages = tinfo.tvcpu_pages_needed; + vcpu->arch.tc = tvcpuc; + + if (!kvm_riscv_cove_capability(KVM_COVE_TSM_CAP_MEMORY_ALLOCATION)) { + return 0; + } + + vcpus_page = alloc_pages(GFP_KERNEL | __GFP_ZERO, get_order_num_pages(tinfo.tvcpu_pages_needed)); if (!vcpus_page) { rc = -ENOMEM; goto alloc_page_failed; } - - tvcpuc->vcpu = vcpu; - tvcpuc->vcpu_state.npages = tinfo.tvcpu_pages_needed; tvcpuc->vcpu_state.page = vcpus_page; vcpus_phys_addr = page_to_phys(vcpus_page); @@ -679,8 +684,6 @@ int kvm_riscv_cove_vcpu_init(struct kvm_vcpu *vcpu) if (rc) goto vcpu_create_failed; - vcpu->arch.tc = tvcpuc; - return 0; vcpu_create_failed: @@ -691,6 +694,7 @@ int kvm_riscv_cove_vcpu_init(struct kvm_vcpu *vcpu) __free_pages(vcpus_page, get_order_num_pages(tinfo.tvcpu_pages_needed)); alloc_page_failed: + vcpu->arch.tc = NULL; kfree(tvcpuc); return rc; } @@ -882,7 +886,7 @@ void kvm_riscv_cove_vm_destroy(struct kvm *kvm) kvm_err("Memory reclaim failed with rc %d\n", rc); } -int kvm_riscv_cove_vm_init(struct kvm *kvm) +int kvm_riscv_cove_vm_multi_step_init(struct kvm *kvm) { struct kvm_cove_tvm_context *tvmc; struct page *tvms_page, *pgt_page; @@ -890,6 +894,10 @@ int kvm_riscv_cove_vm_init(struct kvm *kvm) unsigned long gstage_pgd_size = kvm_riscv_gstage_pgd_size(); int rc = 0; + // Multi-step TVM creation requires TSM that supports dynamic page conversion + if (!kvm_riscv_cove_capability(KVM_COVE_TSM_CAP_MEMORY_ALLOCATION)) + return -EOPNOTSUPP; + tvmc = kzalloc(sizeof(*tvmc), GFP_KERNEL); if (!tvmc) return -ENOMEM; @@ -985,6 +993,65 @@ int kvm_riscv_cove_vm_init(struct kvm *kvm) return rc; } +int kvm_riscv_cove_vm_single_step_init(struct kvm_vcpu *vcpu, unsigned long fdt_address, + unsigned long tap_addr) +{ + struct kvm_cpu_context *cp = &vcpu->arch.guest_context; + unsigned long tvm_gid, target_vcpuid; + struct kvm_cove_tvm_context *tvmc; + struct kvm_vcpu *target_vcpu; + struct kvm *kvm = vcpu->kvm; + void *nshmem = nacl_shmem(); + int rc = 0, gpr_id, offset; + + if (!kvm_riscv_cove_capability(KVM_COVE_TSM_CAP_PROMOTE_TVM)) + return -EOPNOTSUPP; + + tvmc = kzalloc(sizeof(*tvmc), GFP_KERNEL); + if (!tvmc) + return -ENOMEM; + + for (gpr_id = 1; gpr_id < 32; gpr_id++) { + offset = KVM_ARCH_GUEST_ZERO + gpr_id * sizeof(unsigned long); + nacl_shmem_gpr_write_cove(nshmem, offset, + ((unsigned long *)cp)[gpr_id]); + } + kvm_arch_vcpu_load(vcpu, smp_processor_id()); + rc = sbi_covh_tsm_promote_to_tvm(fdt_address, tap_addr, cp->sepc, &tvm_gid); + if (rc) + goto done; + + INIT_LIST_HEAD(&tvmc->measured_pages); + INIT_LIST_HEAD(&tvmc->zero_pages); + INIT_LIST_HEAD(&tvmc->shared_pages); + INIT_LIST_HEAD(&tvmc->reclaim_pending_pages); + + tvmc->tvm_guest_id = tvm_gid; + tvmc->kvm = kvm; + kvm->arch.tvmc = tvmc; + + kvm_for_each_vcpu(target_vcpuid, target_vcpu, kvm) { + rc = kvm_riscv_cove_vcpu_init(target_vcpu); + if (rc) + goto vcpus_allocated; + + target_vcpu->requests = 0; + } + + tvmc->finalized_done = true; + kvm_info("Guest VM creation successful with guest id %lx\n", tvm_gid); + return 0; + +vcpus_allocated: + kvm_for_each_vcpu(target_vcpuid, target_vcpu, kvm) + if (target_vcpu->arch.tc) + kfree(target_vcpu->arch.tc); + +done: + kfree(tvmc); + return rc; +} + int kvm_riscv_cove_init(void) { int rc; diff --git a/arch/riscv/kvm/cove_sbi.c b/arch/riscv/kvm/cove_sbi.c index 4759b4920226..2325ee0f2a15 100644 --- a/arch/riscv/kvm/cove_sbi.c +++ b/arch/riscv/kvm/cove_sbi.c @@ -488,3 +488,23 @@ int sbi_covh_tvm_remove_pages(unsigned long tvmid, return 0; } + +int sbi_covh_tsm_promote_to_tvm(unsigned long fdt_address, + unsigned long tap_addr, + unsigned long sepc, + unsigned long *tvmid) +{ + struct sbiret ret; + int rc = 0; + + ret = sbi_ecall(SBI_EXT_COVH, SBI_EXT_COVH_PROMOTE_TO_TVM, fdt_address, + tap_addr, sepc, 0, 0, 0); + if (ret.error) { + rc = sbi_err_map_linux_errno(ret.error); + goto done; + } + + *tvmid = ret.value; +done: + return rc; +} diff --git a/arch/riscv/kvm/main.c b/arch/riscv/kvm/main.c index 9a9625f9c7a9..bb5562ecc97c 100644 --- a/arch/riscv/kvm/main.c +++ b/arch/riscv/kvm/main.c @@ -32,8 +32,8 @@ int kvm_arch_hardware_enable(void) /* * We just need to invoke aia enable for CoVE if host is in VS mode and TSM - * supports AIA (COVI extension). However, if the host is running in HS mode, - * we need to initialize other CSRs as well for legacy VMs. + * supports AIA (COVI extension). However, if the host is running in HS + * mode, we need to initialize other CSRs as well for legacy VMs. */ if (unlikely(kvm_riscv_cove_enabled()) && kvm_riscv_cove_capability(KVM_COVE_TSM_CAP_AIA)) goto enable_aia; diff --git a/arch/riscv/kvm/vcpu_sbi.c b/arch/riscv/kvm/vcpu_sbi.c index 8bc7d7398349..9399cf5a3062 100644 --- a/arch/riscv/kvm/vcpu_sbi.c +++ b/arch/riscv/kvm/vcpu_sbi.c @@ -40,6 +40,11 @@ static const struct kvm_vcpu_sbi_extension vcpu_sbi_ext_covg = { .extid_end = -1UL, .handler = NULL, }; +static const struct kvm_vcpu_sbi_extension vcpu_sbi_ext_covh = { + .extid_start = -1UL, + .extid_end = -1UL, + .handler = NULL, +}; #endif struct kvm_riscv_sbi_extension_entry { @@ -96,6 +101,10 @@ static const struct kvm_riscv_sbi_extension_entry sbi_ext[] = { .dis_idx = KVM_RISCV_SBI_EXT_COVG, .ext_ptr = &vcpu_sbi_ext_covg, }, + { + .dis_idx = KVM_RISCV_SBI_EXT_COVH, + .ext_ptr = &vcpu_sbi_ext_covh, + }, }; void kvm_riscv_vcpu_sbi_forward(struct kvm_vcpu *vcpu, struct kvm_run *run) diff --git a/arch/riscv/kvm/vcpu_sbi_covh.c b/arch/riscv/kvm/vcpu_sbi_covh.c new file mode 100644 index 000000000000..ef3e255732b4 --- /dev/null +++ b/arch/riscv/kvm/vcpu_sbi_covh.c @@ -0,0 +1,84 @@ +// SPDX-License-Identifier: GPL-2.0 +/* + * Copyright (c) 2024 IBM. + * + * Authors: + * Wojciech Ozga + */ + +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include +#include + +static int preload_pages(struct kvm_vcpu *vcpu) { + unsigned long hva, fault_addr, page; + struct kvm_memory_slot *memslot; + bool writable; + int bkt; + + kvm_for_each_memslot(memslot, bkt, kvm_memslots(vcpu->kvm)) { + for (page = 0; page < memslot->npages; page++) { + fault_addr = gfn_to_gpa(memslot->base_gfn) + + page * PAGE_SIZE; + hva = gfn_to_hva_memslot_prot(memslot, + gpa_to_gfn(fault_addr), + &writable); + if (!kvm_is_error_hva(hva)) + kvm_riscv_gstage_map(vcpu, memslot, fault_addr, + hva, NULL); + } + } + + return 0; +} + +static int kvm_riscv_cove_promote_to_tvm(struct kvm_vcpu *vcpu, + unsigned long fdt_address, + unsigned long tap_addr) { + int rc; + + preload_pages(vcpu); + rc = kvm_riscv_cove_vm_single_step_init(vcpu, fdt_address, tap_addr); + if (rc) + goto done; + + vcpu->kvm->arch.vm_type = KVM_VM_TYPE_RISCV_COVE; +done: + return rc; +} + +static int kvm_sbi_ext_covh_handler(struct kvm_vcpu *vcpu, struct kvm_run *run, + struct kvm_vcpu_sbi_return *retdata) +{ + struct kvm_cpu_context *cp = &vcpu->arch.guest_context; + unsigned long funcid = cp->a6; + int ret; + + switch (funcid) { + case SBI_EXT_COVH_PROMOTE_TO_TVM: + ret = kvm_riscv_cove_promote_to_tvm(vcpu, cp->a0, cp->a1); + return 0; + + default: + kvm_err("%s: Unsupported guest SBI %ld.\n", __func__, funcid); + retdata->err_val = SBI_ERR_NOT_SUPPORTED; + return -EOPNOTSUPP; + } +} + +const struct kvm_vcpu_sbi_extension vcpu_sbi_ext_covh = { + .extid_start = SBI_EXT_COVH, + .extid_end = SBI_EXT_COVH, + .handler = kvm_sbi_ext_covh_handler, +}; diff --git a/arch/riscv/kvm/vm.c b/arch/riscv/kvm/vm.c index 8a1460dba76c..6df73ea8e16f 100644 --- a/arch/riscv/kvm/vm.c +++ b/arch/riscv/kvm/vm.c @@ -44,15 +44,15 @@ int kvm_arch_init_vm(struct kvm *kvm, unsigned long type) if (unlikely(type == KVM_VM_TYPE_RISCV_COVE)) { if (!kvm_riscv_cove_enabled()) { - kvm_err("Unable to init CoVE VM because cove is not enabled\n"); + kvm_err("Unable to init CoVE VM because CoVE extension is not enabled\n"); return -EPERM; } - r = kvm_riscv_cove_vm_init(kvm); + r = kvm_riscv_cove_vm_multi_step_init(kvm); if (r) return r; kvm->arch.vm_type = type; - kvm_info("Trusted VM instance init successful\n"); + kvm_info("CoVE VM instance init successful\n"); } kvm_riscv_aia_init_vm(kvm);