[PATCH Part2 RFC v3 35/37] KVM: SVM: Provide support for SNP_GUEST_REQUEST NAE event

From: Brijesh Singh
Date: Wed Jun 02 2021 - 10:16:50 EST


Version 2 of GHCB specification added the support SNP Guest Request Message
NAE event. The event allows for an SEV-SNP guest to make request to the
SEV-SNP firmware through hypervisor using the SNP_GUEST_REQUEST API define
in the SEV-SNP firmware specification.

The SNP_GUEST_REQUEST requires two unique pages, one page for the request
and one page for the response. The response page need to be in the firmware
state. The GHCB specification says that both the pages need to be in the
hypervisor state but before executing the SEV-SNP command the response page
need to be in the firmware state.

In order to minimize the page state transition during the command handling,
pre-allocate a firmware page on guest creation. Use the pre-allocated
firmware page to complete the command execution and copy the result in the
guest response page.

Ratelimit the handling of SNP_GUEST_REQUEST NAE to avoid the possibility
of a guest creating a denial of service attack aginst the SNP firmware.

Now that KVM supports all the VMGEXIT NAEs required for the base SEV-SNP
feature, set the hypervisor feature to advertise it.

Signed-off-by: Brijesh Singh <brijesh.singh@xxxxxxx>
---
arch/x86/kvm/svm/sev.c | 101 +++++++++++++++++++++++++++++++++++++++--
arch/x86/kvm/svm/svm.h | 5 +-
2 files changed, 102 insertions(+), 4 deletions(-)

diff --git a/arch/x86/kvm/svm/sev.c b/arch/x86/kvm/svm/sev.c
index 5b033d4c3b92..5718e2e07788 100644
--- a/arch/x86/kvm/svm/sev.c
+++ b/arch/x86/kvm/svm/sev.c
@@ -18,6 +18,7 @@
#include <linux/processor.h>
#include <linux/trace_events.h>
#include <linux/sev.h>
+#include <linux/kvm_host.h>
#include <asm/fpu/internal.h>

#include <asm/trapnr.h>
@@ -1515,6 +1516,7 @@ static int sev_receive_finish(struct kvm *kvm, struct kvm_sev_cmd *argp)

static void *snp_context_create(struct kvm *kvm, struct kvm_sev_cmd *argp)
{
+ struct kvm_sev_info *sev = &to_kvm_svm(kvm)->sev_info;
struct sev_data_snp_gctx_create data = {};
void *context;
int rc;
@@ -1524,14 +1526,24 @@ static void *snp_context_create(struct kvm *kvm, struct kvm_sev_cmd *argp)
if (!context)
return NULL;

- data.gctx_paddr = __psp_pa(context);
- rc = __sev_issue_cmd(argp->sev_fd, SEV_CMD_SNP_GCTX_CREATE, &data, &argp->error);
- if (rc) {
+ /* Allocate a firmware buffer used during the guest command handling. */
+ sev->snp_resp_page = snp_alloc_firmware_page(GFP_KERNEL_ACCOUNT);
+ if (!sev->snp_resp_page) {
snp_free_firmware_page(context);
return NULL;
}

+ data.gctx_paddr = __psp_pa(context);
+ rc = __sev_issue_cmd(argp->sev_fd, SEV_CMD_SNP_GCTX_CREATE, &data, &argp->error);
+ if (rc)
+ goto e_free;
+
return context;
+
+e_free:
+ snp_free_firmware_page(context);
+ snp_free_firmware_page(sev->snp_resp_page);
+ return NULL;
}

static int snp_bind_asid(struct kvm *kvm, int *error)
@@ -1599,6 +1611,9 @@ static int snp_launch_start(struct kvm *kvm, struct kvm_sev_cmd *argp)
if (rc)
goto e_free_context;

+ /* Used for rate limiting SNP guest message request, use the default settings */
+ ratelimit_default_init(&sev->snp_guest_msg_rs);
+
return 0;

e_free_context:
@@ -2196,6 +2211,9 @@ static int snp_decommission_context(struct kvm *kvm)
snp_free_firmware_page(sev->snp_context);
sev->snp_context = NULL;

+ /* Free the response page. */
+ snp_free_firmware_page(sev->snp_resp_page);
+
return 0;
}

@@ -2641,6 +2659,7 @@ static int sev_es_validate_vmgexit(struct vcpu_svm *svm)
case SVM_VMGEXIT_UNSUPPORTED_EVENT:
case SVM_VMGEXIT_HV_FT:
case SVM_VMGEXIT_PSC:
+ case SVM_VMGEXIT_GUEST_REQUEST:
break;
default:
goto vmgexit_err;
@@ -3031,6 +3050,76 @@ static unsigned long snp_handle_page_state_change(struct vcpu_svm *svm, struct g
return rc ? map_to_psc_vmgexit_code(rc) : 0;
}

+static void snp_handle_guest_request(struct vcpu_svm *svm, struct ghcb *ghcb,
+ gpa_t req_gpa, gpa_t resp_gpa)
+{
+ struct sev_data_snp_guest_request data = {};
+ struct kvm_vcpu *vcpu = &svm->vcpu;
+ struct kvm *kvm = vcpu->kvm;
+ kvm_pfn_t req_pfn, resp_pfn;
+ struct kvm_sev_info *sev;
+ int rc, err = 0;
+
+ if (!sev_snp_guest(vcpu->kvm)) {
+ rc = -ENODEV;
+ goto e_fail;
+ }
+
+ sev = &to_kvm_svm(kvm)->sev_info;
+
+ if (!__ratelimit(&sev->snp_guest_msg_rs)) {
+ pr_info_ratelimited("svm: too many guest message requests\n");
+ rc = -EAGAIN;
+ goto e_fail;
+ }
+
+ if (!IS_ALIGNED(req_gpa, PAGE_SIZE) || !IS_ALIGNED(resp_gpa, PAGE_SIZE)) {
+ pr_err_ratelimited("svm: guest request (%#llx) or response (%#llx) is not page aligned\n",
+ req_gpa, resp_gpa);
+ rc = -EINVAL;
+ goto e_fail;
+ }
+
+ req_pfn = gfn_to_pfn(kvm, gpa_to_gfn(req_gpa));
+ if (is_error_noslot_pfn(req_pfn)) {
+ pr_err_ratelimited("svm: guest request invalid gpa=%#llx\n", req_gpa);
+ rc = -EINVAL;
+ goto e_fail;
+ }
+
+ resp_pfn = gfn_to_pfn(kvm, gpa_to_gfn(resp_gpa));
+ if (is_error_noslot_pfn(resp_pfn)) {
+ pr_err_ratelimited("svm: guest response invalid gpa=%#llx\n", resp_gpa);
+ rc = -EINVAL;
+ goto e_fail;
+ }
+
+ data.gctx_paddr = __psp_pa(sev->snp_context);
+ data.req_paddr = __sme_set(req_pfn << PAGE_SHIFT);
+ data.res_paddr = __psp_pa(sev->snp_resp_page);
+
+ mutex_lock(&kvm->lock);
+
+ rc = sev_issue_cmd(kvm, SEV_CMD_SNP_GUEST_REQUEST, &data, &err);
+ if (rc) {
+ mutex_unlock(&kvm->lock);
+
+ /* If we have a firmware error code then use it. */
+ if (err)
+ rc = err;
+
+ goto e_fail;
+ }
+
+ /* Copy the response after the firmware returns success. */
+ rc = kvm_write_guest(kvm, resp_gpa, sev->snp_resp_page, PAGE_SIZE);
+
+ mutex_unlock(&kvm->lock);
+
+e_fail:
+ ghcb_set_sw_exit_info_2(ghcb, rc);
+}
+
static int sev_handle_vmgexit_msr_protocol(struct vcpu_svm *svm)
{
struct vmcb_control_area *control = &svm->vmcb->control;
@@ -3284,6 +3373,12 @@ int sev_handle_vmgexit(struct kvm_vcpu *vcpu)
ghcb_set_sw_exit_info_2(ghcb, rc);
break;
}
+ case SVM_VMGEXIT_GUEST_REQUEST: {
+ snp_handle_guest_request(svm, ghcb, control->exit_info_1, control->exit_info_2);
+
+ ret = 1;
+ break;
+ }
case SVM_VMGEXIT_UNSUPPORTED_EVENT:
vcpu_unimpl(vcpu,
"vmgexit: unsupported event - exit_info_1=%#llx, exit_info_2=%#llx\n",
diff --git a/arch/x86/kvm/svm/svm.h b/arch/x86/kvm/svm/svm.h
index ccdaaa4e1fb1..d4efcda3070d 100644
--- a/arch/x86/kvm/svm/svm.h
+++ b/arch/x86/kvm/svm/svm.h
@@ -18,6 +18,7 @@
#include <linux/kvm_types.h>
#include <linux/kvm_host.h>
#include <linux/bits.h>
+#include <linux/ratelimit.h>

#include <asm/svm.h>
#include <asm/sev-common.h>
@@ -68,6 +69,8 @@ struct kvm_sev_info {
struct kvm *enc_context_owner; /* Owner of copied encryption context */
struct misc_cg *misc_cg; /* For misc cgroup accounting */
void *snp_context; /* SNP guest context page */
+ void *snp_resp_page; /* SNP guest response page */
+ struct ratelimit_state snp_guest_msg_rs; /* Rate limit the SNP guest message */
};

struct kvm_svm {
@@ -550,7 +553,7 @@ void svm_vcpu_unblocking(struct kvm_vcpu *vcpu);
#define GHCB_VERSION_MAX 2ULL
#define GHCB_VERSION_MIN 1ULL

-#define GHCB_HV_FT_SUPPORTED 0
+#define GHCB_HV_FT_SUPPORTED GHCB_HV_FT_SNP

extern unsigned int max_sev_asid;

--
2.17.1