[RFC PATCH 06/13] KVM: TDX: Pass size to reclaim_page()

From: isaku . yamahata
Date: Sun Aug 07 2022 - 18:32:23 EST


From: Xiaoyao Li <xiaoyao.li@xxxxxxxxx>

A 2MB large page can be tdh_mem_page_aug()'ed to TD directly. In this case,
it needs to reclaim and clear the page as 2MB size.

Signed-off-by: Xiaoyao Li <xiaoyao.li@xxxxxxxxx>
Signed-off-by: Isaku Yamahata <isaku.yamahata@xxxxxxxxx>
---
arch/x86/kvm/vmx/tdx.c | 28 ++++++++++++++++++----------
1 file changed, 18 insertions(+), 10 deletions(-)

diff --git a/arch/x86/kvm/vmx/tdx.c b/arch/x86/kvm/vmx/tdx.c
index b7a75c0adbfa..0b9f9075e1ea 100644
--- a/arch/x86/kvm/vmx/tdx.c
+++ b/arch/x86/kvm/vmx/tdx.c
@@ -189,11 +189,13 @@ void tdx_hardware_disable(void)
tdx_disassociate_vp(&tdx->vcpu);
}

-static void tdx_clear_page(unsigned long page)
+static void tdx_clear_page(unsigned long page, int size)
{
const void *zero_page = (const void *) __va(page_to_phys(ZERO_PAGE(0)));
unsigned long i;

+ WARN_ON_ONCE(size % 64);
+
/*
* Zeroing the page is only necessary for systems with MKTME-i:
* when re-assign one page from old keyid to a new keyid, MOVDIR64B is
@@ -203,13 +205,14 @@ static void tdx_clear_page(unsigned long page)
if (!static_cpu_has(X86_FEATURE_MOVDIR64B))
return;

- for (i = 0; i < 4096; i += 64)
+ for (i = 0; i < size; i += 64)
/* MOVDIR64B [rdx], es:rdi */
asm (".byte 0x66, 0x0f, 0x38, 0xf8, 0x3a"
: : "d" (zero_page), "D" (page + i) : "memory");
}

-static int tdx_reclaim_page(unsigned long va, hpa_t pa, bool do_wb, u16 hkid)
+static int tdx_reclaim_page(unsigned long va, hpa_t pa, enum pg_level level,
+ bool do_wb, u16 hkid)
{
struct tdx_module_output out;
u64 err;
@@ -219,8 +222,11 @@ static int tdx_reclaim_page(unsigned long va, hpa_t pa, bool do_wb, u16 hkid)
pr_tdx_error(TDH_PHYMEM_PAGE_RECLAIM, err, &out);
return -EIO;
}
+ /* out.r8 == tdx sept page level */
+ WARN_ON_ONCE(out.r8 != pg_level_to_tdx_sept_level(level));

- if (do_wb) {
+ /* only TDR page gets into this path */
+ if (do_wb && level == PG_LEVEL_4K) {
err = tdh_phymem_page_wbinvd(set_hkid_to_hpa(pa, hkid));
if (WARN_ON_ONCE(err)) {
pr_tdx_error(TDH_PHYMEM_PAGE_WBINVD, err, NULL);
@@ -228,7 +234,7 @@ static int tdx_reclaim_page(unsigned long va, hpa_t pa, bool do_wb, u16 hkid)
}
}

- tdx_clear_page(va);
+ tdx_clear_page(va, KVM_HPAGE_SIZE(level));
return 0;
}

@@ -257,7 +263,7 @@ static void tdx_reclaim_td_page(struct tdx_td_page *page)
* was already flushed by TDH.PHYMEM.CACHE.WB before here, So
* cache doesn't need to be flushed again.
*/
- if (tdx_reclaim_page(page->va, page->pa, false, 0))
+ if (tdx_reclaim_page(page->va, page->pa, PG_LEVEL_4K, false, 0))
return;

page->added = false;
@@ -404,8 +410,8 @@ void tdx_vm_free(struct kvm *kvm)
* TDX global HKID is needed.
*/
if (kvm_tdx->tdr.added &&
- tdx_reclaim_page(kvm_tdx->tdr.va, kvm_tdx->tdr.pa, true,
- tdx_global_keyid))
+ tdx_reclaim_page(kvm_tdx->tdr.va, kvm_tdx->tdr.pa, PG_LEVEL_4K,
+ true, tdx_global_keyid))
return;

free_page(kvm_tdx->tdr.va);
@@ -1548,7 +1554,8 @@ static void tdx_sept_drop_private_spte(
* The HKID assigned to this TD was already freed and cache
* was already flushed. We don't have to flush again.
*/
- err = tdx_reclaim_page((unsigned long)__va(hpa), hpa, false, 0);
+ err = tdx_reclaim_page((unsigned long)__va(hpa), hpa, level,
+ false, 0);

unlock:
spin_unlock(&kvm_tdx->seamcall_lock);
@@ -1667,7 +1674,8 @@ static int tdx_sept_free_private_sp(struct kvm *kvm, gfn_t gfn, enum pg_level le
* already flushed. We don't have to flush again.
*/
spin_lock(&kvm_tdx->seamcall_lock);
- ret = tdx_reclaim_page((unsigned long)sept_page, __pa(sept_page), false, 0);
+ ret = tdx_reclaim_page((unsigned long)sept_page, __pa(sept_page),
+ PG_LEVEL_4K, false, 0);
spin_unlock(&kvm_tdx->seamcall_lock);

return ret;
--
2.25.1