KVM: PPC: Book3S HV: MMU notifier callbacks for radix guests
authorPaul Mackerras <paulus@ozlabs.org>
Mon, 30 Jan 2017 10:21:47 +0000 (21:21 +1100)
committerMichael Ellerman <mpe@ellerman.id.au>
Tue, 31 Jan 2017 08:11:49 +0000 (19:11 +1100)
This adapts our implementations of the MMU notifier callbacks
(unmap_hva, unmap_hva_range, age_hva, test_age_hva, set_spte_hva)
to call radix functions when the guest is using radix.  These
implementations are much simpler than for HPT guests because we
have only one PTE to deal with, so we don't need to traverse
rmap chains.

Signed-off-by: Paul Mackerras <paulus@ozlabs.org>
Signed-off-by: Michael Ellerman <mpe@ellerman.id.au>
arch/powerpc/include/asm/kvm_book3s.h
arch/powerpc/kvm/book3s_64_mmu_hv.c
arch/powerpc/kvm/book3s_64_mmu_radix.c

index ff5cd5c5ce8d9e32f2fe303d844828cb89da53ab..952cc4b954a1b9e5eed0bbd3a7b205eb4e0312a1 100644 (file)
@@ -192,6 +192,12 @@ extern int kvmppc_mmu_radix_xlate(struct kvm_vcpu *vcpu, gva_t eaddr,
 extern void kvmppc_free_radix(struct kvm *kvm);
 extern int kvmppc_radix_init(void);
 extern void kvmppc_radix_exit(void);
+extern int kvm_unmap_radix(struct kvm *kvm, struct kvm_memory_slot *memslot,
+                       unsigned long gfn);
+extern int kvm_age_radix(struct kvm *kvm, struct kvm_memory_slot *memslot,
+                       unsigned long gfn);
+extern int kvm_test_age_radix(struct kvm *kvm, struct kvm_memory_slot *memslot,
+                       unsigned long gfn);
 
 /* XXX remove this export when load_last_inst() is generic */
 extern int kvmppc_ld(struct kvm_vcpu *vcpu, ulong *eaddr, int size, void *ptr, bool data);
index 57690c22716d5bd15c334f764e62c0fe9d1104aa..088c82bb7ba4ba09b5fd5cc787538064b578195c 100644 (file)
@@ -701,12 +701,13 @@ static void kvmppc_rmap_reset(struct kvm *kvm)
        srcu_read_unlock(&kvm->srcu, srcu_idx);
 }
 
+typedef int (*hva_handler_fn)(struct kvm *kvm, struct kvm_memory_slot *memslot,
+                             unsigned long gfn);
+
 static int kvm_handle_hva_range(struct kvm *kvm,
                                unsigned long start,
                                unsigned long end,
-                               int (*handler)(struct kvm *kvm,
-                                              unsigned long *rmapp,
-                                              unsigned long gfn))
+                               hva_handler_fn handler)
 {
        int ret;
        int retval = 0;
@@ -731,9 +732,7 @@ static int kvm_handle_hva_range(struct kvm *kvm,
                gfn_end = hva_to_gfn_memslot(hva_end + PAGE_SIZE - 1, memslot);
 
                for (; gfn < gfn_end; ++gfn) {
-                       gfn_t gfn_offset = gfn - memslot->base_gfn;
-
-                       ret = handler(kvm, &memslot->arch.rmap[gfn_offset], gfn);
+                       ret = handler(kvm, memslot, gfn);
                        retval |= ret;
                }
        }
@@ -742,20 +741,21 @@ static int kvm_handle_hva_range(struct kvm *kvm,
 }
 
 static int kvm_handle_hva(struct kvm *kvm, unsigned long hva,
-                         int (*handler)(struct kvm *kvm, unsigned long *rmapp,
-                                        unsigned long gfn))
+                         hva_handler_fn handler)
 {
        return kvm_handle_hva_range(kvm, hva, hva + 1, handler);
 }
 
-static int kvm_unmap_rmapp(struct kvm *kvm, unsigned long *rmapp,
+static int kvm_unmap_rmapp(struct kvm *kvm, struct kvm_memory_slot *memslot,
                           unsigned long gfn)
 {
        struct revmap_entry *rev = kvm->arch.revmap;
        unsigned long h, i, j;
        __be64 *hptep;
        unsigned long ptel, psize, rcbits;
+       unsigned long *rmapp;
 
+       rmapp = &memslot->arch.rmap[gfn - memslot->base_gfn];
        for (;;) {
                lock_rmap(rmapp);
                if (!(*rmapp & KVMPPC_RMAP_PRESENT)) {
@@ -816,26 +816,36 @@ static int kvm_unmap_rmapp(struct kvm *kvm, unsigned long *rmapp,
 
 int kvm_unmap_hva_hv(struct kvm *kvm, unsigned long hva)
 {
-       kvm_handle_hva(kvm, hva, kvm_unmap_rmapp);
+       hva_handler_fn handler;
+
+       handler = kvm_is_radix(kvm) ? kvm_unmap_radix : kvm_unmap_rmapp;
+       kvm_handle_hva(kvm, hva, handler);
        return 0;
 }
 
 int kvm_unmap_hva_range_hv(struct kvm *kvm, unsigned long start, unsigned long end)
 {
-       kvm_handle_hva_range(kvm, start, end, kvm_unmap_rmapp);
+       hva_handler_fn handler;
+
+       handler = kvm_is_radix(kvm) ? kvm_unmap_radix : kvm_unmap_rmapp;
+       kvm_handle_hva_range(kvm, start, end, handler);
        return 0;
 }
 
 void kvmppc_core_flush_memslot_hv(struct kvm *kvm,
                                  struct kvm_memory_slot *memslot)
 {
-       unsigned long *rmapp;
        unsigned long gfn;
        unsigned long n;
+       unsigned long *rmapp;
 
-       rmapp = memslot->arch.rmap;
        gfn = memslot->base_gfn;
-       for (n = memslot->npages; n; --n) {
+       rmapp = memslot->arch.rmap;
+       for (n = memslot->npages; n; --n, ++gfn) {
+               if (kvm_is_radix(kvm)) {
+                       kvm_unmap_radix(kvm, memslot, gfn);
+                       continue;
+               }
                /*
                 * Testing the present bit without locking is OK because
                 * the memslot has been marked invalid already, and hence
@@ -843,20 +853,21 @@ void kvmppc_core_flush_memslot_hv(struct kvm *kvm,
                 * thus the present bit can't go from 0 to 1.
                 */
                if (*rmapp & KVMPPC_RMAP_PRESENT)
-                       kvm_unmap_rmapp(kvm, rmapp, gfn);
+                       kvm_unmap_rmapp(kvm, memslot, gfn);
                ++rmapp;
-               ++gfn;
        }
 }
 
-static int kvm_age_rmapp(struct kvm *kvm, unsigned long *rmapp,
+static int kvm_age_rmapp(struct kvm *kvm, struct kvm_memory_slot *memslot,
                         unsigned long gfn)
 {
        struct revmap_entry *rev = kvm->arch.revmap;
        unsigned long head, i, j;
        __be64 *hptep;
        int ret = 0;
+       unsigned long *rmapp;
 
+       rmapp = &memslot->arch.rmap[gfn - memslot->base_gfn];
  retry:
        lock_rmap(rmapp);
        if (*rmapp & KVMPPC_RMAP_REFERENCED) {
@@ -904,17 +915,22 @@ static int kvm_age_rmapp(struct kvm *kvm, unsigned long *rmapp,
 
 int kvm_age_hva_hv(struct kvm *kvm, unsigned long start, unsigned long end)
 {
-       return kvm_handle_hva_range(kvm, start, end, kvm_age_rmapp);
+       hva_handler_fn handler;
+
+       handler = kvm_is_radix(kvm) ? kvm_age_radix : kvm_age_rmapp;
+       return kvm_handle_hva_range(kvm, start, end, handler);
 }
 
-static int kvm_test_age_rmapp(struct kvm *kvm, unsigned long *rmapp,
+static int kvm_test_age_rmapp(struct kvm *kvm, struct kvm_memory_slot *memslot,
                              unsigned long gfn)
 {
        struct revmap_entry *rev = kvm->arch.revmap;
        unsigned long head, i, j;
        unsigned long *hp;
        int ret = 1;
+       unsigned long *rmapp;
 
+       rmapp = &memslot->arch.rmap[gfn - memslot->base_gfn];
        if (*rmapp & KVMPPC_RMAP_REFERENCED)
                return 1;
 
@@ -940,12 +956,18 @@ static int kvm_test_age_rmapp(struct kvm *kvm, unsigned long *rmapp,
 
 int kvm_test_age_hva_hv(struct kvm *kvm, unsigned long hva)
 {
-       return kvm_handle_hva(kvm, hva, kvm_test_age_rmapp);
+       hva_handler_fn handler;
+
+       handler = kvm_is_radix(kvm) ? kvm_test_age_radix : kvm_test_age_rmapp;
+       return kvm_handle_hva(kvm, hva, handler);
 }
 
 void kvm_set_spte_hva_hv(struct kvm *kvm, unsigned long hva, pte_t pte)
 {
-       kvm_handle_hva(kvm, hva, kvm_unmap_rmapp);
+       hva_handler_fn handler;
+
+       handler = kvm_is_radix(kvm) ? kvm_unmap_radix : kvm_unmap_rmapp;
+       kvm_handle_hva(kvm, hva, handler);
 }
 
 static int vcpus_running(struct kvm *kvm)
index 865ea9bca36416e1fb4b273e98fcd9661ddaf286..69cabadc121a53ce26da2a51284ab3df1a29d1bb 100644 (file)
@@ -463,6 +463,60 @@ int kvmppc_book3s_radix_page_fault(struct kvm_run *run, struct kvm_vcpu *vcpu,
        return ret;
 }
 
+/* Called with kvm->lock held */
+int kvm_unmap_radix(struct kvm *kvm, struct kvm_memory_slot *memslot,
+                   unsigned long gfn)
+{
+       pte_t *ptep;
+       unsigned long gpa = gfn << PAGE_SHIFT;
+       unsigned int shift;
+
+       ptep = __find_linux_pte_or_hugepte(kvm->arch.pgtable, gpa,
+                                          NULL, &shift);
+       if (ptep && pte_present(*ptep)) {
+               kvmppc_radix_update_pte(kvm, ptep, _PAGE_PRESENT, 0,
+                                       gpa, shift);
+               kvmppc_radix_tlbie_page(kvm, gpa, shift);
+       }
+       return 0;                               
+}
+
+/* Called with kvm->lock held */
+int kvm_age_radix(struct kvm *kvm, struct kvm_memory_slot *memslot,
+                 unsigned long gfn)
+{
+       pte_t *ptep;
+       unsigned long gpa = gfn << PAGE_SHIFT;
+       unsigned int shift;
+       int ref = 0;
+
+       ptep = __find_linux_pte_or_hugepte(kvm->arch.pgtable, gpa,
+                                          NULL, &shift);
+       if (ptep && pte_present(*ptep) && pte_young(*ptep)) {
+               kvmppc_radix_update_pte(kvm, ptep, _PAGE_ACCESSED, 0,
+                                       gpa, shift);
+               /* XXX need to flush tlb here? */
+               ref = 1;
+       }
+       return ref;
+}
+
+/* Called with kvm->lock held */
+int kvm_test_age_radix(struct kvm *kvm, struct kvm_memory_slot *memslot,
+                      unsigned long gfn)
+{
+       pte_t *ptep;
+       unsigned long gpa = gfn << PAGE_SHIFT;
+       unsigned int shift;
+       int ref = 0;
+
+       ptep = __find_linux_pte_or_hugepte(kvm->arch.pgtable, gpa,
+                                          NULL, &shift);
+       if (ptep && pte_present(*ptep) && pte_young(*ptep))
+               ref = 1;
+       return ref;
+}
+
 void kvmppc_free_radix(struct kvm *kvm)
 {
        unsigned long ig, iu, im;