KVM: x86: Fix wall clock writes in Xen shared_info not to mark page dirty

author David Woodhouse <dwmw@amazon.co.uk>

Fri, 10 Dec 2021 16:36:24 +0000 (16:36 +0000)

committer Paolo Bonzini <pbonzini@redhat.com>

Fri, 7 Jan 2022 15:44:45 +0000 (10:44 -0500)
author David Woodhouse <dwmw@amazon.co.uk>
Fri, 10 Dec 2021 16:36:24 +0000 (16:36 +0000)
committer Paolo Bonzini <pbonzini@redhat.com>
Fri, 7 Jan 2022 15:44:45 +0000 (10:44 -0500)
diff --git a/arch/x86/kvm/x86.c b/arch/x86/kvm/x86.c

index 3050601..6492329 100644 (file)
--- a/arch/x86/kvm/x86.c
+++ b/arch/x86/kvm/x86.c
@@ -2135,7 +2135,7 @@ static s64 get_kvmclock_base_ns(void)
  }
  #endif
  
-void kvm_write_wall_clock(struct kvm *kvm, gpa_t wall_clock, int sec_hi_ofs)
+static void kvm_write_wall_clock(struct kvm *kvm, gpa_t wall_clock, int sec_hi_ofs)
  {
         int version;
         int r;
diff --git a/arch/x86/kvm/x86.h b/arch/x86/kvm/x86.h

index 4abcd8d..da7031e 100644 (file)
--- a/arch/x86/kvm/x86.h
+++ b/arch/x86/kvm/x86.h
@@ -301,7 +301,6 @@ static inline bool kvm_vcpu_latch_init(struct kvm_vcpu *vcpu)
         return is_smm(vcpu) || static_call(kvm_x86_apic_init_signal_blocked)(vcpu);
  }
  
-void kvm_write_wall_clock(struct kvm *kvm, gpa_t wall_clock, int sec_hi_ofs);
  void kvm_inject_realmode_interrupt(struct kvm_vcpu *vcpu, int irq, int inc_eip);
  
  u64 get_kvmclock_ns(struct kvm *kvm);
diff --git a/arch/x86/kvm/xen.c b/arch/x86/kvm/xen.c

index ceddabd..0e3f7d6 100644 (file)
--- a/arch/x86/kvm/xen.c
+++ b/arch/x86/kvm/xen.c
@@ -25,8 +25,11 @@ DEFINE_STATIC_KEY_DEFERRED_FALSE(kvm_xen_enabled, HZ);
  static int kvm_xen_shared_info_init(struct kvm *kvm, gfn_t gfn)
  {
         struct gfn_to_pfn_cache *gpc = &kvm->arch.xen.shinfo_cache;
+       struct pvclock_wall_clock *wc;
         gpa_t gpa = gfn_to_gpa(gfn);
-       int wc_ofs, sec_hi_ofs;
+       u32 *wc_sec_hi;
+       u32 wc_version;
+       u64 wall_nsec;
         int ret = 0;
         int idx = srcu_read_lock(&kvm->srcu);
  
@@ -35,32 +38,63 @@ static int kvm_xen_shared_info_init(struct kvm *kvm, gfn_t gfn)
                 goto out;
         }
  
-       ret = kvm_gfn_to_pfn_cache_init(kvm, gpc, NULL, false, true, gpa,
-                                       PAGE_SIZE, false);
-       if (ret)
-               goto out;
+       do {
+               ret = kvm_gfn_to_pfn_cache_init(kvm, gpc, NULL, false, true,
+                                               gpa, PAGE_SIZE, false);
+               if (ret)
+                       goto out;
+
+               /*
+                * This code mirrors kvm_write_wall_clock() except that it writes
+                * directly through the pfn cache and doesn't mark the page dirty.
+                */
+               wall_nsec = ktime_get_real_ns() - get_kvmclock_ns(kvm);
+
+               /* It could be invalid again already, so we need to check */
+               read_lock_irq(&gpc->lock);
+
+               if (gpc->valid)
+                       break;
+
+               read_unlock_irq(&gpc->lock);
+       } while (1);
  
         /* Paranoia checks on the 32-bit struct layout */
         BUILD_BUG_ON(offsetof(struct compat_shared_info, wc) != 0x900);
         BUILD_BUG_ON(offsetof(struct compat_shared_info, arch.wc_sec_hi) != 0x924);
         BUILD_BUG_ON(offsetof(struct pvclock_vcpu_time_info, version) != 0);
  
-       /* 32-bit location by default */
-       wc_ofs = offsetof(struct compat_shared_info, wc);
-       sec_hi_ofs = offsetof(struct compat_shared_info, arch.wc_sec_hi);
-
  #ifdef CONFIG_X86_64
         /* Paranoia checks on the 64-bit struct layout */
         BUILD_BUG_ON(offsetof(struct shared_info, wc) != 0xc00);
         BUILD_BUG_ON(offsetof(struct shared_info, wc_sec_hi) != 0xc0c);
  
-       if (kvm->arch.xen.long_mode) {
-               wc_ofs = offsetof(struct shared_info, wc);
-               sec_hi_ofs = offsetof(struct shared_info, wc_sec_hi);
-       }
+       if (IS_ENABLED(CONFIG_64BIT) && kvm->arch.xen.long_mode) {
+               struct shared_info *shinfo = gpc->khva;
+
+               wc_sec_hi = &shinfo->wc_sec_hi;
+               wc = &shinfo->wc;
+       } else
  #endif
+       {
+               struct compat_shared_info *shinfo = gpc->khva;
+
+               wc_sec_hi = &shinfo->arch.wc_sec_hi;
+               wc = &shinfo->wc;
+       }
+
+       /* Increment and ensure an odd value */
+       wc_version = wc->version = (wc->version + 1) | 1;
+       smp_wmb();
+
+       wc->nsec = do_div(wall_nsec,  1000000000);
+       wc->sec = (u32)wall_nsec;
+       *wc_sec_hi = wall_nsec >> 32;
+       smp_wmb();
+
+       wc->version = wc_version + 1;
+       read_unlock_irq(&gpc->lock);
  
-       kvm_write_wall_clock(kvm, gpa + wc_ofs, sec_hi_ofs - wc_ofs);
         kvm_make_all_cpus_request(kvm, KVM_REQ_MASTERCLOCK_UPDATE);
  
  out:
author	David Woodhouse <dwmw@amazon.co.uk>
	Fri, 10 Dec 2021 16:36:24 +0000 (16:36 +0000)
committer	Paolo Bonzini <pbonzini@redhat.com>
	Fri, 7 Jan 2022 15:44:45 +0000 (10:44 -0500)
arch/x86/kvm/x86.c		patch \| blob \| history
arch/x86/kvm/x86.h		patch \| blob \| history
arch/x86/kvm/xen.c		patch \| blob \| history