KVM: VMX: remove yield_on_hlt

[platform/adaptation/renesas_rcar/renesas_kernel.git] / arch / x86 / kvm / vmx.c
diff --git a/arch/x86/kvm/vmx.c b/arch/x86/kvm/vmx.c

index 579a0b5..d2bd719 100644 (file)
--- a/arch/x86/kvm/vmx.c
+++ b/arch/x86/kvm/vmx.c
@@ -18,6 +18,7 @@
  
  #include "irq.h"
  #include "mmu.h"
+#include "cpuid.h"
  
  #include <linux/kvm_host.h>
  #include <linux/module.h>
@@ -50,29 +51,26 @@
  MODULE_AUTHOR("Qumranet");
  MODULE_LICENSE("GPL");
  
-static int __read_mostly enable_vpid = 1;
+static bool __read_mostly enable_vpid = 1;
  module_param_named(vpid, enable_vpid, bool, 0444);
  
-static int __read_mostly flexpriority_enabled = 1;
+static bool __read_mostly flexpriority_enabled = 1;
  module_param_named(flexpriority, flexpriority_enabled, bool, S_IRUGO);
  
-static int __read_mostly enable_ept = 1;
+static bool __read_mostly enable_ept = 1;
  module_param_named(ept, enable_ept, bool, S_IRUGO);
  
-static int __read_mostly enable_unrestricted_guest = 1;
+static bool __read_mostly enable_unrestricted_guest = 1;
  module_param_named(unrestricted_guest,
                         enable_unrestricted_guest, bool, S_IRUGO);
  
-static int __read_mostly emulate_invalid_guest_state = 0;
+static bool __read_mostly emulate_invalid_guest_state = 0;
  module_param(emulate_invalid_guest_state, bool, S_IRUGO);
  
-static int __read_mostly vmm_exclusive = 1;
+static bool __read_mostly vmm_exclusive = 1;
  module_param(vmm_exclusive, bool, S_IRUGO);
  
-static int __read_mostly yield_on_hlt = 1;
-module_param(yield_on_hlt, bool, S_IRUGO);
-
-static int __read_mostly fasteoi = 1;
+static bool __read_mostly fasteoi = 1;
  module_param(fasteoi, bool, S_IRUGO);
  
  /*
@@ -80,7 +78,7 @@ module_param(fasteoi, bool, S_IRUGO);
   * VMX and be a hypervisor for its own guests. If nested=0, guests may not
   * use VMX instructions.
   */
-static int __read_mostly nested = 0;
+static bool __read_mostly nested = 0;
  module_param(nested, bool, S_IRUGO);
  
  #define KVM_GUEST_CR0_MASK_UNRESTRICTED_GUEST                          \
@@ -1456,7 +1454,7 @@ static void __vmx_load_host_state(struct vcpu_vmx *vmx)
  #ifdef CONFIG_X86_64
         wrmsrl(MSR_KERNEL_GS_BASE, vmx->msr_host_kernel_gs_base);
  #endif
-       if (current_thread_info()->status & TS_USEDFPU)
+       if (__thread_has_fpu(current))
                 clts();
         load_gdt(&__get_cpu_var(host_gdt));
  }
@@ -1654,17 +1652,6 @@ static void skip_emulated_instruction(struct kvm_vcpu *vcpu)
         vmx_set_interrupt_shadow(vcpu, 0);
  }
  
-static void vmx_clear_hlt(struct kvm_vcpu *vcpu)
-{
-       /* Ensure that we clear the HLT state in the VMCS.  We don't need to
-        * explicitly skip the instruction because if the HLT state is set, then
-        * the instruction is already executing and RIP has already been
-        * advanced. */
-       if (!yield_on_hlt &&
-           vmcs_read32(GUEST_ACTIVITY_STATE) == GUEST_ACTIVITY_HLT)
-               vmcs_write32(GUEST_ACTIVITY_STATE, GUEST_ACTIVITY_ACTIVE);
-}
-
  /*
   * KVM wants to inject page-faults which it got to the guest. This function
   * checks whether in a nested guest, we need to inject them to L1 or L2.
@@ -1717,7 +1704,6 @@ static void vmx_queue_exception(struct kvm_vcpu *vcpu, unsigned nr,
                 intr_info |= INTR_TYPE_HARD_EXCEPTION;
  
         vmcs_write32(VM_ENTRY_INTR_INFO_FIELD, intr_info);
-       vmx_clear_hlt(vcpu);
  }
  
  static bool vmx_rdtscp_supported(void)
@@ -1747,7 +1733,6 @@ static void setup_msrs(struct vcpu_vmx *vmx)
         int save_nmsrs, index;
         unsigned long *msr_bitmap;
  
-       vmx_load_host_state(vmx);
         save_nmsrs = 0;
  #ifdef CONFIG_X86_64
         if (is_long_mode(&vmx->vcpu)) {
@@ -1817,13 +1802,19 @@ u64 vmx_read_l1_tsc(struct kvm_vcpu *vcpu)
  }
  
  /*
- * Empty call-back. Needs to be implemented when VMX enables the SET_TSC_KHZ
- * ioctl. In this case the call-back should update internal vmx state to make
- * the changes effective.
+ * Engage any workarounds for mis-matched TSC rates.  Currently limited to
+ * software catchup for faster rates on slower CPUs.
   */
-static void vmx_set_tsc_khz(struct kvm_vcpu *vcpu, u32 user_tsc_khz)
+static void vmx_set_tsc_khz(struct kvm_vcpu *vcpu, u32 user_tsc_khz, bool scale)
  {
-       /* Nothing to do here */
+       if (!scale)
+               return;
+
+       if (user_tsc_khz > tsc_khz) {
+               vcpu->arch.tsc_catchup = 1;
+               vcpu->arch.tsc_always_catchup = 1;
+       } else
+               WARN(1, "user requested TSC rate below hardware speed\n");
  }
  
  /*
@@ -1850,7 +1841,7 @@ static void vmx_write_tsc_offset(struct kvm_vcpu *vcpu, u64 offset)
         }
  }
  
-static void vmx_adjust_tsc_offset(struct kvm_vcpu *vcpu, s64 adjustment)
+static void vmx_adjust_tsc_offset(struct kvm_vcpu *vcpu, s64 adjustment, bool host)
  {
         u64 offset = vmcs_read64(TSC_OFFSET);
         vmcs_write64(TSC_OFFSET, offset + adjustment);
@@ -1956,6 +1947,7 @@ static __init void nested_vmx_setup_ctls_msrs(void)
  #endif
                 CPU_BASED_MOV_DR_EXITING | CPU_BASED_UNCOND_IO_EXITING |
                 CPU_BASED_USE_IO_BITMAPS | CPU_BASED_MONITOR_EXITING |
+               CPU_BASED_RDPMC_EXITING |
                 CPU_BASED_ACTIVATE_SECONDARY_CONTROLS;
         /*
          * We can allow some features even when not supported by the
@@ -2142,12 +2134,10 @@ static int vmx_get_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 *pdata)
                         return 1;
                 /* Otherwise falls through */
         default:
-               vmx_load_host_state(to_vmx(vcpu));
                 if (vmx_get_vmx_msr(vcpu, msr_index, pdata))
                         return 0;
                 msr = find_msr_entry(to_vmx(vcpu), msr_index);
                 if (msr) {
-                       vmx_load_host_state(to_vmx(vcpu));
                         data = msr->data;
                         break;
                 }
@@ -2171,7 +2161,6 @@ static int vmx_set_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 data)
  
         switch (msr_index) {
         case MSR_EFER:
-               vmx_load_host_state(vmx);
                 ret = kvm_set_msr_common(vcpu, msr_index, data);
                 break;
  #ifdef CONFIG_X86_64
@@ -2220,7 +2209,6 @@ static int vmx_set_msr(struct kvm_vcpu *vcpu, u32 msr_index, u64 data)
                         break;
                 msr = find_msr_entry(vmx, msr_index);
                 if (msr) {
-                       vmx_load_host_state(vmx);
                         msr->data = data;
                         break;
                 }
@@ -2402,7 +2390,7 @@ static __init int setup_vmcs_config(struct vmcs_config *vmcs_conf)
                                 &_pin_based_exec_control) < 0)
                 return -EIO;
  
-       min =
+       min = CPU_BASED_HLT_EXITING |
  #ifdef CONFIG_X86_64
               CPU_BASED_CR8_LOAD_EXITING |
               CPU_BASED_CR8_STORE_EXITING |
@@ -2414,10 +2402,8 @@ static __init int setup_vmcs_config(struct vmcs_config *vmcs_conf)
               CPU_BASED_USE_TSC_OFFSETING |
               CPU_BASED_MWAIT_EXITING |
               CPU_BASED_MONITOR_EXITING |
-             CPU_BASED_INVLPG_EXITING;
-
-       if (yield_on_hlt)
-               min |= CPU_BASED_HLT_EXITING;
+             CPU_BASED_INVLPG_EXITING |
+             CPU_BASED_RDPMC_EXITING;
  
         opt = CPU_BASED_TPR_SHADOW |
               CPU_BASED_USE_MSR_BITMAPS |
@@ -2716,11 +2702,13 @@ static gva_t rmode_tss_base(struct kvm *kvm)
  {
         if (!kvm->arch.tss_addr) {
                 struct kvm_memslots *slots;
+               struct kvm_memory_slot *slot;
                 gfn_t base_gfn;
  
                 slots = kvm_memslots(kvm);
-               base_gfn = slots->memslots[0].base_gfn +
-                                kvm->memslots->memslots[0].npages - 3;
+               slot = id_to_memslot(slots, 0);
+               base_gfn = slot->base_gfn + slot->npages - 3;
+
                 return base_gfn << PAGE_SHIFT;
         }
         return kvm->arch.tss_addr;
@@ -3945,12 +3933,15 @@ static bool nested_exit_on_intr(struct kvm_vcpu *vcpu)
  static void enable_irq_window(struct kvm_vcpu *vcpu)
  {
         u32 cpu_based_vm_exec_control;
-       if (is_guest_mode(vcpu) && nested_exit_on_intr(vcpu))
-               /* We can get here when nested_run_pending caused
-                * vmx_interrupt_allowed() to return false. In this case, do
-                * nothing - the interrupt will be injected later.
+       if (is_guest_mode(vcpu) && nested_exit_on_intr(vcpu)) {
+               /*
+                * We get here if vmx_interrupt_allowed() said we can't
+                * inject to L1 now because L2 must run. Ask L2 to exit
+                * right after entry, so we can inject to L1 more promptly.
                  */
+               kvm_make_request(KVM_REQ_IMMEDIATE_EXIT, vcpu);
                 return;
+       }
  
         cpu_based_vm_exec_control = vmcs_read32(CPU_BASED_VM_EXEC_CONTROL);
         cpu_based_vm_exec_control |= CPU_BASED_VIRTUAL_INTR_PENDING;
@@ -4000,7 +3991,6 @@ static void vmx_inject_irq(struct kvm_vcpu *vcpu)
         } else
                 intr |= INTR_TYPE_EXT_INTR;
         vmcs_write32(VM_ENTRY_INTR_INFO_FIELD, intr);
-       vmx_clear_hlt(vcpu);
  }
  
  static void vmx_inject_nmi(struct kvm_vcpu *vcpu)
@@ -4032,7 +4022,6 @@ static void vmx_inject_nmi(struct kvm_vcpu *vcpu)
         }
         vmcs_write32(VM_ENTRY_INTR_INFO_FIELD,
                         INTR_TYPE_NMI_INTR | INTR_INFO_VALID_MASK | NMI_VECTOR);
-       vmx_clear_hlt(vcpu);
  }
  
  static int vmx_nmi_allowed(struct kvm_vcpu *vcpu)
@@ -4077,11 +4066,12 @@ static void vmx_set_nmi_mask(struct kvm_vcpu *vcpu, bool masked)
  static int vmx_interrupt_allowed(struct kvm_vcpu *vcpu)
  {
         if (is_guest_mode(vcpu) && nested_exit_on_intr(vcpu)) {
-               struct vmcs12 *vmcs12;
-               if (to_vmx(vcpu)->nested.nested_run_pending)
+               struct vmcs12 *vmcs12 = get_vmcs12(vcpu);
+               if (to_vmx(vcpu)->nested.nested_run_pending ||
+                   (vmcs12->idt_vectoring_info_field &
+                    VECTORING_INFO_VALID_MASK))
                         return 0;
                 nested_vmx_vmexit(vcpu);
-               vmcs12 = get_vmcs12(vcpu);
                 vmcs12->vm_exit_reason = EXIT_REASON_EXTERNAL_INTERRUPT;
                 vmcs12->vm_exit_intr_info = 0;
                 /* fall through to normal code, but now in L1, not L2 */
@@ -4611,6 +4601,16 @@ static int handle_invlpg(struct kvm_vcpu *vcpu)
         return 1;
  }
  
+static int handle_rdpmc(struct kvm_vcpu *vcpu)
+{
+       int err;
+
+       err = kvm_rdpmc(vcpu);
+       kvm_complete_insn_gp(vcpu, err);
+
+       return 1;
+}
+
  static int handle_wbinvd(struct kvm_vcpu *vcpu)
  {
         skip_emulated_instruction(vcpu);
@@ -5561,6 +5561,7 @@ static int (*kvm_vmx_exit_handlers[])(struct kvm_vcpu *vcpu) = {
         [EXIT_REASON_HLT]                     = handle_halt,
         [EXIT_REASON_INVD]                    = handle_invd,
         [EXIT_REASON_INVLPG]                  = handle_invlpg,
+       [EXIT_REASON_RDPMC]                   = handle_rdpmc,
         [EXIT_REASON_VMCALL]                  = handle_vmcall,
         [EXIT_REASON_VMCLEAR]                 = handle_vmclear,
         [EXIT_REASON_VMLAUNCH]                = handle_vmlaunch,