KVM: Use 'unsigned long' as kvm_for_each_vcpu()'s index

[sfrench/cifs-2.6.git] / arch / x86 / kvm / x86.c
diff --git a/arch/x86/kvm/x86.c b/arch/x86/kvm/x86.c

index 5a403d92833f51e4f77d6fd67b38fd85efddb698..96bcf2035bdcd6c94a260ac969c41c1141c3d22c 100644 (file)
--- a/arch/x86/kvm/x86.c
+++ b/arch/x86/kvm/x86.c
@@ -2816,7 +2816,7 @@ static void kvm_end_pvclock_update(struct kvm *kvm)
  {
         struct kvm_arch *ka = &kvm->arch;
         struct kvm_vcpu *vcpu;
-       int i;
+       unsigned long i;
  
         write_seqcount_end(&ka->pvclock_sc);
         raw_spin_unlock_irq(&ka->tsc_write_lock);
@@ -3065,7 +3065,7 @@ static int kvm_guest_time_update(struct kvm_vcpu *v)
  
  static void kvmclock_update_fn(struct work_struct *work)
  {
-       int i;
+       unsigned long i;
         struct delayed_work *dwork = to_delayed_work(work);
         struct kvm_arch *ka = container_of(dwork, struct kvm_arch,
                                            kvmclock_update_work);
@@ -3258,6 +3258,29 @@ static void kvm_vcpu_flush_tlb_guest(struct kvm_vcpu *vcpu)
         static_call(kvm_x86_tlb_flush_guest)(vcpu);
  }
  
+
+static inline void kvm_vcpu_flush_tlb_current(struct kvm_vcpu *vcpu)
+{
+       ++vcpu->stat.tlb_flush;
+       static_call(kvm_x86_tlb_flush_current)(vcpu);
+}
+
+/*
+ * Service "local" TLB flush requests, which are specific to the current MMU
+ * context.  In addition to the generic event handling in vcpu_enter_guest(),
+ * TLB flushes that are targeted at an MMU context also need to be serviced
+ * prior before nested VM-Enter/VM-Exit.
+ */
+void kvm_service_local_tlb_flush_requests(struct kvm_vcpu *vcpu)
+{
+       if (kvm_check_request(KVM_REQ_TLB_FLUSH_CURRENT, vcpu))
+               kvm_vcpu_flush_tlb_current(vcpu);
+
+       if (kvm_check_request(KVM_REQ_TLB_FLUSH_GUEST, vcpu))
+               kvm_vcpu_flush_tlb_guest(vcpu);
+}
+EXPORT_SYMBOL_GPL(kvm_service_local_tlb_flush_requests);
+
  static void record_steal_time(struct kvm_vcpu *vcpu)
  {
         struct gfn_to_hva_cache *ghc = &vcpu->arch.st.cache;
@@ -4133,6 +4156,7 @@ int kvm_vm_ioctl_check_extension(struct kvm *kvm, long ext)
         case KVM_CAP_SGX_ATTRIBUTE:
  #endif
         case KVM_CAP_VM_COPY_ENC_CONTEXT_FROM:
+       case KVM_CAP_VM_MOVE_ENC_CONTEXT_FROM:
         case KVM_CAP_SREGS2:
         case KVM_CAP_EXIT_ON_EMULATION_FAILURE:
         case KVM_CAP_VCPU_ATTRIBUTES:
@@ -4448,8 +4472,7 @@ void kvm_arch_vcpu_put(struct kvm_vcpu *vcpu)
  static int kvm_vcpu_ioctl_get_lapic(struct kvm_vcpu *vcpu,
                                     struct kvm_lapic_state *s)
  {
-       if (vcpu->arch.apicv_active)
-               static_call(kvm_x86_sync_pir_to_irr)(vcpu);
+       static_call_cond(kvm_x86_sync_pir_to_irr)(vcpu);
  
         return kvm_apic_get_state(vcpu, s);
  }
@@ -5124,6 +5147,17 @@ long kvm_arch_vcpu_ioctl(struct file *filp,
                 struct kvm_cpuid __user *cpuid_arg = argp;
                 struct kvm_cpuid cpuid;
  
+               /*
+                * KVM does not correctly handle changing guest CPUID after KVM_RUN, as
+                * MAXPHYADDR, GBPAGES support, AMD reserved bit behavior, etc.. aren't
+                * tracked in kvm_mmu_page_role.  As a result, KVM may miss guest page
+                * faults due to reusing SPs/SPTEs.  In practice no sane VMM mucks with
+                * the core vCPU model on the fly, so fail.
+                */
+               r = -EINVAL;
+               if (vcpu->arch.last_vmentry_cpu != -1)
+                       goto out;
+
                 r = -EFAULT;
                 if (copy_from_user(&cpuid, cpuid_arg, sizeof(cpuid)))
                         goto out;
@@ -5134,6 +5168,14 @@ long kvm_arch_vcpu_ioctl(struct file *filp,
                 struct kvm_cpuid2 __user *cpuid_arg = argp;
                 struct kvm_cpuid2 cpuid;
  
+               /*
+                * KVM_SET_CPUID{,2} after KVM_RUN is forbidded, see the comment in
+                * KVM_SET_CPUID case above.
+                */
+               r = -EINVAL;
+               if (vcpu->arch.last_vmentry_cpu != -1)
+                       goto out;
+
                 r = -EFAULT;
                 if (copy_from_user(&cpuid, cpuid_arg, sizeof(cpuid)))
                         goto out;
@@ -5650,7 +5692,7 @@ void kvm_arch_sync_dirty_log(struct kvm *kvm, struct kvm_memory_slot *memslot)
          * VM-Exit.
          */
         struct kvm_vcpu *vcpu;
-       int i;
+       unsigned long i;
  
         kvm_for_each_vcpu(i, vcpu, kvm)
                 kvm_vcpu_kick(vcpu);
@@ -5698,6 +5740,7 @@ int kvm_vm_ioctl_enable_cap(struct kvm *kvm,
                 smp_wmb();
                 kvm->arch.irqchip_mode = KVM_IRQCHIP_SPLIT;
                 kvm->arch.nr_reserved_ioapic_pins = cap->args[0];
+               kvm_request_apicv_update(kvm, true, APICV_INHIBIT_REASON_ABSENT);
                 r = 0;
  split_irqchip_unlock:
                 mutex_unlock(&kvm->lock);
@@ -5918,7 +5961,8 @@ static int kvm_vm_ioctl_set_msr_filter(struct kvm *kvm, void __user *argp)
  static int kvm_arch_suspend_notifier(struct kvm *kvm)
  {
         struct kvm_vcpu *vcpu;
-       int i, ret = 0;
+       unsigned long i;
+       int ret = 0;
  
         mutex_lock(&kvm->lock);
         kvm_for_each_vcpu(i, vcpu, kvm) {
@@ -6078,6 +6122,7 @@ set_identity_unlock:
                 /* Write kvm->irq_routing before enabling irqchip_in_kernel. */
                 smp_wmb();
                 kvm->arch.irqchip_mode = KVM_IRQCHIP_KERNEL;
+               kvm_request_apicv_update(kvm, true, APICV_INHIBIT_REASON_ABSENT);
         create_irqchip_unlock:
                 mutex_unlock(&kvm->lock);
                 break;
@@ -8344,7 +8389,8 @@ static void __kvmclock_cpufreq_notifier(struct cpufreq_freqs *freq, int cpu)
  {
         struct kvm *kvm;
         struct kvm_vcpu *vcpu;
-       int i, send_ipi = 0;
+       int send_ipi = 0;
+       unsigned long i;
  
         /*
          * We allow guests to temporarily run on slowing clocks,
@@ -8517,9 +8563,8 @@ static struct perf_guest_info_callbacks kvm_guest_cbs = {
  static void pvclock_gtod_update_fn(struct work_struct *work)
  {
         struct kvm *kvm;
-
         struct kvm_vcpu *vcpu;
-       int i;
+       unsigned long i;
  
         mutex_lock(&kvm_lock);
         list_for_each_entry(kvm, &vm_list, vm_list)
@@ -8776,10 +8821,9 @@ static void kvm_apicv_init(struct kvm *kvm)
  {
         init_rwsem(&kvm->arch.apicv_update_lock);
  
-       if (enable_apicv)
-               clear_bit(APICV_INHIBIT_REASON_DISABLE,
-                         &kvm->arch.apicv_inhibit_reasons);
-       else
+       set_bit(APICV_INHIBIT_REASON_ABSENT,
+               &kvm->arch.apicv_inhibit_reasons);
+       if (!enable_apicv)
                 set_bit(APICV_INHIBIT_REASON_DISABLE,
                         &kvm->arch.apicv_inhibit_reasons);
  }
@@ -9528,8 +9572,7 @@ static void vcpu_scan_ioapic(struct kvm_vcpu *vcpu)
         if (irqchip_split(vcpu->kvm))
                 kvm_scan_ioapic_routes(vcpu, vcpu->arch.ioapic_handled_vectors);
         else {
-               if (vcpu->arch.apicv_active)
-                       static_call(kvm_x86_sync_pir_to_irr)(vcpu);
+               static_call_cond(kvm_x86_sync_pir_to_irr)(vcpu);
                 if (ioapic_in_kernel(vcpu->kvm))
                         kvm_ioapic_scan_entry(vcpu, vcpu->arch.ioapic_handled_vectors);
         }
@@ -9648,10 +9691,7 @@ static int vcpu_enter_guest(struct kvm_vcpu *vcpu)
                         /* Flushing all ASIDs flushes the current ASID... */
                         kvm_clear_request(KVM_REQ_TLB_FLUSH_CURRENT, vcpu);
                 }
-               if (kvm_check_request(KVM_REQ_TLB_FLUSH_CURRENT, vcpu))
-                       kvm_vcpu_flush_tlb_current(vcpu);
-               if (kvm_check_request(KVM_REQ_TLB_FLUSH_GUEST, vcpu))
-                       kvm_vcpu_flush_tlb_guest(vcpu);
+               kvm_service_local_tlb_flush_requests(vcpu);
  
                 if (kvm_check_request(KVM_REQ_REPORT_TPR_ACCESS, vcpu)) {
                         vcpu->run->exit_reason = KVM_EXIT_TPR_ACCESS;
@@ -9802,10 +9842,12 @@ static int vcpu_enter_guest(struct kvm_vcpu *vcpu)
  
         /*
          * This handles the case where a posted interrupt was
-        * notified with kvm_vcpu_kick.
+        * notified with kvm_vcpu_kick.  Assigned devices can
+        * use the POSTED_INTR_VECTOR even if APICv is disabled,
+        * so do it even if APICv is disabled on this vCPU.
          */
-       if (kvm_lapic_enabled(vcpu) && vcpu->arch.apicv_active)
-               static_call(kvm_x86_sync_pir_to_irr)(vcpu);
+       if (kvm_lapic_enabled(vcpu))
+               static_call_cond(kvm_x86_sync_pir_to_irr)(vcpu);
  
         if (kvm_vcpu_exit_request(vcpu)) {
                 vcpu->mode = OUTSIDE_GUEST_MODE;
@@ -9849,8 +9891,8 @@ static int vcpu_enter_guest(struct kvm_vcpu *vcpu)
                 if (likely(exit_fastpath != EXIT_FASTPATH_REENTER_GUEST))
                         break;
  
-               if (vcpu->arch.apicv_active)
-                       static_call(kvm_x86_sync_pir_to_irr)(vcpu);
+               if (kvm_lapic_enabled(vcpu))
+                       static_call_cond(kvm_x86_sync_pir_to_irr)(vcpu);
  
                 if (unlikely(kvm_vcpu_exit_request(vcpu))) {
                         exit_fastpath = EXIT_FASTPATH_EXIT_HANDLED;
@@ -10631,7 +10673,7 @@ static void kvm_arch_vcpu_guestdbg_update_apicv_inhibit(struct kvm *kvm)
  {
         bool inhibit = false;
         struct kvm_vcpu *vcpu;
-       int i;
+       unsigned long i;
  
         down_write(&kvm->arch.apicv_update_lock);
  
@@ -11119,7 +11161,7 @@ int kvm_arch_hardware_enable(void)
  {
         struct kvm *kvm;
         struct kvm_vcpu *vcpu;
-       int i;
+       unsigned long i;
         int ret;
         u64 local_tsc;
         u64 max_tsc = 0;
@@ -11372,7 +11414,7 @@ static void kvm_unload_vcpu_mmu(struct kvm_vcpu *vcpu)
  
  static void kvm_free_vcpus(struct kvm *kvm)
  {
-       unsigned int i;
+       unsigned long i;
         struct kvm_vcpu *vcpu;
  
         /*
@@ -11382,15 +11424,8 @@ static void kvm_free_vcpus(struct kvm *kvm)
                 kvm_clear_async_pf_completion_queue(vcpu);
                 kvm_unload_vcpu_mmu(vcpu);
         }
-       kvm_for_each_vcpu(i, vcpu, kvm)
-               kvm_vcpu_destroy(vcpu);
  
-       mutex_lock(&kvm->lock);
-       for (i = 0; i < atomic_read(&kvm->online_vcpus); i++)
-               kvm->vcpus[i] = NULL;
-
-       atomic_set(&kvm->online_vcpus, 0);
-       mutex_unlock(&kvm->lock);
+       kvm_destroy_vcpus(kvm);
  }
  
  void kvm_arch_sync_events(struct kvm *kvm)
@@ -11625,7 +11660,7 @@ out_free:
  void kvm_arch_memslots_updated(struct kvm *kvm, u64 gen)
  {
         struct kvm_vcpu *vcpu;
-       int i;
+       unsigned long i;
  
         /*
          * memslots->generation has been incremented.