Merge commit 'origin/master' into for-linus/xen/master

author Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>

Tue, 7 Apr 2009 20:34:16 +0000 (13:34 -0700)

committer Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>

Tue, 7 Apr 2009 20:34:16 +0000 (13:34 -0700)
author Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>
Tue, 7 Apr 2009 20:34:16 +0000 (13:34 -0700)
committer Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>
Tue, 7 Apr 2009 20:34:16 +0000 (13:34 -0700)
diff --combined arch/x86/include/asm/paravirt.h

index dfdee0ca57d3a3328c6ac4dfe1dde729df5fde6b,7727aa8b7dda99087ca5ced1046a92046ab7c4d5..bc384be6aa44d404ca12ce7ec350bee248dd6df4
--- 1/arch/x86/include/asm/paravirt.h
--- 2/arch/x86/include/asm/paravirt.h
+++ b/arch/x86/include/asm/paravirt.h
@@@ -56,7 -56,6 +56,7 @@@ struct desc_ptr
   struct tss_struct;
   struct mm_struct;
   struct desc_struct;
+ +struct task_struct;
   
   /*
    * Wrapper type for pointers to code which uses the non-standard
@@@ -204,8 -203,7 +204,8 @@@ struct pv_cpu_ops 
   
         void (*swapgs)(void);
   
- -      struct pv_lazy_ops lazy_mode;
+ +      void (*start_context_switch)(struct task_struct *prev);
+ +      void (*end_context_switch)(struct task_struct *next);
   };
   
   struct pv_irq_ops {
@@@ -319,8 -317,6 +319,6 @@@ struct pv_mmu_ops 
   #if PAGETABLE_LEVELS >= 3
   #ifdef CONFIG_X86_PAE
         void (*set_pte_atomic)(pte_t *ptep, pte_t pteval);
-       void (*set_pte_present)(struct mm_struct *mm, unsigned long addr,
-                               pte_t *ptep, pte_t pte);
         void (*pte_clear)(struct mm_struct *mm, unsigned long addr,
                           pte_t *ptep);
         void (*pmd_clear)(pmd_t *pmdp);
@@@ -391,7 -387,7 +389,7 @@@ extern struct pv_lock_ops pv_lock_ops
   
   #define paravirt_type(op)                             \
         [paravirt_typenum] "i" (PARAVIRT_PATCH(op)),    \
-       [paravirt_opptr] "m" (op)
+       [paravirt_opptr] "i" (&(op))
   #define paravirt_clobber(clobber)             \
         [paravirt_clobber] "i" (clobber)
   
@@@ -445,7 -441,7 +443,7 @@@ int paravirt_disable_iospace(void)
    * offset into the paravirt_patch_template structure, and can therefore be
    * freely converted back into a structure offset.
    */
- #define PARAVIRT_CALL "call *%[paravirt_opptr];"
+ #define PARAVIRT_CALL "call *%c[paravirt_opptr];"
   
   /*
    * These macros are intended to wrap calls through one of the paravirt
@@@ -1367,13 -1363,6 +1365,6 @@@ static inline void set_pte_atomic(pte_
                     pte.pte, pte.pte >> 32);
   }
   
- static inline void set_pte_present(struct mm_struct *mm, unsigned long addr,
-                                  pte_t *ptep, pte_t pte)
- {
-       /* 5 arg words */
-       pv_mmu_ops.set_pte_present(mm, addr, ptep, pte);
- }
- 
   static inline void pte_clear(struct mm_struct *mm, unsigned long addr,
                              pte_t *ptep)
   {
@@@ -1390,12 -1379,6 +1381,6 @@@ static inline void set_pte_atomic(pte_
         set_pte(ptep, pte);
   }
   
- static inline void set_pte_present(struct mm_struct *mm, unsigned long addr,
-                                  pte_t *ptep, pte_t pte)
- {
-       set_pte(ptep, pte);
- }
- 
   static inline void pte_clear(struct mm_struct *mm, unsigned long addr,
                              pte_t *ptep)
   {
@@@ -1416,23 -1399,25 +1401,23 @@@ enum paravirt_lazy_mode 
   };
   
   enum paravirt_lazy_mode paravirt_get_lazy_mode(void);
- -void paravirt_enter_lazy_cpu(void);
- -void paravirt_leave_lazy_cpu(void);
+ +void paravirt_start_context_switch(struct task_struct *prev);
+ +void paravirt_end_context_switch(struct task_struct *next);
+ +
   void paravirt_enter_lazy_mmu(void);
   void paravirt_leave_lazy_mmu(void);
- -void paravirt_leave_lazy(enum paravirt_lazy_mode mode);
   
- -#define  __HAVE_ARCH_ENTER_LAZY_CPU_MODE
- -static inline void arch_enter_lazy_cpu_mode(void)
+ +#define  __HAVE_ARCH_START_CONTEXT_SWITCH
+ +static inline void arch_start_context_switch(struct task_struct *prev)
   {
- -      PVOP_VCALL0(pv_cpu_ops.lazy_mode.enter);
+ +      PVOP_VCALL1(pv_cpu_ops.start_context_switch, prev);
   }
   
- -static inline void arch_leave_lazy_cpu_mode(void)
+ +static inline void arch_end_context_switch(struct task_struct *next)
   {
- -      PVOP_VCALL0(pv_cpu_ops.lazy_mode.leave);
+ +      PVOP_VCALL1(pv_cpu_ops.end_context_switch, next);
   }
   
- -void arch_flush_lazy_cpu_mode(void);
- -
   #define  __HAVE_ARCH_ENTER_LAZY_MMU_MODE
   static inline void arch_enter_lazy_mmu_mode(void)
   {
diff --combined arch/x86/include/asm/pgtable.h

index 24e42836e92142f339e068feea1a514f29d593d6,29d96d168bc097195e9cbe66ab723c90929e1116..b27c4f29b5e01bd92c04d28534f29dc19247e2f7
--- 1/arch/x86/include/asm/pgtable.h
--- 2/arch/x86/include/asm/pgtable.h
+++ b/arch/x86/include/asm/pgtable.h
@@@ -31,8 -31,6 +31,6 @@@ extern struct list_head pgd_list
   #define set_pte(ptep, pte)            native_set_pte(ptep, pte)
   #define set_pte_at(mm, addr, ptep, pte)       native_set_pte_at(mm, addr, ptep, pte)
   
- #define set_pte_present(mm, addr, ptep, pte)                          \
-       native_set_pte_present(mm, addr, ptep, pte)
   #define set_pte_atomic(ptep, pte)                                     \
         native_set_pte_atomic(ptep, pte)
   
@@@ -83,8 -81,6 +81,8 @@@ static inline void __init paravirt_page
   #define pte_val(x)    native_pte_val(x)
   #define __pte(x)      native_make_pte(x)
   
+ +#define arch_end_context_switch(prev) do {} while(0)
+ +
   #endif        /* CONFIG_PARAVIRT */
   
   /*
diff --combined arch/x86/include/asm/thread_info.h

index 2f34d643b567c6d267d066eb95fce4486ff13d71,8820a73ae090aae29aa3454d6f3241ffcbef5440..602c769fc98ca7340f5388fe21e57ce5431b376e
--- 1/arch/x86/include/asm/thread_info.h
--- 2/arch/x86/include/asm/thread_info.h
+++ b/arch/x86/include/asm/thread_info.h
@@@ -94,7 -94,7 +94,8 @@@ struct thread_info 
   #define TIF_FORCED_TF         24      /* true if TF in eflags artificially */
   #define TIF_DEBUGCTLMSR               25      /* uses thread_struct.debugctlmsr */
   #define TIF_DS_AREA_MSR               26      /* uses thread_struct.ds_area_msr */
- -#define TIF_SYSCALL_FTRACE    27      /* for ftrace syscall instrumentation */
+ +#define TIF_LAZY_MMU_UPDATES  27      /* task is updating the mmu lazily */
++#define TIF_SYSCALL_FTRACE    28      /* for ftrace syscall instrumentation */
   
   #define _TIF_SYSCALL_TRACE    (1 << TIF_SYSCALL_TRACE)
   #define _TIF_NOTIFY_RESUME    (1 << TIF_NOTIFY_RESUME)
@@@ -116,16 -116,17 +117,18 @@@
   #define _TIF_FORCED_TF                (1 << TIF_FORCED_TF)
   #define _TIF_DEBUGCTLMSR      (1 << TIF_DEBUGCTLMSR)
   #define _TIF_DS_AREA_MSR      (1 << TIF_DS_AREA_MSR)
+ +#define _TIF_LAZY_MMU_UPDATES (1 << TIF_LAZY_MMU_UPDATES)
+ #define _TIF_SYSCALL_FTRACE   (1 << TIF_SYSCALL_FTRACE)
   
   /* work to do in syscall_trace_enter() */
   #define _TIF_WORK_SYSCALL_ENTRY       \
-       (_TIF_SYSCALL_TRACE | _TIF_SYSCALL_EMU | \
+       (_TIF_SYSCALL_TRACE | _TIF_SYSCALL_EMU | _TIF_SYSCALL_FTRACE |  \
          _TIF_SYSCALL_AUDIT | _TIF_SECCOMP | _TIF_SINGLESTEP)
   
   /* work to do in syscall_trace_leave() */
   #define _TIF_WORK_SYSCALL_EXIT        \
-       (_TIF_SYSCALL_TRACE | _TIF_SYSCALL_AUDIT | _TIF_SINGLESTEP)
+       (_TIF_SYSCALL_TRACE | _TIF_SYSCALL_AUDIT | _TIF_SINGLESTEP |    \
+        _TIF_SYSCALL_FTRACE)
   
   /* work to do on interrupt/exception return */
   #define _TIF_WORK_MASK                                                        \
@@@ -134,7 -135,7 +137,7 @@@
            _TIF_SINGLESTEP|_TIF_SECCOMP|_TIF_SYSCALL_EMU))
   
   /* work to do on any return to user space */
- #define _TIF_ALLWORK_MASK (0x0000FFFF & ~_TIF_SECCOMP)
+ #define _TIF_ALLWORK_MASK ((0x0000FFFF & ~_TIF_SECCOMP) | _TIF_SYSCALL_FTRACE)
   
   /* Only used for 64 bit */
   #define _TIF_DO_NOTIFY_MASK                                           \
diff --combined arch/x86/kernel/kvm.c

index 5d7f6e76b5dc67fd7b4746e2aa494bc469bedd94,33019ddb56b452ce736f4b70fcb5d4efe8d0ae9d..6551dedee20c71a58a8f902bdee88dd0e8c4d7f8
--- 1/arch/x86/kernel/kvm.c
--- 2/arch/x86/kernel/kvm.c
+++ b/arch/x86/kernel/kvm.c
@@@ -138,12 -138,6 +138,6 @@@ static void kvm_set_pte_atomic(pte_t *p
         kvm_mmu_write(ptep, pte_val(pte));
   }
   
- static void kvm_set_pte_present(struct mm_struct *mm, unsigned long addr,
-                               pte_t *ptep, pte_t pte)
- {
-       kvm_mmu_write(ptep, pte_val(pte));
- }
- 
   static void kvm_pte_clear(struct mm_struct *mm,
                           unsigned long addr, pte_t *ptep)
   {
@@@ -201,7 -195,7 +195,7 @@@ static void kvm_leave_lazy_mmu(void
         struct kvm_para_state *state = kvm_para_state();
   
         mmu_queue_flush(state);
- -      paravirt_leave_lazy(paravirt_get_lazy_mode());
+ +      paravirt_leave_lazy_mmu();
         state->mode = paravirt_get_lazy_mode();
   }
   
@@@ -220,7 -214,6 +214,6 @@@ static void paravirt_ops_setup(void
   #if PAGETABLE_LEVELS >= 3
   #ifdef CONFIG_X86_PAE
                 pv_mmu_ops.set_pte_atomic = kvm_set_pte_atomic;
-               pv_mmu_ops.set_pte_present = kvm_set_pte_present;
                 pv_mmu_ops.pte_clear = kvm_pte_clear;
                 pv_mmu_ops.pmd_clear = kvm_pmd_clear;
   #endif
diff --combined arch/x86/kernel/paravirt.c

index 254e8aa8bfdb1f64da37941de41a20fc0850d4e8,8e45f4464880ccdba671ea5248c5e2bea4f9b297..aa3442340705bfa7e8855e4e0fcac80a5af60809
--- 1/arch/x86/kernel/paravirt.c
--- 2/arch/x86/kernel/paravirt.c
+++ b/arch/x86/kernel/paravirt.c
@@@ -246,16 -246,18 +246,16 @@@ static DEFINE_PER_CPU(enum paravirt_laz
   
   static inline void enter_lazy(enum paravirt_lazy_mode mode)
   {
- -      BUG_ON(__get_cpu_var(paravirt_lazy_mode) != PARAVIRT_LAZY_NONE);
- -      BUG_ON(preemptible());
+ +      BUG_ON(percpu_read(paravirt_lazy_mode) != PARAVIRT_LAZY_NONE);
   
- -      __get_cpu_var(paravirt_lazy_mode) = mode;
+ +      percpu_write(paravirt_lazy_mode, mode);
   }
   
- -void paravirt_leave_lazy(enum paravirt_lazy_mode mode)
+ +static void leave_lazy(enum paravirt_lazy_mode mode)
   {
- -      BUG_ON(__get_cpu_var(paravirt_lazy_mode) != mode);
- -      BUG_ON(preemptible());
+ +      BUG_ON(percpu_read(paravirt_lazy_mode) != mode);
   
- -      __get_cpu_var(paravirt_lazy_mode) = PARAVIRT_LAZY_NONE;
+ +      percpu_write(paravirt_lazy_mode, PARAVIRT_LAZY_NONE);
   }
   
   void paravirt_enter_lazy_mmu(void)
@@@ -265,36 -267,22 +265,36 @@@
   
   void paravirt_leave_lazy_mmu(void)
   {
- -      paravirt_leave_lazy(PARAVIRT_LAZY_MMU);
+ +      leave_lazy(PARAVIRT_LAZY_MMU);
   }
   
- -void paravirt_enter_lazy_cpu(void)
+ +void paravirt_start_context_switch(struct task_struct *prev)
   {
+ +      BUG_ON(preemptible());
+ +
+ +      if (percpu_read(paravirt_lazy_mode) == PARAVIRT_LAZY_MMU) {
+ +              arch_leave_lazy_mmu_mode();
+ +              set_ti_thread_flag(task_thread_info(prev), TIF_LAZY_MMU_UPDATES);
+ +      }
         enter_lazy(PARAVIRT_LAZY_CPU);
   }
   
- -void paravirt_leave_lazy_cpu(void)
+ +void paravirt_end_context_switch(struct task_struct *next)
   {
- -      paravirt_leave_lazy(PARAVIRT_LAZY_CPU);
+ +      BUG_ON(preemptible());
+ +
+ +      leave_lazy(PARAVIRT_LAZY_CPU);
+ +
+ +      if (test_and_clear_ti_thread_flag(task_thread_info(next), TIF_LAZY_MMU_UPDATES))
+ +              arch_enter_lazy_mmu_mode();
   }
   
   enum paravirt_lazy_mode paravirt_get_lazy_mode(void)
   {
- -      return __get_cpu_var(paravirt_lazy_mode);
+ +      if (in_interrupt())
+ +              return PARAVIRT_LAZY_NONE;
+ +
+ +      return percpu_read(paravirt_lazy_mode);
   }
   
   void arch_flush_lazy_mmu_mode(void)
@@@ -302,6 -290,7 +302,6 @@@
         preempt_disable();
   
         if (paravirt_get_lazy_mode() == PARAVIRT_LAZY_MMU) {
- -              WARN_ON(preempt_count() == 1);
                 arch_leave_lazy_mmu_mode();
                 arch_enter_lazy_mmu_mode();
         }
@@@ -309,6 -298,19 +309,6 @@@
         preempt_enable();
   }
   
- -void arch_flush_lazy_cpu_mode(void)
- -{
- -      preempt_disable();
- -
- -      if (paravirt_get_lazy_mode() == PARAVIRT_LAZY_CPU) {
- -              WARN_ON(preempt_count() == 1);
- -              arch_leave_lazy_cpu_mode();
- -              arch_enter_lazy_cpu_mode();
- -      }
- -
- -      preempt_enable();
- -}
- -
   struct pv_info pv_info = {
         .name = "bare hardware",
         .paravirt_enabled = 0,
@@@ -400,8 -402,10 +400,8 @@@ struct pv_cpu_ops pv_cpu_ops = 
         .set_iopl_mask = native_set_iopl_mask,
         .io_delay = native_io_delay,
   
- -      .lazy_mode = {
- -              .enter = paravirt_nop,
- -              .leave = paravirt_nop,
- -      },
+ +      .start_context_switch = paravirt_nop,
+ +      .end_context_switch = paravirt_nop,
   };
   
   struct pv_apic_ops pv_apic_ops = {
@@@ -466,7 -470,6 +466,6 @@@ struct pv_mmu_ops pv_mmu_ops = 
   #if PAGETABLE_LEVELS >= 3
   #ifdef CONFIG_X86_PAE
         .set_pte_atomic = native_set_pte_atomic,
-       .set_pte_present = native_set_pte_present,
         .pte_clear = native_pte_clear,
         .pmd_clear = native_pmd_clear,
   #endif
diff --combined arch/x86/kernel/process_32.c

index d766c7616fd7dc96d9cd2c879371db89d1c0f9bd,76f8f84043a2a4693123648d92d08c22ca7f5f25..5de30f0960fb137c272eb93c5381e3e26497e0fd
--- 1/arch/x86/kernel/process_32.c
--- 2/arch/x86/kernel/process_32.c
+++ b/arch/x86/kernel/process_32.c
@@@ -245,7 -245,7 +245,7 @@@ void prepare_to_copy(struct task_struc
         unlazy_fpu(tsk);
   }
   
- int copy_thread(int nr, unsigned long clone_flags, unsigned long sp,
+ int copy_thread(unsigned long clone_flags, unsigned long sp,
         unsigned long unused,
         struct task_struct *p, struct pt_regs *regs)
   {
@@@ -407,7 -407,7 +407,7 @@@ __switch_to(struct task_struct *prev_p
          * done before math_state_restore, so the TS bit is up
          * to date.
          */
- -      arch_leave_lazy_cpu_mode();
+ +      arch_end_context_switch(next_p);
   
         /* If the task has used fpu the last 5 timeslices, just do a full
          * restore of the math state immediately to avoid the trap; the
diff --combined arch/x86/kernel/process_64.c

index e8a9aaf9df889ff24661980bcaa06214e2bd24ce,b751a41392b1b997d3c9a3235ba85b2372bdf7a3..66ad06791d6f3ca5e5d15f40c1cbeb1228aaa581
--- 1/arch/x86/kernel/process_64.c
--- 2/arch/x86/kernel/process_64.c
+++ b/arch/x86/kernel/process_64.c
@@@ -278,7 -278,7 +278,7 @@@ void prepare_to_copy(struct task_struc
         unlazy_fpu(tsk);
   }
   
- int copy_thread(int nr, unsigned long clone_flags, unsigned long sp,
+ int copy_thread(unsigned long clone_flags, unsigned long sp,
                 unsigned long unused,
         struct task_struct *p, struct pt_regs *regs)
   {
@@@ -428,7 -428,7 +428,7 @@@ __switch_to(struct task_struct *prev_p
          * done before math_state_restore, so the TS bit is up
          * to date.
          */
- -      arch_leave_lazy_cpu_mode();
+ +      arch_end_context_switch(next_p);
   
         /*
          * Switch FS and GS.
diff --combined arch/x86/kernel/vmi_32.c

index 55a5d6938e5e7479fe7c4e0870e8b40d811c274e,95deb9f2211e98decb5572e4757bc2cc48f3da18..b263423fbe2ae971424c5bd99c112ac984413383
--- 1/arch/x86/kernel/vmi_32.c
--- 2/arch/x86/kernel/vmi_32.c
+++ b/arch/x86/kernel/vmi_32.c
@@@ -395,11 -395,6 +395,6 @@@ static void vmi_set_pte_atomic(pte_t *p
         vmi_ops.update_pte(ptep, VMI_PAGE_PT);
   }
   
- static void vmi_set_pte_present(struct mm_struct *mm, unsigned long addr, pte_t *ptep, pte_t pte)
- {
-       vmi_ops.set_pte(pte, ptep, vmi_flags_addr_defer(mm, addr, VMI_PAGE_PT, 1));
- }
- 
   static void vmi_set_pud(pud_t *pudp, pud_t pudval)
   {
         /* Um, eww */
@@@ -467,28 -462,22 +462,28 @@@ vmi_startup_ipi_hook(int phys_apicid, u
   }
   #endif
   
- -static void vmi_enter_lazy_cpu(void)
+ +static void vmi_start_context_switch(struct task_struct *prev)
   {
- -      paravirt_enter_lazy_cpu();
+ +      paravirt_start_context_switch(prev);
         vmi_ops.set_lazy_mode(2);
   }
   
+ +static void vmi_end_context_switch(struct task_struct *next)
+ +{
+ +      vmi_ops.set_lazy_mode(0);
+ +      paravirt_end_context_switch(next);
+ +}
+ +
   static void vmi_enter_lazy_mmu(void)
   {
         paravirt_enter_lazy_mmu();
         vmi_ops.set_lazy_mode(1);
   }
   
- -static void vmi_leave_lazy(void)
+ +static void vmi_leave_lazy_mmu(void)
   {
- -      paravirt_leave_lazy(paravirt_get_lazy_mode());
         vmi_ops.set_lazy_mode(0);
+ +      paravirt_leave_lazy_mmu();
   }
   
   static inline int __init check_vmi_rom(struct vrom_header *rom)
@@@ -722,14 -711,14 +717,14 @@@ static inline int __init activate_vmi(v
         para_fill(pv_cpu_ops.set_iopl_mask, SetIOPLMask);
         para_fill(pv_cpu_ops.io_delay, IODelay);
   
- -      para_wrap(pv_cpu_ops.lazy_mode.enter, vmi_enter_lazy_cpu,
+ +      para_wrap(pv_cpu_ops.start_context_switch, vmi_start_context_switch,
                   set_lazy_mode, SetLazyMode);
- -      para_wrap(pv_cpu_ops.lazy_mode.leave, vmi_leave_lazy,
+ +      para_wrap(pv_cpu_ops.end_context_switch, vmi_end_context_switch,
                   set_lazy_mode, SetLazyMode);
   
         para_wrap(pv_mmu_ops.lazy_mode.enter, vmi_enter_lazy_mmu,
                   set_lazy_mode, SetLazyMode);
- -      para_wrap(pv_mmu_ops.lazy_mode.leave, vmi_leave_lazy,
+ +      para_wrap(pv_mmu_ops.lazy_mode.leave, vmi_leave_lazy_mmu,
                   set_lazy_mode, SetLazyMode);
   
         /* user and kernel flush are just handled with different flags to FlushTLB */
@@@ -756,7 -745,6 +751,6 @@@
                 pv_mmu_ops.set_pmd = vmi_set_pmd;
   #ifdef CONFIG_X86_PAE
                 pv_mmu_ops.set_pte_atomic = vmi_set_pte_atomic;
-               pv_mmu_ops.set_pte_present = vmi_set_pte_present;
                 pv_mmu_ops.set_pud = vmi_set_pud;
                 pv_mmu_ops.pte_clear = vmi_pte_clear;
                 pv_mmu_ops.pmd_clear = vmi_pmd_clear;
diff --combined arch/x86/lguest/boot.c

index 5287081b356709978183af6aa77d658e1db815c0,e94a11e42f9864a35e197d9fdf7919accc8ba095..5ab239711cc218c56000c7893a26ae7288341281
--- 1/arch/x86/lguest/boot.c
--- 2/arch/x86/lguest/boot.c
+++ b/arch/x86/lguest/boot.c
@@@ -107,7 -107,7 +107,7 @@@ static void async_hcall(unsigned long c
         local_irq_save(flags);
         if (lguest_data.hcall_status[next_call] != 0xFF) {
                 /* Table full, so do normal hcall which will flush table. */
-               hcall(call, arg1, arg2, arg3);
+               kvm_hypercall3(call, arg1, arg2, arg3);
         } else {
                 lguest_data.hcalls[next_call].arg0 = call;
                 lguest_data.hcalls[next_call].arg1 = arg1;
@@@ -134,29 -134,42 +134,48 @@@
    *
    * So, when we're in lazy mode, we call async_hcall() to store the call for
    * future processing: */
- static void lazy_hcall(unsigned long call,
+ static void lazy_hcall1(unsigned long call,
+                      unsigned long arg1)
+ {
+       if (paravirt_get_lazy_mode() == PARAVIRT_LAZY_NONE)
+               kvm_hypercall1(call, arg1);
+       else
+               async_hcall(call, arg1, 0, 0);
+ }
+ 
+ static void lazy_hcall2(unsigned long call,
+                      unsigned long arg1,
+                      unsigned long arg2)
+ {
+       if (paravirt_get_lazy_mode() == PARAVIRT_LAZY_NONE)
+               kvm_hypercall2(call, arg1, arg2);
+       else
+               async_hcall(call, arg1, arg2, 0);
+ }
+ 
+ static void lazy_hcall3(unsigned long call,
                        unsigned long arg1,
                        unsigned long arg2,
                        unsigned long arg3)
   {
         if (paravirt_get_lazy_mode() == PARAVIRT_LAZY_NONE)
-               hcall(call, arg1, arg2, arg3);
+               kvm_hypercall3(call, arg1, arg2, arg3);
         else
                 async_hcall(call, arg1, arg2, arg3);
   }
   
   /* When lazy mode is turned off reset the per-cpu lazy mode variable and then
    * issue the do-nothing hypercall to flush any stored calls. */
- -static void lguest_leave_lazy_mode(void)
+ +static void lguest_leave_lazy_mmu_mode(void)
+ +{
+ +      hcall(LHCALL_FLUSH_ASYNC, 0, 0, 0);
+ +      paravirt_leave_lazy_mmu();
+ +}
+ +
+ +static void lguest_end_context_switch(struct task_struct *next)
   {
-       hcall(LHCALL_FLUSH_ASYNC, 0, 0, 0);
- -      paravirt_leave_lazy(paravirt_get_lazy_mode());
+       kvm_hypercall0(LHCALL_FLUSH_ASYNC);
+ +      paravirt_end_context_switch(next);
   }
   
   /*G:033
@@@ -235,7 -248,7 +254,7 @@@ static void lguest_write_idt_entry(gate
         /* Keep the local copy up to date. */
         native_write_idt_entry(dt, entrynum, g);
         /* Tell Host about this new entry. */
-       hcall(LHCALL_LOAD_IDT_ENTRY, entrynum, desc[0], desc[1]);
+       kvm_hypercall3(LHCALL_LOAD_IDT_ENTRY, entrynum, desc[0], desc[1]);
   }
   
   /* Changing to a different IDT is very rare: we keep the IDT up-to-date every
@@@ -247,7 -260,7 +266,7 @@@ static void lguest_load_idt(const struc
         struct desc_struct *idt = (void *)desc->address;
   
         for (i = 0; i < (desc->size+1)/8; i++)
-               hcall(LHCALL_LOAD_IDT_ENTRY, i, idt[i].a, idt[i].b);
+               kvm_hypercall3(LHCALL_LOAD_IDT_ENTRY, i, idt[i].a, idt[i].b);
   }
   
   /*
@@@ -267,8 -280,8 +286,8 @@@
    */
   static void lguest_load_gdt(const struct desc_ptr *desc)
   {
-       BUG_ON((desc->size+1)/8 != GDT_ENTRIES);
-       hcall(LHCALL_LOAD_GDT, __pa(desc->address), GDT_ENTRIES, 0);
+       BUG_ON((desc->size + 1) / 8 != GDT_ENTRIES);
+       kvm_hypercall2(LHCALL_LOAD_GDT, __pa(desc->address), GDT_ENTRIES);
   }
   
   /* For a single GDT entry which changes, we do the lazy thing: alter our GDT,
@@@ -278,7 -291,7 +297,7 @@@ static void lguest_write_gdt_entry(stru
                                    const void *desc, int type)
   {
         native_write_gdt_entry(dt, entrynum, desc, type);
-       hcall(LHCALL_LOAD_GDT, __pa(dt), GDT_ENTRIES, 0);
+       kvm_hypercall2(LHCALL_LOAD_GDT, __pa(dt), GDT_ENTRIES);
   }
   
   /* OK, I lied.  There are three "thread local storage" GDT entries which change
@@@ -290,7 -303,7 +309,7 @@@ static void lguest_load_tls(struct thre
          * can't handle us removing entries we're currently using.  So we clear
          * the GS register here: if it's needed it'll be reloaded anyway. */
         lazy_load_gs(0);
-       lazy_hcall(LHCALL_LOAD_TLS, __pa(&t->tls_array), cpu, 0);
+       lazy_hcall2(LHCALL_LOAD_TLS, __pa(&t->tls_array), cpu);
   }
   
   /*G:038 That's enough excitement for now, back to ploughing through each of
@@@ -388,7 -401,7 +407,7 @@@ static void lguest_cpuid(unsigned int *
   static unsigned long current_cr0;
   static void lguest_write_cr0(unsigned long val)
   {
-       lazy_hcall(LHCALL_TS, val & X86_CR0_TS, 0, 0);
+       lazy_hcall1(LHCALL_TS, val & X86_CR0_TS);
         current_cr0 = val;
   }
   
@@@ -402,7 -415,7 +421,7 @@@ static unsigned long lguest_read_cr0(vo
    * the vowels have been optimized out. */
   static void lguest_clts(void)
   {
-       lazy_hcall(LHCALL_TS, 0, 0, 0);
+       lazy_hcall1(LHCALL_TS, 0);
         current_cr0 &= ~X86_CR0_TS;
   }
   
@@@ -424,7 -437,7 +443,7 @@@ static bool cr3_changed = false
   static void lguest_write_cr3(unsigned long cr3)
   {
         lguest_data.pgdir = cr3;
-       lazy_hcall(LHCALL_NEW_PGTABLE, cr3, 0, 0);
+       lazy_hcall1(LHCALL_NEW_PGTABLE, cr3);
         cr3_changed = true;
   }
   
@@@ -496,11 -509,17 +515,17 @@@ static void lguest_write_cr4(unsigned l
    * into a process' address space.  We set the entry then tell the Host the
    * toplevel and address this corresponds to.  The Guest uses one pagetable per
    * process, so we need to tell the Host which one we're changing (mm->pgd). */
+ static void lguest_pte_update(struct mm_struct *mm, unsigned long addr,
+                              pte_t *ptep)
+ {
+       lazy_hcall3(LHCALL_SET_PTE, __pa(mm->pgd), addr, ptep->pte_low);
+ }
+ 
   static void lguest_set_pte_at(struct mm_struct *mm, unsigned long addr,
                               pte_t *ptep, pte_t pteval)
   {
         *ptep = pteval;
-       lazy_hcall(LHCALL_SET_PTE, __pa(mm->pgd), addr, pteval.pte_low);
+       lguest_pte_update(mm, addr, ptep);
   }
   
   /* The Guest calls this to set a top-level entry.  Again, we set the entry then
@@@ -509,8 -528,8 +534,8 @@@
   static void lguest_set_pmd(pmd_t *pmdp, pmd_t pmdval)
   {
         *pmdp = pmdval;
-       lazy_hcall(LHCALL_SET_PMD, __pa(pmdp)&PAGE_MASK,
-                  (__pa(pmdp)&(PAGE_SIZE-1))/4, 0);
+       lazy_hcall2(LHCALL_SET_PMD, __pa(pmdp) & PAGE_MASK,
+                  (__pa(pmdp) & (PAGE_SIZE - 1)) / 4);
   }
   
   /* There are a couple of legacy places where the kernel sets a PTE, but we
@@@ -526,7 -545,7 +551,7 @@@ static void lguest_set_pte(pte_t *ptep
   {
         *ptep = pteval;
         if (cr3_changed)
-               lazy_hcall(LHCALL_FLUSH_TLB, 1, 0, 0);
+               lazy_hcall1(LHCALL_FLUSH_TLB, 1);
   }
   
   /* Unfortunately for Lguest, the pv_mmu_ops for page tables were based on
@@@ -542,7 -561,7 +567,7 @@@
   static void lguest_flush_tlb_single(unsigned long addr)
   {
         /* Simply set it to zero: if it was not, it will fault back in. */
-       lazy_hcall(LHCALL_SET_PTE, lguest_data.pgdir, addr, 0);
+       lazy_hcall3(LHCALL_SET_PTE, lguest_data.pgdir, addr, 0);
   }
   
   /* This is what happens after the Guest has removed a large number of entries.
@@@ -550,7 -569,7 +575,7 @@@
    * have changed, ie. virtual addresses below PAGE_OFFSET. */
   static void lguest_flush_tlb_user(void)
   {
-       lazy_hcall(LHCALL_FLUSH_TLB, 0, 0, 0);
+       lazy_hcall1(LHCALL_FLUSH_TLB, 0);
   }
   
   /* This is called when the kernel page tables have changed.  That's not very
@@@ -558,7 -577,7 +583,7 @@@
    * slow), so it's worth separating this from the user flushing above. */
   static void lguest_flush_tlb_kernel(void)
   {
-       lazy_hcall(LHCALL_FLUSH_TLB, 1, 0, 0);
+       lazy_hcall1(LHCALL_FLUSH_TLB, 1);
   }
   
   /*
@@@ -695,7 -714,7 +720,7 @@@ static int lguest_clockevent_set_next_e
         }
   
         /* Please wake us this far in the future. */
-       hcall(LHCALL_SET_CLOCKEVENT, delta, 0, 0);
+       kvm_hypercall1(LHCALL_SET_CLOCKEVENT, delta);
         return 0;
   }
   
@@@ -706,7 -725,7 +731,7 @@@ static void lguest_clockevent_set_mode(
         case CLOCK_EVT_MODE_UNUSED:
         case CLOCK_EVT_MODE_SHUTDOWN:
                 /* A 0 argument shuts the clock down. */
-               hcall(LHCALL_SET_CLOCKEVENT, 0, 0, 0);
+               kvm_hypercall0(LHCALL_SET_CLOCKEVENT);
                 break;
         case CLOCK_EVT_MODE_ONESHOT:
                 /* This is what we expect. */
@@@ -781,8 -800,8 +806,8 @@@ static void lguest_time_init(void
   static void lguest_load_sp0(struct tss_struct *tss,
                             struct thread_struct *thread)
   {
-       lazy_hcall(LHCALL_SET_STACK, __KERNEL_DS|0x1, thread->sp0,
-                  THREAD_SIZE/PAGE_SIZE);
+       lazy_hcall3(LHCALL_SET_STACK, __KERNEL_DS | 0x1, thread->sp0,
+                  THREAD_SIZE / PAGE_SIZE);
   }
   
   /* Let's just say, I wouldn't do debugging under a Guest. */
@@@ -855,7 -874,7 +880,7 @@@ static void set_lguest_basic_apic_ops(v
   /* STOP!  Until an interrupt comes in. */
   static void lguest_safe_halt(void)
   {
-       hcall(LHCALL_HALT, 0, 0, 0);
+       kvm_hypercall0(LHCALL_HALT);
   }
   
   /* The SHUTDOWN hypercall takes a string to describe what's happening, and
@@@ -865,7 -884,8 +890,8 @@@
    * rather than virtual addresses, so we use __pa() here. */
   static void lguest_power_off(void)
   {
-       hcall(LHCALL_SHUTDOWN, __pa("Power down"), LGUEST_SHUTDOWN_POWEROFF, 0);
+       kvm_hypercall2(LHCALL_SHUTDOWN, __pa("Power down"),
+                                       LGUEST_SHUTDOWN_POWEROFF);
   }
   
   /*
@@@ -875,7 -895,7 +901,7 @@@
    */
   static int lguest_panic(struct notifier_block *nb, unsigned long l, void *p)
   {
-       hcall(LHCALL_SHUTDOWN, __pa(p), LGUEST_SHUTDOWN_POWEROFF, 0);
+       kvm_hypercall2(LHCALL_SHUTDOWN, __pa(p), LGUEST_SHUTDOWN_POWEROFF);
         /* The hcall won't return, but to keep gcc happy, we're "done". */
         return NOTIFY_DONE;
   }
@@@ -916,7 -936,7 +942,7 @@@ static __init int early_put_chars(u32 v
                 len = sizeof(scratch) - 1;
         scratch[len] = '\0';
         memcpy(scratch, buf, len);
-       hcall(LHCALL_NOTIFY, __pa(scratch), 0, 0);
+       kvm_hypercall1(LHCALL_NOTIFY, __pa(scratch));
   
         /* This routine returns the number of bytes actually written. */
         return len;
@@@ -926,7 -946,7 +952,7 @@@
    * Launcher to reboot us. */
   static void lguest_restart(char *reason)
   {
-       hcall(LHCALL_SHUTDOWN, __pa(reason), LGUEST_SHUTDOWN_RESTART, 0);
+       kvm_hypercall2(LHCALL_SHUTDOWN, __pa(reason), LGUEST_SHUTDOWN_RESTART);
   }
   
   /*G:050
@@@ -1031,8 -1051,8 +1057,8 @@@ __init void lguest_init(void
         pv_cpu_ops.write_gdt_entry = lguest_write_gdt_entry;
         pv_cpu_ops.write_idt_entry = lguest_write_idt_entry;
         pv_cpu_ops.wbinvd = lguest_wbinvd;
- -      pv_cpu_ops.lazy_mode.enter = paravirt_enter_lazy_cpu;
- -      pv_cpu_ops.lazy_mode.leave = lguest_leave_lazy_mode;
+ +      pv_cpu_ops.start_context_switch = paravirt_start_context_switch;
+ +      pv_cpu_ops.end_context_switch = lguest_end_context_switch;
   
         /* pagetable management */
         pv_mmu_ops.write_cr3 = lguest_write_cr3;
@@@ -1045,7 -1065,9 +1071,9 @@@
         pv_mmu_ops.read_cr2 = lguest_read_cr2;
         pv_mmu_ops.read_cr3 = lguest_read_cr3;
         pv_mmu_ops.lazy_mode.enter = paravirt_enter_lazy_mmu;
- -      pv_mmu_ops.lazy_mode.leave = lguest_leave_lazy_mode;
+ +      pv_mmu_ops.lazy_mode.leave = lguest_leave_lazy_mmu_mode;
+       pv_mmu_ops.pte_update = lguest_pte_update;
+       pv_mmu_ops.pte_update_defer = lguest_pte_update;
   
   #ifdef CONFIG_X86_LOCAL_APIC
         /* apic read/write intercepts */
@@@ -1064,14 -1086,6 +1092,6 @@@
          * lguest_init() where the rest of the fairly chaotic boot setup
          * occurs. */
   
-       /* The native boot code sets up initial page tables immediately after
-        * the kernel itself, and sets init_pg_tables_end so they're not
-        * clobbered.  The Launcher places our initial pagetables somewhere at
-        * the top of our physical memory, so we don't need extra space: set
-        * init_pg_tables_end to the end of the kernel. */
-       init_pg_tables_start = __pa(pg0);
-       init_pg_tables_end = __pa(pg0);
- 
         /* As described in head_32.S, we map the first 128M of memory. */
         max_pfn_mapped = (128*1024*1024) >> PAGE_SHIFT;
   
diff --combined arch/x86/mm/highmem_32.c

index e81dfa4081578c839a8a1cb14f56061b1a3a4f3b,8126e8d1a2a4a789509cb49af563b6cbb76395ae..58f621e8191955c2e02016df1d8e99bec8e1ed8f
--- 1/arch/x86/mm/highmem_32.c
--- 2/arch/x86/mm/highmem_32.c
+++ b/arch/x86/mm/highmem_32.c
@@@ -19,49 -19,6 +19,6 @@@ void kunmap(struct page *page
         kunmap_high(page);
   }
   
- static void debug_kmap_atomic_prot(enum km_type type)
- {
- #ifdef CONFIG_DEBUG_HIGHMEM
-       static unsigned warn_count = 10;
- 
-       if (unlikely(warn_count == 0))
-               return;
- 
-       if (unlikely(in_interrupt())) {
-               if (in_irq()) {
-                       if (type != KM_IRQ0 && type != KM_IRQ1 &&
-                           type != KM_BIO_SRC_IRQ && type != KM_BIO_DST_IRQ &&
-                           type != KM_BOUNCE_READ) {
-                               WARN_ON(1);
-                               warn_count--;
-                       }
-               } else if (!irqs_disabled()) {  /* softirq */
-                       if (type != KM_IRQ0 && type != KM_IRQ1 &&
-                           type != KM_SOFTIRQ0 && type != KM_SOFTIRQ1 &&
-                           type != KM_SKB_SUNRPC_DATA &&
-                           type != KM_SKB_DATA_SOFTIRQ &&
-                           type != KM_BOUNCE_READ) {
-                               WARN_ON(1);
-                               warn_count--;
-                       }
-               }
-       }
- 
-       if (type == KM_IRQ0 || type == KM_IRQ1 || type == KM_BOUNCE_READ ||
-                       type == KM_BIO_SRC_IRQ || type == KM_BIO_DST_IRQ) {
-               if (!irqs_disabled()) {
-                       WARN_ON(1);
-                       warn_count--;
-               }
-       } else if (type == KM_SOFTIRQ0 || type == KM_SOFTIRQ1) {
-               if (irq_count() == 0 && !irqs_disabled()) {
-                       WARN_ON(1);
-                       warn_count--;
-               }
-       }
- #endif
- }
- 
   /*
    * kmap_atomic/kunmap_atomic is significantly faster than kmap/kunmap because
    * no global lock is needed and because the kmap code must perform a global TLB
@@@ -81,12 -38,13 +38,12 @@@ void *kmap_atomic_prot(struct page *pag
         if (!PageHighMem(page))
                 return page_address(page);
   
-       debug_kmap_atomic_prot(type);
+       debug_kmap_atomic(type);
   
         idx = type + KM_TYPE_NR*smp_processor_id();
         vaddr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
         BUG_ON(!pte_none(*(kmap_pte-idx)));
         set_pte(kmap_pte-idx, mk_pte(page, prot));
- -      arch_flush_lazy_mmu_mode();
   
         return (void *)vaddr;
   }
@@@ -116,25 -74,17 +73,16 @@@ void kunmap_atomic(void *kvaddr, enum k
   #endif
         }
   
- -      arch_flush_lazy_mmu_mode();
         pagefault_enable();
   }
   
- /* This is the same as kmap_atomic() but can map memory that doesn't
+ /*
+  * This is the same as kmap_atomic() but can map memory that doesn't
    * have a struct page associated with it.
    */
   void *kmap_atomic_pfn(unsigned long pfn, enum km_type type)
   {
-       enum fixed_addresses idx;
-       unsigned long vaddr;
- 
-       pagefault_disable();
- 
-       idx = type + KM_TYPE_NR*smp_processor_id();
-       vaddr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
-       set_pte(kmap_pte-idx, pfn_pte(pfn, kmap_prot));
-       arch_flush_lazy_mmu_mode();
- 
-       return (void*) vaddr;
+       return kmap_atomic_prot_pfn(pfn, type, kmap_prot);
   }
   EXPORT_SYMBOL_GPL(kmap_atomic_pfn); /* temporarily in use by i915 GEM until vmap */
   
@@@ -156,7 -106,6 +104,6 @@@ EXPORT_SYMBOL(kunmap)
   EXPORT_SYMBOL(kmap_atomic);
   EXPORT_SYMBOL(kunmap_atomic);
   
- #ifdef CONFIG_NUMA
   void __init set_highmem_pages_init(void)
   {
         struct zone *zone;
@@@ -180,11 -129,3 +127,3 @@@
         }
         totalram_pages += totalhigh_pages;
   }
- #else
- void __init set_highmem_pages_init(void)
- {
-       add_highpages_with_active_regions(0, highstart_pfn, highend_pfn);
- 
-       totalram_pages += totalhigh_pages;
- }
- #endif /* CONFIG_NUMA */
diff --combined arch/x86/mm/iomap_32.c

index b6a61f3d7ef828a3c03de42454382895faa996e6,8056545e2d39f9b53ba56349db4717809d6b9f04..fe6f84ca121ee072d2be8014e2b9b7e959e5abbd
--- 1/arch/x86/mm/iomap_32.c
--- 2/arch/x86/mm/iomap_32.c
+++ b/arch/x86/mm/iomap_32.c
@@@ -19,10 -19,11 +19,11 @@@
   #include <asm/iomap.h>
   #include <asm/pat.h>
   #include <linux/module.h>
+ #include <linux/highmem.h>
   
   int is_io_mapping_possible(resource_size_t base, unsigned long size)
   {
- #ifndef CONFIG_X86_PAE
+ #if !defined(CONFIG_X86_PAE) && defined(CONFIG_PHYS_ADDR_T_64BIT)
         /* There is no way to map greater than 1 << 32 address without PAE */
         if (base + size > 0x100000000ULL)
                 return 0;
@@@ -31,16 -32,28 +32,28 @@@
   }
   EXPORT_SYMBOL_GPL(is_io_mapping_possible);
   
- /* Map 'pfn' using fixed map 'type' and protections 'prot'
-  */
- void *
- iomap_atomic_prot_pfn(unsigned long pfn, enum km_type type, pgprot_t prot)
+ void *kmap_atomic_prot_pfn(unsigned long pfn, enum km_type type, pgprot_t prot)
   {
         enum fixed_addresses idx;
         unsigned long vaddr;
   
         pagefault_disable();
   
+       debug_kmap_atomic(type);
+       idx = type + KM_TYPE_NR * smp_processor_id();
+       vaddr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
+       set_pte(kmap_pte - idx, pfn_pte(pfn, prot));
+       arch_flush_lazy_mmu_mode();
+ 
+       return (void *)vaddr;
+ }
+ 
+ /*
+  * Map 'pfn' using fixed map 'type' and protections 'prot'
+  */
+ void *
+ iomap_atomic_prot_pfn(unsigned long pfn, enum km_type type, pgprot_t prot)
+ {
         /*
          * For non-PAT systems, promote PAGE_KERNEL_WC to PAGE_KERNEL_UC_MINUS.
          * PAGE_KERNEL_WC maps to PWT, which translates to uncached if the
@@@ -50,12 -63,7 +63,7 @@@
         if (!pat_enabled && pgprot_val(prot) == pgprot_val(PAGE_KERNEL_WC))
                 prot = PAGE_KERNEL_UC_MINUS;
   
-       idx = type + KM_TYPE_NR*smp_processor_id();
-       vaddr = __fix_to_virt(FIX_KMAP_BEGIN + idx);
-       set_pte(kmap_pte-idx, pfn_pte(pfn, prot));
-       arch_flush_lazy_mmu_mode();
- 
-       return (void*) vaddr;
+       return kmap_atomic_prot_pfn(pfn, type, prot);
   }
   EXPORT_SYMBOL_GPL(iomap_atomic_prot_pfn);
   
@@@ -74,6 -82,7 +82,6 @@@ iounmap_atomic(void *kvaddr, enum km_ty
         if (vaddr == __fix_to_virt(FIX_KMAP_BEGIN+idx))
                 kpte_clear_flush(kmap_pte-idx, vaddr);
   
- -      arch_flush_lazy_mmu_mode();
         pagefault_enable();
   }
   EXPORT_SYMBOL_GPL(iounmap_atomic);
diff --combined arch/x86/mm/pageattr.c

index 9015e5e412b51c59450d6dad805fd79ecd0d1389,d71e1b636ce69167515c0a6bd3b47d3807b49175..660cac75ae11e489e2d443bee8d9a78d37eb8178
--- 1/arch/x86/mm/pageattr.c
--- 2/arch/x86/mm/pageattr.c
+++ b/arch/x86/mm/pageattr.c
@@@ -16,6 -16,7 +16,7 @@@
   #include <asm/processor.h>
   #include <asm/tlbflush.h>
   #include <asm/sections.h>
+ #include <asm/setup.h>
   #include <asm/uaccess.h>
   #include <asm/pgalloc.h>
   #include <asm/proto.h>
@@@ -33,6 -34,7 +34,7 @@@ struct cpa_data 
         unsigned long   pfn;
         unsigned        force_split : 1;
         int             curpage;
+       struct page     **pages;
   };
   
   /*
@@@ -45,6 -47,7 +47,7 @@@ static DEFINE_SPINLOCK(cpa_lock)
   
   #define CPA_FLUSHTLB 1
   #define CPA_ARRAY 2
+ #define CPA_PAGES_ARRAY 4
   
   #ifdef CONFIG_PROC_FS
   static unsigned long direct_pages_count[PG_LEVEL_NUM];
@@@ -95,7 -98,7 +98,7 @@@ static inline unsigned long highmap_sta
   
   static inline unsigned long highmap_end_pfn(void)
   {
-       return __pa(roundup((unsigned long)_end, PMD_SIZE)) >> PAGE_SHIFT;
+       return __pa(roundup(_brk_end, PMD_SIZE)) >> PAGE_SHIFT;
   }
   
   #endif
@@@ -201,10 -204,10 +204,10 @@@ static void cpa_flush_range(unsigned lo
         }
   }
   
- static void cpa_flush_array(unsigned long *start, int numpages, int cache)
+ static void cpa_flush_array(unsigned long *start, int numpages, int cache,
+                           int in_flags, struct page **pages)
   {
         unsigned int i, level;
-       unsigned long *addr;
   
         BUG_ON(irqs_disabled());
   
@@@ -225,14 -228,22 +228,22 @@@
          * will cause all other CPUs to flush the same
          * cachelines:
          */
-       for (i = 0, addr = start; i < numpages; i++, addr++) {
-               pte_t *pte = lookup_address(*addr, &level);
+       for (i = 0; i < numpages; i++) {
+               unsigned long addr;
+               pte_t *pte;
+ 
+               if (in_flags & CPA_PAGES_ARRAY)
+                       addr = (unsigned long)page_address(pages[i]);
+               else
+                       addr = start[i];
+ 
+               pte = lookup_address(addr, &level);
   
                 /*
                  * Only flush present addresses:
                  */
                 if (pte && (pte_val(*pte) & _PAGE_PRESENT))
-                       clflush_cache_range((void *) *addr, PAGE_SIZE);
+                       clflush_cache_range((void *)addr, PAGE_SIZE);
         }
   }
   
@@@ -584,7 -595,9 +595,9 @@@ static int __change_page_attr(struct cp
         unsigned int level;
         pte_t *kpte, old_pte;
   
-       if (cpa->flags & CPA_ARRAY)
+       if (cpa->flags & CPA_PAGES_ARRAY)
+               address = (unsigned long)page_address(cpa->pages[cpa->curpage]);
+       else if (cpa->flags & CPA_ARRAY)
                 address = cpa->vaddr[cpa->curpage];
         else
                 address = *cpa->vaddr;
@@@ -687,7 -700,9 +700,9 @@@ static int cpa_process_alias(struct cpa
          * No need to redo, when the primary call touched the direct
          * mapping already:
          */
-       if (cpa->flags & CPA_ARRAY)
+       if (cpa->flags & CPA_PAGES_ARRAY)
+               vaddr = (unsigned long)page_address(cpa->pages[cpa->curpage]);
+       else if (cpa->flags & CPA_ARRAY)
                 vaddr = cpa->vaddr[cpa->curpage];
         else
                 vaddr = *cpa->vaddr;
@@@ -698,7 -713,7 +713,7 @@@
                 alias_cpa = *cpa;
                 temp_cpa_vaddr = (unsigned long) __va(cpa->pfn << PAGE_SHIFT);
                 alias_cpa.vaddr = &temp_cpa_vaddr;
-               alias_cpa.flags &= ~CPA_ARRAY;
+               alias_cpa.flags &= ~(CPA_PAGES_ARRAY | CPA_ARRAY);
   
   
                 ret = __change_page_attr_set_clr(&alias_cpa, 0);
@@@ -711,7 -726,7 +726,7 @@@
          * No need to redo, when the primary call touched the high
          * mapping already:
          */
-       if (within(vaddr, (unsigned long) _text, (unsigned long) _end))
+       if (within(vaddr, (unsigned long) _text, _brk_end))
                 return 0;
   
         /*
@@@ -724,7 -739,7 +739,7 @@@
         alias_cpa = *cpa;
         temp_cpa_vaddr = (cpa->pfn << PAGE_SHIFT) + __START_KERNEL_map - phys_base;
         alias_cpa.vaddr = &temp_cpa_vaddr;
-       alias_cpa.flags &= ~CPA_ARRAY;
+       alias_cpa.flags &= ~(CPA_PAGES_ARRAY | CPA_ARRAY);
   
         /*
          * The high mapping range is imprecise, so ignore the return value.
@@@ -745,7 -760,7 +760,7 @@@ static int __change_page_attr_set_clr(s
                  */
                 cpa->numpages = numpages;
                 /* for array changes, we can't use large page */
-               if (cpa->flags & CPA_ARRAY)
+               if (cpa->flags & (CPA_ARRAY | CPA_PAGES_ARRAY))
                         cpa->numpages = 1;
   
                 if (!debug_pagealloc)
@@@ -769,7 -784,7 +784,7 @@@
                  */
                 BUG_ON(cpa->numpages > numpages);
                 numpages -= cpa->numpages;
-               if (cpa->flags & CPA_ARRAY)
+               if (cpa->flags & (CPA_PAGES_ARRAY | CPA_ARRAY))
                         cpa->curpage++;
                 else
                         *cpa->vaddr += cpa->numpages * PAGE_SIZE;
@@@ -786,7 -801,8 +801,8 @@@ static inline int cache_attr(pgprot_t a
   
   static int change_page_attr_set_clr(unsigned long *addr, int numpages,
                                     pgprot_t mask_set, pgprot_t mask_clr,
-                                   int force_split, int array)
+                                   int force_split, int in_flag,
+                                   struct page **pages)
   {
         struct cpa_data cpa;
         int ret, cache, checkalias;
@@@ -801,15 -817,7 +817,7 @@@
                 return 0;
   
         /* Ensure we are PAGE_SIZE aligned */
-       if (!array) {
-               if (*addr & ~PAGE_MASK) {
-                       *addr &= PAGE_MASK;
-                       /*
-                        * People should not be passing in unaligned addresses:
-                        */
-                       WARN_ON_ONCE(1);
-               }
-       } else {
+       if (in_flag & CPA_ARRAY) {
                 int i;
                 for (i = 0; i < numpages; i++) {
                         if (addr[i] & ~PAGE_MASK) {
@@@ -817,6 -825,18 +825,18 @@@
                                 WARN_ON_ONCE(1);
                         }
                 }
+       } else if (!(in_flag & CPA_PAGES_ARRAY)) {
+               /*
+                * in_flag of CPA_PAGES_ARRAY implies it is aligned.
+                * No need to cehck in that case
+                */
+               if (*addr & ~PAGE_MASK) {
+                       *addr &= PAGE_MASK;
+                       /*
+                        * People should not be passing in unaligned addresses:
+                        */
+                       WARN_ON_ONCE(1);
+               }
         }
   
         /* Must avoid aliasing mappings in the highmem code */
@@@ -824,7 -844,15 +844,8 @@@
   
         vm_unmap_aliases();
   
- -      /*
- -       * If we're called with lazy mmu updates enabled, the
- -       * in-memory pte state may be stale.  Flush pending updates to
- -       * bring them up to date.
- -       */
- -      arch_flush_lazy_mmu_mode();
- -
         cpa.vaddr = addr;
+       cpa.pages = pages;
         cpa.numpages = numpages;
         cpa.mask_set = mask_set;
         cpa.mask_clr = mask_clr;
@@@ -832,8 -860,8 +853,8 @@@
         cpa.curpage = 0;
         cpa.force_split = force_split;
   
-       if (array)
-               cpa.flags |= CPA_ARRAY;
+       if (in_flag & (CPA_ARRAY | CPA_PAGES_ARRAY))
+               cpa.flags |= in_flag;
   
         /* No alias checking for _NX bit modifications */
         checkalias = (pgprot_val(mask_set) | pgprot_val(mask_clr)) != _PAGE_NX;
@@@ -859,13 -887,21 +880,14 @@@
          * wbindv):
          */
         if (!ret && cpu_has_clflush) {
-               if (cpa.flags & CPA_ARRAY)
-                       cpa_flush_array(addr, numpages, cache);
-               else
+               if (cpa.flags & (CPA_PAGES_ARRAY | CPA_ARRAY)) {
+                       cpa_flush_array(addr, numpages, cache,
+                                       cpa.flags, pages);
+               } else
                         cpa_flush_range(*addr, numpages, cache);
         } else
                 cpa_flush_all(cache);
   
- -      /*
- -       * If we've been called with lazy mmu updates enabled, then
- -       * make sure that everything gets flushed out before we
- -       * return.
- -       */
- -      arch_flush_lazy_mmu_mode();
- -
   out:
         return ret;
   }
@@@ -874,14 -910,28 +896,28 @@@ static inline int change_page_attr_set(
                                        pgprot_t mask, int array)
   {
         return change_page_attr_set_clr(addr, numpages, mask, __pgprot(0), 0,
-               array);
+               (array ? CPA_ARRAY : 0), NULL);
   }
   
   static inline int change_page_attr_clear(unsigned long *addr, int numpages,
                                          pgprot_t mask, int array)
   {
         return change_page_attr_set_clr(addr, numpages, __pgprot(0), mask, 0,
-               array);
+               (array ? CPA_ARRAY : 0), NULL);
+ }
+ 
+ static inline int cpa_set_pages_array(struct page **pages, int numpages,
+                                      pgprot_t mask)
+ {
+       return change_page_attr_set_clr(NULL, numpages, mask, __pgprot(0), 0,
+               CPA_PAGES_ARRAY, pages);
+ }
+ 
+ static inline int cpa_clear_pages_array(struct page **pages, int numpages,
+                                        pgprot_t mask)
+ {
+       return change_page_attr_set_clr(NULL, numpages, __pgprot(0), mask, 0,
+               CPA_PAGES_ARRAY, pages);
   }
   
   int _set_memory_uc(unsigned long addr, int numpages)
@@@ -1029,7 -1079,7 +1065,7 @@@ int set_memory_np(unsigned long addr, i
   int set_memory_4k(unsigned long addr, int numpages)
   {
         return change_page_attr_set_clr(&addr, numpages, __pgprot(0),
-                                       __pgprot(0), 1, 0);
+                                       __pgprot(0), 1, 0, NULL);
   }
   
   int set_pages_uc(struct page *page, int numpages)
@@@ -1040,6 -1090,35 +1076,35 @@@
   }
   EXPORT_SYMBOL(set_pages_uc);
   
+ int set_pages_array_uc(struct page **pages, int addrinarray)
+ {
+       unsigned long start;
+       unsigned long end;
+       int i;
+       int free_idx;
+ 
+       for (i = 0; i < addrinarray; i++) {
+               start = (unsigned long)page_address(pages[i]);
+               end = start + PAGE_SIZE;
+               if (reserve_memtype(start, end, _PAGE_CACHE_UC_MINUS, NULL))
+                       goto err_out;
+       }
+ 
+       if (cpa_set_pages_array(pages, addrinarray,
+                       __pgprot(_PAGE_CACHE_UC_MINUS)) == 0) {
+               return 0; /* Success */
+       }
+ err_out:
+       free_idx = i;
+       for (i = 0; i < free_idx; i++) {
+               start = (unsigned long)page_address(pages[i]);
+               end = start + PAGE_SIZE;
+               free_memtype(start, end);
+       }
+       return -EINVAL;
+ }
+ EXPORT_SYMBOL(set_pages_array_uc);
+ 
   int set_pages_wb(struct page *page, int numpages)
   {
         unsigned long addr = (unsigned long)page_address(page);
@@@ -1048,6 -1127,26 +1113,26 @@@
   }
   EXPORT_SYMBOL(set_pages_wb);
   
+ int set_pages_array_wb(struct page **pages, int addrinarray)
+ {
+       int retval;
+       unsigned long start;
+       unsigned long end;
+       int i;
+ 
+       retval = cpa_clear_pages_array(pages, addrinarray,
+                       __pgprot(_PAGE_CACHE_MASK));
+ 
+       for (i = 0; i < addrinarray; i++) {
+               start = (unsigned long)page_address(pages[i]);
+               end = start + PAGE_SIZE;
+               free_memtype(start, end);
+       }
+ 
+       return retval;
+ }
+ EXPORT_SYMBOL(set_pages_array_wb);
+ 
   int set_pages_x(struct page *page, int numpages)
   {
         unsigned long addr = (unsigned long)page_address(page);
diff --combined arch/x86/xen/mmu.c

index e425a32e0a9084404977f9d2ff474be7ace0aa0c,db3802fb7b8470082aac4ba2884e6a588bda694d..77b242c9a11ed57f86b3aa97268d16d3785c8b39
--- 1/arch/x86/xen/mmu.c
--- 2/arch/x86/xen/mmu.c
+++ b/arch/x86/xen/mmu.c
@@@ -184,7 -184,7 +184,7 @@@ static inline unsigned p2m_index(unsign
   }
   
   /* Build the parallel p2m_top_mfn structures */
- -void xen_setup_mfn_list_list(void)
+ +static void __init xen_build_mfn_list_list(void)
   {
         unsigned pfn, idx;
   
@@@ -198,10 -198,7 +198,10 @@@
                 unsigned topidx = idx * P2M_ENTRIES_PER_PAGE;
                 p2m_top_mfn_list[idx] = virt_to_mfn(&p2m_top_mfn[topidx]);
         }
+ +}
   
+ +void xen_setup_mfn_list_list(void)
+ +{
         BUG_ON(HYPERVISOR_shared_info == &xen_dummy_shared_info);
   
         HYPERVISOR_shared_info->arch.pfn_to_mfn_frame_list_list =
@@@ -221,8 -218,6 +221,8 @@@ void __init xen_build_dynamic_phys_to_m
   
                 p2m_top[topidx] = &mfn_list[pfn];
         }
+ +
+ +      xen_build_mfn_list_list();
   }
   
   unsigned long get_phys_to_machine(unsigned long pfn)
@@@ -238,74 -233,47 +238,74 @@@
   }
   EXPORT_SYMBOL_GPL(get_phys_to_machine);
   
- -static void alloc_p2m(unsigned long **pp, unsigned long *mfnp)
+ +/* install a  new p2m_top page */
+ +bool install_p2mtop_page(unsigned long pfn, unsigned long *p)
   {
- -      unsigned long *p;
+ +      unsigned topidx = p2m_top_index(pfn);
+ +      unsigned long **pfnp, *mfnp;
         unsigned i;
   
- -      p = (void *)__get_free_page(GFP_KERNEL | __GFP_NOFAIL);
- -      BUG_ON(p == NULL);
+ +      pfnp = &p2m_top[topidx];
+ +      mfnp = &p2m_top_mfn[topidx];
   
         for (i = 0; i < P2M_ENTRIES_PER_PAGE; i++)
                 p[i] = INVALID_P2M_ENTRY;
   
- -      if (cmpxchg(pp, p2m_missing, p) != p2m_missing)
- -              free_page((unsigned long)p);
- -      else
+ +      if (cmpxchg(pfnp, p2m_missing, p) == p2m_missing) {
                 *mfnp = virt_to_mfn(p);
+ +              return true;
+ +      }
+ +
+ +      return false;
   }
   
- -void set_phys_to_machine(unsigned long pfn, unsigned long mfn)
+ +static void alloc_p2m(unsigned long pfn)
   {
- -      unsigned topidx, idx;
+ +      unsigned long *p;
   
- -      if (unlikely(xen_feature(XENFEAT_auto_translated_physmap))) {
- -              BUG_ON(pfn != mfn && mfn != INVALID_P2M_ENTRY);
- -              return;
- -      }
+ +      p = (void *)__get_free_page(GFP_KERNEL | __GFP_NOFAIL);
+ +      BUG_ON(p == NULL);
+ +
+ +      if (!install_p2mtop_page(pfn, p))
+ +              free_page((unsigned long)p);
+ +}
+ +
+ +/* Try to install p2m mapping; fail if intermediate bits missing */
+ +bool __set_phys_to_machine(unsigned long pfn, unsigned long mfn)
+ +{
+ +      unsigned topidx, idx;
   
         if (unlikely(pfn >= MAX_DOMAIN_PAGES)) {
                 BUG_ON(mfn != INVALID_P2M_ENTRY);
- -              return;
+ +              return true;
         }
   
         topidx = p2m_top_index(pfn);
         if (p2m_top[topidx] == p2m_missing) {
- -              /* no need to allocate a page to store an invalid entry */
                 if (mfn == INVALID_P2M_ENTRY)
- -                      return;
- -              alloc_p2m(&p2m_top[topidx], &p2m_top_mfn[topidx]);
+ +                      return true;
+ +              return false;
         }
   
         idx = p2m_index(pfn);
         p2m_top[topidx][idx] = mfn;
+ +
+ +      return true;
+ +}
+ +
+ +void set_phys_to_machine(unsigned long pfn, unsigned long mfn)
+ +{
+ +      if (unlikely(xen_feature(XENFEAT_auto_translated_physmap))) {
+ +              BUG_ON(pfn != mfn && mfn != INVALID_P2M_ENTRY);
+ +              return;
+ +      }
+ +
+ +      if (unlikely(!__set_phys_to_machine(pfn, mfn)))  {
+ +              alloc_p2m(pfn);
+ +
+ +              if (!__set_phys_to_machine(pfn, mfn))
+ +                      BUG();
+ +      }
   }
   
   unsigned long arbitrary_virt_to_mfn(void *vaddr)
@@@ -451,6 -419,10 +451,6 @@@ void set_pte_mfn(unsigned long vaddr, u
   void xen_set_pte_at(struct mm_struct *mm, unsigned long addr,
                     pte_t *ptep, pte_t pteval)
   {
- -      /* updates to init_mm may be done without lock */
- -      if (mm == &init_mm)
- -              preempt_disable();
- -
         ADD_STATS(set_pte_at, 1);
   //    ADD_STATS(set_pte_at_pinned, xen_page_pinned(ptep));
         ADD_STATS(set_pte_at_current, mm == current->mm);
@@@ -471,7 -443,9 +471,7 @@@
         }
         xen_set_pte(ptep, pteval);
   
- -out:
- -      if (mm == &init_mm)
- -              preempt_enable();
+ +out:  return;
   }
   
   pte_t xen_ptep_modify_prot_start(struct mm_struct *mm,
@@@ -1013,7 -987,7 +1013,7 @@@ static __init int xen_mark_pinned(struc
         return 0;
   }
   
- -void __init xen_mark_init_mm_pinned(void)
+ +static void __init xen_mark_init_mm_pinned(void)
   {
         xen_pgd_walk(&init_mm, xen_mark_pinned, FIXADDR_TOP);
   }
@@@ -1145,8 -1119,10 +1145,8 @@@ static void drop_other_mm_ref(void *inf
   
         /* If this cpu still has a stale cr3 reference, then make sure
            it has been flushed. */
- -      if (percpu_read(xen_current_cr3) == __pa(mm->pgd)) {
+ +      if (percpu_read(xen_current_cr3) == __pa(mm->pgd))
                 load_cr3(swapper_pg_dir);
- -              arch_flush_lazy_cpu_mode();
- -      }
   }
   
   static void xen_drop_mm_ref(struct mm_struct *mm)
@@@ -1159,6 -1135,7 +1159,6 @@@
                         load_cr3(swapper_pg_dir);
                 else
                         leave_mm(smp_processor_id());
- -              arch_flush_lazy_cpu_mode();
         }
   
         /* Get the "official" set of cpus referring to our pagetable. */
@@@ -1293,8 -1270,8 +1293,8 @@@ static void xen_flush_tlb_others(const 
         } *args;
         struct multicall_space mcs;
   
- -      BUG_ON(cpumask_empty(cpus));
- -      BUG_ON(!mm);
+ +      if (cpumask_empty(cpus))
+ +              return;         /* nothing to do */
   
         mcs = xen_mc_entry(sizeof(*args));
         args = mcs.args;
@@@ -1461,29 -1438,10 +1461,29 @@@ static __init void xen_set_pte_init(pte
   }
   #endif
   
+ +static void pin_pagetable_pfn(unsigned cmd, unsigned long pfn)
+ +{
+ +      struct mmuext_op op;
+ +      op.cmd = cmd;
+ +      op.arg1.mfn = pfn_to_mfn(pfn);
+ +      if (HYPERVISOR_mmuext_op(&op, 1, NULL, DOMID_SELF))
+ +              BUG();
+ +}
+ +
   /* Early in boot, while setting up the initial pagetable, assume
      everything is pinned. */
   static __init void xen_alloc_pte_init(struct mm_struct *mm, unsigned long pfn)
   {
+ +#ifdef CONFIG_FLATMEM
+ +      BUG_ON(mem_map);        /* should only be used early */
+ +#endif
+ +      make_lowmem_page_readonly(__va(PFN_PHYS(pfn)));
+ +      pin_pagetable_pfn(MMUEXT_PIN_L1_TABLE, pfn);
+ +}
+ +
+ +/* Used for pmd and pud */
+ +static __init void xen_alloc_pmd_init(struct mm_struct *mm, unsigned long pfn)
+ +{
   #ifdef CONFIG_FLATMEM
         BUG_ON(mem_map);        /* should only be used early */
   #endif
@@@ -1492,15 -1450,18 +1492,15 @@@
   
   /* Early release_pte assumes that all pts are pinned, since there's
      only init_mm and anything attached to that is pinned. */
- -static void xen_release_pte_init(unsigned long pfn)
+ +static __init void xen_release_pte_init(unsigned long pfn)
   {
+ +      pin_pagetable_pfn(MMUEXT_UNPIN_TABLE, pfn);
         make_lowmem_page_readwrite(__va(PFN_PHYS(pfn)));
   }
   
- -static void pin_pagetable_pfn(unsigned cmd, unsigned long pfn)
+ +static __init void xen_release_pmd_init(unsigned long pfn)
   {
- -      struct mmuext_op op;
- -      op.cmd = cmd;
- -      op.arg1.mfn = pfn_to_mfn(pfn);
- -      if (HYPERVISOR_mmuext_op(&op, 1, NULL, DOMID_SELF))
- -              BUG();
+ +      make_lowmem_page_readwrite(__va(PFN_PHYS(pfn)));
   }
   
   /* This needs to make sure the new pte page is pinned iff its being
@@@ -1762,9 -1723,9 +1762,9 @@@ __init pgd_t *xen_setup_kernel_pagetabl
   {
         pmd_t *kernel_pmd;
   
-       init_pg_tables_start = __pa(pgd);
-       init_pg_tables_end = __pa(pgd) + xen_start_info->nr_pt_frames*PAGE_SIZE;
-       max_pfn_mapped = PFN_DOWN(init_pg_tables_end + 512*1024);
+       max_pfn_mapped = PFN_DOWN(__pa(xen_start_info->pt_base) +
+                                 xen_start_info->nr_pt_frames * PAGE_SIZE +
+                                 512*1024);
   
         kernel_pmd = m2v(pgd[KERNEL_PGD_BOUNDARY].pgd);
         memcpy(level2_kernel_pgt, kernel_pmd, sizeof(pmd_t) * PTRS_PER_PMD);
@@@ -1858,13 -1819,6 +1858,13 @@@ __init void xen_post_allocator_init(voi
         xen_mark_init_mm_pinned();
   }
   
+ +static void xen_leave_lazy_mmu(void)
+ +{
+ +      preempt_disable();
+ +      xen_mc_flush();
+ +      paravirt_leave_lazy_mmu();
+ +      preempt_enable();
+ +}
   
   const struct pv_mmu_ops xen_mmu_ops __initdata = {
         .pagetable_setup_start = xen_pagetable_setup_start,
@@@ -1889,9 -1843,9 +1889,9 @@@
   
         .alloc_pte = xen_alloc_pte_init,
         .release_pte = xen_release_pte_init,
- -      .alloc_pmd = xen_alloc_pte_init,
+ +      .alloc_pmd = xen_alloc_pmd_init,
         .alloc_pmd_clone = paravirt_nop,
- -      .release_pmd = xen_release_pte_init,
+ +      .release_pmd = xen_release_pmd_init,
   
   #ifdef CONFIG_HIGHPTE
         .kmap_atomic_pte = xen_kmap_atomic_pte,
@@@ -1916,7 -1870,6 +1916,6 @@@
   
   #ifdef CONFIG_X86_PAE
         .set_pte_atomic = xen_set_pte_atomic,
-       .set_pte_present = xen_set_pte_at,
         .pte_clear = xen_pte_clear,
         .pmd_clear = xen_pmd_clear,
   #endif        /* CONFIG_X86_PAE */
@@@ -1930,8 -1883,8 +1929,8 @@@
         .make_pud = PV_CALLEE_SAVE(xen_make_pud),
         .set_pgd = xen_set_pgd_hyper,
   
- -      .alloc_pud = xen_alloc_pte_init,
- -      .release_pud = xen_release_pte_init,
+ +      .alloc_pud = xen_alloc_pmd_init,
+ +      .release_pud = xen_release_pmd_init,
   #endif        /* PAGETABLE_LEVELS == 4 */
   
         .activate_mm = xen_activate_mm,
@@@ -1940,7 -1893,7 +1939,7 @@@
   
         .lazy_mode = {
                 .enter = paravirt_enter_lazy_mmu,
- -              .leave = xen_leave_lazy,
+ +              .leave = xen_leave_lazy_mmu,
         },
   
         .set_fixmap = xen_set_fixmap,
diff --combined arch/x86/xen/smp.c

index 304d832710cd53b95786625c19eed1d6389e7a83,585a6e330837ffb3a9e37d50be37f93e169832e1..429834ec1687d9b7de965027f3f8d1c862ea88cd
--- 1/arch/x86/xen/smp.c
--- 2/arch/x86/xen/smp.c
+++ b/arch/x86/xen/smp.c
@@@ -158,7 -158,7 +158,7 @@@ static void __init xen_fill_possible_ma
                 rc = HYPERVISOR_vcpu_op(VCPUOP_is_up, i, NULL);
                 if (rc >= 0) {
                         num_processors++;
-                       cpu_set(i, cpu_possible_map);
+                       set_cpu_possible(i, true);
                 }
         }
   }
@@@ -197,7 -197,7 +197,7 @@@ static void __init xen_smp_prepare_cpus
         while ((num_possible_cpus() > 1) && (num_possible_cpus() > max_cpus)) {
                 for (cpu = nr_cpu_ids - 1; !cpu_possible(cpu); cpu--)
                         continue;
-               cpu_clear(cpu, cpu_possible_map);
+               set_cpu_possible(cpu, false);
         }
   
         for_each_possible_cpu (cpu) {
@@@ -210,7 -210,7 +210,7 @@@
                 if (IS_ERR(idle))
                         panic("failed fork for CPU %d", cpu);
   
-               cpu_set(cpu, cpu_present_map);
+               set_cpu_present(cpu, true);
         }
   }
   
@@@ -317,7 -317,7 +317,7 @@@ static int __cpuinit xen_cpu_up(unsigne
         BUG_ON(rc);
   
         while(per_cpu(cpu_state, cpu) != CPU_ONLINE) {
- -              HYPERVISOR_sched_op(SCHEDOP_yield, 0);
+ +              HYPERVISOR_sched_op(SCHEDOP_yield, NULL);
                 barrier();
         }
   
@@@ -422,7 -422,7 +422,7 @@@ static void xen_smp_send_call_function_
         /* Make sure other vcpus get a chance to run if they need to. */
         for_each_cpu(cpu, mask) {
                 if (xen_vcpu_stolen(cpu)) {
- -                      HYPERVISOR_sched_op(SCHEDOP_yield, 0);
+ +                      HYPERVISOR_sched_op(SCHEDOP_yield, NULL);
                         break;
                 }
         }
diff --combined drivers/xen/Kconfig

index c0c490ea7d1bcead63196d2d3188bcc47da4ce86,8ac9cddac5754fdbf8ef9df33550a47bfba318f4..cab100acf983905b53d5c85b6ae76496d7b9b7c8
--- 1/drivers/xen/Kconfig
--- 2/drivers/xen/Kconfig
+++ b/drivers/xen/Kconfig
@@@ -18,16 -18,6 +18,16 @@@ config XEN_SCRUB_PAGE
           secure, but slightly less efficient.
           If in doubt, say yes.
   
+ +config XEN_DEV_EVTCHN
+ +      tristate "Xen /dev/xen/evtchn device"
+ +      depends on XEN
+ +      default y
+ +      help
+ +        The evtchn driver allows a userspace process to triger event
+ +        channels and to receive notification of an event channel
+ +        firing.
+ +        If in doubt, say yes.
+ +
   config XENFS
         tristate "Xen filesystem"
         depends on XEN
@@@ -47,17 -37,7 +47,17 @@@ config XEN_COMPAT_XENF
            The old xenstore userspace tools expect to find "xenbus"
            under /proc/xen, but "xenbus" is now found at the root of the
            xenfs filesystem.  Selecting this causes the kernel to create
-          the compatibilty mount point /proc/xen if it is running on
+          the compatibility mount point /proc/xen if it is running on
            a xen platform.
            If in doubt, say yes.
   
+ +config XEN_SYS_HYPERVISOR
+ +       bool "Create xen entries under /sys/hypervisor"
+ +       depends on XEN && SYSFS
+ +       select SYS_HYPERVISOR
+ +       default y
+ +       help
+ +         Create entries under /sys/hypervisor describing the Xen
+ +       hypervisor environment.  When running native or in another
+ +       virtual environment, /sys/hypervisor will still be present,
+ +       but will have no xen contents.
diff --combined drivers/xen/cpu_hotplug.c

index 411cb1fc92795b969ee3d3cf3f0d4ffdc7558e4c,5f54c01c156872100ab8e2bf9f1ad74e08152abc..bdfd584ad853ac379e0b3ed9975034e86faa27c4
--- 1/drivers/xen/cpu_hotplug.c
--- 2/drivers/xen/cpu_hotplug.c
+++ b/drivers/xen/cpu_hotplug.c
@@@ -10,7 -10,7 +10,7 @@@ static void enable_hotplug_cpu(int cpu
         if (!cpu_present(cpu))
                 arch_register_cpu(cpu);
   
-       cpu_set(cpu, cpu_present_map);
+       set_cpu_present(cpu, true);
   }
   
   static void disable_hotplug_cpu(int cpu)
@@@ -18,44 -18,32 +18,44 @@@
         if (cpu_present(cpu))
                 arch_unregister_cpu(cpu);
   
-       cpu_clear(cpu, cpu_present_map);
+       set_cpu_present(cpu, false);
   }
   
- -static void vcpu_hotplug(unsigned int cpu)
+ +static int vcpu_online(unsigned int cpu)
   {
         int err;
         char dir[32], state[32];
   
- -      if (!cpu_possible(cpu))
- -              return;
- -
         sprintf(dir, "cpu/%u", cpu);
         err = xenbus_scanf(XBT_NIL, dir, "availability", "%s", state);
         if (err != 1) {
                 printk(KERN_ERR "XENBUS: Unable to read cpu state\n");
- -              return;
+ +              return err;
         }
   
- -      if (strcmp(state, "online") == 0) {
+ +      if (strcmp(state, "online") == 0)
+ +              return 1;
+ +      else if (strcmp(state, "offline") == 0)
+ +              return 0;
+ +
+ +      printk(KERN_ERR "XENBUS: unknown state(%s) on CPU%d\n", state, cpu);
+ +      return -EINVAL;
+ +}
+ +static void vcpu_hotplug(unsigned int cpu)
+ +{
+ +      if (!cpu_possible(cpu))
+ +              return;
+ +
+ +      switch (vcpu_online(cpu)) {
+ +      case 1:
                 enable_hotplug_cpu(cpu);
- -      } else if (strcmp(state, "offline") == 0) {
+ +              break;
+ +      case 0:
                 (void)cpu_down(cpu);
                 disable_hotplug_cpu(cpu);
- -      } else {
- -              printk(KERN_ERR "XENBUS: unknown state(%s) on CPU%d\n",
- -                     state, cpu);
+ +              break;
+ +      default:
+ +              break;
         }
   }
   
@@@ -76,20 -64,12 +76,20 @@@ static void handle_vcpu_hotplug_event(s
   static int setup_cpu_watcher(struct notifier_block *notifier,
                               unsigned long event, void *data)
   {
+ +      int cpu;
         static struct xenbus_watch cpu_watch = {
                 .node = "cpu",
                 .callback = handle_vcpu_hotplug_event};
   
         (void)register_xenbus_watch(&cpu_watch);
   
+ +      for_each_possible_cpu(cpu) {
+ +              if (vcpu_online(cpu) == 0) {
+ +                      (void)cpu_down(cpu);
+ +                      cpu_clear(cpu, cpu_present_map);
+ +              }
+ +      }
+ +
         return NOTIFY_DONE;
   }
   
diff --combined drivers/xen/manage.c

index 5269bb4d2496930862605f1f664d311f97815b1f,0d61db1e7b49bc5f5fd095795e74001dadda1bc3..fddc2025dece777c513a7a7a72f8537751bf1834
--- 1/drivers/xen/manage.c
--- 2/drivers/xen/manage.c
+++ b/drivers/xen/manage.c
@@@ -39,12 -39,6 +39,6 @@@ static int xen_suspend(void *data
   
         BUG_ON(!irqs_disabled());
   
-       err = device_power_down(PMSG_SUSPEND);
-       if (err) {
-               printk(KERN_ERR "xen_suspend: device_power_down failed: %d\n",
-                      err);
-               return err;
-       }
         err = sysdev_suspend(PMSG_SUSPEND);
         if (err) {
                 printk(KERN_ERR "xen_suspend: sysdev_suspend failed: %d\n",
@@@ -68,15 -62,14 +62,15 @@@
         gnttab_resume();
         xen_mm_unpin_all();
   
- -      sysdev_resume();
- -
         if (!*cancelled) {
                 xen_irq_resume();
                 xen_console_resume();
                 xen_timer_resume();
         }
   
+ +      sysdev_resume();
+ +      device_power_up(PMSG_RESUME);
+ +
         return 0;
   }
   
@@@ -104,9 -97,16 +98,15 @@@ static void do_suspend(void
                 goto out;
         }
   
- -      printk("suspending xenbus...\n");
- -      /* XXX use normal device tree? */
- -      xenbus_suspend();
+ +      printk(KERN_DEBUG "suspending xenstore...\n");
+ +      xs_suspend();
   
+       err = device_power_down(PMSG_SUSPEND);
+       if (err) {
+               printk(KERN_ERR "device_power_down failed: %d\n", err);
+               goto resume_devices;
+       }
+ 
         err = stop_machine(xen_suspend, &cancelled, cpumask_of(0));
         if (err) {
                 printk(KERN_ERR "failed to start xen_suspend: %d\n", err);
@@@ -115,10 -115,13 +115,13 @@@
   
         if (!cancelled) {
                 xen_arch_resume();
- -              xenbus_resume();
+ +              xs_resume();
         } else
- -              xenbus_suspend_cancel();
+ +              xs_suspend_cancel();
   
+       device_power_up(PMSG_RESUME);
+ 
+ resume_devices:
         device_resume(PMSG_RESUME);
   
         /* Make sure timer events get retriggered on all CPUs */
diff --combined kernel/sched.c

index 133762aece50e00b76225e5b2fed7124c7694220,6cc1fd5d5072b69638c562d7e01697d4c9870684..b38bd96098f62da8154a9edf048ca15f0c95d6b6
--- 1/kernel/sched.c
--- 2/kernel/sched.c
+++ b/kernel/sched.c
@@@ -231,13 -231,20 +231,20 @@@ static void start_rt_bandwidth(struct r
   
         spin_lock(&rt_b->rt_runtime_lock);
         for (;;) {
+               unsigned long delta;
+               ktime_t soft, hard;
+ 
                 if (hrtimer_active(&rt_b->rt_period_timer))
                         break;
   
                 now = hrtimer_cb_get_time(&rt_b->rt_period_timer);
                 hrtimer_forward(&rt_b->rt_period_timer, now, rt_b->rt_period);
-               hrtimer_start_expires(&rt_b->rt_period_timer,
-                               HRTIMER_MODE_ABS);
+ 
+               soft = hrtimer_get_softexpires(&rt_b->rt_period_timer);
+               hard = hrtimer_get_expires(&rt_b->rt_period_timer);
+               delta = ktime_to_ns(ktime_sub(hard, soft));
+               __hrtimer_start_range_ns(&rt_b->rt_period_timer, soft, delta,
+                               HRTIMER_MODE_ABS, 0);
         }
         spin_unlock(&rt_b->rt_runtime_lock);
   }
@@@ -1110,7 -1117,7 +1117,7 @@@ static void hrtick_start(struct rq *rq
         if (rq == this_rq()) {
                 hrtimer_restart(timer);
         } else if (!rq->hrtick_csd_pending) {
-               __smp_call_function_single(cpu_of(rq), &rq->hrtick_csd);
+               __smp_call_function_single(cpu_of(rq), &rq->hrtick_csd, 0);
                 rq->hrtick_csd_pending = 1;
         }
   }
@@@ -1146,7 -1153,8 +1153,8 @@@ static __init void init_hrtick(void
    */
   static void hrtick_start(struct rq *rq, u64 delay)
   {
-       hrtimer_start(&rq->hrtick_timer, ns_to_ktime(delay), HRTIMER_MODE_REL);
+       __hrtimer_start_range_ns(&rq->hrtick_timer, ns_to_ktime(delay), 0,
+                       HRTIMER_MODE_REL, 0);
   }
   
   static inline void init_hrtick(void)
@@@ -2746,7 -2754,7 +2754,7 @@@ context_switch(struct rq *rq, struct ta
          * combine the page table reload and the switch backend into
          * one hypercall.
          */
- -      arch_enter_lazy_cpu_mode();
+ +      arch_start_context_switch(prev);
   
         if (unlikely(!mm)) {
                 next->active_mm = oldmm;
@@@ -3818,19 -3826,23 +3826,23 @@@ find_busiest_queue(struct sched_group *
    */
   #define MAX_PINNED_INTERVAL   512
   
+ /* Working cpumask for load_balance and load_balance_newidle. */
+ static DEFINE_PER_CPU(cpumask_var_t, load_balance_tmpmask);
+ 
   /*
    * Check this_cpu to ensure it is balanced within domain. Attempt to move
    * tasks if there is an imbalance.
    */
   static int load_balance(int this_cpu, struct rq *this_rq,
                         struct sched_domain *sd, enum cpu_idle_type idle,
-                       int *balance, struct cpumask *cpus)
+                       int *balance)
   {
         int ld_moved, all_pinned = 0, active_balance = 0, sd_idle = 0;
         struct sched_group *group;
         unsigned long imbalance;
         struct rq *busiest;
         unsigned long flags;
+       struct cpumask *cpus = __get_cpu_var(load_balance_tmpmask);
   
         cpumask_setall(cpus);
   
@@@ -3985,8 -3997,7 +3997,7 @@@ out
    * this_rq is locked.
    */
   static int
- load_balance_newidle(int this_cpu, struct rq *this_rq, struct sched_domain *sd,
-                       struct cpumask *cpus)
+ load_balance_newidle(int this_cpu, struct rq *this_rq, struct sched_domain *sd)
   {
         struct sched_group *group;
         struct rq *busiest = NULL;
@@@ -3994,6 -4005,7 +4005,7 @@@
         int ld_moved = 0;
         int sd_idle = 0;
         int all_pinned = 0;
+       struct cpumask *cpus = __get_cpu_var(load_balance_tmpmask);
   
         cpumask_setall(cpus);
   
@@@ -4134,10 -4146,6 +4146,6 @@@ static void idle_balance(int this_cpu, 
         struct sched_domain *sd;
         int pulled_task = 0;
         unsigned long next_balance = jiffies + HZ;
-       cpumask_var_t tmpmask;
- 
-       if (!alloc_cpumask_var(&tmpmask, GFP_ATOMIC))
-               return;
   
         for_each_domain(this_cpu, sd) {
                 unsigned long interval;
@@@ -4148,7 -4156,7 +4156,7 @@@
                 if (sd->flags & SD_BALANCE_NEWIDLE)
                         /* If we've pulled tasks over stop searching: */
                         pulled_task = load_balance_newidle(this_cpu, this_rq,
-                                                          sd, tmpmask);
+                                                          sd);
   
                 interval = msecs_to_jiffies(sd->balance_interval);
                 if (time_after(next_balance, sd->last_balance + interval))
@@@ -4163,7 -4171,6 +4171,6 @@@
                  */
                 this_rq->next_balance = next_balance;
         }
-       free_cpumask_var(tmpmask);
   }
   
   /*
@@@ -4313,11 -4320,6 +4320,6 @@@ static void rebalance_domains(int cpu, 
         unsigned long next_balance = jiffies + 60*HZ;
         int update_next_balance = 0;
         int need_serialize;
-       cpumask_var_t tmp;
- 
-       /* Fails alloc?  Rebalancing probably not a priority right now. */
-       if (!alloc_cpumask_var(&tmp, GFP_ATOMIC))
-               return;
   
         for_each_domain(cpu, sd) {
                 if (!(sd->flags & SD_LOAD_BALANCE))
@@@ -4342,7 -4344,7 +4344,7 @@@
                 }
   
                 if (time_after_eq(jiffies, sd->last_balance + interval)) {
-                       if (load_balance(cpu, rq, sd, idle, &balance, tmp)) {
+                       if (load_balance(cpu, rq, sd, idle, &balance)) {
                                 /*
                                  * We've pulled tasks over so either we're no
                                  * longer idle, or one of our SMT siblings is
@@@ -4376,8 -4378,6 +4378,6 @@@ out
          */
         if (likely(update_next_balance))
                 rq->next_balance = next_balance;
- 
-       free_cpumask_var(tmp);
   }
   
   /*
@@@ -4781,10 -4781,7 +4781,7 @@@ void scheduler_tick(void
   #endif
   }
   
- #if defined(CONFIG_PREEMPT) && (defined(CONFIG_DEBUG_PREEMPT) || \
-                               defined(CONFIG_PREEMPT_TRACER))
- 
- static inline unsigned long get_parent_ip(unsigned long addr)
+ unsigned long get_parent_ip(unsigned long addr)
   {
         if (in_lock_functions(addr)) {
                 addr = CALLER_ADDR2;
@@@ -4794,6 -4791,9 +4791,9 @@@
         return addr;
   }
   
+ #if defined(CONFIG_PREEMPT) && (defined(CONFIG_DEBUG_PREEMPT) || \
+                               defined(CONFIG_PREEMPT_TRACER))
+ 
   void __kprobes add_preempt_count(int val)
   {
   #ifdef CONFIG_DEBUG_PREEMPT
@@@ -4942,15 -4942,13 +4942,13 @@@ pick_next_task(struct rq *rq
   /*
    * schedule() is the main scheduler function.
    */
- asmlinkage void __sched schedule(void)
+ asmlinkage void __sched __schedule(void)
   {
         struct task_struct *prev, *next;
         unsigned long *switch_count;
         struct rq *rq;
         int cpu;
   
- need_resched:
-       preempt_disable();
         cpu = smp_processor_id();
         rq = cpu_rq(cpu);
         rcu_qsctr_inc(cpu);
@@@ -5007,13 -5005,80 +5005,80 @@@ need_resched_nonpreemptible
   
         if (unlikely(reacquire_kernel_lock(current) < 0))
                 goto need_resched_nonpreemptible;
+ }
   
+ asmlinkage void __sched schedule(void)
+ {
+ need_resched:
+       preempt_disable();
+       __schedule();
         preempt_enable_no_resched();
         if (unlikely(test_thread_flag(TIF_NEED_RESCHED)))
                 goto need_resched;
   }
   EXPORT_SYMBOL(schedule);
   
+ #ifdef CONFIG_SMP
+ /*
+  * Look out! "owner" is an entirely speculative pointer
+  * access and not reliable.
+  */
+ int mutex_spin_on_owner(struct mutex *lock, struct thread_info *owner)
+ {
+       unsigned int cpu;
+       struct rq *rq;
+ 
+       if (!sched_feat(OWNER_SPIN))
+               return 0;
+ 
+ #ifdef CONFIG_DEBUG_PAGEALLOC
+       /*
+        * Need to access the cpu field knowing that
+        * DEBUG_PAGEALLOC could have unmapped it if
+        * the mutex owner just released it and exited.
+        */
+       if (probe_kernel_address(&owner->cpu, cpu))
+               goto out;
+ #else
+       cpu = owner->cpu;
+ #endif
+ 
+       /*
+        * Even if the access succeeded (likely case),
+        * the cpu field may no longer be valid.
+        */
+       if (cpu >= nr_cpumask_bits)
+               goto out;
+ 
+       /*
+        * We need to validate that we can do a
+        * get_cpu() and that we have the percpu area.
+        */
+       if (!cpu_online(cpu))
+               goto out;
+ 
+       rq = cpu_rq(cpu);
+ 
+       for (;;) {
+               /*
+                * Owner changed, break to re-assess state.
+                */
+               if (lock->owner != owner)
+                       break;
+ 
+               /*
+                * Is that owner really running on that cpu?
+                */
+               if (task_thread_info(rq->curr) != owner || need_resched())
+                       return 0;
+ 
+               cpu_relax();
+       }
+ out:
+       return 1;
+ }
+ #endif
+ 
   #ifdef CONFIG_PREEMPT
   /*
    * this is the entry point to schedule() from in-kernel preemption
@@@ -5131,11 -5196,17 +5196,17 @@@ void __wake_up_locked(wait_queue_head_
         __wake_up_common(q, mode, 1, 0, NULL);
   }
   
+ void __wake_up_locked_key(wait_queue_head_t *q, unsigned int mode, void *key)
+ {
+       __wake_up_common(q, mode, 1, 0, key);
+ }
+ 
   /**
-  * __wake_up_sync - wake up threads blocked on a waitqueue.
+  * __wake_up_sync_key - wake up threads blocked on a waitqueue.
    * @q: the waitqueue
    * @mode: which threads
    * @nr_exclusive: how many wake-one or wake-many threads to wake up
+  * @key: opaque value to be passed to wakeup targets
    *
    * The sync wakeup differs that the waker knows that it will schedule
    * away soon, so while the target thread will be woken up, it will not
@@@ -5144,8 -5215,8 +5215,8 @@@
    *
    * On UP it can prevent extra preemption.
    */
- void
- __wake_up_sync(wait_queue_head_t *q, unsigned int mode, int nr_exclusive)
+ void __wake_up_sync_key(wait_queue_head_t *q, unsigned int mode,
+                       int nr_exclusive, void *key)
   {
         unsigned long flags;
         int sync = 1;
@@@ -5157,9 -5228,18 +5228,18 @@@
                 sync = 0;
   
         spin_lock_irqsave(&q->lock, flags);
-       __wake_up_common(q, mode, nr_exclusive, sync, NULL);
+       __wake_up_common(q, mode, nr_exclusive, sync, key);
         spin_unlock_irqrestore(&q->lock, flags);
   }
+ EXPORT_SYMBOL_GPL(__wake_up_sync_key);
+ 
+ /*
+  * __wake_up_sync - see __wake_up_sync_key()
+  */
+ void __wake_up_sync(wait_queue_head_t *q, unsigned int mode, int nr_exclusive)
+ {
+       __wake_up_sync_key(q, mode, nr_exclusive, NULL);
+ }
   EXPORT_SYMBOL_GPL(__wake_up_sync);    /* For internal use only */
   
   /**
@@@ -7648,7 -7728,7 +7728,7 @@@ cpu_to_core_group(int cpu, const struc
   {
         int group;
   
-       cpumask_and(mask, &per_cpu(cpu_sibling_map, cpu), cpu_map);
+       cpumask_and(mask, topology_thread_cpumask(cpu), cpu_map);
         group = cpumask_first(mask);
         if (sg)
                 *sg = &per_cpu(sched_group_core, group).sg;
@@@ -7677,7 -7757,7 +7757,7 @@@ cpu_to_phys_group(int cpu, const struc
         cpumask_and(mask, cpu_coregroup_mask(cpu), cpu_map);
         group = cpumask_first(mask);
   #elif defined(CONFIG_SCHED_SMT)
-       cpumask_and(mask, &per_cpu(cpu_sibling_map, cpu), cpu_map);
+       cpumask_and(mask, topology_thread_cpumask(cpu), cpu_map);
         group = cpumask_first(mask);
   #else
         group = cpu;
@@@ -8020,7 -8100,7 +8100,7 @@@ static int __build_sched_domains(const 
                 SD_INIT(sd, SIBLING);
                 set_domain_attribute(sd, attr);
                 cpumask_and(sched_domain_span(sd),
-                           &per_cpu(cpu_sibling_map, i), cpu_map);
+                           topology_thread_cpumask(i), cpu_map);
                 sd->parent = p;
                 p->child = sd;
                 cpu_to_cpu_group(i, cpu_map, &sd->groups, tmpmask);
@@@ -8031,7 -8111,7 +8111,7 @@@
         /* Set up CPU (sibling) groups */
         for_each_cpu(i, cpu_map) {
                 cpumask_and(this_sibling_map,
-                           &per_cpu(cpu_sibling_map, i), cpu_map);
+                           topology_thread_cpumask(i), cpu_map);
                 if (i != cpumask_first(this_sibling_map))
                         continue;
   
@@@ -8706,6 -8786,9 +8786,9 @@@ void __init sched_init(void
   #endif
   #ifdef CONFIG_USER_SCHED
         alloc_size *= 2;
+ #endif
+ #ifdef CONFIG_CPUMASK_OFFSTACK
+       alloc_size += num_possible_cpus() * cpumask_size();
   #endif
         /*
          * As sched_init() is called before page_alloc is setup,
@@@ -8744,6 -8827,12 +8827,12 @@@
                 ptr += nr_cpu_ids * sizeof(void **);
   #endif /* CONFIG_USER_SCHED */
   #endif /* CONFIG_RT_GROUP_SCHED */
+ #ifdef CONFIG_CPUMASK_OFFSTACK
+               for_each_possible_cpu(i) {
+                       per_cpu(load_balance_tmpmask, i) = (void *)ptr;
+                       ptr += cpumask_size();
+               }
+ #endif /* CONFIG_CPUMASK_OFFSTACK */
         }
   
   #ifdef CONFIG_SMP
author	Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>
	Tue, 7 Apr 2009 20:34:16 +0000 (13:34 -0700)
committer	Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>
	Tue, 7 Apr 2009 20:34:16 +0000 (13:34 -0700)
		1	2
arch/x86/include/asm/paravirt.h	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/include/asm/pgtable.h	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/include/asm/thread_info.h	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/kernel/kvm.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/kernel/paravirt.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/kernel/process_32.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/kernel/process_64.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/kernel/vmi_32.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/lguest/boot.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/mm/highmem_32.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/mm/iomap_32.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/mm/pageattr.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/xen/mmu.c	patch \|	diff1 \|	diff2 \|	blob \| history
arch/x86/xen/smp.c	patch \|	diff1 \|	diff2 \|	blob \| history
drivers/xen/Kconfig	patch \|	diff1 \|	diff2 \|	blob \| history
drivers/xen/cpu_hotplug.c	patch \|	diff1 \|	diff2 \|	blob \| history
drivers/xen/manage.c	patch \|	diff1 \|	diff2 \|	blob \| history
kernel/sched.c	patch \|	diff1 \|	diff2 \|	blob \| history