Merge to kernel-2.6.20-1.2949.fc6.vs2.2.0.1

[linux-2.6.git] / arch / i386 / kernel / smp.c
diff --git a/arch/i386/kernel/smp.c b/arch/i386/kernel/smp.c

index 13c1714..26552a5 100644 (file)
--- a/arch/i386/kernel/smp.c
+++ b/arch/i386/kernel/smp.c
@@ -11,7 +11,6 @@
  #include <linux/init.h>
  
  #include <linux/mm.h>
-#include <linux/irq.h>
  #include <linux/delay.h>
  #include <linux/spinlock.h>
  #include <linux/smp_lock.h>
@@ -19,10 +18,12 @@
  #include <linux/mc146818rtc.h>
  #include <linux/cache.h>
  #include <linux/interrupt.h>
+#include <linux/cpu.h>
+#include <linux/module.h>
  
  #include <asm/mtrr.h>
  #include <asm/tlbflush.h>
-#include <mach_ipi.h>
+#include <asm/desc.h>
  #include <mach_apic.h>
  
  /*
@@ -104,7 +105,7 @@
   *     about nothing of note with C stepping upwards.
   */
  
-struct tlb_state cpu_tlbstate[NR_CPUS] __cacheline_aligned = {[0 ... NR_CPUS-1] = { &init_mm, 0, }};
+DEFINE_PER_CPU(struct tlb_state, cpu_tlbstate) ____cacheline_aligned = { &init_mm, 0, };
  
  /*
   * the following functions deal with sending IPIs between CPUs.
@@ -114,7 +115,17 @@ struct tlb_state cpu_tlbstate[NR_CPUS] __cacheline_aligned = {[0 ... NR_CPUS-1]
  
  static inline int __prepare_ICR (unsigned int shortcut, int vector)
  {
-       return APIC_DM_FIXED | shortcut | vector | APIC_DEST_LOGICAL;
+       unsigned int icr = shortcut | APIC_DEST_LOGICAL;
+
+       switch (vector) {
+       default:
+               icr |= APIC_DM_FIXED | vector;
+               break;
+       case NMI_VECTOR:
+               icr |= APIC_DM_NMI;
+               break;
+       }
+       return icr;
  }
  
  static inline int __prepare_ICR2 (unsigned int mask)
@@ -122,7 +133,7 @@ static inline int __prepare_ICR2 (unsigned int mask)
         return SET_APIC_DEST_FIELD(mask);
  }
  
-inline void __send_IPI_shortcut(unsigned int shortcut, int vector)
+void __send_IPI_shortcut(unsigned int shortcut, int vector)
  {
         /*
          * Subtle. In the case of the 'never do double writes' workaround
@@ -157,14 +168,14 @@ void fastcall send_IPI_self(int vector)
  /*
   * This is only used on smaller machines.
   */
-inline void send_IPI_mask_bitmask(cpumask_t cpumask, int vector)
+void send_IPI_mask_bitmask(cpumask_t cpumask, int vector)
  {
-       unsigned long mask = cpus_coerce(cpumask);
+       unsigned long mask = cpus_addr(cpumask)[0];
         unsigned long cfg;
         unsigned long flags;
  
         local_irq_save(flags);
-               
+       WARN_ON(mask & ~cpus_addr(cpu_online_map)[0]);
         /*
          * Wait for idle.
          */
@@ -189,7 +200,7 @@ inline void send_IPI_mask_bitmask(cpumask_t cpumask, int vector)
         local_irq_restore(flags);
  }
  
-inline void send_IPI_mask_sequence(cpumask_t mask, int vector)
+void send_IPI_mask_sequence(cpumask_t mask, int vector)
  {
         unsigned long cfg, flags;
         unsigned int query_cpu;
@@ -230,6 +241,8 @@ inline void send_IPI_mask_sequence(cpumask_t mask, int vector)
         local_irq_restore(flags);
  }
  
+#include <mach_ipi.h> /* must come after the send_IPI functions above for inlining */
+
  /*
   *     Smarter SMP flushing macros. 
   *             c/o Linus Torvalds.
@@ -243,7 +256,7 @@ inline void send_IPI_mask_sequence(cpumask_t mask, int vector)
  static cpumask_t flush_cpumask;
  static struct mm_struct * flush_mm;
  static unsigned long flush_va;
-static spinlock_t tlbstate_lock = SPIN_LOCK_UNLOCKED;
+static DEFINE_SPINLOCK(tlbstate_lock);
  #define FLUSH_ALL      0xffffffff
  
  /*
@@ -255,9 +268,9 @@ static spinlock_t tlbstate_lock = SPIN_LOCK_UNLOCKED;
   */
  static inline void leave_mm (unsigned long cpu)
  {
-       if (cpu_tlbstate[cpu].state == TLBSTATE_OK)
+       if (per_cpu(cpu_tlbstate, cpu).state == TLBSTATE_OK)
                 BUG();
-       cpu_clear(cpu, cpu_tlbstate[cpu].active_mm->cpu_vm_mask);
+       cpu_clear(cpu, per_cpu(cpu_tlbstate, cpu).active_mm->cpu_vm_mask);
         load_cr3(swapper_pg_dir);
  }
  
@@ -307,11 +320,13 @@ static inline void leave_mm (unsigned long cpu)
   * 2) Leave the mm if we are in the lazy tlb mode.
   */
  
-asmlinkage void smp_invalidate_interrupt (void)
+fastcall void smp_invalidate_interrupt(struct pt_regs *regs)
  {
         unsigned long cpu;
  
         cpu = get_cpu();
+       if (current->active_mm)
+               load_user_cs_desc(cpu, current->active_mm);
  
         if (!cpu_isset(cpu, flush_cpumask))
                 goto out;
@@ -324,14 +339,12 @@ asmlinkage void smp_invalidate_interrupt (void)
                  * BUG();
                  */
                  
-       if (flush_mm == cpu_tlbstate[cpu].active_mm) {
-               if (cpu_tlbstate[cpu].state == TLBSTATE_OK) {
-#ifndef CONFIG_X86_SWITCH_PAGETABLES
+       if (flush_mm == per_cpu(cpu_tlbstate, cpu).active_mm) {
+               if (per_cpu(cpu_tlbstate, cpu).state == TLBSTATE_OK) {
                         if (flush_va == FLUSH_ALL)
                                 local_flush_tlb();
                         else
                                 __flush_tlb_one(flush_va);
-#endif
                 } else
                         leave_mm(cpu);
         }
@@ -346,21 +359,21 @@ out:
  static void flush_tlb_others(cpumask_t cpumask, struct mm_struct *mm,
                                                 unsigned long va)
  {
-       cpumask_t tmp;
         /*
          * A couple of (to be removed) sanity checks:
          *
-        * - we do not send IPIs to not-yet booted CPUs.
          * - current CPU must not be in mask
          * - mask must exist :)
          */
         BUG_ON(cpus_empty(cpumask));
-
-       cpus_and(tmp, cpumask, cpu_online_map);
-       BUG_ON(!cpus_equal(cpumask, tmp));
         BUG_ON(cpu_isset(smp_processor_id(), cpumask));
         BUG_ON(!mm);
  
+       /* If a CPU which we ran on has gone down, OK. */
+       cpus_and(cpumask, cpumask, cpu_online_map);
+       if (cpus_empty(cpumask))
+               return;
+
         /*
          * i'm not happy about this global shared spinlock in the
          * MM hot path, but we'll see how contended it is.
@@ -397,6 +410,21 @@ static void flush_tlb_others(cpumask_t cpumask, struct mm_struct *mm,
         spin_unlock(&tlbstate_lock);
  }
         
+void flush_tlb_current_task(void)
+{
+       struct mm_struct *mm = current->mm;
+       cpumask_t cpu_mask;
+
+       preempt_disable();
+       cpu_mask = mm->cpu_vm_mask;
+       cpu_clear(smp_processor_id(), cpu_mask);
+
+       local_flush_tlb();
+       if (!cpus_empty(cpu_mask))
+               flush_tlb_others(cpu_mask, mm, FLUSH_ALL);
+       preempt_enable();
+}
+
  void flush_tlb_mm (struct mm_struct * mm)
  {
         cpumask_t cpu_mask;
@@ -428,10 +456,7 @@ void flush_tlb_page(struct vm_area_struct * vma, unsigned long va)
  
         if (current->active_mm == mm) {
                 if(current->mm)
-#ifndef CONFIG_X86_SWITCH_PAGETABLES
-                       __flush_tlb_one(va)
-#endif
-                               ;
+                       __flush_tlb_one(va);
                  else
                         leave_mm(smp_processor_id());
         }
@@ -441,19 +466,20 @@ void flush_tlb_page(struct vm_area_struct * vma, unsigned long va)
  
         preempt_enable();
  }
+EXPORT_SYMBOL(flush_tlb_page);
  
  static void do_flush_tlb_all(void* info)
  {
         unsigned long cpu = smp_processor_id();
  
         __flush_tlb_all();
-       if (cpu_tlbstate[cpu].state == TLBSTATE_LAZY)
+       if (per_cpu(cpu_tlbstate, cpu).state == TLBSTATE_LAZY)
                 leave_mm(cpu);
  }
  
  void flush_tlb_all(void)
  {
-       on_each_cpu(do_flush_tlb_all, 0, 1, 1);
+       on_each_cpu(do_flush_tlb_all, NULL, 1, 1);
  }
  
  /*
@@ -463,6 +489,7 @@ void flush_tlb_all(void)
   */
  void smp_send_reschedule(int cpu)
  {
+       WARN_ON(cpu_is_offline(cpu));
         send_IPI_mask(cpumask_of_cpu(cpu), RESCHEDULE_VECTOR);
  }
  
@@ -470,7 +497,7 @@ void smp_send_reschedule(int cpu)
   * Structure and data for smp_call_function(). This is designed to minimise
   * static memory requirements. It also looks cleaner.
   */
-static spinlock_t call_lock = SPIN_LOCK_UNLOCKED;
+static DEFINE_SPINLOCK(call_lock);
  
  struct call_data_struct {
         void (*func) (void *info);
@@ -480,33 +507,44 @@ struct call_data_struct {
         int wait;
  };
  
-static struct call_data_struct * call_data;
+void lock_ipi_call_lock(void)
+{
+       spin_lock_irq(&call_lock);
+}
  
-/*
- * this function sends a 'generic call function' IPI to all other CPUs
- * in the system.
- */
+void unlock_ipi_call_lock(void)
+{
+       spin_unlock_irq(&call_lock);
+}
  
-int smp_call_function (void (*func) (void *info), void *info, int nonatomic,
-                       int wait)
-/*
- * [SUMMARY] Run a function on all other CPUs.
- * <func> The function to run. This must be fast and non-blocking.
- * <info> An arbitrary pointer to pass to the function.
- * <nonatomic> currently unused.
- * <wait> If true, wait (atomically) until function has completed on other CPUs.
- * [RETURNS] 0 on success, else a negative status code. Does not return until
+static struct call_data_struct *call_data;
+
+/**
+ * smp_call_function(): Run a function on all other CPUs.
+ * @func: The function to run. This must be fast and non-blocking.
+ * @info: An arbitrary pointer to pass to the function.
+ * @nonatomic: currently unused.
+ * @wait: If true, wait (atomically) until function has completed on other CPUs.
+ *
+ * Returns 0 on success, else a negative status code. Does not return until
   * remote CPUs are nearly ready to execute <<func>> or are or have executed.
   *
   * You must not call this function with disabled interrupts or from a
   * hardware interrupt handler or from a bottom half handler.
   */
+int smp_call_function (void (*func) (void *info), void *info, int nonatomic,
+                       int wait)
  {
         struct call_data_struct data;
-       int cpus = num_online_cpus()-1;
+       int cpus;
  
-       if (!cpus)
+       /* Holding any lock stops cpus from going down. */
+       spin_lock(&call_lock);
+       cpus = num_online_cpus() - 1;
+       if (!cpus) {
+               spin_unlock(&call_lock);
                 return 0;
+       }
  
         /* Can deadlock when called with interrupts disabled */
         WARN_ON(irqs_disabled());
@@ -518,7 +556,6 @@ int smp_call_function (void (*func) (void *info), void *info, int nonatomic,
         if (wait)
                 atomic_set(&data.finished, 0);
  
-       spin_lock(&call_lock);
         call_data = &data;
         mb();
         
@@ -527,15 +564,16 @@ int smp_call_function (void (*func) (void *info), void *info, int nonatomic,
  
         /* Wait for response */
         while (atomic_read(&data.started) != cpus)
-               barrier();
+               cpu_relax();
  
         if (wait)
                 while (atomic_read(&data.finished) != cpus)
-                       barrier();
+                       cpu_relax();
         spin_unlock(&call_lock);
  
         return 0;
  }
+EXPORT_SYMBOL(smp_call_function);
  
  static void stop_this_cpu (void * dummy)
  {
@@ -546,7 +584,7 @@ static void stop_this_cpu (void * dummy)
         local_irq_disable();
         disable_local_APIC();
         if (cpu_data[smp_processor_id()].hlt_works_ok)
-               for(;;) __asm__("hlt");
+               for(;;) halt();
         for (;;);
  }
  
@@ -568,12 +606,12 @@ void smp_send_stop(void)
   * all the work is done automatically when
   * we return from the interrupt.
   */
-asmlinkage void smp_reschedule_interrupt(void)
+fastcall void smp_reschedule_interrupt(struct pt_regs *regs)
  {
         ack_APIC_irq();
  }
  
-asmlinkage void smp_call_function_interrupt(void)
+fastcall void smp_call_function_interrupt(struct pt_regs *regs)
  {
         void (*func) (void *info) = call_data->func;
         void *info = call_data->info;
@@ -599,3 +637,100 @@ asmlinkage void smp_call_function_interrupt(void)
         }
  }
  
+/*
+ * this function sends a 'generic call function' IPI to one other CPU
+ * in the system.
+ *
+ * cpu is a standard Linux logical CPU number.
+ */
+static void
+__smp_call_function_single(int cpu, void (*func) (void *info), void *info,
+                               int nonatomic, int wait)
+{
+       struct call_data_struct data;
+       int cpus = 1;
+
+       data.func = func;
+       data.info = info;
+       atomic_set(&data.started, 0);
+       data.wait = wait;
+       if (wait)
+               atomic_set(&data.finished, 0);
+
+       call_data = &data;
+       wmb();
+       /* Send a message to all other CPUs and wait for them to respond */
+       send_IPI_mask(cpumask_of_cpu(cpu), CALL_FUNCTION_VECTOR);
+
+       /* Wait for response */
+       while (atomic_read(&data.started) != cpus)
+               cpu_relax();
+
+       if (!wait)
+               return;
+
+       while (atomic_read(&data.finished) != cpus)
+               cpu_relax();
+}
+
+/*
+ * smp_call_function_single - Run a function on another CPU
+ * @func: The function to run. This must be fast and non-blocking.
+ * @info: An arbitrary pointer to pass to the function.
+ * @nonatomic: Currently unused.
+ * @wait: If true, wait until function has completed on other CPUs.
+ *
+ * Retrurns 0 on success, else a negative status code.
+ *
+ * Does not return until the remote CPU is nearly ready to execute <func>
+ * or is or has executed.
+ */
+
+int smp_call_function_single(int cpu, void (*func) (void *info), void *info,
+                       int nonatomic, int wait)
+{
+       /* prevent preemption and reschedule on another processor */
+       int me = get_cpu();
+       if (cpu == me) {
+               WARN_ON(1);
+               put_cpu();
+               return -EBUSY;
+       }
+
+       /* Can deadlock when called with interrupts disabled */
+       WARN_ON(irqs_disabled());
+
+       spin_lock_bh(&call_lock);
+       __smp_call_function_single(cpu, func, info, nonatomic, wait);
+       spin_unlock_bh(&call_lock);
+       put_cpu();
+       return 0;
+}
+EXPORT_SYMBOL(smp_call_function_single);
+
+static int convert_apicid_to_cpu(int apic_id)
+{
+       int i;
+
+       for (i = 0; i < NR_CPUS; i++) {
+               if (x86_cpu_to_apicid[i] == apic_id)
+                       return i;
+       }
+       return -1;
+}
+
+int safe_smp_processor_id(void)
+{
+       int apicid, cpuid;
+
+       if (!boot_cpu_has(X86_FEATURE_APIC))
+               return 0;
+
+       apicid = hard_smp_processor_id();
+       if (apicid == BAD_APICID)
+               return 0;
+
+       cpuid = convert_apicid_to_cpu(apicid);
+
+       return cpuid >= 0 ? cpuid : 0;
+}