arch/mips/kernel/smp.c

   1 /*
   2  * This program is free software; you can redistribute it and/or
   3  * modify it under the terms of the GNU General Public License
   4  * as published by the Free Software Foundation; either version 2
   5  * of the License, or (at your option) any later version.
   6  *
   7  * This program is distributed in the hope that it will be useful,
   8  * but WITHOUT ANY WARRANTY; without even the implied warranty of
   9  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  10  * GNU General Public License for more details.
  11  *
  12  * You should have received a copy of the GNU General Public License
  13  * along with this program; if not, write to the Free Software
  14  * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
  15  *
  16  * Copyright (C) 2000, 2001 Kanoj Sarcar
  17  * Copyright (C) 2000, 2001 Ralf Baechle
  18  * Copyright (C) 2000, 2001 Silicon Graphics, Inc.
  19  * Copyright (C) 2000, 2001, 2003 Broadcom Corporation
  20  */
  21 #include <linux/config.h>
  22 #include <linux/cache.h>
  23 #include <linux/delay.h>
  24 #include <linux/init.h>
  25 #include <linux/interrupt.h>
  26 #include <linux/spinlock.h>
  27 #include <linux/threads.h>
  28 #include <linux/module.h>
  29 #include <linux/time.h>
  30 #include <linux/timex.h>
  31 #include <linux/sched.h>
  32 #include <linux/cpumask.h>
  33
  34 #include <asm/atomic.h>
  35 #include <asm/cpu.h>
  36 #include <asm/processor.h>
  37 #include <asm/system.h>
  38 #include <asm/hardirq.h>
  39 #include <asm/mmu_context.h>
  40 #include <asm/smp.h>
  41
  42 cpumask_t phys_cpu_present_map;         /* Bitmask of available CPUs */
  43 volatile cpumask_t cpu_callin_map;      /* Bitmask of started secondaries */
  44 cpumask_t cpu_online_map;               /* Bitmask of currently online CPUs */
  45 int __cpu_number_map[NR_CPUS];          /* Map physical to logical */
  46 int __cpu_logical_map[NR_CPUS];         /* Map logical to physical */
  47
  48 EXPORT_SYMBOL(cpu_online_map);
  49
  50 cycles_t cacheflush_time;
  51 unsigned long cache_decay_ticks;
  52
  53 static void smp_tune_scheduling (void)
  54 {
  55         struct cache_desc *cd = &current_cpu_data.scache;
  56         unsigned long cachesize;       /* kB   */
  57         unsigned long bandwidth = 350; /* MB/s */
  58         unsigned long cpu_khz;
  59
  60         /*
  61          * Crude estimate until we actually meassure ...
  62          */
  63         cpu_khz = loops_per_jiffy * 2 * HZ / 1000;
  64
  65         /*
  66          * Rough estimation for SMP scheduling, this is the number of
  67          * cycles it takes for a fully memory-limited process to flush
  68          * the SMP-local cache.
  69          *
  70          * (For a P5 this pretty much means we will choose another idle
  71          *  CPU almost always at wakeup time (this is due to the small
  72          *  L1 cache), on PIIs it's around 50-100 usecs, depending on
  73          *  the cache size)
  74          */
  75         if (!cpu_khz) {
  76                 /*
  77                  * This basically disables processor-affinity scheduling on SMP
  78                  * without a cycle counter.  Currently all SMP capable MIPS
  79                  * processors have a cycle counter.
  80                  */
  81                 cacheflush_time = 0;
  82                 return;
  83         }
  84
  85         cachesize = cd->linesz * cd->sets * cd->ways;
  86         cacheflush_time = (cpu_khz>>10) * (cachesize<<10) / bandwidth;
  87         cache_decay_ticks = (long)cacheflush_time/cpu_khz * HZ / 1000;
  88
  89         printk("per-CPU timeslice cutoff: %ld.%02ld usecs.\n",
  90                 (long)cacheflush_time/(cpu_khz/1000),
  91                 ((long)cacheflush_time*100/(cpu_khz/1000)) % 100);
  92         printk("task migration cache decay timeout: %ld msecs.\n",
  93                 (cache_decay_ticks + 1) * 1000 / HZ);
  94 }
  95
  96 extern void __init calibrate_delay(void);
  97
  98 /*
  99  * First C code run on the secondary CPUs after being started up by
 100  * the master.
 101  */
 102 asmlinkage void start_secondary(void)
 103 {
 104         unsigned int cpu = smp_processor_id();
 105
 106         cpu_probe();
 107         cpu_report();
 108         per_cpu_trap_init();
 109         prom_init_secondary();
 110
 111         /*
 112          * XXX parity protection should be folded in here when it's converted
 113          * to an option instead of something based on .cputype
 114          */
 115
 116         calibrate_delay();
 117         cpu_data[cpu].udelay_val = loops_per_jiffy;
 118
 119         prom_smp_finish();
 120
 121         cpu_set(cpu, cpu_callin_map);
 122
 123         cpu_idle();
 124 }
 125
 126 spinlock_t smp_call_lock = SPIN_LOCK_UNLOCKED;
 127
 128 struct call_data_struct *call_data;
 129
 130 /*
 131  * Run a function on all other CPUs.
 132  *  <func>      The function to run. This must be fast and non-blocking.
 133  *  <info>      An arbitrary pointer to pass to the function.
 134  *  <retry>     If true, keep retrying until ready.
 135  *  <wait>      If true, wait until function has completed on other CPUs.
 136  *  [RETURNS]   0 on success, else a negative status code.
 137  *
 138  * Does not return until remote CPUs are nearly ready to execute <func>
 139  * or are or have executed.
 140  *
 141  * You must not call this function with disabled interrupts or from a
 142  * hardware interrupt handler or from a bottom half handler.
 143  */
 144 int smp_call_function (void (*func) (void *info), void *info, int retry,
 145                                                                 int wait)
 146 {
 147         struct call_data_struct data;
 148         int i, cpus = num_online_cpus() - 1;
 149         int cpu = smp_processor_id();
 150
 151         if (!cpus)
 152                 return 0;
 153
 154         data.func = func;
 155         data.info = info;
 156         atomic_set(&data.started, 0);
 157         data.wait = wait;
 158         if (wait)
 159                 atomic_set(&data.finished, 0);
 160
 161         spin_lock(&smp_call_lock);
 162         call_data = &data;
 163         mb();
 164
 165         /* Send a message to all other CPUs and wait for them to respond */
 166         for (i = 0; i < NR_CPUS; i++)
 167                 if (cpu_online(i) && i != cpu)
 168                         core_send_ipi(i, SMP_CALL_FUNCTION);
 169
 170         /* Wait for response */
 171         /* FIXME: lock-up detection, backtrace on lock-up */
 172         while (atomic_read(&data.started) != cpus)
 173                 barrier();
 174
 175         if (wait)
 176                 while (atomic_read(&data.finished) != cpus)
 177                         barrier();
 178         spin_unlock(&smp_call_lock);
 179
 180         return 0;
 181 }
 182
 183 void smp_call_function_interrupt(void)
 184 {
 185         void (*func) (void *info) = call_data->func;
 186         void *info = call_data->info;
 187         int wait = call_data->wait;
 188
 189         /*
 190          * Notify initiating CPU that I've grabbed the data and am
 191          * about to execute the function.
 192          */
 193         mb();
 194         atomic_inc(&call_data->started);
 195
 196         /*
 197          * At this point the info structure may be out of scope unless wait==1.
 198          */
 199         irq_enter();
 200         (*func)(info);
 201         irq_exit();
 202
 203         if (wait) {
 204                 mb();
 205                 atomic_inc(&call_data->finished);
 206         }
 207 }
 208
 209 static void stop_this_cpu(void *dummy)
 210 {
 211         /*
 212          * Remove this CPU:
 213          */
 214         cpu_clear(smp_processor_id(), cpu_online_map);
 215         local_irq_enable();     /* May need to service _machine_restart IPI */
 216         for (;;);               /* Wait if available. */
 217 }
 218
 219 void smp_send_stop(void)
 220 {
 221         smp_call_function(stop_this_cpu, NULL, 1, 0);
 222 }
 223
 224 void __init smp_cpus_done(unsigned int max_cpus)
 225 {
 226         prom_cpus_done();
 227 }
 228
 229 /* called from main before smp_init() */
 230 void __init smp_prepare_cpus(unsigned int max_cpus)
 231 {
 232         cpu_data[0].udelay_val = loops_per_jiffy;
 233         init_new_context(current, &init_mm);
 234         current_thread_info()->cpu = 0;
 235         smp_tune_scheduling();
 236         prom_build_cpu_map();
 237         prom_prepare_cpus(max_cpus);
 238 }
 239
 240 /* preload SMP state for boot cpu */
 241 void __devinit smp_prepare_boot_cpu(void)
 242 {
 243         /*
 244          * This assumes that bootup is always handled by the processor
 245          * with the logic and physical number 0.
 246          */
 247         __cpu_number_map[0] = 0;
 248         __cpu_logical_map[0] = 0;
 249         cpu_set(0, phys_cpu_present_map);
 250         cpu_set(0, cpu_online_map);
 251         cpu_set(0, cpu_callin_map);
 252 }
 253
 254 static struct task_struct * __init fork_by_hand(void)
 255 {
 256         struct pt_regs regs;
 257         /*
 258          * don't care about the eip and regs settings since
 259          * we'll never reschedule the forked task.
 260          */
 261         return copy_process(CLONE_VM|CLONE_IDLETASK, 0, &regs, 0, NULL, NULL);
 262 }
 263
 264 /*
 265  * Startup the CPU with this logical number
 266  */
 267 static int __init do_boot_cpu(int cpu)
 268 {
 269         struct task_struct *idle;
 270
 271         /*
 272          * The following code is purely to make sure
 273          * Linux can schedule processes on this slave.
 274          */
 275         idle = fork_by_hand();
 276         if (IS_ERR(idle))
 277                 panic("failed fork for CPU %d\n", cpu);
 278
 279         wake_up_forked_process(idle);
 280
 281         /*
 282          * We remove it from the pidhash and the runqueue once we've
 283          * got the process:
 284          */
 285         init_idle(idle, cpu);
 286
 287         unhash_process(idle);
 288
 289         prom_boot_secondary(cpu, idle);
 290
 291         /* XXXKW timeout */
 292         while (!cpu_isset(cpu, cpu_callin_map))
 293                 udelay(100);
 294
 295         cpu_set(cpu, cpu_online_map);
 296
 297         return 0;
 298 }
 299
 300 /*
 301  * Called once for each "cpu_possible(cpu)".  Needs to spin up the cpu
 302  * and keep control until "cpu_online(cpu)" is set.  Note: cpu is
 303  * physical, not logical.
 304  */
 305 int __devinit __cpu_up(unsigned int cpu)
 306 {
 307         int ret;
 308
 309         /* Processor goes to start_secondary(), sets online flag */
 310         ret = do_boot_cpu(cpu);
 311         if (ret < 0)
 312                 return ret;
 313
 314         return 0;
 315 }
 316
 317 /* Not really SMP stuff ... */
 318 int setup_profiling_timer(unsigned int multiplier)
 319 {
 320         return 0;
 321 }
 322
 323 static void flush_tlb_all_ipi(void *info)
 324 {
 325         local_flush_tlb_all();
 326 }
 327
 328 void flush_tlb_all(void)
 329 {
 330         on_each_cpu(flush_tlb_all_ipi, 0, 1, 1);
 331 }
 332
 333 static void flush_tlb_mm_ipi(void *mm)
 334 {
 335         local_flush_tlb_mm((struct mm_struct *)mm);
 336 }
 337
 338 /*
 339  * The following tlb flush calls are invoked when old translations are
 340  * being torn down, or pte attributes are changing. For single threaded
 341  * address spaces, a new context is obtained on the current cpu, and tlb
 342  * context on other cpus are invalidated to force a new context allocation
 343  * at switch_mm time, should the mm ever be used on other cpus. For
 344  * multithreaded address spaces, intercpu interrupts have to be sent.
 345  * Another case where intercpu interrupts are required is when the target
 346  * mm might be active on another cpu (eg debuggers doing the flushes on
 347  * behalf of debugees, kswapd stealing pages from another process etc).
 348  * Kanoj 07/00.
 349  */
 350
 351 void flush_tlb_mm(struct mm_struct *mm)
 352 {
 353         preempt_disable();
 354
 355         if ((atomic_read(&mm->mm_users) != 1) || (current->mm != mm)) {
 356                 smp_call_function(flush_tlb_mm_ipi, (void *)mm, 1, 1);
 357         } else {
 358                 int i;
 359                 for (i = 0; i < num_online_cpus(); i++)
 360                         if (smp_processor_id() != i)
 361                                 cpu_context(i, mm) = 0;
 362         }
 363         local_flush_tlb_mm(mm);
 364
 365         preempt_enable();
 366 }
 367
 368 struct flush_tlb_data {
 369         struct vm_area_struct *vma;
 370         unsigned long addr1;
 371         unsigned long addr2;
 372 };
 373
 374 static void flush_tlb_range_ipi(void *info)
 375 {
 376         struct flush_tlb_data *fd = (struct flush_tlb_data *)info;
 377
 378         local_flush_tlb_range(fd->vma, fd->addr1, fd->addr2);
 379 }
 380
 381 void flush_tlb_range(struct vm_area_struct *vma, unsigned long start, unsigned long end)
 382 {
 383         struct mm_struct *mm = vma->vm_mm;
 384
 385         preempt_disable();
 386         if ((atomic_read(&mm->mm_users) != 1) || (current->mm != mm)) {
 387                 struct flush_tlb_data fd;
 388
 389                 fd.vma = vma;
 390                 fd.addr1 = start;
 391                 fd.addr2 = end;
 392                 smp_call_function(flush_tlb_range_ipi, (void *)&fd, 1, 1);
 393         } else {
 394                 int i;
 395                 for (i = 0; i < num_online_cpus(); i++)
 396                         if (smp_processor_id() != i)
 397                                 cpu_context(i, mm) = 0;
 398         }
 399         local_flush_tlb_range(vma, start, end);
 400         preempt_enable();
 401 }
 402
 403 static void flush_tlb_kernel_range_ipi(void *info)
 404 {
 405         struct flush_tlb_data *fd = (struct flush_tlb_data *)info;
 406
 407         local_flush_tlb_kernel_range(fd->addr1, fd->addr2);
 408 }
 409
 410 void flush_tlb_kernel_range(unsigned long start, unsigned long end)
 411 {
 412         struct flush_tlb_data fd;
 413
 414         fd.addr1 = start;
 415         fd.addr2 = end;
 416         on_each_cpu(flush_tlb_kernel_range_ipi, (void *)&fd, 1, 1);
 417 }
 418
 419 static void flush_tlb_page_ipi(void *info)
 420 {
 421         struct flush_tlb_data *fd = (struct flush_tlb_data *)info;
 422
 423         local_flush_tlb_page(fd->vma, fd->addr1);
 424 }
 425
 426 void flush_tlb_page(struct vm_area_struct *vma, unsigned long page)
 427 {
 428         preempt_disable();
 429         if ((atomic_read(&vma->vm_mm->mm_users) != 1) || (current->mm != vma->vm_mm)) {
 430                 struct flush_tlb_data fd;
 431
 432                 fd.vma = vma;
 433                 fd.addr1 = page;
 434                 smp_call_function(flush_tlb_page_ipi, (void *)&fd, 1, 1);
 435         } else {
 436                 int i;
 437                 for (i = 0; i < num_online_cpus(); i++)
 438                         if (smp_processor_id() != i)
 439                                 cpu_context(i, vma->vm_mm) = 0;
 440         }
 441         local_flush_tlb_page(vma, page);
 442         preempt_enable();
 443 }
 444
 445 static void flush_tlb_one_ipi(void *info)
 446 {
 447         unsigned long vaddr = (unsigned long) info;
 448
 449         local_flush_tlb_one(vaddr);
 450 }
 451
 452 void flush_tlb_one(unsigned long vaddr)
 453 {
 454         smp_call_function(flush_tlb_one_ipi, (void *) vaddr, 1, 1);
 455         local_flush_tlb_one(vaddr);
 456 }
 457
 458 EXPORT_SYMBOL(flush_tlb_page);
 459 EXPORT_SYMBOL(flush_tlb_one);
 460 EXPORT_SYMBOL(cpu_data);
 461 EXPORT_SYMBOL(synchronize_irq);