at v2.6.12 621 lines 13 kB view raw
1/* 2 * SMP support for ppc. 3 * 4 * Written by Cort Dougan (cort@cs.nmt.edu) borrowing a great 5 * deal of code from the sparc and intel versions. 6 * 7 * Copyright (C) 1999 Cort Dougan <cort@cs.nmt.edu> 8 * 9 * PowerPC-64 Support added by Dave Engebretsen, Peter Bergner, and 10 * Mike Corrigan {engebret|bergner|mikec}@us.ibm.com 11 * 12 * This program is free software; you can redistribute it and/or 13 * modify it under the terms of the GNU General Public License 14 * as published by the Free Software Foundation; either version 15 * 2 of the License, or (at your option) any later version. 16 */ 17 18#undef DEBUG 19 20#include <linux/config.h> 21#include <linux/kernel.h> 22#include <linux/module.h> 23#include <linux/sched.h> 24#include <linux/smp.h> 25#include <linux/interrupt.h> 26#include <linux/delay.h> 27#include <linux/init.h> 28#include <linux/spinlock.h> 29#include <linux/cache.h> 30#include <linux/err.h> 31#include <linux/sysdev.h> 32#include <linux/cpu.h> 33#include <linux/notifier.h> 34 35#include <asm/ptrace.h> 36#include <asm/atomic.h> 37#include <asm/irq.h> 38#include <asm/page.h> 39#include <asm/pgtable.h> 40#include <asm/prom.h> 41#include <asm/smp.h> 42#include <asm/paca.h> 43#include <asm/time.h> 44#include <asm/machdep.h> 45#include <asm/cputable.h> 46#include <asm/system.h> 47#include <asm/abs_addr.h> 48 49#include "mpic.h" 50 51#ifdef DEBUG 52#define DBG(fmt...) udbg_printf(fmt) 53#else 54#define DBG(fmt...) 55#endif 56 57cpumask_t cpu_possible_map = CPU_MASK_NONE; 58cpumask_t cpu_online_map = CPU_MASK_NONE; 59cpumask_t cpu_sibling_map[NR_CPUS] = { [0 ... NR_CPUS-1] = CPU_MASK_NONE }; 60 61EXPORT_SYMBOL(cpu_online_map); 62EXPORT_SYMBOL(cpu_possible_map); 63 64struct smp_ops_t *smp_ops; 65 66static volatile unsigned int cpu_callin_map[NR_CPUS]; 67 68extern unsigned char stab_array[]; 69 70void smp_call_function_interrupt(void); 71 72int smt_enabled_at_boot = 1; 73 74#ifdef CONFIG_PPC_MULTIPLATFORM 75void smp_mpic_message_pass(int target, int msg) 76{ 77 /* make sure we're sending something that translates to an IPI */ 78 if ( msg > 0x3 ){ 79 printk("SMP %d: smp_message_pass: unknown msg %d\n", 80 smp_processor_id(), msg); 81 return; 82 } 83 switch ( target ) 84 { 85 case MSG_ALL: 86 mpic_send_ipi(msg, 0xffffffff); 87 break; 88 case MSG_ALL_BUT_SELF: 89 mpic_send_ipi(msg, 0xffffffff & ~(1 << smp_processor_id())); 90 break; 91 default: 92 mpic_send_ipi(msg, 1 << target); 93 break; 94 } 95} 96 97int __init smp_mpic_probe(void) 98{ 99 int nr_cpus; 100 101 DBG("smp_mpic_probe()...\n"); 102 103 nr_cpus = cpus_weight(cpu_possible_map); 104 105 DBG("nr_cpus: %d\n", nr_cpus); 106 107 if (nr_cpus > 1) 108 mpic_request_ipis(); 109 110 return nr_cpus; 111} 112 113void __devinit smp_mpic_setup_cpu(int cpu) 114{ 115 mpic_setup_this_cpu(); 116} 117 118void __devinit smp_generic_kick_cpu(int nr) 119{ 120 BUG_ON(nr < 0 || nr >= NR_CPUS); 121 122 /* 123 * The processor is currently spinning, waiting for the 124 * cpu_start field to become non-zero After we set cpu_start, 125 * the processor will continue on to secondary_start 126 */ 127 paca[nr].cpu_start = 1; 128 smp_mb(); 129} 130 131#endif /* CONFIG_PPC_MULTIPLATFORM */ 132 133static void __init smp_space_timers(unsigned int max_cpus) 134{ 135 int i; 136 unsigned long offset = tb_ticks_per_jiffy / max_cpus; 137 unsigned long previous_tb = paca[boot_cpuid].next_jiffy_update_tb; 138 139 for_each_cpu(i) { 140 if (i != boot_cpuid) { 141 paca[i].next_jiffy_update_tb = 142 previous_tb + offset; 143 previous_tb = paca[i].next_jiffy_update_tb; 144 } 145 } 146} 147 148void smp_message_recv(int msg, struct pt_regs *regs) 149{ 150 switch(msg) { 151 case PPC_MSG_CALL_FUNCTION: 152 smp_call_function_interrupt(); 153 break; 154 case PPC_MSG_RESCHEDULE: 155 /* XXX Do we have to do this? */ 156 set_need_resched(); 157 break; 158#if 0 159 case PPC_MSG_MIGRATE_TASK: 160 /* spare */ 161 break; 162#endif 163#ifdef CONFIG_DEBUGGER 164 case PPC_MSG_DEBUGGER_BREAK: 165 debugger_ipi(regs); 166 break; 167#endif 168 default: 169 printk("SMP %d: smp_message_recv(): unknown msg %d\n", 170 smp_processor_id(), msg); 171 break; 172 } 173} 174 175void smp_send_reschedule(int cpu) 176{ 177 smp_ops->message_pass(cpu, PPC_MSG_RESCHEDULE); 178} 179 180#ifdef CONFIG_DEBUGGER 181void smp_send_debugger_break(int cpu) 182{ 183 smp_ops->message_pass(cpu, PPC_MSG_DEBUGGER_BREAK); 184} 185#endif 186 187static void stop_this_cpu(void *dummy) 188{ 189 local_irq_disable(); 190 while (1) 191 ; 192} 193 194void smp_send_stop(void) 195{ 196 smp_call_function(stop_this_cpu, NULL, 1, 0); 197} 198 199/* 200 * Structure and data for smp_call_function(). This is designed to minimise 201 * static memory requirements. It also looks cleaner. 202 * Stolen from the i386 version. 203 */ 204static __cacheline_aligned_in_smp DEFINE_SPINLOCK(call_lock); 205 206static struct call_data_struct { 207 void (*func) (void *info); 208 void *info; 209 atomic_t started; 210 atomic_t finished; 211 int wait; 212} *call_data; 213 214/* delay of at least 8 seconds on 1GHz cpu */ 215#define SMP_CALL_TIMEOUT (1UL << (30 + 3)) 216 217/* 218 * This function sends a 'generic call function' IPI to all other CPUs 219 * in the system. 220 * 221 * [SUMMARY] Run a function on all other CPUs. 222 * <func> The function to run. This must be fast and non-blocking. 223 * <info> An arbitrary pointer to pass to the function. 224 * <nonatomic> currently unused. 225 * <wait> If true, wait (atomically) until function has completed on other CPUs. 226 * [RETURNS] 0 on success, else a negative status code. Does not return until 227 * remote CPUs are nearly ready to execute <<func>> or are or have executed. 228 * 229 * You must not call this function with disabled interrupts or from a 230 * hardware interrupt handler or from a bottom half handler. 231 */ 232int smp_call_function (void (*func) (void *info), void *info, int nonatomic, 233 int wait) 234{ 235 struct call_data_struct data; 236 int ret = -1, cpus; 237 unsigned long timeout; 238 239 /* Can deadlock when called with interrupts disabled */ 240 WARN_ON(irqs_disabled()); 241 242 data.func = func; 243 data.info = info; 244 atomic_set(&data.started, 0); 245 data.wait = wait; 246 if (wait) 247 atomic_set(&data.finished, 0); 248 249 spin_lock(&call_lock); 250 /* Must grab online cpu count with preempt disabled, otherwise 251 * it can change. */ 252 cpus = num_online_cpus() - 1; 253 if (!cpus) { 254 ret = 0; 255 goto out; 256 } 257 258 call_data = &data; 259 smp_wmb(); 260 /* Send a message to all other CPUs and wait for them to respond */ 261 smp_ops->message_pass(MSG_ALL_BUT_SELF, PPC_MSG_CALL_FUNCTION); 262 263 /* Wait for response */ 264 timeout = SMP_CALL_TIMEOUT; 265 while (atomic_read(&data.started) != cpus) { 266 HMT_low(); 267 if (--timeout == 0) { 268 printk("smp_call_function on cpu %d: other cpus not " 269 "responding (%d)\n", smp_processor_id(), 270 atomic_read(&data.started)); 271 debugger(NULL); 272 goto out; 273 } 274 } 275 276 if (wait) { 277 timeout = SMP_CALL_TIMEOUT; 278 while (atomic_read(&data.finished) != cpus) { 279 HMT_low(); 280 if (--timeout == 0) { 281 printk("smp_call_function on cpu %d: other " 282 "cpus not finishing (%d/%d)\n", 283 smp_processor_id(), 284 atomic_read(&data.finished), 285 atomic_read(&data.started)); 286 debugger(NULL); 287 goto out; 288 } 289 } 290 } 291 292 ret = 0; 293 294out: 295 call_data = NULL; 296 HMT_medium(); 297 spin_unlock(&call_lock); 298 return ret; 299} 300 301EXPORT_SYMBOL(smp_call_function); 302 303void smp_call_function_interrupt(void) 304{ 305 void (*func) (void *info); 306 void *info; 307 int wait; 308 309 /* call_data will be NULL if the sender timed out while 310 * waiting on us to receive the call. 311 */ 312 if (!call_data) 313 return; 314 315 func = call_data->func; 316 info = call_data->info; 317 wait = call_data->wait; 318 319 if (!wait) 320 smp_mb__before_atomic_inc(); 321 322 /* 323 * Notify initiating CPU that I've grabbed the data and am 324 * about to execute the function 325 */ 326 atomic_inc(&call_data->started); 327 /* 328 * At this point the info structure may be out of scope unless wait==1 329 */ 330 (*func)(info); 331 if (wait) { 332 smp_mb__before_atomic_inc(); 333 atomic_inc(&call_data->finished); 334 } 335} 336 337extern struct gettimeofday_struct do_gtod; 338 339struct thread_info *current_set[NR_CPUS]; 340 341DECLARE_PER_CPU(unsigned int, pvr); 342 343static void __devinit smp_store_cpu_info(int id) 344{ 345 per_cpu(pvr, id) = mfspr(SPRN_PVR); 346} 347 348static void __init smp_create_idle(unsigned int cpu) 349{ 350 struct task_struct *p; 351 352 /* create a process for the processor */ 353 p = fork_idle(cpu); 354 if (IS_ERR(p)) 355 panic("failed fork for CPU %u: %li", cpu, PTR_ERR(p)); 356 paca[cpu].__current = p; 357 current_set[cpu] = p->thread_info; 358} 359 360void __init smp_prepare_cpus(unsigned int max_cpus) 361{ 362 unsigned int cpu; 363 364 DBG("smp_prepare_cpus\n"); 365 366 /* 367 * setup_cpu may need to be called on the boot cpu. We havent 368 * spun any cpus up but lets be paranoid. 369 */ 370 BUG_ON(boot_cpuid != smp_processor_id()); 371 372 /* Fixup boot cpu */ 373 smp_store_cpu_info(boot_cpuid); 374 cpu_callin_map[boot_cpuid] = 1; 375 376#ifndef CONFIG_PPC_ISERIES 377 paca[boot_cpuid].next_jiffy_update_tb = tb_last_stamp = get_tb(); 378 379 /* 380 * Should update do_gtod.stamp_xsec. 381 * For now we leave it which means the time can be some 382 * number of msecs off until someone does a settimeofday() 383 */ 384 do_gtod.varp->tb_orig_stamp = tb_last_stamp; 385 systemcfg->tb_orig_stamp = tb_last_stamp; 386#endif 387 388 max_cpus = smp_ops->probe(); 389 390 smp_space_timers(max_cpus); 391 392 for_each_cpu(cpu) 393 if (cpu != boot_cpuid) 394 smp_create_idle(cpu); 395} 396 397void __devinit smp_prepare_boot_cpu(void) 398{ 399 BUG_ON(smp_processor_id() != boot_cpuid); 400 401 cpu_set(boot_cpuid, cpu_online_map); 402 403 paca[boot_cpuid].__current = current; 404 current_set[boot_cpuid] = current->thread_info; 405} 406 407#ifdef CONFIG_HOTPLUG_CPU 408/* State of each CPU during hotplug phases */ 409DEFINE_PER_CPU(int, cpu_state) = { 0 }; 410 411int generic_cpu_disable(void) 412{ 413 unsigned int cpu = smp_processor_id(); 414 415 if (cpu == boot_cpuid) 416 return -EBUSY; 417 418 systemcfg->processorCount--; 419 cpu_clear(cpu, cpu_online_map); 420 fixup_irqs(cpu_online_map); 421 return 0; 422} 423 424int generic_cpu_enable(unsigned int cpu) 425{ 426 /* Do the normal bootup if we haven't 427 * already bootstrapped. */ 428 if (system_state != SYSTEM_RUNNING) 429 return -ENOSYS; 430 431 /* get the target out of it's holding state */ 432 per_cpu(cpu_state, cpu) = CPU_UP_PREPARE; 433 smp_wmb(); 434 435 while (!cpu_online(cpu)) 436 cpu_relax(); 437 438 fixup_irqs(cpu_online_map); 439 /* counter the irq disable in fixup_irqs */ 440 local_irq_enable(); 441 return 0; 442} 443 444void generic_cpu_die(unsigned int cpu) 445{ 446 int i; 447 448 for (i = 0; i < 100; i++) { 449 smp_rmb(); 450 if (per_cpu(cpu_state, cpu) == CPU_DEAD) 451 return; 452 msleep(100); 453 } 454 printk(KERN_ERR "CPU%d didn't die...\n", cpu); 455} 456 457void generic_mach_cpu_die(void) 458{ 459 unsigned int cpu; 460 461 local_irq_disable(); 462 cpu = smp_processor_id(); 463 printk(KERN_DEBUG "CPU%d offline\n", cpu); 464 __get_cpu_var(cpu_state) = CPU_DEAD; 465 smp_wmb(); 466 while (__get_cpu_var(cpu_state) != CPU_UP_PREPARE) 467 cpu_relax(); 468 469 flush_tlb_pending(); 470 cpu_set(cpu, cpu_online_map); 471 local_irq_enable(); 472} 473#endif 474 475static int __devinit cpu_enable(unsigned int cpu) 476{ 477 if (smp_ops->cpu_enable) 478 return smp_ops->cpu_enable(cpu); 479 480 return -ENOSYS; 481} 482 483int __devinit __cpu_up(unsigned int cpu) 484{ 485 int c; 486 487 if (!cpu_enable(cpu)) 488 return 0; 489 490 if (smp_ops->cpu_bootable && !smp_ops->cpu_bootable(cpu)) 491 return -EINVAL; 492 493 paca[cpu].default_decr = tb_ticks_per_jiffy; 494 495 if (!cpu_has_feature(CPU_FTR_SLB)) { 496 void *tmp; 497 498 /* maximum of 48 CPUs on machines with a segment table */ 499 if (cpu >= 48) 500 BUG(); 501 502 tmp = &stab_array[PAGE_SIZE * cpu]; 503 memset(tmp, 0, PAGE_SIZE); 504 paca[cpu].stab_addr = (unsigned long)tmp; 505 paca[cpu].stab_real = virt_to_abs(tmp); 506 } 507 508 /* Make sure callin-map entry is 0 (can be leftover a CPU 509 * hotplug 510 */ 511 cpu_callin_map[cpu] = 0; 512 513 /* The information for processor bringup must 514 * be written out to main store before we release 515 * the processor. 516 */ 517 smp_mb(); 518 519 /* wake up cpus */ 520 DBG("smp: kicking cpu %d\n", cpu); 521 smp_ops->kick_cpu(cpu); 522 523 /* 524 * wait to see if the cpu made a callin (is actually up). 525 * use this value that I found through experimentation. 526 * -- Cort 527 */ 528 if (system_state < SYSTEM_RUNNING) 529 for (c = 5000; c && !cpu_callin_map[cpu]; c--) 530 udelay(100); 531#ifdef CONFIG_HOTPLUG_CPU 532 else 533 /* 534 * CPUs can take much longer to come up in the 535 * hotplug case. Wait five seconds. 536 */ 537 for (c = 25; c && !cpu_callin_map[cpu]; c--) { 538 msleep(200); 539 } 540#endif 541 542 if (!cpu_callin_map[cpu]) { 543 printk("Processor %u is stuck.\n", cpu); 544 return -ENOENT; 545 } 546 547 printk("Processor %u found.\n", cpu); 548 549 if (smp_ops->give_timebase) 550 smp_ops->give_timebase(); 551 552 /* Wait until cpu puts itself in the online map */ 553 while (!cpu_online(cpu)) 554 cpu_relax(); 555 556 return 0; 557} 558 559 560/* Activate a secondary processor. */ 561int __devinit start_secondary(void *unused) 562{ 563 unsigned int cpu = smp_processor_id(); 564 565 atomic_inc(&init_mm.mm_count); 566 current->active_mm = &init_mm; 567 568 smp_store_cpu_info(cpu); 569 set_dec(paca[cpu].default_decr); 570 cpu_callin_map[cpu] = 1; 571 572 smp_ops->setup_cpu(cpu); 573 if (smp_ops->take_timebase) 574 smp_ops->take_timebase(); 575 576 spin_lock(&call_lock); 577 cpu_set(cpu, cpu_online_map); 578 spin_unlock(&call_lock); 579 580 local_irq_enable(); 581 582 cpu_idle(); 583 return 0; 584} 585 586int setup_profiling_timer(unsigned int multiplier) 587{ 588 return 0; 589} 590 591void __init smp_cpus_done(unsigned int max_cpus) 592{ 593 cpumask_t old_mask; 594 595 /* We want the setup_cpu() here to be called from CPU 0, but our 596 * init thread may have been "borrowed" by another CPU in the meantime 597 * se we pin us down to CPU 0 for a short while 598 */ 599 old_mask = current->cpus_allowed; 600 set_cpus_allowed(current, cpumask_of_cpu(boot_cpuid)); 601 602 smp_ops->setup_cpu(boot_cpuid); 603 604 set_cpus_allowed(current, old_mask); 605} 606 607#ifdef CONFIG_HOTPLUG_CPU 608int __cpu_disable(void) 609{ 610 if (smp_ops->cpu_disable) 611 return smp_ops->cpu_disable(); 612 613 return -ENOSYS; 614} 615 616void __cpu_die(unsigned int cpu) 617{ 618 if (smp_ops->cpu_die) 619 smp_ops->cpu_die(cpu); 620} 621#endif