11da177e4SLinus Torvalds /* 21da177e4SLinus Torvalds * SMP boot-related support 31da177e4SLinus Torvalds * 482975115SDavid Mosberger-Tang * Copyright (C) 1998-2003, 2005 Hewlett-Packard Co 51da177e4SLinus Torvalds * David Mosberger-Tang <davidm@hpl.hp.com> 6e927ecb0SSuresh Siddha * Copyright (C) 2001, 2004-2005 Intel Corp 7e927ecb0SSuresh Siddha * Rohit Seth <rohit.seth@intel.com> 8e927ecb0SSuresh Siddha * Suresh Siddha <suresh.b.siddha@intel.com> 9e927ecb0SSuresh Siddha * Gordon Jin <gordon.jin@intel.com> 10e927ecb0SSuresh Siddha * Ashok Raj <ashok.raj@intel.com> 111da177e4SLinus Torvalds * 121da177e4SLinus Torvalds * 01/05/16 Rohit Seth <rohit.seth@intel.com> Moved SMP booting functions from smp.c to here. 131da177e4SLinus Torvalds * 01/04/27 David Mosberger <davidm@hpl.hp.com> Added ITC synching code. 141da177e4SLinus Torvalds * 02/07/31 David Mosberger <davidm@hpl.hp.com> Switch over to hotplug-CPU boot-sequence. 151da177e4SLinus Torvalds * smp_boot_cpus()/smp_commence() is replaced by 161da177e4SLinus Torvalds * smp_prepare_cpus()/__cpu_up()/smp_cpus_done(). 17b8d8b883SAshok Raj * 04/06/21 Ashok Raj <ashok.raj@intel.com> Added CPU Hotplug Support 18e927ecb0SSuresh Siddha * 04/12/26 Jin Gordon <gordon.jin@intel.com> 19e927ecb0SSuresh Siddha * 04/12/26 Rohit Seth <rohit.seth@intel.com> 20e927ecb0SSuresh Siddha * Add multi-threading and multi-core detection 21e927ecb0SSuresh Siddha * 05/01/30 Suresh Siddha <suresh.b.siddha@intel.com> 22e927ecb0SSuresh Siddha * Setup cpu_sibling_map and cpu_core_map 231da177e4SLinus Torvalds */ 241da177e4SLinus Torvalds #include <linux/config.h> 251da177e4SLinus Torvalds 261da177e4SLinus Torvalds #include <linux/module.h> 271da177e4SLinus Torvalds #include <linux/acpi.h> 281da177e4SLinus Torvalds #include <linux/bootmem.h> 291da177e4SLinus Torvalds #include <linux/cpu.h> 301da177e4SLinus Torvalds #include <linux/delay.h> 311da177e4SLinus Torvalds #include <linux/init.h> 321da177e4SLinus Torvalds #include <linux/interrupt.h> 331da177e4SLinus Torvalds #include <linux/irq.h> 341da177e4SLinus Torvalds #include <linux/kernel.h> 351da177e4SLinus Torvalds #include <linux/kernel_stat.h> 361da177e4SLinus Torvalds #include <linux/mm.h> 371da177e4SLinus Torvalds #include <linux/notifier.h> 381da177e4SLinus Torvalds #include <linux/smp.h> 391da177e4SLinus Torvalds #include <linux/smp_lock.h> 401da177e4SLinus Torvalds #include <linux/spinlock.h> 411da177e4SLinus Torvalds #include <linux/efi.h> 421da177e4SLinus Torvalds #include <linux/percpu.h> 431da177e4SLinus Torvalds #include <linux/bitops.h> 441da177e4SLinus Torvalds 451da177e4SLinus Torvalds #include <asm/atomic.h> 461da177e4SLinus Torvalds #include <asm/cache.h> 471da177e4SLinus Torvalds #include <asm/current.h> 481da177e4SLinus Torvalds #include <asm/delay.h> 491da177e4SLinus Torvalds #include <asm/ia32.h> 501da177e4SLinus Torvalds #include <asm/io.h> 511da177e4SLinus Torvalds #include <asm/irq.h> 521da177e4SLinus Torvalds #include <asm/machvec.h> 531da177e4SLinus Torvalds #include <asm/mca.h> 541da177e4SLinus Torvalds #include <asm/page.h> 551da177e4SLinus Torvalds #include <asm/pgalloc.h> 561da177e4SLinus Torvalds #include <asm/pgtable.h> 571da177e4SLinus Torvalds #include <asm/processor.h> 581da177e4SLinus Torvalds #include <asm/ptrace.h> 591da177e4SLinus Torvalds #include <asm/sal.h> 601da177e4SLinus Torvalds #include <asm/system.h> 611da177e4SLinus Torvalds #include <asm/tlbflush.h> 621da177e4SLinus Torvalds #include <asm/unistd.h> 631da177e4SLinus Torvalds 641da177e4SLinus Torvalds #define SMP_DEBUG 0 651da177e4SLinus Torvalds 661da177e4SLinus Torvalds #if SMP_DEBUG 671da177e4SLinus Torvalds #define Dprintk(x...) printk(x) 681da177e4SLinus Torvalds #else 691da177e4SLinus Torvalds #define Dprintk(x...) 701da177e4SLinus Torvalds #endif 711da177e4SLinus Torvalds 72b8d8b883SAshok Raj #ifdef CONFIG_HOTPLUG_CPU 73b8d8b883SAshok Raj /* 74b8d8b883SAshok Raj * Store all idle threads, this can be reused instead of creating 75b8d8b883SAshok Raj * a new thread. Also avoids complicated thread destroy functionality 76b8d8b883SAshok Raj * for idle threads. 77b8d8b883SAshok Raj */ 78b8d8b883SAshok Raj struct task_struct *idle_thread_array[NR_CPUS]; 79b8d8b883SAshok Raj 80b8d8b883SAshok Raj /* 81b8d8b883SAshok Raj * Global array allocated for NR_CPUS at boot time 82b8d8b883SAshok Raj */ 83b8d8b883SAshok Raj struct sal_to_os_boot sal_boot_rendez_state[NR_CPUS]; 84b8d8b883SAshok Raj 85b8d8b883SAshok Raj /* 86b8d8b883SAshok Raj * start_ap in head.S uses this to store current booting cpu 87b8d8b883SAshok Raj * info. 88b8d8b883SAshok Raj */ 89b8d8b883SAshok Raj struct sal_to_os_boot *sal_state_for_booting_cpu = &sal_boot_rendez_state[0]; 90b8d8b883SAshok Raj 91b8d8b883SAshok Raj #define set_brendez_area(x) (sal_state_for_booting_cpu = &sal_boot_rendez_state[(x)]); 92b8d8b883SAshok Raj 93b8d8b883SAshok Raj #define get_idle_for_cpu(x) (idle_thread_array[(x)]) 94b8d8b883SAshok Raj #define set_idle_for_cpu(x,p) (idle_thread_array[(x)] = (p)) 95b8d8b883SAshok Raj 96b8d8b883SAshok Raj #else 97b8d8b883SAshok Raj 98b8d8b883SAshok Raj #define get_idle_for_cpu(x) (NULL) 99b8d8b883SAshok Raj #define set_idle_for_cpu(x,p) 100b8d8b883SAshok Raj #define set_brendez_area(x) 101b8d8b883SAshok Raj #endif 102b8d8b883SAshok Raj 1031da177e4SLinus Torvalds 1041da177e4SLinus Torvalds /* 1051da177e4SLinus Torvalds * ITC synchronization related stuff: 1061da177e4SLinus Torvalds */ 1071da177e4SLinus Torvalds #define MASTER 0 1081da177e4SLinus Torvalds #define SLAVE (SMP_CACHE_BYTES/8) 1091da177e4SLinus Torvalds 1101da177e4SLinus Torvalds #define NUM_ROUNDS 64 /* magic value */ 1111da177e4SLinus Torvalds #define NUM_ITERS 5 /* likewise */ 1121da177e4SLinus Torvalds 1131da177e4SLinus Torvalds static DEFINE_SPINLOCK(itc_sync_lock); 1141da177e4SLinus Torvalds static volatile unsigned long go[SLAVE + 1]; 1151da177e4SLinus Torvalds 1161da177e4SLinus Torvalds #define DEBUG_ITC_SYNC 0 1171da177e4SLinus Torvalds 1181da177e4SLinus Torvalds extern void __devinit calibrate_delay (void); 1191da177e4SLinus Torvalds extern void start_ap (void); 1201da177e4SLinus Torvalds extern unsigned long ia64_iobase; 1211da177e4SLinus Torvalds 1221da177e4SLinus Torvalds task_t *task_for_booting_cpu; 1231da177e4SLinus Torvalds 1241da177e4SLinus Torvalds /* 1251da177e4SLinus Torvalds * State for each CPU 1261da177e4SLinus Torvalds */ 1271da177e4SLinus Torvalds DEFINE_PER_CPU(int, cpu_state); 1281da177e4SLinus Torvalds 1291da177e4SLinus Torvalds /* Bitmasks of currently online, and possible CPUs */ 1301da177e4SLinus Torvalds cpumask_t cpu_online_map; 1311da177e4SLinus Torvalds EXPORT_SYMBOL(cpu_online_map); 13269aa234bSAshok Raj cpumask_t cpu_possible_map = CPU_MASK_NONE; 1331da177e4SLinus Torvalds EXPORT_SYMBOL(cpu_possible_map); 1341da177e4SLinus Torvalds 135e927ecb0SSuresh Siddha cpumask_t cpu_core_map[NR_CPUS] __cacheline_aligned; 136e927ecb0SSuresh Siddha cpumask_t cpu_sibling_map[NR_CPUS] __cacheline_aligned; 137e927ecb0SSuresh Siddha int smp_num_siblings = 1; 138e927ecb0SSuresh Siddha int smp_num_cpucores = 1; 139e927ecb0SSuresh Siddha 1401da177e4SLinus Torvalds /* which logical CPU number maps to which CPU (physical APIC ID) */ 1411da177e4SLinus Torvalds volatile int ia64_cpu_to_sapicid[NR_CPUS]; 1421da177e4SLinus Torvalds EXPORT_SYMBOL(ia64_cpu_to_sapicid); 1431da177e4SLinus Torvalds 1441da177e4SLinus Torvalds static volatile cpumask_t cpu_callin_map; 1451da177e4SLinus Torvalds 1461da177e4SLinus Torvalds struct smp_boot_data smp_boot_data __initdata; 1471da177e4SLinus Torvalds 1481da177e4SLinus Torvalds unsigned long ap_wakeup_vector = -1; /* External Int use to wakeup APs */ 1491da177e4SLinus Torvalds 1501da177e4SLinus Torvalds char __initdata no_int_routing; 1511da177e4SLinus Torvalds 1521da177e4SLinus Torvalds unsigned char smp_int_redirect; /* are INT and IPI redirectable by the chipset? */ 1531da177e4SLinus Torvalds 1541da177e4SLinus Torvalds static int __init 1551da177e4SLinus Torvalds nointroute (char *str) 1561da177e4SLinus Torvalds { 1571da177e4SLinus Torvalds no_int_routing = 1; 1581da177e4SLinus Torvalds printk ("no_int_routing on\n"); 1591da177e4SLinus Torvalds return 1; 1601da177e4SLinus Torvalds } 1611da177e4SLinus Torvalds 1621da177e4SLinus Torvalds __setup("nointroute", nointroute); 1631da177e4SLinus Torvalds 1641da177e4SLinus Torvalds void 1651da177e4SLinus Torvalds sync_master (void *arg) 1661da177e4SLinus Torvalds { 1671da177e4SLinus Torvalds unsigned long flags, i; 1681da177e4SLinus Torvalds 1691da177e4SLinus Torvalds go[MASTER] = 0; 1701da177e4SLinus Torvalds 1711da177e4SLinus Torvalds local_irq_save(flags); 1721da177e4SLinus Torvalds { 1731da177e4SLinus Torvalds for (i = 0; i < NUM_ROUNDS*NUM_ITERS; ++i) { 17482975115SDavid Mosberger-Tang while (!go[MASTER]) 17582975115SDavid Mosberger-Tang cpu_relax(); 1761da177e4SLinus Torvalds go[MASTER] = 0; 1771da177e4SLinus Torvalds go[SLAVE] = ia64_get_itc(); 1781da177e4SLinus Torvalds } 1791da177e4SLinus Torvalds } 1801da177e4SLinus Torvalds local_irq_restore(flags); 1811da177e4SLinus Torvalds } 1821da177e4SLinus Torvalds 1831da177e4SLinus Torvalds /* 1841da177e4SLinus Torvalds * Return the number of cycles by which our itc differs from the itc on the master 1851da177e4SLinus Torvalds * (time-keeper) CPU. A positive number indicates our itc is ahead of the master, 1861da177e4SLinus Torvalds * negative that it is behind. 1871da177e4SLinus Torvalds */ 1881da177e4SLinus Torvalds static inline long 1891da177e4SLinus Torvalds get_delta (long *rt, long *master) 1901da177e4SLinus Torvalds { 1911da177e4SLinus Torvalds unsigned long best_t0 = 0, best_t1 = ~0UL, best_tm = 0; 1921da177e4SLinus Torvalds unsigned long tcenter, t0, t1, tm; 1931da177e4SLinus Torvalds long i; 1941da177e4SLinus Torvalds 1951da177e4SLinus Torvalds for (i = 0; i < NUM_ITERS; ++i) { 1961da177e4SLinus Torvalds t0 = ia64_get_itc(); 1971da177e4SLinus Torvalds go[MASTER] = 1; 19882975115SDavid Mosberger-Tang while (!(tm = go[SLAVE])) 19982975115SDavid Mosberger-Tang cpu_relax(); 2001da177e4SLinus Torvalds go[SLAVE] = 0; 2011da177e4SLinus Torvalds t1 = ia64_get_itc(); 2021da177e4SLinus Torvalds 2031da177e4SLinus Torvalds if (t1 - t0 < best_t1 - best_t0) 2041da177e4SLinus Torvalds best_t0 = t0, best_t1 = t1, best_tm = tm; 2051da177e4SLinus Torvalds } 2061da177e4SLinus Torvalds 2071da177e4SLinus Torvalds *rt = best_t1 - best_t0; 2081da177e4SLinus Torvalds *master = best_tm - best_t0; 2091da177e4SLinus Torvalds 2101da177e4SLinus Torvalds /* average best_t0 and best_t1 without overflow: */ 2111da177e4SLinus Torvalds tcenter = (best_t0/2 + best_t1/2); 2121da177e4SLinus Torvalds if (best_t0 % 2 + best_t1 % 2 == 2) 2131da177e4SLinus Torvalds ++tcenter; 2141da177e4SLinus Torvalds return tcenter - best_tm; 2151da177e4SLinus Torvalds } 2161da177e4SLinus Torvalds 2171da177e4SLinus Torvalds /* 2181da177e4SLinus Torvalds * Synchronize ar.itc of the current (slave) CPU with the ar.itc of the MASTER CPU 2191da177e4SLinus Torvalds * (normally the time-keeper CPU). We use a closed loop to eliminate the possibility of 2201da177e4SLinus Torvalds * unaccounted-for errors (such as getting a machine check in the middle of a calibration 2211da177e4SLinus Torvalds * step). The basic idea is for the slave to ask the master what itc value it has and to 2221da177e4SLinus Torvalds * read its own itc before and after the master responds. Each iteration gives us three 2231da177e4SLinus Torvalds * timestamps: 2241da177e4SLinus Torvalds * 2251da177e4SLinus Torvalds * slave master 2261da177e4SLinus Torvalds * 2271da177e4SLinus Torvalds * t0 ---\ 2281da177e4SLinus Torvalds * ---\ 2291da177e4SLinus Torvalds * ---> 2301da177e4SLinus Torvalds * tm 2311da177e4SLinus Torvalds * /--- 2321da177e4SLinus Torvalds * /--- 2331da177e4SLinus Torvalds * t1 <--- 2341da177e4SLinus Torvalds * 2351da177e4SLinus Torvalds * 2361da177e4SLinus Torvalds * The goal is to adjust the slave's ar.itc such that tm falls exactly half-way between t0 2371da177e4SLinus Torvalds * and t1. If we achieve this, the clocks are synchronized provided the interconnect 2381da177e4SLinus Torvalds * between the slave and the master is symmetric. Even if the interconnect were 2391da177e4SLinus Torvalds * asymmetric, we would still know that the synchronization error is smaller than the 2401da177e4SLinus Torvalds * roundtrip latency (t0 - t1). 2411da177e4SLinus Torvalds * 2421da177e4SLinus Torvalds * When the interconnect is quiet and symmetric, this lets us synchronize the itc to 2431da177e4SLinus Torvalds * within one or two cycles. However, we can only *guarantee* that the synchronization is 2441da177e4SLinus Torvalds * accurate to within a round-trip time, which is typically in the range of several 2451da177e4SLinus Torvalds * hundred cycles (e.g., ~500 cycles). In practice, this means that the itc's are usually 2461da177e4SLinus Torvalds * almost perfectly synchronized, but we shouldn't assume that the accuracy is much better 2471da177e4SLinus Torvalds * than half a micro second or so. 2481da177e4SLinus Torvalds */ 2491da177e4SLinus Torvalds void 2501da177e4SLinus Torvalds ia64_sync_itc (unsigned int master) 2511da177e4SLinus Torvalds { 2521da177e4SLinus Torvalds long i, delta, adj, adjust_latency = 0, done = 0; 2531da177e4SLinus Torvalds unsigned long flags, rt, master_time_stamp, bound; 2541da177e4SLinus Torvalds #if DEBUG_ITC_SYNC 2551da177e4SLinus Torvalds struct { 2561da177e4SLinus Torvalds long rt; /* roundtrip time */ 2571da177e4SLinus Torvalds long master; /* master's timestamp */ 2581da177e4SLinus Torvalds long diff; /* difference between midpoint and master's timestamp */ 2591da177e4SLinus Torvalds long lat; /* estimate of itc adjustment latency */ 2601da177e4SLinus Torvalds } t[NUM_ROUNDS]; 2611da177e4SLinus Torvalds #endif 2621da177e4SLinus Torvalds 2631da177e4SLinus Torvalds /* 2641da177e4SLinus Torvalds * Make sure local timer ticks are disabled while we sync. If 2651da177e4SLinus Torvalds * they were enabled, we'd have to worry about nasty issues 2661da177e4SLinus Torvalds * like setting the ITC ahead of (or a long time before) the 2671da177e4SLinus Torvalds * next scheduled tick. 2681da177e4SLinus Torvalds */ 2691da177e4SLinus Torvalds BUG_ON((ia64_get_itv() & (1 << 16)) == 0); 2701da177e4SLinus Torvalds 2711da177e4SLinus Torvalds go[MASTER] = 1; 2721da177e4SLinus Torvalds 2731da177e4SLinus Torvalds if (smp_call_function_single(master, sync_master, NULL, 1, 0) < 0) { 2741da177e4SLinus Torvalds printk(KERN_ERR "sync_itc: failed to get attention of CPU %u!\n", master); 2751da177e4SLinus Torvalds return; 2761da177e4SLinus Torvalds } 2771da177e4SLinus Torvalds 27882975115SDavid Mosberger-Tang while (go[MASTER]) 27982975115SDavid Mosberger-Tang cpu_relax(); /* wait for master to be ready */ 2801da177e4SLinus Torvalds 2811da177e4SLinus Torvalds spin_lock_irqsave(&itc_sync_lock, flags); 2821da177e4SLinus Torvalds { 2831da177e4SLinus Torvalds for (i = 0; i < NUM_ROUNDS; ++i) { 2841da177e4SLinus Torvalds delta = get_delta(&rt, &master_time_stamp); 2851da177e4SLinus Torvalds if (delta == 0) { 2861da177e4SLinus Torvalds done = 1; /* let's lock on to this... */ 2871da177e4SLinus Torvalds bound = rt; 2881da177e4SLinus Torvalds } 2891da177e4SLinus Torvalds 2901da177e4SLinus Torvalds if (!done) { 2911da177e4SLinus Torvalds if (i > 0) { 2921da177e4SLinus Torvalds adjust_latency += -delta; 2931da177e4SLinus Torvalds adj = -delta + adjust_latency/4; 2941da177e4SLinus Torvalds } else 2951da177e4SLinus Torvalds adj = -delta; 2961da177e4SLinus Torvalds 2971da177e4SLinus Torvalds ia64_set_itc(ia64_get_itc() + adj); 2981da177e4SLinus Torvalds } 2991da177e4SLinus Torvalds #if DEBUG_ITC_SYNC 3001da177e4SLinus Torvalds t[i].rt = rt; 3011da177e4SLinus Torvalds t[i].master = master_time_stamp; 3021da177e4SLinus Torvalds t[i].diff = delta; 3031da177e4SLinus Torvalds t[i].lat = adjust_latency/4; 3041da177e4SLinus Torvalds #endif 3051da177e4SLinus Torvalds } 3061da177e4SLinus Torvalds } 3071da177e4SLinus Torvalds spin_unlock_irqrestore(&itc_sync_lock, flags); 3081da177e4SLinus Torvalds 3091da177e4SLinus Torvalds #if DEBUG_ITC_SYNC 3101da177e4SLinus Torvalds for (i = 0; i < NUM_ROUNDS; ++i) 3111da177e4SLinus Torvalds printk("rt=%5ld master=%5ld diff=%5ld adjlat=%5ld\n", 3121da177e4SLinus Torvalds t[i].rt, t[i].master, t[i].diff, t[i].lat); 3131da177e4SLinus Torvalds #endif 3141da177e4SLinus Torvalds 3151da177e4SLinus Torvalds printk(KERN_INFO "CPU %d: synchronized ITC with CPU %u (last diff %ld cycles, " 3161da177e4SLinus Torvalds "maxerr %lu cycles)\n", smp_processor_id(), master, delta, rt); 3171da177e4SLinus Torvalds } 3181da177e4SLinus Torvalds 3191da177e4SLinus Torvalds /* 3201da177e4SLinus Torvalds * Ideally sets up per-cpu profiling hooks. Doesn't do much now... 3211da177e4SLinus Torvalds */ 3221da177e4SLinus Torvalds static inline void __devinit 3231da177e4SLinus Torvalds smp_setup_percpu_timer (void) 3241da177e4SLinus Torvalds { 3251da177e4SLinus Torvalds } 3261da177e4SLinus Torvalds 3271da177e4SLinus Torvalds static void __devinit 3281da177e4SLinus Torvalds smp_callin (void) 3291da177e4SLinus Torvalds { 3301da177e4SLinus Torvalds int cpuid, phys_id; 3311da177e4SLinus Torvalds extern void ia64_init_itm(void); 3321da177e4SLinus Torvalds 3331da177e4SLinus Torvalds #ifdef CONFIG_PERFMON 3341da177e4SLinus Torvalds extern void pfm_init_percpu(void); 3351da177e4SLinus Torvalds #endif 3361da177e4SLinus Torvalds 3371da177e4SLinus Torvalds cpuid = smp_processor_id(); 3381da177e4SLinus Torvalds phys_id = hard_smp_processor_id(); 3391da177e4SLinus Torvalds 3401da177e4SLinus Torvalds if (cpu_online(cpuid)) { 3411da177e4SLinus Torvalds printk(KERN_ERR "huh, phys CPU#0x%x, CPU#0x%x already present??\n", 3421da177e4SLinus Torvalds phys_id, cpuid); 3431da177e4SLinus Torvalds BUG(); 3441da177e4SLinus Torvalds } 3451da177e4SLinus Torvalds 3461da177e4SLinus Torvalds lock_ipi_calllock(); 3471da177e4SLinus Torvalds cpu_set(cpuid, cpu_online_map); 3481da177e4SLinus Torvalds unlock_ipi_calllock(); 349a9fa06c2SShaohua Li per_cpu(cpu_state, cpuid) = CPU_ONLINE; 3501da177e4SLinus Torvalds 3511da177e4SLinus Torvalds smp_setup_percpu_timer(); 3521da177e4SLinus Torvalds 3531da177e4SLinus Torvalds ia64_mca_cmc_vector_setup(); /* Setup vector on AP */ 3541da177e4SLinus Torvalds 3551da177e4SLinus Torvalds #ifdef CONFIG_PERFMON 3561da177e4SLinus Torvalds pfm_init_percpu(); 3571da177e4SLinus Torvalds #endif 3581da177e4SLinus Torvalds 3591da177e4SLinus Torvalds local_irq_enable(); 3601da177e4SLinus Torvalds 3611da177e4SLinus Torvalds if (!(sal_platform_features & IA64_SAL_PLATFORM_FEATURE_ITC_DRIFT)) { 3621da177e4SLinus Torvalds /* 3631da177e4SLinus Torvalds * Synchronize the ITC with the BP. Need to do this after irqs are 3641da177e4SLinus Torvalds * enabled because ia64_sync_itc() calls smp_call_function_single(), which 3651da177e4SLinus Torvalds * calls spin_unlock_bh(), which calls spin_unlock_bh(), which calls 3661da177e4SLinus Torvalds * local_bh_enable(), which bugs out if irqs are not enabled... 3671da177e4SLinus Torvalds */ 3681da177e4SLinus Torvalds Dprintk("Going to syncup ITC with BP.\n"); 3691da177e4SLinus Torvalds ia64_sync_itc(0); 3701da177e4SLinus Torvalds } 3711da177e4SLinus Torvalds 3721da177e4SLinus Torvalds /* 3731da177e4SLinus Torvalds * Get our bogomips. 3741da177e4SLinus Torvalds */ 3751da177e4SLinus Torvalds ia64_init_itm(); 3761da177e4SLinus Torvalds calibrate_delay(); 3771da177e4SLinus Torvalds local_cpu_data->loops_per_jiffy = loops_per_jiffy; 3781da177e4SLinus Torvalds 3791da177e4SLinus Torvalds #ifdef CONFIG_IA32_SUPPORT 3801da177e4SLinus Torvalds ia32_gdt_init(); 3811da177e4SLinus Torvalds #endif 3821da177e4SLinus Torvalds 3831da177e4SLinus Torvalds /* 3841da177e4SLinus Torvalds * Allow the master to continue. 3851da177e4SLinus Torvalds */ 3861da177e4SLinus Torvalds cpu_set(cpuid, cpu_callin_map); 3871da177e4SLinus Torvalds Dprintk("Stack on CPU %d at about %p\n",cpuid, &cpuid); 3881da177e4SLinus Torvalds } 3891da177e4SLinus Torvalds 3901da177e4SLinus Torvalds 3911da177e4SLinus Torvalds /* 3921da177e4SLinus Torvalds * Activate a secondary processor. head.S calls this. 3931da177e4SLinus Torvalds */ 3941da177e4SLinus Torvalds int __devinit 3951da177e4SLinus Torvalds start_secondary (void *unused) 3961da177e4SLinus Torvalds { 3971da177e4SLinus Torvalds /* Early console may use I/O ports */ 3981da177e4SLinus Torvalds ia64_set_kr(IA64_KR_IO_BASE, __pa(ia64_iobase)); 3991da177e4SLinus Torvalds Dprintk("start_secondary: starting CPU 0x%x\n", hard_smp_processor_id()); 4001da177e4SLinus Torvalds efi_map_pal_code(); 4011da177e4SLinus Torvalds cpu_init(); 4025bfb5d69SNick Piggin preempt_disable(); 4031da177e4SLinus Torvalds smp_callin(); 4041da177e4SLinus Torvalds 4051da177e4SLinus Torvalds cpu_idle(); 4061da177e4SLinus Torvalds return 0; 4071da177e4SLinus Torvalds } 4081da177e4SLinus Torvalds 4091da177e4SLinus Torvalds struct pt_regs * __devinit idle_regs(struct pt_regs *regs) 4101da177e4SLinus Torvalds { 4111da177e4SLinus Torvalds return NULL; 4121da177e4SLinus Torvalds } 4131da177e4SLinus Torvalds 4141da177e4SLinus Torvalds struct create_idle { 4151da177e4SLinus Torvalds struct task_struct *idle; 4161da177e4SLinus Torvalds struct completion done; 4171da177e4SLinus Torvalds int cpu; 4181da177e4SLinus Torvalds }; 4191da177e4SLinus Torvalds 4201da177e4SLinus Torvalds void 4211da177e4SLinus Torvalds do_fork_idle(void *_c_idle) 4221da177e4SLinus Torvalds { 4231da177e4SLinus Torvalds struct create_idle *c_idle = _c_idle; 4241da177e4SLinus Torvalds 4251da177e4SLinus Torvalds c_idle->idle = fork_idle(c_idle->cpu); 4261da177e4SLinus Torvalds complete(&c_idle->done); 4271da177e4SLinus Torvalds } 4281da177e4SLinus Torvalds 4291da177e4SLinus Torvalds static int __devinit 4301da177e4SLinus Torvalds do_boot_cpu (int sapicid, int cpu) 4311da177e4SLinus Torvalds { 4321da177e4SLinus Torvalds int timeout; 4331da177e4SLinus Torvalds struct create_idle c_idle = { 4341da177e4SLinus Torvalds .cpu = cpu, 4351da177e4SLinus Torvalds .done = COMPLETION_INITIALIZER(c_idle.done), 4361da177e4SLinus Torvalds }; 4371da177e4SLinus Torvalds DECLARE_WORK(work, do_fork_idle, &c_idle); 438b8d8b883SAshok Raj 439b8d8b883SAshok Raj c_idle.idle = get_idle_for_cpu(cpu); 440b8d8b883SAshok Raj if (c_idle.idle) { 441b8d8b883SAshok Raj init_idle(c_idle.idle, cpu); 442b8d8b883SAshok Raj goto do_rest; 443b8d8b883SAshok Raj } 444b8d8b883SAshok Raj 4451da177e4SLinus Torvalds /* 4461da177e4SLinus Torvalds * We can't use kernel_thread since we must avoid to reschedule the child. 4471da177e4SLinus Torvalds */ 4481da177e4SLinus Torvalds if (!keventd_up() || current_is_keventd()) 4491da177e4SLinus Torvalds work.func(work.data); 4501da177e4SLinus Torvalds else { 4511da177e4SLinus Torvalds schedule_work(&work); 4521da177e4SLinus Torvalds wait_for_completion(&c_idle.done); 4531da177e4SLinus Torvalds } 4541da177e4SLinus Torvalds 4551da177e4SLinus Torvalds if (IS_ERR(c_idle.idle)) 4561da177e4SLinus Torvalds panic("failed fork for CPU %d", cpu); 457b8d8b883SAshok Raj 458b8d8b883SAshok Raj set_idle_for_cpu(cpu, c_idle.idle); 459b8d8b883SAshok Raj 460b8d8b883SAshok Raj do_rest: 4611da177e4SLinus Torvalds task_for_booting_cpu = c_idle.idle; 4621da177e4SLinus Torvalds 4631da177e4SLinus Torvalds Dprintk("Sending wakeup vector %lu to AP 0x%x/0x%x.\n", ap_wakeup_vector, cpu, sapicid); 4641da177e4SLinus Torvalds 465b8d8b883SAshok Raj set_brendez_area(cpu); 4661da177e4SLinus Torvalds platform_send_ipi(cpu, ap_wakeup_vector, IA64_IPI_DM_INT, 0); 4671da177e4SLinus Torvalds 4681da177e4SLinus Torvalds /* 4691da177e4SLinus Torvalds * Wait 10s total for the AP to start 4701da177e4SLinus Torvalds */ 4711da177e4SLinus Torvalds Dprintk("Waiting on callin_map ..."); 4721da177e4SLinus Torvalds for (timeout = 0; timeout < 100000; timeout++) { 4731da177e4SLinus Torvalds if (cpu_isset(cpu, cpu_callin_map)) 4741da177e4SLinus Torvalds break; /* It has booted */ 4751da177e4SLinus Torvalds udelay(100); 4761da177e4SLinus Torvalds } 4771da177e4SLinus Torvalds Dprintk("\n"); 4781da177e4SLinus Torvalds 4791da177e4SLinus Torvalds if (!cpu_isset(cpu, cpu_callin_map)) { 4801da177e4SLinus Torvalds printk(KERN_ERR "Processor 0x%x/0x%x is stuck.\n", cpu, sapicid); 4811da177e4SLinus Torvalds ia64_cpu_to_sapicid[cpu] = -1; 4821da177e4SLinus Torvalds cpu_clear(cpu, cpu_online_map); /* was set in smp_callin() */ 4831da177e4SLinus Torvalds return -EINVAL; 4841da177e4SLinus Torvalds } 4851da177e4SLinus Torvalds return 0; 4861da177e4SLinus Torvalds } 4871da177e4SLinus Torvalds 4881da177e4SLinus Torvalds static int __init 4891da177e4SLinus Torvalds decay (char *str) 4901da177e4SLinus Torvalds { 4911da177e4SLinus Torvalds int ticks; 4921da177e4SLinus Torvalds get_option (&str, &ticks); 4931da177e4SLinus Torvalds return 1; 4941da177e4SLinus Torvalds } 4951da177e4SLinus Torvalds 4961da177e4SLinus Torvalds __setup("decay=", decay); 4971da177e4SLinus Torvalds 4981da177e4SLinus Torvalds /* 4991da177e4SLinus Torvalds * Initialize the logical CPU number to SAPICID mapping 5001da177e4SLinus Torvalds */ 5011da177e4SLinus Torvalds void __init 5021da177e4SLinus Torvalds smp_build_cpu_map (void) 5031da177e4SLinus Torvalds { 5041da177e4SLinus Torvalds int sapicid, cpu, i; 5051da177e4SLinus Torvalds int boot_cpu_id = hard_smp_processor_id(); 5061da177e4SLinus Torvalds 5071da177e4SLinus Torvalds for (cpu = 0; cpu < NR_CPUS; cpu++) { 5081da177e4SLinus Torvalds ia64_cpu_to_sapicid[cpu] = -1; 5091da177e4SLinus Torvalds } 5101da177e4SLinus Torvalds 5111da177e4SLinus Torvalds ia64_cpu_to_sapicid[0] = boot_cpu_id; 5121da177e4SLinus Torvalds cpus_clear(cpu_present_map); 5131da177e4SLinus Torvalds cpu_set(0, cpu_present_map); 5141da177e4SLinus Torvalds cpu_set(0, cpu_possible_map); 5151da177e4SLinus Torvalds for (cpu = 1, i = 0; i < smp_boot_data.cpu_count; i++) { 5161da177e4SLinus Torvalds sapicid = smp_boot_data.cpu_phys_id[i]; 5171da177e4SLinus Torvalds if (sapicid == boot_cpu_id) 5181da177e4SLinus Torvalds continue; 5191da177e4SLinus Torvalds cpu_set(cpu, cpu_present_map); 5201da177e4SLinus Torvalds cpu_set(cpu, cpu_possible_map); 5211da177e4SLinus Torvalds ia64_cpu_to_sapicid[cpu] = sapicid; 5221da177e4SLinus Torvalds cpu++; 5231da177e4SLinus Torvalds } 5241da177e4SLinus Torvalds } 5251da177e4SLinus Torvalds 5261da177e4SLinus Torvalds /* 5271da177e4SLinus Torvalds * Cycle through the APs sending Wakeup IPIs to boot each. 5281da177e4SLinus Torvalds */ 5291da177e4SLinus Torvalds void __init 5301da177e4SLinus Torvalds smp_prepare_cpus (unsigned int max_cpus) 5311da177e4SLinus Torvalds { 5321da177e4SLinus Torvalds int boot_cpu_id = hard_smp_processor_id(); 5331da177e4SLinus Torvalds 5341da177e4SLinus Torvalds /* 5351da177e4SLinus Torvalds * Initialize the per-CPU profiling counter/multiplier 5361da177e4SLinus Torvalds */ 5371da177e4SLinus Torvalds 5381da177e4SLinus Torvalds smp_setup_percpu_timer(); 5391da177e4SLinus Torvalds 5401da177e4SLinus Torvalds /* 5411da177e4SLinus Torvalds * We have the boot CPU online for sure. 5421da177e4SLinus Torvalds */ 5431da177e4SLinus Torvalds cpu_set(0, cpu_online_map); 5441da177e4SLinus Torvalds cpu_set(0, cpu_callin_map); 5451da177e4SLinus Torvalds 5461da177e4SLinus Torvalds local_cpu_data->loops_per_jiffy = loops_per_jiffy; 5471da177e4SLinus Torvalds ia64_cpu_to_sapicid[0] = boot_cpu_id; 5481da177e4SLinus Torvalds 5491da177e4SLinus Torvalds printk(KERN_INFO "Boot processor id 0x%x/0x%x\n", 0, boot_cpu_id); 5501da177e4SLinus Torvalds 5511da177e4SLinus Torvalds current_thread_info()->cpu = 0; 5521da177e4SLinus Torvalds 5531da177e4SLinus Torvalds /* 5541da177e4SLinus Torvalds * If SMP should be disabled, then really disable it! 5551da177e4SLinus Torvalds */ 5561da177e4SLinus Torvalds if (!max_cpus) { 5571da177e4SLinus Torvalds printk(KERN_INFO "SMP mode deactivated.\n"); 5581da177e4SLinus Torvalds cpus_clear(cpu_online_map); 5591da177e4SLinus Torvalds cpus_clear(cpu_present_map); 5601da177e4SLinus Torvalds cpus_clear(cpu_possible_map); 5611da177e4SLinus Torvalds cpu_set(0, cpu_online_map); 5621da177e4SLinus Torvalds cpu_set(0, cpu_present_map); 5631da177e4SLinus Torvalds cpu_set(0, cpu_possible_map); 5641da177e4SLinus Torvalds return; 5651da177e4SLinus Torvalds } 5661da177e4SLinus Torvalds } 5671da177e4SLinus Torvalds 5681da177e4SLinus Torvalds void __devinit smp_prepare_boot_cpu(void) 5691da177e4SLinus Torvalds { 5701da177e4SLinus Torvalds cpu_set(smp_processor_id(), cpu_online_map); 5711da177e4SLinus Torvalds cpu_set(smp_processor_id(), cpu_callin_map); 572a9fa06c2SShaohua Li per_cpu(cpu_state, smp_processor_id()) = CPU_ONLINE; 5731da177e4SLinus Torvalds } 5741da177e4SLinus Torvalds 575e927ecb0SSuresh Siddha /* 576e927ecb0SSuresh Siddha * mt_info[] is a temporary store for all info returned by 577e927ecb0SSuresh Siddha * PAL_LOGICAL_TO_PHYSICAL, to be copied into cpuinfo_ia64 when the 578e927ecb0SSuresh Siddha * specific cpu comes. 579e927ecb0SSuresh Siddha */ 580e927ecb0SSuresh Siddha static struct { 581e927ecb0SSuresh Siddha __u32 socket_id; 582e927ecb0SSuresh Siddha __u16 core_id; 583e927ecb0SSuresh Siddha __u16 thread_id; 584e927ecb0SSuresh Siddha __u16 proc_fixed_addr; 585e927ecb0SSuresh Siddha __u8 valid; 58666302f21SDavid Mosberger-Tang } mt_info[NR_CPUS] __devinitdata; 587e927ecb0SSuresh Siddha 5881da177e4SLinus Torvalds #ifdef CONFIG_HOTPLUG_CPU 589e927ecb0SSuresh Siddha static inline void 590e927ecb0SSuresh Siddha remove_from_mtinfo(int cpu) 591e927ecb0SSuresh Siddha { 592e927ecb0SSuresh Siddha int i; 593e927ecb0SSuresh Siddha 594e927ecb0SSuresh Siddha for_each_cpu(i) 595e927ecb0SSuresh Siddha if (mt_info[i].valid && mt_info[i].socket_id == 596e927ecb0SSuresh Siddha cpu_data(cpu)->socket_id) 597e927ecb0SSuresh Siddha mt_info[i].valid = 0; 598e927ecb0SSuresh Siddha } 599e927ecb0SSuresh Siddha 600e927ecb0SSuresh Siddha static inline void 601e927ecb0SSuresh Siddha clear_cpu_sibling_map(int cpu) 602e927ecb0SSuresh Siddha { 603e927ecb0SSuresh Siddha int i; 604e927ecb0SSuresh Siddha 605e927ecb0SSuresh Siddha for_each_cpu_mask(i, cpu_sibling_map[cpu]) 606e927ecb0SSuresh Siddha cpu_clear(cpu, cpu_sibling_map[i]); 607e927ecb0SSuresh Siddha for_each_cpu_mask(i, cpu_core_map[cpu]) 608e927ecb0SSuresh Siddha cpu_clear(cpu, cpu_core_map[i]); 609e927ecb0SSuresh Siddha 610e927ecb0SSuresh Siddha cpu_sibling_map[cpu] = cpu_core_map[cpu] = CPU_MASK_NONE; 611e927ecb0SSuresh Siddha } 612e927ecb0SSuresh Siddha 613e927ecb0SSuresh Siddha static void 614e927ecb0SSuresh Siddha remove_siblinginfo(int cpu) 615e927ecb0SSuresh Siddha { 616e927ecb0SSuresh Siddha int last = 0; 617e927ecb0SSuresh Siddha 618e927ecb0SSuresh Siddha if (cpu_data(cpu)->threads_per_core == 1 && 619e927ecb0SSuresh Siddha cpu_data(cpu)->cores_per_socket == 1) { 620e927ecb0SSuresh Siddha cpu_clear(cpu, cpu_core_map[cpu]); 621e927ecb0SSuresh Siddha cpu_clear(cpu, cpu_sibling_map[cpu]); 622e927ecb0SSuresh Siddha return; 623e927ecb0SSuresh Siddha } 624e927ecb0SSuresh Siddha 625e927ecb0SSuresh Siddha last = (cpus_weight(cpu_core_map[cpu]) == 1 ? 1 : 0); 626e927ecb0SSuresh Siddha 627e927ecb0SSuresh Siddha /* remove it from all sibling map's */ 628e927ecb0SSuresh Siddha clear_cpu_sibling_map(cpu); 629e927ecb0SSuresh Siddha 630e927ecb0SSuresh Siddha /* if this cpu is the last in the core group, remove all its info 631e927ecb0SSuresh Siddha * from mt_info structure 632e927ecb0SSuresh Siddha */ 633e927ecb0SSuresh Siddha if (last) 634e927ecb0SSuresh Siddha remove_from_mtinfo(cpu); 635e927ecb0SSuresh Siddha } 636e927ecb0SSuresh Siddha 6371da177e4SLinus Torvalds extern void fixup_irqs(void); 6381da177e4SLinus Torvalds /* must be called with cpucontrol mutex held */ 6391da177e4SLinus Torvalds int __cpu_disable(void) 6401da177e4SLinus Torvalds { 6411da177e4SLinus Torvalds int cpu = smp_processor_id(); 6421da177e4SLinus Torvalds 6431da177e4SLinus Torvalds /* 6441da177e4SLinus Torvalds * dont permit boot processor for now 6451da177e4SLinus Torvalds */ 6461da177e4SLinus Torvalds if (cpu == 0) 6471da177e4SLinus Torvalds return -EBUSY; 6481da177e4SLinus Torvalds 649e927ecb0SSuresh Siddha remove_siblinginfo(cpu); 650f3705136SZwane Mwaikambo cpu_clear(cpu, cpu_online_map); 6511da177e4SLinus Torvalds fixup_irqs(); 6521da177e4SLinus Torvalds local_flush_tlb_all(); 653b8d8b883SAshok Raj cpu_clear(cpu, cpu_callin_map); 6541da177e4SLinus Torvalds return 0; 6551da177e4SLinus Torvalds } 6561da177e4SLinus Torvalds 6571da177e4SLinus Torvalds void __cpu_die(unsigned int cpu) 6581da177e4SLinus Torvalds { 6591da177e4SLinus Torvalds unsigned int i; 6601da177e4SLinus Torvalds 6611da177e4SLinus Torvalds for (i = 0; i < 100; i++) { 6621da177e4SLinus Torvalds /* They ack this in play_dead by setting CPU_DEAD */ 6631da177e4SLinus Torvalds if (per_cpu(cpu_state, cpu) == CPU_DEAD) 6641da177e4SLinus Torvalds { 665b8d8b883SAshok Raj printk ("CPU %d is now offline\n", cpu); 6661da177e4SLinus Torvalds return; 6671da177e4SLinus Torvalds } 6681da177e4SLinus Torvalds msleep(100); 6691da177e4SLinus Torvalds } 6701da177e4SLinus Torvalds printk(KERN_ERR "CPU %u didn't die...\n", cpu); 6711da177e4SLinus Torvalds } 6721da177e4SLinus Torvalds #else /* !CONFIG_HOTPLUG_CPU */ 6731da177e4SLinus Torvalds int __cpu_disable(void) 6741da177e4SLinus Torvalds { 6751da177e4SLinus Torvalds return -ENOSYS; 6761da177e4SLinus Torvalds } 6771da177e4SLinus Torvalds 6781da177e4SLinus Torvalds void __cpu_die(unsigned int cpu) 6791da177e4SLinus Torvalds { 6801da177e4SLinus Torvalds /* We said "no" in __cpu_disable */ 6811da177e4SLinus Torvalds BUG(); 6821da177e4SLinus Torvalds } 6831da177e4SLinus Torvalds #endif /* CONFIG_HOTPLUG_CPU */ 6841da177e4SLinus Torvalds 6851da177e4SLinus Torvalds void 6861da177e4SLinus Torvalds smp_cpus_done (unsigned int dummy) 6871da177e4SLinus Torvalds { 6881da177e4SLinus Torvalds int cpu; 6891da177e4SLinus Torvalds unsigned long bogosum = 0; 6901da177e4SLinus Torvalds 6911da177e4SLinus Torvalds /* 6921da177e4SLinus Torvalds * Allow the user to impress friends. 6931da177e4SLinus Torvalds */ 6941da177e4SLinus Torvalds 695dc565b52Shawkes@sgi.com for_each_online_cpu(cpu) { 6961da177e4SLinus Torvalds bogosum += cpu_data(cpu)->loops_per_jiffy; 697dc565b52Shawkes@sgi.com } 6981da177e4SLinus Torvalds 6991da177e4SLinus Torvalds printk(KERN_INFO "Total of %d processors activated (%lu.%02lu BogoMIPS).\n", 7001da177e4SLinus Torvalds (int)num_online_cpus(), bogosum/(500000/HZ), (bogosum/(5000/HZ))%100); 7011da177e4SLinus Torvalds } 7021da177e4SLinus Torvalds 703e927ecb0SSuresh Siddha static inline void __devinit 704e927ecb0SSuresh Siddha set_cpu_sibling_map(int cpu) 705e927ecb0SSuresh Siddha { 706e927ecb0SSuresh Siddha int i; 707e927ecb0SSuresh Siddha 708e927ecb0SSuresh Siddha for_each_online_cpu(i) { 709e927ecb0SSuresh Siddha if ((cpu_data(cpu)->socket_id == cpu_data(i)->socket_id)) { 710e927ecb0SSuresh Siddha cpu_set(i, cpu_core_map[cpu]); 711e927ecb0SSuresh Siddha cpu_set(cpu, cpu_core_map[i]); 712e927ecb0SSuresh Siddha if (cpu_data(cpu)->core_id == cpu_data(i)->core_id) { 713e927ecb0SSuresh Siddha cpu_set(i, cpu_sibling_map[cpu]); 714e927ecb0SSuresh Siddha cpu_set(cpu, cpu_sibling_map[i]); 715e927ecb0SSuresh Siddha } 716e927ecb0SSuresh Siddha } 717e927ecb0SSuresh Siddha } 718e927ecb0SSuresh Siddha } 719e927ecb0SSuresh Siddha 7201da177e4SLinus Torvalds int __devinit 7211da177e4SLinus Torvalds __cpu_up (unsigned int cpu) 7221da177e4SLinus Torvalds { 7231da177e4SLinus Torvalds int ret; 7241da177e4SLinus Torvalds int sapicid; 7251da177e4SLinus Torvalds 7261da177e4SLinus Torvalds sapicid = ia64_cpu_to_sapicid[cpu]; 7271da177e4SLinus Torvalds if (sapicid == -1) 7281da177e4SLinus Torvalds return -EINVAL; 7291da177e4SLinus Torvalds 7301da177e4SLinus Torvalds /* 731b8d8b883SAshok Raj * Already booted cpu? not valid anymore since we dont 732b8d8b883SAshok Raj * do idle loop tightspin anymore. 7331da177e4SLinus Torvalds */ 7341da177e4SLinus Torvalds if (cpu_isset(cpu, cpu_callin_map)) 735b8d8b883SAshok Raj return -EINVAL; 736b8d8b883SAshok Raj 737a9fa06c2SShaohua Li per_cpu(cpu_state, cpu) = CPU_UP_PREPARE; 7381da177e4SLinus Torvalds /* Processor goes to start_secondary(), sets online flag */ 7391da177e4SLinus Torvalds ret = do_boot_cpu(sapicid, cpu); 7401da177e4SLinus Torvalds if (ret < 0) 7411da177e4SLinus Torvalds return ret; 7421da177e4SLinus Torvalds 743e927ecb0SSuresh Siddha if (cpu_data(cpu)->threads_per_core == 1 && 744e927ecb0SSuresh Siddha cpu_data(cpu)->cores_per_socket == 1) { 745e927ecb0SSuresh Siddha cpu_set(cpu, cpu_sibling_map[cpu]); 746e927ecb0SSuresh Siddha cpu_set(cpu, cpu_core_map[cpu]); 747e927ecb0SSuresh Siddha return 0; 748e927ecb0SSuresh Siddha } 749e927ecb0SSuresh Siddha 750e927ecb0SSuresh Siddha set_cpu_sibling_map(cpu); 751e927ecb0SSuresh Siddha 7521da177e4SLinus Torvalds return 0; 7531da177e4SLinus Torvalds } 7541da177e4SLinus Torvalds 7551da177e4SLinus Torvalds /* 7561da177e4SLinus Torvalds * Assume that CPU's have been discovered by some platform-dependent interface. For 7571da177e4SLinus Torvalds * SoftSDV/Lion, that would be ACPI. 7581da177e4SLinus Torvalds * 7591da177e4SLinus Torvalds * Setup of the IPI irq handler is done in irq.c:init_IRQ_SMP(). 7601da177e4SLinus Torvalds */ 7611da177e4SLinus Torvalds void __init 7621da177e4SLinus Torvalds init_smp_config(void) 7631da177e4SLinus Torvalds { 7641da177e4SLinus Torvalds struct fptr { 7651da177e4SLinus Torvalds unsigned long fp; 7661da177e4SLinus Torvalds unsigned long gp; 7671da177e4SLinus Torvalds } *ap_startup; 7681da177e4SLinus Torvalds long sal_ret; 7691da177e4SLinus Torvalds 7701da177e4SLinus Torvalds /* Tell SAL where to drop the AP's. */ 7711da177e4SLinus Torvalds ap_startup = (struct fptr *) start_ap; 7721da177e4SLinus Torvalds sal_ret = ia64_sal_set_vectors(SAL_VECTOR_OS_BOOT_RENDEZ, 7731da177e4SLinus Torvalds ia64_tpa(ap_startup->fp), ia64_tpa(ap_startup->gp), 0, 0, 0, 0); 7741da177e4SLinus Torvalds if (sal_ret < 0) 7751da177e4SLinus Torvalds printk(KERN_ERR "SMP: Can't set SAL AP Boot Rendezvous: %s\n", 7761da177e4SLinus Torvalds ia64_sal_strerror(sal_ret)); 7771da177e4SLinus Torvalds } 7781da177e4SLinus Torvalds 779e927ecb0SSuresh Siddha static inline int __devinit 780e927ecb0SSuresh Siddha check_for_mtinfo_index(void) 781e927ecb0SSuresh Siddha { 782e927ecb0SSuresh Siddha int i; 783e927ecb0SSuresh Siddha 784e927ecb0SSuresh Siddha for_each_cpu(i) 785e927ecb0SSuresh Siddha if (!mt_info[i].valid) 786e927ecb0SSuresh Siddha return i; 787e927ecb0SSuresh Siddha 788e927ecb0SSuresh Siddha return -1; 789e927ecb0SSuresh Siddha } 790e927ecb0SSuresh Siddha 791e927ecb0SSuresh Siddha /* 792e927ecb0SSuresh Siddha * Search the mt_info to find out if this socket's cid/tid information is 793e927ecb0SSuresh Siddha * cached or not. If the socket exists, fill in the core_id and thread_id 794e927ecb0SSuresh Siddha * in cpuinfo 795e927ecb0SSuresh Siddha */ 796e927ecb0SSuresh Siddha static int __devinit 797e927ecb0SSuresh Siddha check_for_new_socket(__u16 logical_address, struct cpuinfo_ia64 *c) 798e927ecb0SSuresh Siddha { 799e927ecb0SSuresh Siddha int i; 800e927ecb0SSuresh Siddha __u32 sid = c->socket_id; 801e927ecb0SSuresh Siddha 802e927ecb0SSuresh Siddha for_each_cpu(i) { 803e927ecb0SSuresh Siddha if (mt_info[i].valid && mt_info[i].proc_fixed_addr == logical_address 804e927ecb0SSuresh Siddha && mt_info[i].socket_id == sid) { 805e927ecb0SSuresh Siddha c->core_id = mt_info[i].core_id; 806e927ecb0SSuresh Siddha c->thread_id = mt_info[i].thread_id; 807e927ecb0SSuresh Siddha return 1; /* not a new socket */ 808e927ecb0SSuresh Siddha } 809e927ecb0SSuresh Siddha } 810e927ecb0SSuresh Siddha return 0; 811e927ecb0SSuresh Siddha } 812e927ecb0SSuresh Siddha 813e927ecb0SSuresh Siddha /* 814e927ecb0SSuresh Siddha * identify_siblings(cpu) gets called from identify_cpu. This populates the 815e927ecb0SSuresh Siddha * information related to logical execution units in per_cpu_data structure. 816e927ecb0SSuresh Siddha */ 817e927ecb0SSuresh Siddha void __devinit 818e927ecb0SSuresh Siddha identify_siblings(struct cpuinfo_ia64 *c) 819e927ecb0SSuresh Siddha { 820e927ecb0SSuresh Siddha s64 status; 821e927ecb0SSuresh Siddha u16 pltid; 822e927ecb0SSuresh Siddha u64 proc_fixed_addr; 823e927ecb0SSuresh Siddha int count, i; 824e927ecb0SSuresh Siddha pal_logical_to_physical_t info; 825e927ecb0SSuresh Siddha 826e927ecb0SSuresh Siddha if (smp_num_cpucores == 1 && smp_num_siblings == 1) 827e927ecb0SSuresh Siddha return; 828e927ecb0SSuresh Siddha 829e927ecb0SSuresh Siddha if ((status = ia64_pal_logical_to_phys(0, &info)) != PAL_STATUS_SUCCESS) { 830e927ecb0SSuresh Siddha printk(KERN_ERR "ia64_pal_logical_to_phys failed with %ld\n", 831e927ecb0SSuresh Siddha status); 832e927ecb0SSuresh Siddha return; 833e927ecb0SSuresh Siddha } 834e927ecb0SSuresh Siddha if ((status = ia64_sal_physical_id_info(&pltid)) != PAL_STATUS_SUCCESS) { 835e927ecb0SSuresh Siddha printk(KERN_ERR "ia64_sal_pltid failed with %ld\n", status); 836e927ecb0SSuresh Siddha return; 837e927ecb0SSuresh Siddha } 838e927ecb0SSuresh Siddha if ((status = ia64_pal_fixed_addr(&proc_fixed_addr)) != PAL_STATUS_SUCCESS) { 839e927ecb0SSuresh Siddha printk(KERN_ERR "ia64_pal_fixed_addr failed with %ld\n", status); 840e927ecb0SSuresh Siddha return; 841e927ecb0SSuresh Siddha } 842e927ecb0SSuresh Siddha 843e927ecb0SSuresh Siddha c->socket_id = (pltid << 8) | info.overview_ppid; 844e927ecb0SSuresh Siddha c->cores_per_socket = info.overview_cpp; 845e927ecb0SSuresh Siddha c->threads_per_core = info.overview_tpc; 846e927ecb0SSuresh Siddha count = c->num_log = info.overview_num_log; 847e927ecb0SSuresh Siddha 848e927ecb0SSuresh Siddha /* If the thread and core id information is already cached, then 849e927ecb0SSuresh Siddha * we will simply update cpu_info and return. Otherwise, we will 850e927ecb0SSuresh Siddha * do the PAL calls and cache core and thread id's of all the siblings. 851e927ecb0SSuresh Siddha */ 852e927ecb0SSuresh Siddha if (check_for_new_socket(proc_fixed_addr, c)) 853e927ecb0SSuresh Siddha return; 854e927ecb0SSuresh Siddha 855e927ecb0SSuresh Siddha for (i = 0; i < count; i++) { 856e927ecb0SSuresh Siddha int index; 857e927ecb0SSuresh Siddha 858e927ecb0SSuresh Siddha if (i && (status = ia64_pal_logical_to_phys(i, &info)) 859e927ecb0SSuresh Siddha != PAL_STATUS_SUCCESS) { 860e927ecb0SSuresh Siddha printk(KERN_ERR "ia64_pal_logical_to_phys failed" 861e927ecb0SSuresh Siddha " with %ld\n", status); 862e927ecb0SSuresh Siddha return; 863e927ecb0SSuresh Siddha } 864e927ecb0SSuresh Siddha if (info.log2_la == proc_fixed_addr) { 865e927ecb0SSuresh Siddha c->core_id = info.log1_cid; 866e927ecb0SSuresh Siddha c->thread_id = info.log1_tid; 867e927ecb0SSuresh Siddha } 868e927ecb0SSuresh Siddha 869e927ecb0SSuresh Siddha index = check_for_mtinfo_index(); 870e927ecb0SSuresh Siddha /* We will not do the mt_info caching optimization in this case. 871e927ecb0SSuresh Siddha */ 872e927ecb0SSuresh Siddha if (index < 0) 873e927ecb0SSuresh Siddha continue; 874e927ecb0SSuresh Siddha 875e927ecb0SSuresh Siddha mt_info[index].valid = 1; 876e927ecb0SSuresh Siddha mt_info[index].socket_id = c->socket_id; 877e927ecb0SSuresh Siddha mt_info[index].core_id = info.log1_cid; 878e927ecb0SSuresh Siddha mt_info[index].thread_id = info.log1_tid; 879e927ecb0SSuresh Siddha mt_info[index].proc_fixed_addr = info.log2_la; 880e927ecb0SSuresh Siddha } 881e927ecb0SSuresh Siddha } 882