blob: 16c52aaaca3517c37e1e99d25c38ab5ce7756b5e [file] [log] [blame]
Glauber Costa0941ecb2008-03-03 14:12:55 -03001/*
2 * Intel SMP support routines.
3 *
4 * (c) 1995 Alan Cox, Building #3 <alan@redhat.com>
5 * (c) 1998-99, 2000 Ingo Molnar <mingo@redhat.com>
6 * (c) 2002,2003 Andi Kleen, SuSE Labs.
7 *
8 * i386 and x86_64 integration by Glauber Costa <gcosta@redhat.com>
9 *
10 * This code is released under the GNU General Public License version 2 or
11 * later.
12 */
13
Glauber Costaf9e47a12008-03-03 14:12:52 -030014#include <linux/init.h>
15
16#include <linux/mm.h>
17#include <linux/delay.h>
18#include <linux/spinlock.h>
19#include <linux/kernel_stat.h>
20#include <linux/mc146818rtc.h>
21#include <linux/cache.h>
22#include <linux/interrupt.h>
23#include <linux/cpu.h>
24
25#include <asm/mtrr.h>
26#include <asm/tlbflush.h>
27#include <asm/mmu_context.h>
28#include <asm/proto.h>
29#ifdef CONFIG_X86_32
30#include <mach_apic.h>
31#include <mach_ipi.h>
32#else
33#include <asm/mach_apic.h>
34#endif
Glauber Costa0941ecb2008-03-03 14:12:55 -030035/*
36 * Some notes on x86 processor bugs affecting SMP operation:
37 *
38 * Pentium, Pentium Pro, II, III (and all CPUs) have bugs.
39 * The Linux implications for SMP are handled as follows:
40 *
41 * Pentium III / [Xeon]
42 * None of the E1AP-E3AP errata are visible to the user.
43 *
44 * E1AP. see PII A1AP
45 * E2AP. see PII A2AP
46 * E3AP. see PII A3AP
47 *
48 * Pentium II / [Xeon]
49 * None of the A1AP-A3AP errata are visible to the user.
50 *
51 * A1AP. see PPro 1AP
52 * A2AP. see PPro 2AP
53 * A3AP. see PPro 7AP
54 *
55 * Pentium Pro
56 * None of 1AP-9AP errata are visible to the normal user,
57 * except occasional delivery of 'spurious interrupt' as trap #15.
58 * This is very rare and a non-problem.
59 *
60 * 1AP. Linux maps APIC as non-cacheable
61 * 2AP. worked around in hardware
62 * 3AP. fixed in C0 and above steppings microcode update.
63 * Linux does not use excessive STARTUP_IPIs.
64 * 4AP. worked around in hardware
65 * 5AP. symmetric IO mode (normal Linux operation) not affected.
66 * 'noapic' mode has vector 0xf filled out properly.
67 * 6AP. 'noapic' mode might be affected - fixed in later steppings
68 * 7AP. We do not assume writes to the LVT deassering IRQs
69 * 8AP. We do not enable low power mode (deep sleep) during MP bootup
70 * 9AP. We do not use mixed mode
71 *
72 * Pentium
73 * There is a marginal case where REP MOVS on 100MHz SMP
74 * machines with B stepping processors can fail. XXX should provide
75 * an L1cache=Writethrough or L1cache=off option.
76 *
77 * B stepping CPUs may hang. There are hardware work arounds
78 * for this. We warn about it in case your board doesn't have the work
79 * arounds. Basically that's so I can tell anyone with a B stepping
80 * CPU and SMP problems "tough".
81 *
82 * Specific items [From Pentium Processor Specification Update]
83 *
84 * 1AP. Linux doesn't use remote read
85 * 2AP. Linux doesn't trust APIC errors
86 * 3AP. We work around this
87 * 4AP. Linux never generated 3 interrupts of the same priority
88 * to cause a lost local interrupt.
89 * 5AP. Remote read is never used
90 * 6AP. not affected - worked around in hardware
91 * 7AP. not affected - worked around in hardware
92 * 8AP. worked around in hardware - we get explicit CS errors if not
93 * 9AP. only 'noapic' mode affected. Might generate spurious
94 * interrupts, we log only the first one and count the
95 * rest silently.
96 * 10AP. not affected - worked around in hardware
97 * 11AP. Linux reads the APIC between writes to avoid this, as per
98 * the documentation. Make sure you preserve this as it affects
99 * the C stepping chips too.
100 * 12AP. not affected - worked around in hardware
101 * 13AP. not affected - worked around in hardware
102 * 14AP. we always deassert INIT during bootup
103 * 15AP. not affected - worked around in hardware
104 * 16AP. not affected - worked around in hardware
105 * 17AP. not affected - worked around in hardware
106 * 18AP. not affected - worked around in hardware
107 * 19AP. not affected - worked around in BIOS
108 *
109 * If this sounds worrying believe me these bugs are either ___RARE___,
110 * or are signal timing bugs worked around in hardware and there's
111 * about nothing of note with C stepping upwards.
112 */
Glauber Costaf9e47a12008-03-03 14:12:52 -0300113
114/*
115 * this function sends a 'reschedule' IPI to another CPU.
116 * it goes straight through and wastes no time serializing
117 * anything. Worst case is that we lose a reschedule ...
118 */
119static void native_smp_send_reschedule(int cpu)
120{
Gautham R Shenoyf6940102008-03-10 17:44:03 +0530121 if (unlikely(cpu_is_offline(cpu))) {
122 WARN_ON(1);
123 return;
124 }
Glauber Costaf9e47a12008-03-03 14:12:52 -0300125 send_IPI_mask(cpumask_of_cpu(cpu), RESCHEDULE_VECTOR);
126}
127
128/*
129 * Structure and data for smp_call_function(). This is designed to minimise
130 * static memory requirements. It also looks cleaner.
131 */
132static DEFINE_SPINLOCK(call_lock);
133
134struct call_data_struct {
135 void (*func) (void *info);
136 void *info;
137 atomic_t started;
138 atomic_t finished;
139 int wait;
140};
141
142void lock_ipi_call_lock(void)
143{
144 spin_lock_irq(&call_lock);
145}
146
147void unlock_ipi_call_lock(void)
148{
149 spin_unlock_irq(&call_lock);
150}
151
152static struct call_data_struct *call_data;
153
154static void __smp_call_function(void (*func) (void *info), void *info,
155 int nonatomic, int wait)
156{
157 struct call_data_struct data;
158 int cpus = num_online_cpus() - 1;
159
160 if (!cpus)
161 return;
162
163 data.func = func;
164 data.info = info;
165 atomic_set(&data.started, 0);
166 data.wait = wait;
167 if (wait)
168 atomic_set(&data.finished, 0);
169
170 call_data = &data;
171 mb();
172
173 /* Send a message to all other CPUs and wait for them to respond */
174 send_IPI_allbutself(CALL_FUNCTION_VECTOR);
175
176 /* Wait for response */
177 while (atomic_read(&data.started) != cpus)
178 cpu_relax();
179
180 if (wait)
181 while (atomic_read(&data.finished) != cpus)
182 cpu_relax();
183}
184
185
186/**
187 * smp_call_function_mask(): Run a function on a set of other CPUs.
188 * @mask: The set of cpus to run on. Must not include the current cpu.
189 * @func: The function to run. This must be fast and non-blocking.
190 * @info: An arbitrary pointer to pass to the function.
191 * @wait: If true, wait (atomically) until function has completed on other CPUs.
192 *
193 * Returns 0 on success, else a negative status code.
194 *
195 * If @wait is true, then returns once @func has returned; otherwise
196 * it returns just before the target cpu calls @func.
197 *
198 * You must not call this function with disabled interrupts or from a
199 * hardware interrupt handler or from a bottom half handler.
200 */
201static int
202native_smp_call_function_mask(cpumask_t mask,
203 void (*func)(void *), void *info,
204 int wait)
205{
206 struct call_data_struct data;
207 cpumask_t allbutself;
208 int cpus;
209
210 /* Can deadlock when called with interrupts disabled */
211 WARN_ON(irqs_disabled());
212
213 /* Holding any lock stops cpus from going down. */
214 spin_lock(&call_lock);
215
216 allbutself = cpu_online_map;
217 cpu_clear(smp_processor_id(), allbutself);
218
219 cpus_and(mask, mask, allbutself);
220 cpus = cpus_weight(mask);
221
222 if (!cpus) {
223 spin_unlock(&call_lock);
224 return 0;
225 }
226
227 data.func = func;
228 data.info = info;
229 atomic_set(&data.started, 0);
230 data.wait = wait;
231 if (wait)
232 atomic_set(&data.finished, 0);
233
234 call_data = &data;
235 wmb();
236
237 /* Send a message to other CPUs */
238 if (cpus_equal(mask, allbutself))
239 send_IPI_allbutself(CALL_FUNCTION_VECTOR);
240 else
241 send_IPI_mask(mask, CALL_FUNCTION_VECTOR);
242
243 /* Wait for response */
244 while (atomic_read(&data.started) != cpus)
245 cpu_relax();
246
247 if (wait)
248 while (atomic_read(&data.finished) != cpus)
249 cpu_relax();
250 spin_unlock(&call_lock);
251
252 return 0;
253}
254
255static void stop_this_cpu(void *dummy)
256{
257 local_irq_disable();
258 /*
259 * Remove this CPU:
260 */
261 cpu_clear(smp_processor_id(), cpu_online_map);
262 disable_local_APIC();
263 if (hlt_works(smp_processor_id()))
264 for (;;) halt();
265 for (;;);
266}
267
268/*
269 * this function calls the 'stop' function on all other CPUs in the system.
270 */
271
272static void native_smp_send_stop(void)
273{
274 int nolock;
275 unsigned long flags;
276
277 if (reboot_force)
278 return;
279
280 /* Don't deadlock on the call lock in panic */
281 nolock = !spin_trylock(&call_lock);
282 local_irq_save(flags);
283 __smp_call_function(stop_this_cpu, NULL, 0, 0);
284 if (!nolock)
285 spin_unlock(&call_lock);
286 disable_local_APIC();
287 local_irq_restore(flags);
288}
289
290/*
291 * Reschedule call back. Nothing to do,
292 * all the work is done automatically when
293 * we return from the interrupt.
294 */
295void smp_reschedule_interrupt(struct pt_regs *regs)
296{
297 ack_APIC_irq();
298#ifdef CONFIG_X86_32
299 __get_cpu_var(irq_stat).irq_resched_count++;
300#else
301 add_pda(irq_resched_count, 1);
302#endif
303}
304
305void smp_call_function_interrupt(struct pt_regs *regs)
306{
307 void (*func) (void *info) = call_data->func;
308 void *info = call_data->info;
309 int wait = call_data->wait;
310
311 ack_APIC_irq();
312 /*
313 * Notify initiating CPU that I've grabbed the data and am
314 * about to execute the function
315 */
316 mb();
317 atomic_inc(&call_data->started);
318 /*
319 * At this point the info structure may be out of scope unless wait==1
320 */
321 irq_enter();
322 (*func)(info);
323#ifdef CONFIG_X86_32
324 __get_cpu_var(irq_stat).irq_call_count++;
325#else
326 add_pda(irq_call_count, 1);
327#endif
328 irq_exit();
329
330 if (wait) {
331 mb();
332 atomic_inc(&call_data->finished);
333 }
334}
335
336struct smp_ops smp_ops = {
337 .smp_prepare_boot_cpu = native_smp_prepare_boot_cpu,
338 .smp_prepare_cpus = native_smp_prepare_cpus,
339 .cpu_up = native_cpu_up,
340 .smp_cpus_done = native_smp_cpus_done,
341
342 .smp_send_stop = native_smp_send_stop,
343 .smp_send_reschedule = native_smp_send_reschedule,
344 .smp_call_function_mask = native_smp_call_function_mask,
345};
346EXPORT_SYMBOL_GPL(smp_ops);
347