blob: 2589ea4c60ce145bfadbb2b925e6f81f85957bd8 [file] [log] [blame]
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -08001#include <linux/module.h>
Al Virof6a57032006-10-18 01:47:25 -04002#include <linux/sched.h>
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +02003#include <linux/mutex.h>
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -08004#include <linux/list.h>
Jan Beulich8b5a10f2009-08-19 08:40:48 +01005#include <linux/stringify.h>
Andi Kleen19d36cc2007-07-22 11:12:31 +02006#include <linux/kprobes.h>
7#include <linux/mm.h>
8#include <linux/vmalloc.h>
Masami Hiramatsu3945dab2009-03-06 10:37:22 -05009#include <linux/memory.h>
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080010#include <asm/alternative.h>
11#include <asm/sections.h>
Andi Kleen19d36cc2007-07-22 11:12:31 +020012#include <asm/pgtable.h>
Andi Kleen8f4e9562007-07-22 11:12:32 +020013#include <asm/mce.h>
14#include <asm/nmi.h>
Dave Jonesb0979762007-10-14 22:57:45 +020015#include <asm/vsyscall.h>
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -050016#include <asm/cacheflush.h>
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -050017#include <asm/tlbflush.h>
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -050018#include <asm/io.h>
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -050019#include <asm/fixmap.h>
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080020
Andi Kleenab144f52007-08-10 22:31:03 +020021#define MAX_PATCH_LEN (255-1)
22
Jan Beulich09488162007-07-21 17:10:25 +020023#ifdef CONFIG_HOTPLUG_CPU
24static int smp_alt_once;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080025
Gerd Hoffmannd167a512006-06-26 13:56:16 +020026static int __init bootonly(char *str)
27{
28 smp_alt_once = 1;
29 return 1;
30}
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +020031__setup("smp-alt-boot", bootonly);
Jan Beulich09488162007-07-21 17:10:25 +020032#else
33#define smp_alt_once 1
34#endif
35
Jan Beulich8b5a10f2009-08-19 08:40:48 +010036static int __initdata_or_module debug_alternative;
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +020037
Gerd Hoffmannd167a512006-06-26 13:56:16 +020038static int __init debug_alt(char *str)
39{
40 debug_alternative = 1;
41 return 1;
42}
Gerd Hoffmannd167a512006-06-26 13:56:16 +020043__setup("debug-alternative", debug_alt);
44
Jan Beulich09488162007-07-21 17:10:25 +020045static int noreplace_smp;
46
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +020047static int __init setup_noreplace_smp(char *str)
48{
49 noreplace_smp = 1;
50 return 1;
51}
52__setup("noreplace-smp", setup_noreplace_smp);
53
Jeremy Fitzhardinge959b4fd2007-05-02 19:27:16 +020054#ifdef CONFIG_PARAVIRT
Jan Beulich8b5a10f2009-08-19 08:40:48 +010055static int __initdata_or_module noreplace_paravirt = 0;
Jeremy Fitzhardinge959b4fd2007-05-02 19:27:16 +020056
57static int __init setup_noreplace_paravirt(char *str)
58{
59 noreplace_paravirt = 1;
60 return 1;
61}
62__setup("noreplace-paravirt", setup_noreplace_paravirt);
63#endif
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +020064
Gerd Hoffmannd167a512006-06-26 13:56:16 +020065#define DPRINTK(fmt, args...) if (debug_alternative) \
66 printk(KERN_DEBUG fmt, args)
67
Jan Beulich8b5a10f2009-08-19 08:40:48 +010068#if defined(GENERIC_NOP1) && !defined(CONFIG_X86_64)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080069/* Use inline assembly to define this because the nops are defined
70 as inline assembly strings in the include files and we cannot
71 get them easily into strings. */
Jan Beulich8b5a10f2009-08-19 08:40:48 +010072asm("\t" __stringify(__INITRODATA_OR_MODULE) "\nintelnops: "
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080073 GENERIC_NOP1 GENERIC_NOP2 GENERIC_NOP3 GENERIC_NOP4 GENERIC_NOP5 GENERIC_NOP6
Steven Rostedtf4be31e2008-04-09 19:04:07 -040074 GENERIC_NOP7 GENERIC_NOP8
75 "\t.previous");
Jan Beulich121d7bf2007-10-17 18:04:37 +020076extern const unsigned char intelnops[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +010077static const unsigned char *const __initconst_or_module
78intel_nops[ASM_NOP_MAX+1] = {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080079 NULL,
80 intelnops,
81 intelnops + 1,
82 intelnops + 1 + 2,
83 intelnops + 1 + 2 + 3,
84 intelnops + 1 + 2 + 3 + 4,
85 intelnops + 1 + 2 + 3 + 4 + 5,
86 intelnops + 1 + 2 + 3 + 4 + 5 + 6,
87 intelnops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
88};
Gerd Hoffmannd167a512006-06-26 13:56:16 +020089#endif
90
91#ifdef K8_NOP1
Jan Beulich8b5a10f2009-08-19 08:40:48 +010092asm("\t" __stringify(__INITRODATA_OR_MODULE) "\nk8nops: "
Gerd Hoffmannd167a512006-06-26 13:56:16 +020093 K8_NOP1 K8_NOP2 K8_NOP3 K8_NOP4 K8_NOP5 K8_NOP6
Steven Rostedtf4be31e2008-04-09 19:04:07 -040094 K8_NOP7 K8_NOP8
95 "\t.previous");
Jan Beulich121d7bf2007-10-17 18:04:37 +020096extern const unsigned char k8nops[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +010097static const unsigned char *const __initconst_or_module
98k8_nops[ASM_NOP_MAX+1] = {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080099 NULL,
100 k8nops,
101 k8nops + 1,
102 k8nops + 1 + 2,
103 k8nops + 1 + 2 + 3,
104 k8nops + 1 + 2 + 3 + 4,
105 k8nops + 1 + 2 + 3 + 4 + 5,
106 k8nops + 1 + 2 + 3 + 4 + 5 + 6,
107 k8nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
108};
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200109#endif
110
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100111#if defined(K7_NOP1) && !defined(CONFIG_X86_64)
112asm("\t" __stringify(__INITRODATA_OR_MODULE) "\nk7nops: "
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200113 K7_NOP1 K7_NOP2 K7_NOP3 K7_NOP4 K7_NOP5 K7_NOP6
Steven Rostedtf4be31e2008-04-09 19:04:07 -0400114 K7_NOP7 K7_NOP8
115 "\t.previous");
Jan Beulich121d7bf2007-10-17 18:04:37 +0200116extern const unsigned char k7nops[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100117static const unsigned char *const __initconst_or_module
118k7_nops[ASM_NOP_MAX+1] = {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800119 NULL,
120 k7nops,
121 k7nops + 1,
122 k7nops + 1 + 2,
123 k7nops + 1 + 2 + 3,
124 k7nops + 1 + 2 + 3 + 4,
125 k7nops + 1 + 2 + 3 + 4 + 5,
126 k7nops + 1 + 2 + 3 + 4 + 5 + 6,
127 k7nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
128};
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200129#endif
130
Jan Beulich32c464f2007-10-17 18:04:41 +0200131#ifdef P6_NOP1
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100132asm("\t" __stringify(__INITRODATA_OR_MODULE) "\np6nops: "
Jan Beulich32c464f2007-10-17 18:04:41 +0200133 P6_NOP1 P6_NOP2 P6_NOP3 P6_NOP4 P6_NOP5 P6_NOP6
Steven Rostedtf4be31e2008-04-09 19:04:07 -0400134 P6_NOP7 P6_NOP8
135 "\t.previous");
Jan Beulich32c464f2007-10-17 18:04:41 +0200136extern const unsigned char p6nops[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100137static const unsigned char *const __initconst_or_module
138p6_nops[ASM_NOP_MAX+1] = {
Jan Beulich32c464f2007-10-17 18:04:41 +0200139 NULL,
140 p6nops,
141 p6nops + 1,
142 p6nops + 1 + 2,
143 p6nops + 1 + 2 + 3,
144 p6nops + 1 + 2 + 3 + 4,
145 p6nops + 1 + 2 + 3 + 4 + 5,
146 p6nops + 1 + 2 + 3 + 4 + 5 + 6,
147 p6nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
148};
149#endif
150
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200151#ifdef CONFIG_X86_64
152
153extern char __vsyscall_0;
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100154static const unsigned char *const *__init_or_module find_nop_table(void)
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200155{
H. Peter Anvinf31d7312008-08-18 17:50:33 -0700156 if (boot_cpu_data.x86_vendor == X86_VENDOR_INTEL &&
157 boot_cpu_has(X86_FEATURE_NOPL))
158 return p6_nops;
159 else
160 return k8_nops;
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200161}
162
163#else /* CONFIG_X86_64 */
164
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100165static const unsigned char *const *__init_or_module find_nop_table(void)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800166{
H. Peter Anvinf31d7312008-08-18 17:50:33 -0700167 if (boot_cpu_has(X86_FEATURE_K8))
168 return k8_nops;
169 else if (boot_cpu_has(X86_FEATURE_K7))
170 return k7_nops;
171 else if (boot_cpu_has(X86_FEATURE_NOPL))
172 return p6_nops;
173 else
174 return intel_nops;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800175}
176
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200177#endif /* CONFIG_X86_64 */
178
Andi Kleenab144f52007-08-10 22:31:03 +0200179/* Use this to add nops to a buffer, then text_poke the whole buffer. */
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100180static void __init_or_module add_nops(void *insns, unsigned int len)
Rusty Russell139ec7c2006-12-07 02:14:08 +0100181{
Jan Beulich121d7bf2007-10-17 18:04:37 +0200182 const unsigned char *const *noptable = find_nop_table();
Rusty Russell139ec7c2006-12-07 02:14:08 +0100183
184 while (len > 0) {
185 unsigned int noplen = len;
186 if (noplen > ASM_NOP_MAX)
187 noplen = ASM_NOP_MAX;
Andi Kleenab144f52007-08-10 22:31:03 +0200188 memcpy(insns, noptable[noplen], noplen);
Rusty Russell139ec7c2006-12-07 02:14:08 +0100189 insns += noplen;
190 len -= noplen;
191 }
192}
193
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200194extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200195extern u8 *__smp_locks[], *__smp_locks_end[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100196static void *text_poke_early(void *addr, const void *opcode, size_t len);
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200197
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800198/* Replace instructions with better alternatives for this CPU type.
199 This runs before SMP is initialized to avoid SMP problems with
200 self modifying code. This implies that assymetric systems where
201 APs have less capabilities than the boot processor are not handled.
202 Tough. Make sure you disable such features by hand. */
203
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100204void __init_or_module apply_alternatives(struct alt_instr *start,
205 struct alt_instr *end)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800206{
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800207 struct alt_instr *a;
Jan Beulich1b1d9252009-12-18 16:12:56 +0000208 u8 insnbuf[MAX_PATCH_LEN];
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800209
Harvey Harrison77bf90e2008-03-03 11:37:23 -0800210 DPRINTK("%s: alt table %p -> %p\n", __func__, start, end);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800211 for (a = start; a < end; a++) {
Andi Kleenab144f52007-08-10 22:31:03 +0200212 u8 *instr = a->instr;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800213 BUG_ON(a->replacementlen > a->instrlen);
Andi Kleenab144f52007-08-10 22:31:03 +0200214 BUG_ON(a->instrlen > sizeof(insnbuf));
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800215 if (!boot_cpu_has(a->cpuid))
216 continue;
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200217#ifdef CONFIG_X86_64
218 /* vsyscall code is not mapped yet. resolve it manually. */
219 if (instr >= (u8 *)VSYSCALL_START && instr < (u8*)VSYSCALL_END) {
220 instr = __va(instr - (u8*)VSYSCALL_START + (u8*)__pa_symbol(&__vsyscall_0));
221 DPRINTK("%s: vsyscall fixup: %p => %p\n",
Harvey Harrison77bf90e2008-03-03 11:37:23 -0800222 __func__, a->instr, instr);
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200223 }
224#endif
Andi Kleenab144f52007-08-10 22:31:03 +0200225 memcpy(insnbuf, a->replacement, a->replacementlen);
Jan Beulich1b1d9252009-12-18 16:12:56 +0000226 if (*insnbuf == 0xe8 && a->replacementlen == 5)
227 *(s32 *)(insnbuf + 1) += a->replacement - a->instr;
Andi Kleenab144f52007-08-10 22:31:03 +0200228 add_nops(insnbuf + a->replacementlen,
229 a->instrlen - a->replacementlen);
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500230 text_poke_early(instr, insnbuf, a->instrlen);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800231 }
232}
233
Gerd Hoffmann8ec4d412006-07-01 04:36:18 -0700234#ifdef CONFIG_SMP
235
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800236static void alternatives_smp_lock(u8 **start, u8 **end, u8 *text, u8 *text_end)
237{
238 u8 **ptr;
239
Masami Hiramatsu3945dab2009-03-06 10:37:22 -0500240 mutex_lock(&text_mutex);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800241 for (ptr = start; ptr < end; ptr++) {
242 if (*ptr < text)
243 continue;
244 if (*ptr > text_end)
245 continue;
Mathieu Desnoyersf88f07e2008-08-14 16:58:15 -0400246 /* turn DS segment override prefix into lock prefix */
247 text_poke(*ptr, ((unsigned char []){0xf0}), 1);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800248 };
Masami Hiramatsu3945dab2009-03-06 10:37:22 -0500249 mutex_unlock(&text_mutex);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800250}
251
252static void alternatives_smp_unlock(u8 **start, u8 **end, u8 *text, u8 *text_end)
253{
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800254 u8 **ptr;
255
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +0200256 if (noreplace_smp)
257 return;
258
Masami Hiramatsu3945dab2009-03-06 10:37:22 -0500259 mutex_lock(&text_mutex);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800260 for (ptr = start; ptr < end; ptr++) {
261 if (*ptr < text)
262 continue;
263 if (*ptr > text_end)
264 continue;
Mathieu Desnoyersf88f07e2008-08-14 16:58:15 -0400265 /* turn lock prefix into DS segment override prefix */
266 text_poke(*ptr, ((unsigned char []){0x3E}), 1);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800267 };
Masami Hiramatsu3945dab2009-03-06 10:37:22 -0500268 mutex_unlock(&text_mutex);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800269}
270
271struct smp_alt_module {
272 /* what is this ??? */
273 struct module *mod;
274 char *name;
275
276 /* ptrs to lock prefixes */
277 u8 **locks;
278 u8 **locks_end;
279
280 /* .text segment, needed to avoid patching init code ;) */
281 u8 *text;
282 u8 *text_end;
283
284 struct list_head next;
285};
286static LIST_HEAD(smp_alt_modules);
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200287static DEFINE_MUTEX(smp_alt);
Andi Kleenca74a6f2008-01-30 13:33:17 +0100288static int smp_mode = 1; /* protected by smp_alt */
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800289
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100290void __init_or_module alternatives_smp_module_add(struct module *mod,
291 char *name,
292 void *locks, void *locks_end,
293 void *text, void *text_end)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800294{
295 struct smp_alt_module *smp;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800296
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +0200297 if (noreplace_smp)
298 return;
299
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800300 if (smp_alt_once) {
301 if (boot_cpu_has(X86_FEATURE_UP))
302 alternatives_smp_unlock(locks, locks_end,
303 text, text_end);
304 return;
305 }
306
307 smp = kzalloc(sizeof(*smp), GFP_KERNEL);
308 if (NULL == smp)
309 return; /* we'll run the (safe but slow) SMP code then ... */
310
311 smp->mod = mod;
312 smp->name = name;
313 smp->locks = locks;
314 smp->locks_end = locks_end;
315 smp->text = text;
316 smp->text_end = text_end;
317 DPRINTK("%s: locks %p -> %p, text %p -> %p, name %s\n",
Harvey Harrison77bf90e2008-03-03 11:37:23 -0800318 __func__, smp->locks, smp->locks_end,
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800319 smp->text, smp->text_end, smp->name);
320
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200321 mutex_lock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800322 list_add_tail(&smp->next, &smp_alt_modules);
323 if (boot_cpu_has(X86_FEATURE_UP))
324 alternatives_smp_unlock(smp->locks, smp->locks_end,
325 smp->text, smp->text_end);
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200326 mutex_unlock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800327}
328
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100329void __init_or_module alternatives_smp_module_del(struct module *mod)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800330{
331 struct smp_alt_module *item;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800332
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +0200333 if (smp_alt_once || noreplace_smp)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800334 return;
335
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200336 mutex_lock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800337 list_for_each_entry(item, &smp_alt_modules, next) {
338 if (mod != item->mod)
339 continue;
340 list_del(&item->next);
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200341 mutex_unlock(&smp_alt);
Harvey Harrison77bf90e2008-03-03 11:37:23 -0800342 DPRINTK("%s: %s\n", __func__, item->name);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800343 kfree(item);
344 return;
345 }
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200346 mutex_unlock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800347}
348
349void alternatives_smp_switch(int smp)
350{
351 struct smp_alt_module *mod;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800352
Ingo Molnar3047e992006-07-03 00:24:57 -0700353#ifdef CONFIG_LOCKDEP
354 /*
Ingo Molnar17abecf2008-01-30 13:33:24 +0100355 * Older binutils section handling bug prevented
356 * alternatives-replacement from working reliably.
357 *
358 * If this still occurs then you should see a hang
359 * or crash shortly after this line:
Ingo Molnar3047e992006-07-03 00:24:57 -0700360 */
Ingo Molnar17abecf2008-01-30 13:33:24 +0100361 printk("lockdep: fixing up alternatives.\n");
Ingo Molnar3047e992006-07-03 00:24:57 -0700362#endif
363
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +0200364 if (noreplace_smp || smp_alt_once)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800365 return;
366 BUG_ON(!smp && (num_online_cpus() > 1));
367
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200368 mutex_lock(&smp_alt);
Andi Kleenca74a6f2008-01-30 13:33:17 +0100369
370 /*
371 * Avoid unnecessary switches because it forces JIT based VMs to
372 * throw away all cached translations, which can be quite costly.
373 */
374 if (smp == smp_mode) {
375 /* nothing */
376 } else if (smp) {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800377 printk(KERN_INFO "SMP alternatives: switching to SMP code\n");
Jeremy Fitzhardinge53756d32008-01-30 13:30:55 +0100378 clear_cpu_cap(&boot_cpu_data, X86_FEATURE_UP);
379 clear_cpu_cap(&cpu_data(0), X86_FEATURE_UP);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800380 list_for_each_entry(mod, &smp_alt_modules, next)
381 alternatives_smp_lock(mod->locks, mod->locks_end,
382 mod->text, mod->text_end);
383 } else {
384 printk(KERN_INFO "SMP alternatives: switching to UP code\n");
Jeremy Fitzhardinge53756d32008-01-30 13:30:55 +0100385 set_cpu_cap(&boot_cpu_data, X86_FEATURE_UP);
386 set_cpu_cap(&cpu_data(0), X86_FEATURE_UP);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800387 list_for_each_entry(mod, &smp_alt_modules, next)
388 alternatives_smp_unlock(mod->locks, mod->locks_end,
389 mod->text, mod->text_end);
390 }
Andi Kleenca74a6f2008-01-30 13:33:17 +0100391 smp_mode = smp;
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200392 mutex_unlock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800393}
394
Gerd Hoffmann8ec4d412006-07-01 04:36:18 -0700395#endif
396
Rusty Russell139ec7c2006-12-07 02:14:08 +0100397#ifdef CONFIG_PARAVIRT
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100398void __init_or_module apply_paravirt(struct paravirt_patch_site *start,
399 struct paravirt_patch_site *end)
Rusty Russell139ec7c2006-12-07 02:14:08 +0100400{
Jeremy Fitzhardinge98de0322007-05-02 19:27:14 +0200401 struct paravirt_patch_site *p;
Andi Kleenab144f52007-08-10 22:31:03 +0200402 char insnbuf[MAX_PATCH_LEN];
Rusty Russell139ec7c2006-12-07 02:14:08 +0100403
Jeremy Fitzhardinge959b4fd2007-05-02 19:27:16 +0200404 if (noreplace_paravirt)
405 return;
406
Rusty Russell139ec7c2006-12-07 02:14:08 +0100407 for (p = start; p < end; p++) {
408 unsigned int used;
409
Andi Kleenab144f52007-08-10 22:31:03 +0200410 BUG_ON(p->len > MAX_PATCH_LEN);
Chris Wrightd34fda42007-08-18 14:31:41 -0700411 /* prep the buffer with the original instructions */
412 memcpy(insnbuf, p->instr, p->len);
Jeremy Fitzhardinge93b1eab2007-10-16 11:51:29 -0700413 used = pv_init_ops.patch(p->instrtype, p->clobbers, insnbuf,
414 (unsigned long)p->instr, p->len);
Jeremy Fitzhardinge7f63c412007-05-02 19:27:13 +0200415
Jeremy Fitzhardinge63f70272007-05-02 19:27:14 +0200416 BUG_ON(used > p->len);
417
Rusty Russell139ec7c2006-12-07 02:14:08 +0100418 /* Pad the rest with nops */
Andi Kleenab144f52007-08-10 22:31:03 +0200419 add_nops(insnbuf + used, p->len - used);
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500420 text_poke_early(p->instr, insnbuf, p->len);
Rusty Russell139ec7c2006-12-07 02:14:08 +0100421 }
Rusty Russell139ec7c2006-12-07 02:14:08 +0100422}
Jeremy Fitzhardinge98de0322007-05-02 19:27:14 +0200423extern struct paravirt_patch_site __start_parainstructions[],
Rusty Russell139ec7c2006-12-07 02:14:08 +0100424 __stop_parainstructions[];
425#endif /* CONFIG_PARAVIRT */
426
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800427void __init alternative_instructions(void)
428{
Andi Kleen8f4e9562007-07-22 11:12:32 +0200429 /* The patching is not fully atomic, so try to avoid local interruptions
430 that might execute the to be patched code.
431 Other CPUs are not running. */
432 stop_nmi();
Andi Kleen123aa762009-02-12 13:39:27 +0100433
434 /*
435 * Don't stop machine check exceptions while patching.
436 * MCEs only happen when something got corrupted and in this
437 * case we must do something about the corruption.
438 * Ignoring it is worse than a unlikely patching race.
439 * Also machine checks tend to be broadcast and if one CPU
440 * goes into machine check the others follow quickly, so we don't
441 * expect a machine check to cause undue problems during to code
442 * patching.
443 */
Andi Kleen8f4e9562007-07-22 11:12:32 +0200444
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800445 apply_alternatives(__alt_instructions, __alt_instructions_end);
446
447 /* switch to patch-once-at-boottime-only mode and free the
448 * tables in case we know the number of CPUs will never ever
449 * change */
450#ifdef CONFIG_HOTPLUG_CPU
451 if (num_possible_cpus() < 2)
452 smp_alt_once = 1;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800453#endif
454
Gerd Hoffmann8ec4d412006-07-01 04:36:18 -0700455#ifdef CONFIG_SMP
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800456 if (smp_alt_once) {
457 if (1 == num_possible_cpus()) {
458 printk(KERN_INFO "SMP alternatives: switching to UP code\n");
Jeremy Fitzhardinge53756d32008-01-30 13:30:55 +0100459 set_cpu_cap(&boot_cpu_data, X86_FEATURE_UP);
460 set_cpu_cap(&cpu_data(0), X86_FEATURE_UP);
461
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800462 alternatives_smp_unlock(__smp_locks, __smp_locks_end,
463 _text, _etext);
464 }
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800465 } else {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800466 alternatives_smp_module_add(NULL, "core kernel",
467 __smp_locks, __smp_locks_end,
468 _text, _etext);
Andi Kleenca74a6f2008-01-30 13:33:17 +0100469
470 /* Only switch to UP mode if we don't immediately boot others */
Thomas Gleixner649c6652008-10-05 16:52:24 +0200471 if (num_present_cpus() == 1 || setup_max_cpus <= 1)
Andi Kleenca74a6f2008-01-30 13:33:17 +0100472 alternatives_smp_switch(0);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800473 }
Gerd Hoffmann8ec4d412006-07-01 04:36:18 -0700474#endif
Jeremy Fitzhardinge441d40d2007-05-02 19:27:16 +0200475 apply_paravirt(__parainstructions, __parainstructions_end);
Andi Kleen8f4e9562007-07-22 11:12:32 +0200476
Fengguang Wuf68fd5f2007-10-17 18:04:34 +0200477 if (smp_alt_once)
478 free_init_pages("SMP alternatives",
479 (unsigned long)__smp_locks,
480 (unsigned long)__smp_locks_end);
481
Andi Kleen8f4e9562007-07-22 11:12:32 +0200482 restart_nmi();
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800483}
Andi Kleen19d36cc2007-07-22 11:12:31 +0200484
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500485/**
486 * text_poke_early - Update instructions on a live kernel at boot time
487 * @addr: address to modify
488 * @opcode: source of the copy
489 * @len: length to copy
490 *
Andi Kleen19d36cc2007-07-22 11:12:31 +0200491 * When you use this code to patch more than one byte of an instruction
492 * you need to make sure that other CPUs cannot execute this code in parallel.
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500493 * Also no thread must be currently preempted in the middle of these
494 * instructions. And on the local CPU you need to be protected again NMI or MCE
495 * handlers seeing an inconsistent instruction while you patch.
Andi Kleen19d36cc2007-07-22 11:12:31 +0200496 */
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100497static void *__init_or_module text_poke_early(void *addr, const void *opcode,
498 size_t len)
Andi Kleen19d36cc2007-07-22 11:12:31 +0200499{
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500500 unsigned long flags;
501 local_irq_save(flags);
Andi Kleen19d36cc2007-07-22 11:12:31 +0200502 memcpy(addr, opcode, len);
503 sync_core();
Ben Hutchings5367b682009-09-10 02:53:50 +0100504 local_irq_restore(flags);
Andi Kleena534b672007-09-06 16:59:52 +0200505 /* Could also do a CLFLUSH here to speed up CPU recovery; but
506 that causes hangs on some VIA CPUs. */
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500507 return addr;
508}
509
510/**
511 * text_poke - Update instructions on a live kernel
512 * @addr: address to modify
513 * @opcode: source of the copy
514 * @len: length to copy
515 *
516 * Only atomic text poke/set should be allowed when not doing early patching.
517 * It means the size must be writable atomically and the address must be aligned
518 * in a way that permits an atomic write. It also makes sure we fit on a single
519 * page.
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -0500520 *
521 * Note: Must be called under text_mutex.
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500522 */
523void *__kprobes text_poke(void *addr, const void *opcode, size_t len)
524{
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -0500525 unsigned long flags;
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500526 char *vaddr;
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400527 struct page *pages[2];
528 int i;
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500529
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400530 if (!core_kernel_text((unsigned long)addr)) {
531 pages[0] = vmalloc_to_page(addr);
532 pages[1] = vmalloc_to_page(addr + PAGE_SIZE);
Mathieu Desnoyers15a601e2008-03-12 11:54:16 -0400533 } else {
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400534 pages[0] = virt_to_page(addr);
Ingo Molnar00c6b2d2008-04-25 17:07:03 +0200535 WARN_ON(!PageReserved(pages[0]));
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400536 pages[1] = virt_to_page(addr + PAGE_SIZE);
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500537 }
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400538 BUG_ON(!pages[0]);
Masami Hiramatsu7cf49422009-03-09 12:40:40 -0400539 local_irq_save(flags);
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -0500540 set_fixmap(FIX_TEXT_POKE0, page_to_phys(pages[0]));
541 if (pages[1])
542 set_fixmap(FIX_TEXT_POKE1, page_to_phys(pages[1]));
543 vaddr = (char *)fix_to_virt(FIX_TEXT_POKE0);
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400544 memcpy(&vaddr[(unsigned long)addr & ~PAGE_MASK], opcode, len);
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -0500545 clear_fixmap(FIX_TEXT_POKE0);
546 if (pages[1])
547 clear_fixmap(FIX_TEXT_POKE1);
548 local_flush_tlb();
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500549 sync_core();
550 /* Could also do a CLFLUSH here to speed up CPU recovery; but
551 that causes hangs on some VIA CPUs. */
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400552 for (i = 0; i < len; i++)
553 BUG_ON(((char *)addr)[i] != ((char *)opcode)[i]);
Masami Hiramatsu7cf49422009-03-09 12:40:40 -0400554 local_irq_restore(flags);
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500555 return addr;
Andi Kleen19d36cc2007-07-22 11:12:31 +0200556}