blob: 3a4bf35c179b7e54b8d1902d22d734cdc4cc4b89 [file] [log] [blame]
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -08001#include <linux/module.h>
Al Virof6a57032006-10-18 01:47:25 -04002#include <linux/sched.h>
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +02003#include <linux/mutex.h>
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -08004#include <linux/list.h>
Jan Beulich8b5a10f2009-08-19 08:40:48 +01005#include <linux/stringify.h>
Andi Kleen19d36cc2007-07-22 11:12:31 +02006#include <linux/kprobes.h>
7#include <linux/mm.h>
8#include <linux/vmalloc.h>
Masami Hiramatsu3945dab2009-03-06 10:37:22 -05009#include <linux/memory.h>
Masami Hiramatsu3d55cc82010-02-25 08:34:38 -050010#include <linux/stop_machine.h>
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080011#include <asm/alternative.h>
12#include <asm/sections.h>
Andi Kleen19d36cc2007-07-22 11:12:31 +020013#include <asm/pgtable.h>
Andi Kleen8f4e9562007-07-22 11:12:32 +020014#include <asm/mce.h>
15#include <asm/nmi.h>
Dave Jonesb0979762007-10-14 22:57:45 +020016#include <asm/vsyscall.h>
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -050017#include <asm/cacheflush.h>
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -050018#include <asm/tlbflush.h>
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -050019#include <asm/io.h>
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -050020#include <asm/fixmap.h>
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080021
Andi Kleenab144f52007-08-10 22:31:03 +020022#define MAX_PATCH_LEN (255-1)
23
Jan Beulich09488162007-07-21 17:10:25 +020024#ifdef CONFIG_HOTPLUG_CPU
25static int smp_alt_once;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080026
Gerd Hoffmannd167a512006-06-26 13:56:16 +020027static int __init bootonly(char *str)
28{
29 smp_alt_once = 1;
30 return 1;
31}
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +020032__setup("smp-alt-boot", bootonly);
Jan Beulich09488162007-07-21 17:10:25 +020033#else
34#define smp_alt_once 1
35#endif
36
Jan Beulich8b5a10f2009-08-19 08:40:48 +010037static int __initdata_or_module debug_alternative;
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +020038
Gerd Hoffmannd167a512006-06-26 13:56:16 +020039static int __init debug_alt(char *str)
40{
41 debug_alternative = 1;
42 return 1;
43}
Gerd Hoffmannd167a512006-06-26 13:56:16 +020044__setup("debug-alternative", debug_alt);
45
Jan Beulich09488162007-07-21 17:10:25 +020046static int noreplace_smp;
47
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +020048static int __init setup_noreplace_smp(char *str)
49{
50 noreplace_smp = 1;
51 return 1;
52}
53__setup("noreplace-smp", setup_noreplace_smp);
54
Jeremy Fitzhardinge959b4fd2007-05-02 19:27:16 +020055#ifdef CONFIG_PARAVIRT
Jan Beulich8b5a10f2009-08-19 08:40:48 +010056static int __initdata_or_module noreplace_paravirt = 0;
Jeremy Fitzhardinge959b4fd2007-05-02 19:27:16 +020057
58static int __init setup_noreplace_paravirt(char *str)
59{
60 noreplace_paravirt = 1;
61 return 1;
62}
63__setup("noreplace-paravirt", setup_noreplace_paravirt);
64#endif
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +020065
Gerd Hoffmannd167a512006-06-26 13:56:16 +020066#define DPRINTK(fmt, args...) if (debug_alternative) \
67 printk(KERN_DEBUG fmt, args)
68
Jan Beulich8b5a10f2009-08-19 08:40:48 +010069#if defined(GENERIC_NOP1) && !defined(CONFIG_X86_64)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080070/* Use inline assembly to define this because the nops are defined
71 as inline assembly strings in the include files and we cannot
72 get them easily into strings. */
Jan Beulich8b5a10f2009-08-19 08:40:48 +010073asm("\t" __stringify(__INITRODATA_OR_MODULE) "\nintelnops: "
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080074 GENERIC_NOP1 GENERIC_NOP2 GENERIC_NOP3 GENERIC_NOP4 GENERIC_NOP5 GENERIC_NOP6
Steven Rostedtf4be31e2008-04-09 19:04:07 -040075 GENERIC_NOP7 GENERIC_NOP8
76 "\t.previous");
Jan Beulich121d7bf2007-10-17 18:04:37 +020077extern const unsigned char intelnops[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +010078static const unsigned char *const __initconst_or_module
79intel_nops[ASM_NOP_MAX+1] = {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -080080 NULL,
81 intelnops,
82 intelnops + 1,
83 intelnops + 1 + 2,
84 intelnops + 1 + 2 + 3,
85 intelnops + 1 + 2 + 3 + 4,
86 intelnops + 1 + 2 + 3 + 4 + 5,
87 intelnops + 1 + 2 + 3 + 4 + 5 + 6,
88 intelnops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
89};
Gerd Hoffmannd167a512006-06-26 13:56:16 +020090#endif
91
92#ifdef K8_NOP1
Jan Beulich8b5a10f2009-08-19 08:40:48 +010093asm("\t" __stringify(__INITRODATA_OR_MODULE) "\nk8nops: "
Gerd Hoffmannd167a512006-06-26 13:56:16 +020094 K8_NOP1 K8_NOP2 K8_NOP3 K8_NOP4 K8_NOP5 K8_NOP6
Steven Rostedtf4be31e2008-04-09 19:04:07 -040095 K8_NOP7 K8_NOP8
96 "\t.previous");
Jan Beulich121d7bf2007-10-17 18:04:37 +020097extern const unsigned char k8nops[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +010098static const unsigned char *const __initconst_or_module
99k8_nops[ASM_NOP_MAX+1] = {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800100 NULL,
101 k8nops,
102 k8nops + 1,
103 k8nops + 1 + 2,
104 k8nops + 1 + 2 + 3,
105 k8nops + 1 + 2 + 3 + 4,
106 k8nops + 1 + 2 + 3 + 4 + 5,
107 k8nops + 1 + 2 + 3 + 4 + 5 + 6,
108 k8nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
109};
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200110#endif
111
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100112#if defined(K7_NOP1) && !defined(CONFIG_X86_64)
113asm("\t" __stringify(__INITRODATA_OR_MODULE) "\nk7nops: "
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200114 K7_NOP1 K7_NOP2 K7_NOP3 K7_NOP4 K7_NOP5 K7_NOP6
Steven Rostedtf4be31e2008-04-09 19:04:07 -0400115 K7_NOP7 K7_NOP8
116 "\t.previous");
Jan Beulich121d7bf2007-10-17 18:04:37 +0200117extern const unsigned char k7nops[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100118static const unsigned char *const __initconst_or_module
119k7_nops[ASM_NOP_MAX+1] = {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800120 NULL,
121 k7nops,
122 k7nops + 1,
123 k7nops + 1 + 2,
124 k7nops + 1 + 2 + 3,
125 k7nops + 1 + 2 + 3 + 4,
126 k7nops + 1 + 2 + 3 + 4 + 5,
127 k7nops + 1 + 2 + 3 + 4 + 5 + 6,
128 k7nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
129};
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200130#endif
131
Jan Beulich32c464f2007-10-17 18:04:41 +0200132#ifdef P6_NOP1
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100133asm("\t" __stringify(__INITRODATA_OR_MODULE) "\np6nops: "
Jan Beulich32c464f2007-10-17 18:04:41 +0200134 P6_NOP1 P6_NOP2 P6_NOP3 P6_NOP4 P6_NOP5 P6_NOP6
Steven Rostedtf4be31e2008-04-09 19:04:07 -0400135 P6_NOP7 P6_NOP8
136 "\t.previous");
Jan Beulich32c464f2007-10-17 18:04:41 +0200137extern const unsigned char p6nops[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100138static const unsigned char *const __initconst_or_module
139p6_nops[ASM_NOP_MAX+1] = {
Jan Beulich32c464f2007-10-17 18:04:41 +0200140 NULL,
141 p6nops,
142 p6nops + 1,
143 p6nops + 1 + 2,
144 p6nops + 1 + 2 + 3,
145 p6nops + 1 + 2 + 3 + 4,
146 p6nops + 1 + 2 + 3 + 4 + 5,
147 p6nops + 1 + 2 + 3 + 4 + 5 + 6,
148 p6nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
149};
150#endif
151
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200152#ifdef CONFIG_X86_64
153
154extern char __vsyscall_0;
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100155static const unsigned char *const *__init_or_module find_nop_table(void)
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200156{
H. Peter Anvinf31d7312008-08-18 17:50:33 -0700157 if (boot_cpu_data.x86_vendor == X86_VENDOR_INTEL &&
158 boot_cpu_has(X86_FEATURE_NOPL))
159 return p6_nops;
160 else
161 return k8_nops;
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200162}
163
164#else /* CONFIG_X86_64 */
165
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100166static const unsigned char *const *__init_or_module find_nop_table(void)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800167{
H. Peter Anvinf31d7312008-08-18 17:50:33 -0700168 if (boot_cpu_has(X86_FEATURE_K8))
169 return k8_nops;
170 else if (boot_cpu_has(X86_FEATURE_K7))
171 return k7_nops;
172 else if (boot_cpu_has(X86_FEATURE_NOPL))
173 return p6_nops;
174 else
175 return intel_nops;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800176}
177
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200178#endif /* CONFIG_X86_64 */
179
Andi Kleenab144f52007-08-10 22:31:03 +0200180/* Use this to add nops to a buffer, then text_poke the whole buffer. */
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100181static void __init_or_module add_nops(void *insns, unsigned int len)
Rusty Russell139ec7c2006-12-07 02:14:08 +0100182{
Jan Beulich121d7bf2007-10-17 18:04:37 +0200183 const unsigned char *const *noptable = find_nop_table();
Rusty Russell139ec7c2006-12-07 02:14:08 +0100184
185 while (len > 0) {
186 unsigned int noplen = len;
187 if (noplen > ASM_NOP_MAX)
188 noplen = ASM_NOP_MAX;
Andi Kleenab144f52007-08-10 22:31:03 +0200189 memcpy(insns, noptable[noplen], noplen);
Rusty Russell139ec7c2006-12-07 02:14:08 +0100190 insns += noplen;
191 len -= noplen;
192 }
193}
194
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200195extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200196extern u8 *__smp_locks[], *__smp_locks_end[];
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100197static void *text_poke_early(void *addr, const void *opcode, size_t len);
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200198
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800199/* Replace instructions with better alternatives for this CPU type.
200 This runs before SMP is initialized to avoid SMP problems with
201 self modifying code. This implies that assymetric systems where
202 APs have less capabilities than the boot processor are not handled.
203 Tough. Make sure you disable such features by hand. */
204
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100205void __init_or_module apply_alternatives(struct alt_instr *start,
206 struct alt_instr *end)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800207{
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800208 struct alt_instr *a;
Jan Beulich1b1d9252009-12-18 16:12:56 +0000209 u8 insnbuf[MAX_PATCH_LEN];
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800210
Harvey Harrison77bf90e2008-03-03 11:37:23 -0800211 DPRINTK("%s: alt table %p -> %p\n", __func__, start, end);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800212 for (a = start; a < end; a++) {
Andi Kleenab144f52007-08-10 22:31:03 +0200213 u8 *instr = a->instr;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800214 BUG_ON(a->replacementlen > a->instrlen);
Andi Kleenab144f52007-08-10 22:31:03 +0200215 BUG_ON(a->instrlen > sizeof(insnbuf));
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800216 if (!boot_cpu_has(a->cpuid))
217 continue;
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200218#ifdef CONFIG_X86_64
219 /* vsyscall code is not mapped yet. resolve it manually. */
220 if (instr >= (u8 *)VSYSCALL_START && instr < (u8*)VSYSCALL_END) {
221 instr = __va(instr - (u8*)VSYSCALL_START + (u8*)__pa_symbol(&__vsyscall_0));
222 DPRINTK("%s: vsyscall fixup: %p => %p\n",
Harvey Harrison77bf90e2008-03-03 11:37:23 -0800223 __func__, a->instr, instr);
Gerd Hoffmannd167a512006-06-26 13:56:16 +0200224 }
225#endif
Andi Kleenab144f52007-08-10 22:31:03 +0200226 memcpy(insnbuf, a->replacement, a->replacementlen);
Jan Beulich1b1d9252009-12-18 16:12:56 +0000227 if (*insnbuf == 0xe8 && a->replacementlen == 5)
228 *(s32 *)(insnbuf + 1) += a->replacement - a->instr;
Andi Kleenab144f52007-08-10 22:31:03 +0200229 add_nops(insnbuf + a->replacementlen,
230 a->instrlen - a->replacementlen);
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500231 text_poke_early(instr, insnbuf, a->instrlen);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800232 }
233}
234
Gerd Hoffmann8ec4d412006-07-01 04:36:18 -0700235#ifdef CONFIG_SMP
236
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800237static void alternatives_smp_lock(u8 **start, u8 **end, u8 *text, u8 *text_end)
238{
239 u8 **ptr;
240
Masami Hiramatsu3945dab2009-03-06 10:37:22 -0500241 mutex_lock(&text_mutex);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800242 for (ptr = start; ptr < end; ptr++) {
243 if (*ptr < text)
244 continue;
245 if (*ptr > text_end)
246 continue;
Mathieu Desnoyersf88f07e2008-08-14 16:58:15 -0400247 /* turn DS segment override prefix into lock prefix */
248 text_poke(*ptr, ((unsigned char []){0xf0}), 1);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800249 };
Masami Hiramatsu3945dab2009-03-06 10:37:22 -0500250 mutex_unlock(&text_mutex);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800251}
252
253static void alternatives_smp_unlock(u8 **start, u8 **end, u8 *text, u8 *text_end)
254{
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800255 u8 **ptr;
256
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +0200257 if (noreplace_smp)
258 return;
259
Masami Hiramatsu3945dab2009-03-06 10:37:22 -0500260 mutex_lock(&text_mutex);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800261 for (ptr = start; ptr < end; ptr++) {
262 if (*ptr < text)
263 continue;
264 if (*ptr > text_end)
265 continue;
Mathieu Desnoyersf88f07e2008-08-14 16:58:15 -0400266 /* turn lock prefix into DS segment override prefix */
267 text_poke(*ptr, ((unsigned char []){0x3E}), 1);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800268 };
Masami Hiramatsu3945dab2009-03-06 10:37:22 -0500269 mutex_unlock(&text_mutex);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800270}
271
272struct smp_alt_module {
273 /* what is this ??? */
274 struct module *mod;
275 char *name;
276
277 /* ptrs to lock prefixes */
278 u8 **locks;
279 u8 **locks_end;
280
281 /* .text segment, needed to avoid patching init code ;) */
282 u8 *text;
283 u8 *text_end;
284
285 struct list_head next;
286};
287static LIST_HEAD(smp_alt_modules);
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200288static DEFINE_MUTEX(smp_alt);
Andi Kleenca74a6f2008-01-30 13:33:17 +0100289static int smp_mode = 1; /* protected by smp_alt */
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800290
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100291void __init_or_module alternatives_smp_module_add(struct module *mod,
292 char *name,
293 void *locks, void *locks_end,
294 void *text, void *text_end)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800295{
296 struct smp_alt_module *smp;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800297
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +0200298 if (noreplace_smp)
299 return;
300
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800301 if (smp_alt_once) {
302 if (boot_cpu_has(X86_FEATURE_UP))
303 alternatives_smp_unlock(locks, locks_end,
304 text, text_end);
305 return;
306 }
307
308 smp = kzalloc(sizeof(*smp), GFP_KERNEL);
309 if (NULL == smp)
310 return; /* we'll run the (safe but slow) SMP code then ... */
311
312 smp->mod = mod;
313 smp->name = name;
314 smp->locks = locks;
315 smp->locks_end = locks_end;
316 smp->text = text;
317 smp->text_end = text_end;
318 DPRINTK("%s: locks %p -> %p, text %p -> %p, name %s\n",
Harvey Harrison77bf90e2008-03-03 11:37:23 -0800319 __func__, smp->locks, smp->locks_end,
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800320 smp->text, smp->text_end, smp->name);
321
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200322 mutex_lock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800323 list_add_tail(&smp->next, &smp_alt_modules);
324 if (boot_cpu_has(X86_FEATURE_UP))
325 alternatives_smp_unlock(smp->locks, smp->locks_end,
326 smp->text, smp->text_end);
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200327 mutex_unlock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800328}
329
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100330void __init_or_module alternatives_smp_module_del(struct module *mod)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800331{
332 struct smp_alt_module *item;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800333
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +0200334 if (smp_alt_once || noreplace_smp)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800335 return;
336
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200337 mutex_lock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800338 list_for_each_entry(item, &smp_alt_modules, next) {
339 if (mod != item->mod)
340 continue;
341 list_del(&item->next);
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200342 mutex_unlock(&smp_alt);
Harvey Harrison77bf90e2008-03-03 11:37:23 -0800343 DPRINTK("%s: %s\n", __func__, item->name);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800344 kfree(item);
345 return;
346 }
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200347 mutex_unlock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800348}
349
350void alternatives_smp_switch(int smp)
351{
352 struct smp_alt_module *mod;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800353
Ingo Molnar3047e992006-07-03 00:24:57 -0700354#ifdef CONFIG_LOCKDEP
355 /*
Ingo Molnar17abecf2008-01-30 13:33:24 +0100356 * Older binutils section handling bug prevented
357 * alternatives-replacement from working reliably.
358 *
359 * If this still occurs then you should see a hang
360 * or crash shortly after this line:
Ingo Molnar3047e992006-07-03 00:24:57 -0700361 */
Ingo Molnar17abecf2008-01-30 13:33:24 +0100362 printk("lockdep: fixing up alternatives.\n");
Ingo Molnar3047e992006-07-03 00:24:57 -0700363#endif
364
Jeremy Fitzhardingeb7fb4af2007-05-02 19:27:13 +0200365 if (noreplace_smp || smp_alt_once)
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800366 return;
367 BUG_ON(!smp && (num_online_cpus() > 1));
368
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200369 mutex_lock(&smp_alt);
Andi Kleenca74a6f2008-01-30 13:33:17 +0100370
371 /*
372 * Avoid unnecessary switches because it forces JIT based VMs to
373 * throw away all cached translations, which can be quite costly.
374 */
375 if (smp == smp_mode) {
376 /* nothing */
377 } else if (smp) {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800378 printk(KERN_INFO "SMP alternatives: switching to SMP code\n");
Jeremy Fitzhardinge53756d32008-01-30 13:30:55 +0100379 clear_cpu_cap(&boot_cpu_data, X86_FEATURE_UP);
380 clear_cpu_cap(&cpu_data(0), X86_FEATURE_UP);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800381 list_for_each_entry(mod, &smp_alt_modules, next)
382 alternatives_smp_lock(mod->locks, mod->locks_end,
383 mod->text, mod->text_end);
384 } else {
385 printk(KERN_INFO "SMP alternatives: switching to UP code\n");
Jeremy Fitzhardinge53756d32008-01-30 13:30:55 +0100386 set_cpu_cap(&boot_cpu_data, X86_FEATURE_UP);
387 set_cpu_cap(&cpu_data(0), X86_FEATURE_UP);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800388 list_for_each_entry(mod, &smp_alt_modules, next)
389 alternatives_smp_unlock(mod->locks, mod->locks_end,
390 mod->text, mod->text_end);
391 }
Andi Kleenca74a6f2008-01-30 13:33:17 +0100392 smp_mode = smp;
Pekka Paalanen2f1dafe2008-05-12 21:21:01 +0200393 mutex_unlock(&smp_alt);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800394}
395
Masami Hiramatsu2cfa1972010-02-02 16:49:11 -0500396/* Return 1 if the address range is reserved for smp-alternatives */
397int alternatives_text_reserved(void *start, void *end)
398{
399 struct smp_alt_module *mod;
400 u8 **ptr;
Masami Hiramatsu076dc4a2010-02-05 12:16:47 -0500401 u8 *text_start = start;
402 u8 *text_end = end;
Masami Hiramatsu2cfa1972010-02-02 16:49:11 -0500403
404 list_for_each_entry(mod, &smp_alt_modules, next) {
Masami Hiramatsu076dc4a2010-02-05 12:16:47 -0500405 if (mod->text > text_end || mod->text_end < text_start)
Masami Hiramatsu2cfa1972010-02-02 16:49:11 -0500406 continue;
407 for (ptr = mod->locks; ptr < mod->locks_end; ptr++)
Masami Hiramatsu076dc4a2010-02-05 12:16:47 -0500408 if (text_start <= *ptr && text_end >= *ptr)
Masami Hiramatsu2cfa1972010-02-02 16:49:11 -0500409 return 1;
410 }
411
412 return 0;
413}
Gerd Hoffmann8ec4d412006-07-01 04:36:18 -0700414#endif
415
Rusty Russell139ec7c2006-12-07 02:14:08 +0100416#ifdef CONFIG_PARAVIRT
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100417void __init_or_module apply_paravirt(struct paravirt_patch_site *start,
418 struct paravirt_patch_site *end)
Rusty Russell139ec7c2006-12-07 02:14:08 +0100419{
Jeremy Fitzhardinge98de0322007-05-02 19:27:14 +0200420 struct paravirt_patch_site *p;
Andi Kleenab144f52007-08-10 22:31:03 +0200421 char insnbuf[MAX_PATCH_LEN];
Rusty Russell139ec7c2006-12-07 02:14:08 +0100422
Jeremy Fitzhardinge959b4fd2007-05-02 19:27:16 +0200423 if (noreplace_paravirt)
424 return;
425
Rusty Russell139ec7c2006-12-07 02:14:08 +0100426 for (p = start; p < end; p++) {
427 unsigned int used;
428
Andi Kleenab144f52007-08-10 22:31:03 +0200429 BUG_ON(p->len > MAX_PATCH_LEN);
Chris Wrightd34fda42007-08-18 14:31:41 -0700430 /* prep the buffer with the original instructions */
431 memcpy(insnbuf, p->instr, p->len);
Jeremy Fitzhardinge93b1eab2007-10-16 11:51:29 -0700432 used = pv_init_ops.patch(p->instrtype, p->clobbers, insnbuf,
433 (unsigned long)p->instr, p->len);
Jeremy Fitzhardinge7f63c412007-05-02 19:27:13 +0200434
Jeremy Fitzhardinge63f70272007-05-02 19:27:14 +0200435 BUG_ON(used > p->len);
436
Rusty Russell139ec7c2006-12-07 02:14:08 +0100437 /* Pad the rest with nops */
Andi Kleenab144f52007-08-10 22:31:03 +0200438 add_nops(insnbuf + used, p->len - used);
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500439 text_poke_early(p->instr, insnbuf, p->len);
Rusty Russell139ec7c2006-12-07 02:14:08 +0100440 }
Rusty Russell139ec7c2006-12-07 02:14:08 +0100441}
Jeremy Fitzhardinge98de0322007-05-02 19:27:14 +0200442extern struct paravirt_patch_site __start_parainstructions[],
Rusty Russell139ec7c2006-12-07 02:14:08 +0100443 __stop_parainstructions[];
444#endif /* CONFIG_PARAVIRT */
445
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800446void __init alternative_instructions(void)
447{
Andi Kleen8f4e9562007-07-22 11:12:32 +0200448 /* The patching is not fully atomic, so try to avoid local interruptions
449 that might execute the to be patched code.
450 Other CPUs are not running. */
451 stop_nmi();
Andi Kleen123aa762009-02-12 13:39:27 +0100452
453 /*
454 * Don't stop machine check exceptions while patching.
455 * MCEs only happen when something got corrupted and in this
456 * case we must do something about the corruption.
457 * Ignoring it is worse than a unlikely patching race.
458 * Also machine checks tend to be broadcast and if one CPU
459 * goes into machine check the others follow quickly, so we don't
460 * expect a machine check to cause undue problems during to code
461 * patching.
462 */
Andi Kleen8f4e9562007-07-22 11:12:32 +0200463
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800464 apply_alternatives(__alt_instructions, __alt_instructions_end);
465
466 /* switch to patch-once-at-boottime-only mode and free the
467 * tables in case we know the number of CPUs will never ever
468 * change */
469#ifdef CONFIG_HOTPLUG_CPU
470 if (num_possible_cpus() < 2)
471 smp_alt_once = 1;
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800472#endif
473
Gerd Hoffmann8ec4d412006-07-01 04:36:18 -0700474#ifdef CONFIG_SMP
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800475 if (smp_alt_once) {
476 if (1 == num_possible_cpus()) {
477 printk(KERN_INFO "SMP alternatives: switching to UP code\n");
Jeremy Fitzhardinge53756d32008-01-30 13:30:55 +0100478 set_cpu_cap(&boot_cpu_data, X86_FEATURE_UP);
479 set_cpu_cap(&cpu_data(0), X86_FEATURE_UP);
480
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800481 alternatives_smp_unlock(__smp_locks, __smp_locks_end,
482 _text, _etext);
483 }
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800484 } else {
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800485 alternatives_smp_module_add(NULL, "core kernel",
486 __smp_locks, __smp_locks_end,
487 _text, _etext);
Andi Kleenca74a6f2008-01-30 13:33:17 +0100488
489 /* Only switch to UP mode if we don't immediately boot others */
Thomas Gleixner649c6652008-10-05 16:52:24 +0200490 if (num_present_cpus() == 1 || setup_max_cpus <= 1)
Andi Kleenca74a6f2008-01-30 13:33:17 +0100491 alternatives_smp_switch(0);
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800492 }
Gerd Hoffmann8ec4d412006-07-01 04:36:18 -0700493#endif
Jeremy Fitzhardinge441d40d2007-05-02 19:27:16 +0200494 apply_paravirt(__parainstructions, __parainstructions_end);
Andi Kleen8f4e9562007-07-22 11:12:32 +0200495
Fengguang Wuf68fd5f2007-10-17 18:04:34 +0200496 if (smp_alt_once)
497 free_init_pages("SMP alternatives",
498 (unsigned long)__smp_locks,
499 (unsigned long)__smp_locks_end);
500
Andi Kleen8f4e9562007-07-22 11:12:32 +0200501 restart_nmi();
Gerd Hoffmann9a0b5812006-03-23 02:59:32 -0800502}
Andi Kleen19d36cc2007-07-22 11:12:31 +0200503
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500504/**
505 * text_poke_early - Update instructions on a live kernel at boot time
506 * @addr: address to modify
507 * @opcode: source of the copy
508 * @len: length to copy
509 *
Andi Kleen19d36cc2007-07-22 11:12:31 +0200510 * When you use this code to patch more than one byte of an instruction
511 * you need to make sure that other CPUs cannot execute this code in parallel.
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500512 * Also no thread must be currently preempted in the middle of these
513 * instructions. And on the local CPU you need to be protected again NMI or MCE
514 * handlers seeing an inconsistent instruction while you patch.
Andi Kleen19d36cc2007-07-22 11:12:31 +0200515 */
Jan Beulich8b5a10f2009-08-19 08:40:48 +0100516static void *__init_or_module text_poke_early(void *addr, const void *opcode,
517 size_t len)
Andi Kleen19d36cc2007-07-22 11:12:31 +0200518{
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500519 unsigned long flags;
520 local_irq_save(flags);
Andi Kleen19d36cc2007-07-22 11:12:31 +0200521 memcpy(addr, opcode, len);
522 sync_core();
Ben Hutchings5367b682009-09-10 02:53:50 +0100523 local_irq_restore(flags);
Andi Kleena534b672007-09-06 16:59:52 +0200524 /* Could also do a CLFLUSH here to speed up CPU recovery; but
525 that causes hangs on some VIA CPUs. */
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500526 return addr;
527}
528
529/**
530 * text_poke - Update instructions on a live kernel
531 * @addr: address to modify
532 * @opcode: source of the copy
533 * @len: length to copy
534 *
535 * Only atomic text poke/set should be allowed when not doing early patching.
536 * It means the size must be writable atomically and the address must be aligned
537 * in a way that permits an atomic write. It also makes sure we fit on a single
538 * page.
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -0500539 *
540 * Note: Must be called under text_mutex.
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500541 */
542void *__kprobes text_poke(void *addr, const void *opcode, size_t len)
543{
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -0500544 unsigned long flags;
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500545 char *vaddr;
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400546 struct page *pages[2];
547 int i;
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500548
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400549 if (!core_kernel_text((unsigned long)addr)) {
550 pages[0] = vmalloc_to_page(addr);
551 pages[1] = vmalloc_to_page(addr + PAGE_SIZE);
Mathieu Desnoyers15a601e2008-03-12 11:54:16 -0400552 } else {
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400553 pages[0] = virt_to_page(addr);
Ingo Molnar00c6b2d2008-04-25 17:07:03 +0200554 WARN_ON(!PageReserved(pages[0]));
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400555 pages[1] = virt_to_page(addr + PAGE_SIZE);
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500556 }
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400557 BUG_ON(!pages[0]);
Masami Hiramatsu7cf49422009-03-09 12:40:40 -0400558 local_irq_save(flags);
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -0500559 set_fixmap(FIX_TEXT_POKE0, page_to_phys(pages[0]));
560 if (pages[1])
561 set_fixmap(FIX_TEXT_POKE1, page_to_phys(pages[1]));
562 vaddr = (char *)fix_to_virt(FIX_TEXT_POKE0);
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400563 memcpy(&vaddr[(unsigned long)addr & ~PAGE_MASK], opcode, len);
Masami Hiramatsu78ff7fa2009-03-06 10:37:54 -0500564 clear_fixmap(FIX_TEXT_POKE0);
565 if (pages[1])
566 clear_fixmap(FIX_TEXT_POKE1);
567 local_flush_tlb();
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500568 sync_core();
569 /* Could also do a CLFLUSH here to speed up CPU recovery; but
570 that causes hangs on some VIA CPUs. */
Mathieu Desnoyersb7b66ba2008-04-24 11:03:33 -0400571 for (i = 0; i < len; i++)
572 BUG_ON(((char *)addr)[i] != ((char *)opcode)[i]);
Masami Hiramatsu7cf49422009-03-09 12:40:40 -0400573 local_irq_restore(flags);
Mathieu Desnoyerse587cad2008-03-06 08:48:49 -0500574 return addr;
Andi Kleen19d36cc2007-07-22 11:12:31 +0200575}
Masami Hiramatsu3d55cc82010-02-25 08:34:38 -0500576
577/*
578 * Cross-modifying kernel text with stop_machine().
579 * This code originally comes from immediate value.
580 */
581static atomic_t stop_machine_first;
582static int wrote_text;
583
584struct text_poke_params {
585 void *addr;
586 const void *opcode;
587 size_t len;
588};
589
590static int __kprobes stop_machine_text_poke(void *data)
591{
592 struct text_poke_params *tpp = data;
593
594 if (atomic_dec_and_test(&stop_machine_first)) {
595 text_poke(tpp->addr, tpp->opcode, tpp->len);
596 smp_wmb(); /* Make sure other cpus see that this has run */
597 wrote_text = 1;
598 } else {
599 while (!wrote_text)
Masami Hiramatsue5a11012010-03-03 22:38:50 -0500600 cpu_relax();
601 smp_mb(); /* Load wrote_text before following execution */
Masami Hiramatsu3d55cc82010-02-25 08:34:38 -0500602 }
603
604 flush_icache_range((unsigned long)tpp->addr,
605 (unsigned long)tpp->addr + tpp->len);
606 return 0;
607}
608
609/**
610 * text_poke_smp - Update instructions on a live kernel on SMP
611 * @addr: address to modify
612 * @opcode: source of the copy
613 * @len: length to copy
614 *
615 * Modify multi-byte instruction by using stop_machine() on SMP. This allows
616 * user to poke/set multi-byte text on SMP. Only non-NMI/MCE code modifying
617 * should be allowed, since stop_machine() does _not_ protect code against
618 * NMI and MCE.
619 *
620 * Note: Must be called under get_online_cpus() and text_mutex.
621 */
622void *__kprobes text_poke_smp(void *addr, const void *opcode, size_t len)
623{
624 struct text_poke_params tpp;
625
626 tpp.addr = addr;
627 tpp.opcode = opcode;
628 tpp.len = len;
629 atomic_set(&stop_machine_first, 1);
630 wrote_text = 0;
631 stop_machine(stop_machine_text_poke, (void *)&tpp, NULL);
632 return addr;
633}
634