perf probe: Correct probe syntax on command line help
[deliverable/linux.git] / arch / x86 / kernel / alternative.c
CommitLineData
9a0b5817 1#include <linux/module.h>
f6a57033 2#include <linux/sched.h>
2f1dafe5 3#include <linux/mutex.h>
9a0b5817 4#include <linux/list.h>
8b5a10fc 5#include <linux/stringify.h>
19d36ccd
AK
6#include <linux/kprobes.h>
7#include <linux/mm.h>
8#include <linux/vmalloc.h>
3945dab4 9#include <linux/memory.h>
3d55cc8a 10#include <linux/stop_machine.h>
9a0b5817
GH
11#include <asm/alternative.h>
12#include <asm/sections.h>
19d36ccd 13#include <asm/pgtable.h>
8f4e956b
AK
14#include <asm/mce.h>
15#include <asm/nmi.h>
b097976e 16#include <asm/vsyscall.h>
e587cadd 17#include <asm/cacheflush.h>
78ff7fae 18#include <asm/tlbflush.h>
e587cadd 19#include <asm/io.h>
78ff7fae 20#include <asm/fixmap.h>
9a0b5817 21
ab144f5e
AK
22#define MAX_PATCH_LEN (255-1)
23
09488165
JB
24#ifdef CONFIG_HOTPLUG_CPU
25static int smp_alt_once;
9a0b5817 26
d167a518
GH
27static int __init bootonly(char *str)
28{
29 smp_alt_once = 1;
30 return 1;
31}
b7fb4af0 32__setup("smp-alt-boot", bootonly);
09488165
JB
33#else
34#define smp_alt_once 1
35#endif
36
8b5a10fc 37static int __initdata_or_module debug_alternative;
b7fb4af0 38
d167a518
GH
39static int __init debug_alt(char *str)
40{
41 debug_alternative = 1;
42 return 1;
43}
d167a518
GH
44__setup("debug-alternative", debug_alt);
45
09488165
JB
46static int noreplace_smp;
47
b7fb4af0
JF
48static int __init setup_noreplace_smp(char *str)
49{
50 noreplace_smp = 1;
51 return 1;
52}
53__setup("noreplace-smp", setup_noreplace_smp);
54
959b4fdf 55#ifdef CONFIG_PARAVIRT
8b5a10fc 56static int __initdata_or_module noreplace_paravirt = 0;
959b4fdf
JF
57
58static int __init setup_noreplace_paravirt(char *str)
59{
60 noreplace_paravirt = 1;
61 return 1;
62}
63__setup("noreplace-paravirt", setup_noreplace_paravirt);
64#endif
b7fb4af0 65
d167a518
GH
66#define DPRINTK(fmt, args...) if (debug_alternative) \
67 printk(KERN_DEBUG fmt, args)
68
8b5a10fc 69#if defined(GENERIC_NOP1) && !defined(CONFIG_X86_64)
9a0b5817
GH
70/* Use inline assembly to define this because the nops are defined
71 as inline assembly strings in the include files and we cannot
72 get them easily into strings. */
8b5a10fc 73asm("\t" __stringify(__INITRODATA_OR_MODULE) "\nintelnops: "
9a0b5817 74 GENERIC_NOP1 GENERIC_NOP2 GENERIC_NOP3 GENERIC_NOP4 GENERIC_NOP5 GENERIC_NOP6
f4be31ec
SR
75 GENERIC_NOP7 GENERIC_NOP8
76 "\t.previous");
121d7bf5 77extern const unsigned char intelnops[];
8b5a10fc
JB
78static const unsigned char *const __initconst_or_module
79intel_nops[ASM_NOP_MAX+1] = {
9a0b5817
GH
80 NULL,
81 intelnops,
82 intelnops + 1,
83 intelnops + 1 + 2,
84 intelnops + 1 + 2 + 3,
85 intelnops + 1 + 2 + 3 + 4,
86 intelnops + 1 + 2 + 3 + 4 + 5,
87 intelnops + 1 + 2 + 3 + 4 + 5 + 6,
88 intelnops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
89};
d167a518
GH
90#endif
91
92#ifdef K8_NOP1
8b5a10fc 93asm("\t" __stringify(__INITRODATA_OR_MODULE) "\nk8nops: "
d167a518 94 K8_NOP1 K8_NOP2 K8_NOP3 K8_NOP4 K8_NOP5 K8_NOP6
f4be31ec
SR
95 K8_NOP7 K8_NOP8
96 "\t.previous");
121d7bf5 97extern const unsigned char k8nops[];
8b5a10fc
JB
98static const unsigned char *const __initconst_or_module
99k8_nops[ASM_NOP_MAX+1] = {
9a0b5817
GH
100 NULL,
101 k8nops,
102 k8nops + 1,
103 k8nops + 1 + 2,
104 k8nops + 1 + 2 + 3,
105 k8nops + 1 + 2 + 3 + 4,
106 k8nops + 1 + 2 + 3 + 4 + 5,
107 k8nops + 1 + 2 + 3 + 4 + 5 + 6,
108 k8nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
109};
d167a518
GH
110#endif
111
8b5a10fc
JB
112#if defined(K7_NOP1) && !defined(CONFIG_X86_64)
113asm("\t" __stringify(__INITRODATA_OR_MODULE) "\nk7nops: "
d167a518 114 K7_NOP1 K7_NOP2 K7_NOP3 K7_NOP4 K7_NOP5 K7_NOP6
f4be31ec
SR
115 K7_NOP7 K7_NOP8
116 "\t.previous");
121d7bf5 117extern const unsigned char k7nops[];
8b5a10fc
JB
118static const unsigned char *const __initconst_or_module
119k7_nops[ASM_NOP_MAX+1] = {
9a0b5817
GH
120 NULL,
121 k7nops,
122 k7nops + 1,
123 k7nops + 1 + 2,
124 k7nops + 1 + 2 + 3,
125 k7nops + 1 + 2 + 3 + 4,
126 k7nops + 1 + 2 + 3 + 4 + 5,
127 k7nops + 1 + 2 + 3 + 4 + 5 + 6,
128 k7nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
129};
d167a518
GH
130#endif
131
32c464f5 132#ifdef P6_NOP1
8b5a10fc 133asm("\t" __stringify(__INITRODATA_OR_MODULE) "\np6nops: "
32c464f5 134 P6_NOP1 P6_NOP2 P6_NOP3 P6_NOP4 P6_NOP5 P6_NOP6
f4be31ec
SR
135 P6_NOP7 P6_NOP8
136 "\t.previous");
32c464f5 137extern const unsigned char p6nops[];
8b5a10fc
JB
138static const unsigned char *const __initconst_or_module
139p6_nops[ASM_NOP_MAX+1] = {
32c464f5
JB
140 NULL,
141 p6nops,
142 p6nops + 1,
143 p6nops + 1 + 2,
144 p6nops + 1 + 2 + 3,
145 p6nops + 1 + 2 + 3 + 4,
146 p6nops + 1 + 2 + 3 + 4 + 5,
147 p6nops + 1 + 2 + 3 + 4 + 5 + 6,
148 p6nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
149};
150#endif
151
d167a518
GH
152#ifdef CONFIG_X86_64
153
154extern char __vsyscall_0;
8b5a10fc 155static const unsigned char *const *__init_or_module find_nop_table(void)
d167a518 156{
f31d731e
PA
157 if (boot_cpu_data.x86_vendor == X86_VENDOR_INTEL &&
158 boot_cpu_has(X86_FEATURE_NOPL))
159 return p6_nops;
160 else
161 return k8_nops;
d167a518
GH
162}
163
164#else /* CONFIG_X86_64 */
165
8b5a10fc 166static const unsigned char *const *__init_or_module find_nop_table(void)
9a0b5817 167{
f31d731e
PA
168 if (boot_cpu_has(X86_FEATURE_K8))
169 return k8_nops;
170 else if (boot_cpu_has(X86_FEATURE_K7))
171 return k7_nops;
172 else if (boot_cpu_has(X86_FEATURE_NOPL))
173 return p6_nops;
174 else
175 return intel_nops;
9a0b5817
GH
176}
177
d167a518
GH
178#endif /* CONFIG_X86_64 */
179
ab144f5e 180/* Use this to add nops to a buffer, then text_poke the whole buffer. */
8b5a10fc 181static void __init_or_module add_nops(void *insns, unsigned int len)
139ec7c4 182{
121d7bf5 183 const unsigned char *const *noptable = find_nop_table();
139ec7c4
RR
184
185 while (len > 0) {
186 unsigned int noplen = len;
187 if (noplen > ASM_NOP_MAX)
188 noplen = ASM_NOP_MAX;
ab144f5e 189 memcpy(insns, noptable[noplen], noplen);
139ec7c4
RR
190 insns += noplen;
191 len -= noplen;
192 }
193}
194
d167a518 195extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
d167a518 196extern u8 *__smp_locks[], *__smp_locks_end[];
8b5a10fc 197static void *text_poke_early(void *addr, const void *opcode, size_t len);
d167a518 198
9a0b5817
GH
199/* Replace instructions with better alternatives for this CPU type.
200 This runs before SMP is initialized to avoid SMP problems with
201 self modifying code. This implies that assymetric systems where
202 APs have less capabilities than the boot processor are not handled.
203 Tough. Make sure you disable such features by hand. */
204
8b5a10fc
JB
205void __init_or_module apply_alternatives(struct alt_instr *start,
206 struct alt_instr *end)
9a0b5817 207{
9a0b5817 208 struct alt_instr *a;
ab144f5e 209 char insnbuf[MAX_PATCH_LEN];
9a0b5817 210
77bf90ed 211 DPRINTK("%s: alt table %p -> %p\n", __func__, start, end);
9a0b5817 212 for (a = start; a < end; a++) {
ab144f5e 213 u8 *instr = a->instr;
9a0b5817 214 BUG_ON(a->replacementlen > a->instrlen);
ab144f5e 215 BUG_ON(a->instrlen > sizeof(insnbuf));
9a0b5817
GH
216 if (!boot_cpu_has(a->cpuid))
217 continue;
d167a518
GH
218#ifdef CONFIG_X86_64
219 /* vsyscall code is not mapped yet. resolve it manually. */
220 if (instr >= (u8 *)VSYSCALL_START && instr < (u8*)VSYSCALL_END) {
221 instr = __va(instr - (u8*)VSYSCALL_START + (u8*)__pa_symbol(&__vsyscall_0));
222 DPRINTK("%s: vsyscall fixup: %p => %p\n",
77bf90ed 223 __func__, a->instr, instr);
d167a518
GH
224 }
225#endif
ab144f5e
AK
226 memcpy(insnbuf, a->replacement, a->replacementlen);
227 add_nops(insnbuf + a->replacementlen,
228 a->instrlen - a->replacementlen);
e587cadd 229 text_poke_early(instr, insnbuf, a->instrlen);
9a0b5817
GH
230 }
231}
232
8ec4d41f
GH
233#ifdef CONFIG_SMP
234
9a0b5817
GH
235static void alternatives_smp_lock(u8 **start, u8 **end, u8 *text, u8 *text_end)
236{
237 u8 **ptr;
238
3945dab4 239 mutex_lock(&text_mutex);
9a0b5817
GH
240 for (ptr = start; ptr < end; ptr++) {
241 if (*ptr < text)
242 continue;
243 if (*ptr > text_end)
244 continue;
f88f07e0
MD
245 /* turn DS segment override prefix into lock prefix */
246 text_poke(*ptr, ((unsigned char []){0xf0}), 1);
9a0b5817 247 };
3945dab4 248 mutex_unlock(&text_mutex);
9a0b5817
GH
249}
250
251static void alternatives_smp_unlock(u8 **start, u8 **end, u8 *text, u8 *text_end)
252{
9a0b5817
GH
253 u8 **ptr;
254
b7fb4af0
JF
255 if (noreplace_smp)
256 return;
257
3945dab4 258 mutex_lock(&text_mutex);
9a0b5817
GH
259 for (ptr = start; ptr < end; ptr++) {
260 if (*ptr < text)
261 continue;
262 if (*ptr > text_end)
263 continue;
f88f07e0
MD
264 /* turn lock prefix into DS segment override prefix */
265 text_poke(*ptr, ((unsigned char []){0x3E}), 1);
9a0b5817 266 };
3945dab4 267 mutex_unlock(&text_mutex);
9a0b5817
GH
268}
269
270struct smp_alt_module {
271 /* what is this ??? */
272 struct module *mod;
273 char *name;
274
275 /* ptrs to lock prefixes */
276 u8 **locks;
277 u8 **locks_end;
278
279 /* .text segment, needed to avoid patching init code ;) */
280 u8 *text;
281 u8 *text_end;
282
283 struct list_head next;
284};
285static LIST_HEAD(smp_alt_modules);
2f1dafe5 286static DEFINE_MUTEX(smp_alt);
ca74a6f8 287static int smp_mode = 1; /* protected by smp_alt */
9a0b5817 288
8b5a10fc
JB
289void __init_or_module alternatives_smp_module_add(struct module *mod,
290 char *name,
291 void *locks, void *locks_end,
292 void *text, void *text_end)
9a0b5817
GH
293{
294 struct smp_alt_module *smp;
9a0b5817 295
b7fb4af0
JF
296 if (noreplace_smp)
297 return;
298
9a0b5817
GH
299 if (smp_alt_once) {
300 if (boot_cpu_has(X86_FEATURE_UP))
301 alternatives_smp_unlock(locks, locks_end,
302 text, text_end);
303 return;
304 }
305
306 smp = kzalloc(sizeof(*smp), GFP_KERNEL);
307 if (NULL == smp)
308 return; /* we'll run the (safe but slow) SMP code then ... */
309
310 smp->mod = mod;
311 smp->name = name;
312 smp->locks = locks;
313 smp->locks_end = locks_end;
314 smp->text = text;
315 smp->text_end = text_end;
316 DPRINTK("%s: locks %p -> %p, text %p -> %p, name %s\n",
77bf90ed 317 __func__, smp->locks, smp->locks_end,
9a0b5817
GH
318 smp->text, smp->text_end, smp->name);
319
2f1dafe5 320 mutex_lock(&smp_alt);
9a0b5817
GH
321 list_add_tail(&smp->next, &smp_alt_modules);
322 if (boot_cpu_has(X86_FEATURE_UP))
323 alternatives_smp_unlock(smp->locks, smp->locks_end,
324 smp->text, smp->text_end);
2f1dafe5 325 mutex_unlock(&smp_alt);
9a0b5817
GH
326}
327
8b5a10fc 328void __init_or_module alternatives_smp_module_del(struct module *mod)
9a0b5817
GH
329{
330 struct smp_alt_module *item;
9a0b5817 331
b7fb4af0 332 if (smp_alt_once || noreplace_smp)
9a0b5817
GH
333 return;
334
2f1dafe5 335 mutex_lock(&smp_alt);
9a0b5817
GH
336 list_for_each_entry(item, &smp_alt_modules, next) {
337 if (mod != item->mod)
338 continue;
339 list_del(&item->next);
2f1dafe5 340 mutex_unlock(&smp_alt);
77bf90ed 341 DPRINTK("%s: %s\n", __func__, item->name);
9a0b5817
GH
342 kfree(item);
343 return;
344 }
2f1dafe5 345 mutex_unlock(&smp_alt);
9a0b5817
GH
346}
347
348void alternatives_smp_switch(int smp)
349{
350 struct smp_alt_module *mod;
9a0b5817 351
3047e99e
IM
352#ifdef CONFIG_LOCKDEP
353 /*
17abecfe
IM
354 * Older binutils section handling bug prevented
355 * alternatives-replacement from working reliably.
356 *
357 * If this still occurs then you should see a hang
358 * or crash shortly after this line:
3047e99e 359 */
17abecfe 360 printk("lockdep: fixing up alternatives.\n");
3047e99e
IM
361#endif
362
b7fb4af0 363 if (noreplace_smp || smp_alt_once)
9a0b5817
GH
364 return;
365 BUG_ON(!smp && (num_online_cpus() > 1));
366
2f1dafe5 367 mutex_lock(&smp_alt);
ca74a6f8
AK
368
369 /*
370 * Avoid unnecessary switches because it forces JIT based VMs to
371 * throw away all cached translations, which can be quite costly.
372 */
373 if (smp == smp_mode) {
374 /* nothing */
375 } else if (smp) {
9a0b5817 376 printk(KERN_INFO "SMP alternatives: switching to SMP code\n");
53756d37
JF
377 clear_cpu_cap(&boot_cpu_data, X86_FEATURE_UP);
378 clear_cpu_cap(&cpu_data(0), X86_FEATURE_UP);
9a0b5817
GH
379 list_for_each_entry(mod, &smp_alt_modules, next)
380 alternatives_smp_lock(mod->locks, mod->locks_end,
381 mod->text, mod->text_end);
382 } else {
383 printk(KERN_INFO "SMP alternatives: switching to UP code\n");
53756d37
JF
384 set_cpu_cap(&boot_cpu_data, X86_FEATURE_UP);
385 set_cpu_cap(&cpu_data(0), X86_FEATURE_UP);
9a0b5817
GH
386 list_for_each_entry(mod, &smp_alt_modules, next)
387 alternatives_smp_unlock(mod->locks, mod->locks_end,
388 mod->text, mod->text_end);
389 }
ca74a6f8 390 smp_mode = smp;
2f1dafe5 391 mutex_unlock(&smp_alt);
9a0b5817
GH
392}
393
2cfa1978
MH
394/* Return 1 if the address range is reserved for smp-alternatives */
395int alternatives_text_reserved(void *start, void *end)
396{
397 struct smp_alt_module *mod;
398 u8 **ptr;
076dc4a6
MH
399 u8 *text_start = start;
400 u8 *text_end = end;
2cfa1978
MH
401
402 list_for_each_entry(mod, &smp_alt_modules, next) {
076dc4a6 403 if (mod->text > text_end || mod->text_end < text_start)
2cfa1978
MH
404 continue;
405 for (ptr = mod->locks; ptr < mod->locks_end; ptr++)
076dc4a6 406 if (text_start <= *ptr && text_end >= *ptr)
2cfa1978
MH
407 return 1;
408 }
409
410 return 0;
411}
8ec4d41f
GH
412#endif
413
139ec7c4 414#ifdef CONFIG_PARAVIRT
8b5a10fc
JB
415void __init_or_module apply_paravirt(struct paravirt_patch_site *start,
416 struct paravirt_patch_site *end)
139ec7c4 417{
98de032b 418 struct paravirt_patch_site *p;
ab144f5e 419 char insnbuf[MAX_PATCH_LEN];
139ec7c4 420
959b4fdf
JF
421 if (noreplace_paravirt)
422 return;
423
139ec7c4
RR
424 for (p = start; p < end; p++) {
425 unsigned int used;
426
ab144f5e 427 BUG_ON(p->len > MAX_PATCH_LEN);
d34fda4a
CW
428 /* prep the buffer with the original instructions */
429 memcpy(insnbuf, p->instr, p->len);
93b1eab3
JF
430 used = pv_init_ops.patch(p->instrtype, p->clobbers, insnbuf,
431 (unsigned long)p->instr, p->len);
7f63c41c 432
63f70270
JF
433 BUG_ON(used > p->len);
434
139ec7c4 435 /* Pad the rest with nops */
ab144f5e 436 add_nops(insnbuf + used, p->len - used);
e587cadd 437 text_poke_early(p->instr, insnbuf, p->len);
139ec7c4 438 }
139ec7c4 439}
98de032b 440extern struct paravirt_patch_site __start_parainstructions[],
139ec7c4
RR
441 __stop_parainstructions[];
442#endif /* CONFIG_PARAVIRT */
443
9a0b5817
GH
444void __init alternative_instructions(void)
445{
8f4e956b
AK
446 /* The patching is not fully atomic, so try to avoid local interruptions
447 that might execute the to be patched code.
448 Other CPUs are not running. */
449 stop_nmi();
123aa76e
AK
450
451 /*
452 * Don't stop machine check exceptions while patching.
453 * MCEs only happen when something got corrupted and in this
454 * case we must do something about the corruption.
455 * Ignoring it is worse than a unlikely patching race.
456 * Also machine checks tend to be broadcast and if one CPU
457 * goes into machine check the others follow quickly, so we don't
458 * expect a machine check to cause undue problems during to code
459 * patching.
460 */
8f4e956b 461
9a0b5817
GH
462 apply_alternatives(__alt_instructions, __alt_instructions_end);
463
464 /* switch to patch-once-at-boottime-only mode and free the
465 * tables in case we know the number of CPUs will never ever
466 * change */
467#ifdef CONFIG_HOTPLUG_CPU
468 if (num_possible_cpus() < 2)
469 smp_alt_once = 1;
9a0b5817
GH
470#endif
471
8ec4d41f 472#ifdef CONFIG_SMP
9a0b5817
GH
473 if (smp_alt_once) {
474 if (1 == num_possible_cpus()) {
475 printk(KERN_INFO "SMP alternatives: switching to UP code\n");
53756d37
JF
476 set_cpu_cap(&boot_cpu_data, X86_FEATURE_UP);
477 set_cpu_cap(&cpu_data(0), X86_FEATURE_UP);
478
9a0b5817
GH
479 alternatives_smp_unlock(__smp_locks, __smp_locks_end,
480 _text, _etext);
481 }
9a0b5817 482 } else {
9a0b5817
GH
483 alternatives_smp_module_add(NULL, "core kernel",
484 __smp_locks, __smp_locks_end,
485 _text, _etext);
ca74a6f8
AK
486
487 /* Only switch to UP mode if we don't immediately boot others */
649c6653 488 if (num_present_cpus() == 1 || setup_max_cpus <= 1)
ca74a6f8 489 alternatives_smp_switch(0);
9a0b5817 490 }
8ec4d41f 491#endif
441d40dc 492 apply_paravirt(__parainstructions, __parainstructions_end);
8f4e956b 493
f68fd5f4
FW
494 if (smp_alt_once)
495 free_init_pages("SMP alternatives",
496 (unsigned long)__smp_locks,
497 (unsigned long)__smp_locks_end);
498
8f4e956b 499 restart_nmi();
9a0b5817 500}
19d36ccd 501
e587cadd
MD
502/**
503 * text_poke_early - Update instructions on a live kernel at boot time
504 * @addr: address to modify
505 * @opcode: source of the copy
506 * @len: length to copy
507 *
19d36ccd
AK
508 * When you use this code to patch more than one byte of an instruction
509 * you need to make sure that other CPUs cannot execute this code in parallel.
e587cadd
MD
510 * Also no thread must be currently preempted in the middle of these
511 * instructions. And on the local CPU you need to be protected again NMI or MCE
512 * handlers seeing an inconsistent instruction while you patch.
19d36ccd 513 */
8b5a10fc
JB
514static void *__init_or_module text_poke_early(void *addr, const void *opcode,
515 size_t len)
19d36ccd 516{
e587cadd
MD
517 unsigned long flags;
518 local_irq_save(flags);
19d36ccd 519 memcpy(addr, opcode, len);
e587cadd 520 sync_core();
5367b688 521 local_irq_restore(flags);
e587cadd
MD
522 /* Could also do a CLFLUSH here to speed up CPU recovery; but
523 that causes hangs on some VIA CPUs. */
524 return addr;
525}
526
527/**
528 * text_poke - Update instructions on a live kernel
529 * @addr: address to modify
530 * @opcode: source of the copy
531 * @len: length to copy
532 *
533 * Only atomic text poke/set should be allowed when not doing early patching.
534 * It means the size must be writable atomically and the address must be aligned
535 * in a way that permits an atomic write. It also makes sure we fit on a single
536 * page.
78ff7fae
MH
537 *
538 * Note: Must be called under text_mutex.
e587cadd
MD
539 */
540void *__kprobes text_poke(void *addr, const void *opcode, size_t len)
541{
78ff7fae 542 unsigned long flags;
e587cadd 543 char *vaddr;
b7b66baa
MD
544 struct page *pages[2];
545 int i;
e587cadd 546
b7b66baa
MD
547 if (!core_kernel_text((unsigned long)addr)) {
548 pages[0] = vmalloc_to_page(addr);
549 pages[1] = vmalloc_to_page(addr + PAGE_SIZE);
15a601eb 550 } else {
b7b66baa 551 pages[0] = virt_to_page(addr);
00c6b2d5 552 WARN_ON(!PageReserved(pages[0]));
b7b66baa 553 pages[1] = virt_to_page(addr + PAGE_SIZE);
e587cadd 554 }
b7b66baa 555 BUG_ON(!pages[0]);
7cf49427 556 local_irq_save(flags);
78ff7fae
MH
557 set_fixmap(FIX_TEXT_POKE0, page_to_phys(pages[0]));
558 if (pages[1])
559 set_fixmap(FIX_TEXT_POKE1, page_to_phys(pages[1]));
560 vaddr = (char *)fix_to_virt(FIX_TEXT_POKE0);
b7b66baa 561 memcpy(&vaddr[(unsigned long)addr & ~PAGE_MASK], opcode, len);
78ff7fae
MH
562 clear_fixmap(FIX_TEXT_POKE0);
563 if (pages[1])
564 clear_fixmap(FIX_TEXT_POKE1);
565 local_flush_tlb();
19d36ccd 566 sync_core();
a534b679
AK
567 /* Could also do a CLFLUSH here to speed up CPU recovery; but
568 that causes hangs on some VIA CPUs. */
b7b66baa
MD
569 for (i = 0; i < len; i++)
570 BUG_ON(((char *)addr)[i] != ((char *)opcode)[i]);
7cf49427 571 local_irq_restore(flags);
e587cadd 572 return addr;
19d36ccd 573}
3d55cc8a
MH
574
575/*
576 * Cross-modifying kernel text with stop_machine().
577 * This code originally comes from immediate value.
578 */
579static atomic_t stop_machine_first;
580static int wrote_text;
581
582struct text_poke_params {
583 void *addr;
584 const void *opcode;
585 size_t len;
586};
587
588static int __kprobes stop_machine_text_poke(void *data)
589{
590 struct text_poke_params *tpp = data;
591
592 if (atomic_dec_and_test(&stop_machine_first)) {
593 text_poke(tpp->addr, tpp->opcode, tpp->len);
594 smp_wmb(); /* Make sure other cpus see that this has run */
595 wrote_text = 1;
596 } else {
597 while (!wrote_text)
598 smp_rmb();
599 sync_core();
600 }
601
602 flush_icache_range((unsigned long)tpp->addr,
603 (unsigned long)tpp->addr + tpp->len);
604 return 0;
605}
606
607/**
608 * text_poke_smp - Update instructions on a live kernel on SMP
609 * @addr: address to modify
610 * @opcode: source of the copy
611 * @len: length to copy
612 *
613 * Modify multi-byte instruction by using stop_machine() on SMP. This allows
614 * user to poke/set multi-byte text on SMP. Only non-NMI/MCE code modifying
615 * should be allowed, since stop_machine() does _not_ protect code against
616 * NMI and MCE.
617 *
618 * Note: Must be called under get_online_cpus() and text_mutex.
619 */
620void *__kprobes text_poke_smp(void *addr, const void *opcode, size_t len)
621{
622 struct text_poke_params tpp;
623
624 tpp.addr = addr;
625 tpp.opcode = opcode;
626 tpp.len = len;
627 atomic_set(&stop_machine_first, 1);
628 wrote_text = 0;
629 stop_machine(stop_machine_text_poke, (void *)&tpp, NULL);
630 return addr;
631}
632
This page took 0.520943 seconds and 5 git commands to generate.