blob: 226882fe85a6581876a06721147dcaa90619eb73 [file] [log] [blame]
Alexander Graf2a342ed2010-07-29 14:47:48 +02001/*
2 * Copyright (C) 2010 SUSE Linux Products GmbH. All rights reserved.
3 *
4 * Authors:
5 * Alexander Graf <agraf@suse.de>
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License, version 2, as
9 * published by the Free Software Foundation.
10 *
11 * This program is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 * GNU General Public License for more details.
15 *
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
19 */
20
21#include <linux/kvm_host.h>
22#include <linux/init.h>
23#include <linux/kvm_para.h>
24#include <linux/slab.h>
25#include <linux/of.h>
26
27#include <asm/reg.h>
Alexander Graf2a342ed2010-07-29 14:47:48 +020028#include <asm/sections.h>
29#include <asm/cacheflush.h>
30#include <asm/disassemble.h>
31
Alexander Grafd17051c2010-07-29 14:47:57 +020032#define KVM_MAGIC_PAGE (-4096L)
33#define magic_var(x) KVM_MAGIC_PAGE + offsetof(struct kvm_vcpu_arch_shared, x)
34
Alexander Grafd1293c92010-07-29 14:47:59 +020035#define KVM_INST_LWZ 0x80000000
36#define KVM_INST_STW 0x90000000
37#define KVM_INST_LD 0xe8000000
38#define KVM_INST_STD 0xf8000000
39#define KVM_INST_NOP 0x60000000
40#define KVM_INST_B 0x48000000
41#define KVM_INST_B_MASK 0x03ffffff
42#define KVM_INST_B_MAX 0x01ffffff
43
Alexander Graf73a18102010-07-29 14:47:58 +020044#define KVM_MASK_RT 0x03e00000
Alexander Grafd1293c92010-07-29 14:47:59 +020045#define KVM_INST_MFMSR 0x7c0000a6
46#define KVM_INST_MFSPR_SPRG0 0x7c1042a6
47#define KVM_INST_MFSPR_SPRG1 0x7c1142a6
48#define KVM_INST_MFSPR_SPRG2 0x7c1242a6
49#define KVM_INST_MFSPR_SPRG3 0x7c1342a6
50#define KVM_INST_MFSPR_SRR0 0x7c1a02a6
51#define KVM_INST_MFSPR_SRR1 0x7c1b02a6
52#define KVM_INST_MFSPR_DAR 0x7c1302a6
53#define KVM_INST_MFSPR_DSISR 0x7c1202a6
54
55#define KVM_INST_MTSPR_SPRG0 0x7c1043a6
56#define KVM_INST_MTSPR_SPRG1 0x7c1143a6
57#define KVM_INST_MTSPR_SPRG2 0x7c1243a6
58#define KVM_INST_MTSPR_SPRG3 0x7c1343a6
59#define KVM_INST_MTSPR_SRR0 0x7c1a03a6
60#define KVM_INST_MTSPR_SRR1 0x7c1b03a6
61#define KVM_INST_MTSPR_DAR 0x7c1303a6
62#define KVM_INST_MTSPR_DSISR 0x7c1203a6
Alexander Graf73a18102010-07-29 14:47:58 +020063
Alexander Grafd1290b152010-07-29 14:48:00 +020064#define KVM_INST_TLBSYNC 0x7c00046c
Alexander Graf78109272010-07-29 14:48:05 +020065#define KVM_INST_MTMSRD_L0 0x7c000164
Alexander Graf819a63d2010-07-29 14:48:04 +020066#define KVM_INST_MTMSRD_L1 0x7c010164
Alexander Graf78109272010-07-29 14:48:05 +020067#define KVM_INST_MTMSR 0x7c000124
Alexander Grafd1290b152010-07-29 14:48:00 +020068
Alexander Graf644bfa02010-07-29 14:48:06 +020069#define KVM_INST_WRTEEI_0 0x7c000146
70#define KVM_INST_WRTEEI_1 0x7c008146
71
Alexander Graf73a18102010-07-29 14:47:58 +020072static bool kvm_patching_worked = true;
Alexander Graf2d4f5672010-07-29 14:48:01 +020073static char kvm_tmp[1024 * 1024];
74static int kvm_tmp_index;
Alexander Graf73a18102010-07-29 14:47:58 +020075
76static inline void kvm_patch_ins(u32 *inst, u32 new_inst)
77{
78 *inst = new_inst;
79 flush_icache_range((ulong)inst, (ulong)inst + 4);
80}
81
Alexander Grafd1293c92010-07-29 14:47:59 +020082static void kvm_patch_ins_ld(u32 *inst, long addr, u32 rt)
83{
84#ifdef CONFIG_64BIT
85 kvm_patch_ins(inst, KVM_INST_LD | rt | (addr & 0x0000fffc));
86#else
87 kvm_patch_ins(inst, KVM_INST_LWZ | rt | ((addr + 4) & 0x0000fffc));
88#endif
89}
90
91static void kvm_patch_ins_lwz(u32 *inst, long addr, u32 rt)
92{
93 kvm_patch_ins(inst, KVM_INST_LWZ | rt | (addr & 0x0000ffff));
94}
95
96static void kvm_patch_ins_std(u32 *inst, long addr, u32 rt)
97{
98#ifdef CONFIG_64BIT
99 kvm_patch_ins(inst, KVM_INST_STD | rt | (addr & 0x0000fffc));
100#else
101 kvm_patch_ins(inst, KVM_INST_STW | rt | ((addr + 4) & 0x0000fffc));
102#endif
103}
104
105static void kvm_patch_ins_stw(u32 *inst, long addr, u32 rt)
106{
107 kvm_patch_ins(inst, KVM_INST_STW | rt | (addr & 0x0000fffc));
108}
109
Alexander Grafd1290b152010-07-29 14:48:00 +0200110static void kvm_patch_ins_nop(u32 *inst)
111{
112 kvm_patch_ins(inst, KVM_INST_NOP);
113}
114
Alexander Graf71ee8e32010-07-29 14:48:02 +0200115static void kvm_patch_ins_b(u32 *inst, int addr)
116{
117#ifdef CONFIG_RELOCATABLE
118 /* On relocatable kernels interrupts handlers and our code
119 can be in different regions, so we don't patch them */
120
121 extern u32 __end_interrupts;
122 if ((ulong)inst < (ulong)&__end_interrupts)
123 return;
124#endif
125
126 kvm_patch_ins(inst, KVM_INST_B | (addr & KVM_INST_B_MASK));
127}
128
Alexander Graf2d4f5672010-07-29 14:48:01 +0200129static u32 *kvm_alloc(int len)
130{
131 u32 *p;
132
133 if ((kvm_tmp_index + len) > ARRAY_SIZE(kvm_tmp)) {
134 printk(KERN_ERR "KVM: No more space (%d + %d)\n",
135 kvm_tmp_index, len);
136 kvm_patching_worked = false;
137 return NULL;
138 }
139
140 p = (void*)&kvm_tmp[kvm_tmp_index];
141 kvm_tmp_index += len;
142
143 return p;
144}
145
Alexander Graf819a63d2010-07-29 14:48:04 +0200146extern u32 kvm_emulate_mtmsrd_branch_offs;
147extern u32 kvm_emulate_mtmsrd_reg_offs;
148extern u32 kvm_emulate_mtmsrd_len;
149extern u32 kvm_emulate_mtmsrd[];
150
151static void kvm_patch_ins_mtmsrd(u32 *inst, u32 rt)
152{
153 u32 *p;
154 int distance_start;
155 int distance_end;
156 ulong next_inst;
157
158 p = kvm_alloc(kvm_emulate_mtmsrd_len * 4);
159 if (!p)
160 return;
161
162 /* Find out where we are and put everything there */
163 distance_start = (ulong)p - (ulong)inst;
164 next_inst = ((ulong)inst + 4);
165 distance_end = next_inst - (ulong)&p[kvm_emulate_mtmsrd_branch_offs];
166
167 /* Make sure we only write valid b instructions */
168 if (distance_start > KVM_INST_B_MAX) {
169 kvm_patching_worked = false;
170 return;
171 }
172
173 /* Modify the chunk to fit the invocation */
174 memcpy(p, kvm_emulate_mtmsrd, kvm_emulate_mtmsrd_len * 4);
175 p[kvm_emulate_mtmsrd_branch_offs] |= distance_end & KVM_INST_B_MASK;
176 p[kvm_emulate_mtmsrd_reg_offs] |= rt;
177 flush_icache_range((ulong)p, (ulong)p + kvm_emulate_mtmsrd_len * 4);
178
179 /* Patch the invocation */
180 kvm_patch_ins_b(inst, distance_start);
181}
182
Alexander Graf78109272010-07-29 14:48:05 +0200183extern u32 kvm_emulate_mtmsr_branch_offs;
184extern u32 kvm_emulate_mtmsr_reg1_offs;
185extern u32 kvm_emulate_mtmsr_reg2_offs;
186extern u32 kvm_emulate_mtmsr_reg3_offs;
187extern u32 kvm_emulate_mtmsr_orig_ins_offs;
188extern u32 kvm_emulate_mtmsr_len;
189extern u32 kvm_emulate_mtmsr[];
190
191static void kvm_patch_ins_mtmsr(u32 *inst, u32 rt)
192{
193 u32 *p;
194 int distance_start;
195 int distance_end;
196 ulong next_inst;
197
198 p = kvm_alloc(kvm_emulate_mtmsr_len * 4);
199 if (!p)
200 return;
201
202 /* Find out where we are and put everything there */
203 distance_start = (ulong)p - (ulong)inst;
204 next_inst = ((ulong)inst + 4);
205 distance_end = next_inst - (ulong)&p[kvm_emulate_mtmsr_branch_offs];
206
207 /* Make sure we only write valid b instructions */
208 if (distance_start > KVM_INST_B_MAX) {
209 kvm_patching_worked = false;
210 return;
211 }
212
213 /* Modify the chunk to fit the invocation */
214 memcpy(p, kvm_emulate_mtmsr, kvm_emulate_mtmsr_len * 4);
215 p[kvm_emulate_mtmsr_branch_offs] |= distance_end & KVM_INST_B_MASK;
216 p[kvm_emulate_mtmsr_reg1_offs] |= rt;
217 p[kvm_emulate_mtmsr_reg2_offs] |= rt;
218 p[kvm_emulate_mtmsr_reg3_offs] |= rt;
219 p[kvm_emulate_mtmsr_orig_ins_offs] = *inst;
220 flush_icache_range((ulong)p, (ulong)p + kvm_emulate_mtmsr_len * 4);
221
222 /* Patch the invocation */
223 kvm_patch_ins_b(inst, distance_start);
224}
225
Alexander Graf644bfa02010-07-29 14:48:06 +0200226#ifdef CONFIG_BOOKE
227
228extern u32 kvm_emulate_wrteei_branch_offs;
229extern u32 kvm_emulate_wrteei_ee_offs;
230extern u32 kvm_emulate_wrteei_len;
231extern u32 kvm_emulate_wrteei[];
232
233static void kvm_patch_ins_wrteei(u32 *inst)
234{
235 u32 *p;
236 int distance_start;
237 int distance_end;
238 ulong next_inst;
239
240 p = kvm_alloc(kvm_emulate_wrteei_len * 4);
241 if (!p)
242 return;
243
244 /* Find out where we are and put everything there */
245 distance_start = (ulong)p - (ulong)inst;
246 next_inst = ((ulong)inst + 4);
247 distance_end = next_inst - (ulong)&p[kvm_emulate_wrteei_branch_offs];
248
249 /* Make sure we only write valid b instructions */
250 if (distance_start > KVM_INST_B_MAX) {
251 kvm_patching_worked = false;
252 return;
253 }
254
255 /* Modify the chunk to fit the invocation */
256 memcpy(p, kvm_emulate_wrteei, kvm_emulate_wrteei_len * 4);
257 p[kvm_emulate_wrteei_branch_offs] |= distance_end & KVM_INST_B_MASK;
258 p[kvm_emulate_wrteei_ee_offs] |= (*inst & MSR_EE);
259 flush_icache_range((ulong)p, (ulong)p + kvm_emulate_wrteei_len * 4);
260
261 /* Patch the invocation */
262 kvm_patch_ins_b(inst, distance_start);
263}
264
265#endif
266
Alexander Graf73a18102010-07-29 14:47:58 +0200267static void kvm_map_magic_page(void *data)
268{
Alexander Graf7508e162010-08-03 11:32:56 +0200269 u32 *features = data;
270
271 ulong in[8];
272 ulong out[8];
273
274 in[0] = KVM_MAGIC_PAGE;
275 in[1] = KVM_MAGIC_PAGE;
276
277 kvm_hypercall(in, out, HC_VENDOR_KVM | KVM_HC_PPC_MAP_MAGIC_PAGE);
278
279 *features = out[0];
Alexander Graf73a18102010-07-29 14:47:58 +0200280}
281
Alexander Graf7508e162010-08-03 11:32:56 +0200282static void kvm_check_ins(u32 *inst, u32 features)
Alexander Graf73a18102010-07-29 14:47:58 +0200283{
284 u32 _inst = *inst;
285 u32 inst_no_rt = _inst & ~KVM_MASK_RT;
286 u32 inst_rt = _inst & KVM_MASK_RT;
287
288 switch (inst_no_rt) {
Alexander Grafd1293c92010-07-29 14:47:59 +0200289 /* Loads */
290 case KVM_INST_MFMSR:
291 kvm_patch_ins_ld(inst, magic_var(msr), inst_rt);
292 break;
293 case KVM_INST_MFSPR_SPRG0:
294 kvm_patch_ins_ld(inst, magic_var(sprg0), inst_rt);
295 break;
296 case KVM_INST_MFSPR_SPRG1:
297 kvm_patch_ins_ld(inst, magic_var(sprg1), inst_rt);
298 break;
299 case KVM_INST_MFSPR_SPRG2:
300 kvm_patch_ins_ld(inst, magic_var(sprg2), inst_rt);
301 break;
302 case KVM_INST_MFSPR_SPRG3:
303 kvm_patch_ins_ld(inst, magic_var(sprg3), inst_rt);
304 break;
305 case KVM_INST_MFSPR_SRR0:
306 kvm_patch_ins_ld(inst, magic_var(srr0), inst_rt);
307 break;
308 case KVM_INST_MFSPR_SRR1:
309 kvm_patch_ins_ld(inst, magic_var(srr1), inst_rt);
310 break;
311 case KVM_INST_MFSPR_DAR:
312 kvm_patch_ins_ld(inst, magic_var(dar), inst_rt);
313 break;
314 case KVM_INST_MFSPR_DSISR:
315 kvm_patch_ins_lwz(inst, magic_var(dsisr), inst_rt);
316 break;
317
318 /* Stores */
319 case KVM_INST_MTSPR_SPRG0:
320 kvm_patch_ins_std(inst, magic_var(sprg0), inst_rt);
321 break;
322 case KVM_INST_MTSPR_SPRG1:
323 kvm_patch_ins_std(inst, magic_var(sprg1), inst_rt);
324 break;
325 case KVM_INST_MTSPR_SPRG2:
326 kvm_patch_ins_std(inst, magic_var(sprg2), inst_rt);
327 break;
328 case KVM_INST_MTSPR_SPRG3:
329 kvm_patch_ins_std(inst, magic_var(sprg3), inst_rt);
330 break;
331 case KVM_INST_MTSPR_SRR0:
332 kvm_patch_ins_std(inst, magic_var(srr0), inst_rt);
333 break;
334 case KVM_INST_MTSPR_SRR1:
335 kvm_patch_ins_std(inst, magic_var(srr1), inst_rt);
336 break;
337 case KVM_INST_MTSPR_DAR:
338 kvm_patch_ins_std(inst, magic_var(dar), inst_rt);
339 break;
340 case KVM_INST_MTSPR_DSISR:
341 kvm_patch_ins_stw(inst, magic_var(dsisr), inst_rt);
342 break;
Alexander Grafd1290b152010-07-29 14:48:00 +0200343
344 /* Nops */
345 case KVM_INST_TLBSYNC:
346 kvm_patch_ins_nop(inst);
347 break;
Alexander Graf819a63d2010-07-29 14:48:04 +0200348
349 /* Rewrites */
350 case KVM_INST_MTMSRD_L1:
351 /* We use r30 and r31 during the hook */
352 if (get_rt(inst_rt) < 30)
353 kvm_patch_ins_mtmsrd(inst, inst_rt);
354 break;
Alexander Graf78109272010-07-29 14:48:05 +0200355 case KVM_INST_MTMSR:
356 case KVM_INST_MTMSRD_L0:
357 /* We use r30 and r31 during the hook */
358 if (get_rt(inst_rt) < 30)
359 kvm_patch_ins_mtmsr(inst, inst_rt);
360 break;
Alexander Graf73a18102010-07-29 14:47:58 +0200361 }
362
363 switch (_inst) {
Alexander Graf644bfa02010-07-29 14:48:06 +0200364#ifdef CONFIG_BOOKE
365 case KVM_INST_WRTEEI_0:
366 case KVM_INST_WRTEEI_1:
367 kvm_patch_ins_wrteei(inst);
368 break;
369#endif
Alexander Graf73a18102010-07-29 14:47:58 +0200370 }
371}
372
373static void kvm_use_magic_page(void)
374{
375 u32 *p;
376 u32 *start, *end;
377 u32 tmp;
Alexander Graf7508e162010-08-03 11:32:56 +0200378 u32 features;
Alexander Graf73a18102010-07-29 14:47:58 +0200379
380 /* Tell the host to map the magic page to -4096 on all CPUs */
Alexander Graf7508e162010-08-03 11:32:56 +0200381 on_each_cpu(kvm_map_magic_page, &features, 1);
Alexander Graf73a18102010-07-29 14:47:58 +0200382
383 /* Quick self-test to see if the mapping works */
384 if (__get_user(tmp, (u32*)KVM_MAGIC_PAGE)) {
385 kvm_patching_worked = false;
386 return;
387 }
388
389 /* Now loop through all code and find instructions */
390 start = (void*)_stext;
391 end = (void*)_etext;
392
393 for (p = start; p < end; p++)
Alexander Graf7508e162010-08-03 11:32:56 +0200394 kvm_check_ins(p, features);
Alexander Graf73a18102010-07-29 14:47:58 +0200395
396 printk(KERN_INFO "KVM: Live patching for a fast VM %s\n",
397 kvm_patching_worked ? "worked" : "failed");
398}
399
Alexander Graf2a342ed2010-07-29 14:47:48 +0200400unsigned long kvm_hypercall(unsigned long *in,
401 unsigned long *out,
402 unsigned long nr)
403{
404 unsigned long register r0 asm("r0");
405 unsigned long register r3 asm("r3") = in[0];
406 unsigned long register r4 asm("r4") = in[1];
407 unsigned long register r5 asm("r5") = in[2];
408 unsigned long register r6 asm("r6") = in[3];
409 unsigned long register r7 asm("r7") = in[4];
410 unsigned long register r8 asm("r8") = in[5];
411 unsigned long register r9 asm("r9") = in[6];
412 unsigned long register r10 asm("r10") = in[7];
413 unsigned long register r11 asm("r11") = nr;
414 unsigned long register r12 asm("r12");
415
416 asm volatile("bl kvm_hypercall_start"
417 : "=r"(r0), "=r"(r3), "=r"(r4), "=r"(r5), "=r"(r6),
418 "=r"(r7), "=r"(r8), "=r"(r9), "=r"(r10), "=r"(r11),
419 "=r"(r12)
420 : "r"(r3), "r"(r4), "r"(r5), "r"(r6), "r"(r7), "r"(r8),
421 "r"(r9), "r"(r10), "r"(r11)
422 : "memory", "cc", "xer", "ctr", "lr");
423
424 out[0] = r4;
425 out[1] = r5;
426 out[2] = r6;
427 out[3] = r7;
428 out[4] = r8;
429 out[5] = r9;
430 out[6] = r10;
431 out[7] = r11;
432
433 return r3;
434}
435EXPORT_SYMBOL_GPL(kvm_hypercall);
Alexander Graf73a18102010-07-29 14:47:58 +0200436
437static int kvm_para_setup(void)
438{
439 extern u32 kvm_hypercall_start;
440 struct device_node *hyper_node;
441 u32 *insts;
442 int len, i;
443
444 hyper_node = of_find_node_by_path("/hypervisor");
445 if (!hyper_node)
446 return -1;
447
448 insts = (u32*)of_get_property(hyper_node, "hcall-instructions", &len);
449 if (len % 4)
450 return -1;
451 if (len > (4 * 4))
452 return -1;
453
454 for (i = 0; i < (len / 4); i++)
455 kvm_patch_ins(&(&kvm_hypercall_start)[i], insts[i]);
456
457 return 0;
458}
459
Alexander Graf2d4f5672010-07-29 14:48:01 +0200460static __init void kvm_free_tmp(void)
461{
462 unsigned long start, end;
463
464 start = (ulong)&kvm_tmp[kvm_tmp_index + (PAGE_SIZE - 1)] & PAGE_MASK;
465 end = (ulong)&kvm_tmp[ARRAY_SIZE(kvm_tmp)] & PAGE_MASK;
466
467 /* Free the tmp space we don't need */
468 for (; start < end; start += PAGE_SIZE) {
469 ClearPageReserved(virt_to_page(start));
470 init_page_count(virt_to_page(start));
471 free_page(start);
472 totalram_pages++;
473 }
474}
475
Alexander Graf73a18102010-07-29 14:47:58 +0200476static int __init kvm_guest_init(void)
477{
478 if (!kvm_para_available())
Alexander Graf2d4f5672010-07-29 14:48:01 +0200479 goto free_tmp;
Alexander Graf73a18102010-07-29 14:47:58 +0200480
481 if (kvm_para_setup())
Alexander Graf2d4f5672010-07-29 14:48:01 +0200482 goto free_tmp;
Alexander Graf73a18102010-07-29 14:47:58 +0200483
484 if (kvm_para_has_feature(KVM_FEATURE_MAGIC_PAGE))
485 kvm_use_magic_page();
486
Alexander Graf2d4f5672010-07-29 14:48:01 +0200487free_tmp:
488 kvm_free_tmp();
489
Alexander Graf73a18102010-07-29 14:47:58 +0200490 return 0;
491}
492
493postcore_initcall(kvm_guest_init);