2 * Copyright (C) 2010 SUSE Linux Products GmbH. All rights reserved.
3 * Copyright 2010-2011 Freescale Semiconductor, Inc.
6 * Alexander Graf <agraf@suse.de>
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License, version 2, as
10 * published by the Free Software Foundation.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
22 #include <linux/kvm_host.h>
23 #include <linux/init.h>
24 #include <linux/export.h>
25 #include <linux/kvm_para.h>
26 #include <linux/slab.h>
30 #include <asm/sections.h>
31 #include <asm/cacheflush.h>
32 #include <asm/disassemble.h>
33 #include <asm/ppc-opcode.h>
35 #define KVM_MAGIC_PAGE (-4096L)
36 #define magic_var(x) KVM_MAGIC_PAGE + offsetof(struct kvm_vcpu_arch_shared, x)
38 #define KVM_INST_LWZ 0x80000000
39 #define KVM_INST_STW 0x90000000
40 #define KVM_INST_LD 0xe8000000
41 #define KVM_INST_STD 0xf8000000
42 #define KVM_INST_NOP 0x60000000
43 #define KVM_INST_B 0x48000000
44 #define KVM_INST_B_MASK 0x03ffffff
45 #define KVM_INST_B_MAX 0x01ffffff
46 #define KVM_INST_LI 0x38000000
48 #define KVM_MASK_RT 0x03e00000
49 #define KVM_RT_30 0x03c00000
50 #define KVM_MASK_RB 0x0000f800
51 #define KVM_INST_MFMSR 0x7c0000a6
52 #define KVM_INST_MFSPR_SPRG0 0x7c1042a6
53 #define KVM_INST_MFSPR_SPRG1 0x7c1142a6
54 #define KVM_INST_MFSPR_SPRG2 0x7c1242a6
55 #define KVM_INST_MFSPR_SPRG3 0x7c1342a6
56 #define KVM_INST_MFSPR_SRR0 0x7c1a02a6
57 #define KVM_INST_MFSPR_SRR1 0x7c1b02a6
58 #define KVM_INST_MFSPR_DAR 0x7c1302a6
59 #define KVM_INST_MFSPR_DSISR 0x7c1202a6
61 #define KVM_INST_MTSPR_SPRG0 0x7c1043a6
62 #define KVM_INST_MTSPR_SPRG1 0x7c1143a6
63 #define KVM_INST_MTSPR_SPRG2 0x7c1243a6
64 #define KVM_INST_MTSPR_SPRG3 0x7c1343a6
65 #define KVM_INST_MTSPR_SRR0 0x7c1a03a6
66 #define KVM_INST_MTSPR_SRR1 0x7c1b03a6
67 #define KVM_INST_MTSPR_DAR 0x7c1303a6
68 #define KVM_INST_MTSPR_DSISR 0x7c1203a6
70 #define KVM_INST_TLBSYNC 0x7c00046c
71 #define KVM_INST_MTMSRD_L0 0x7c000164
72 #define KVM_INST_MTMSRD_L1 0x7c010164
73 #define KVM_INST_MTMSR 0x7c000124
75 #define KVM_INST_WRTEE 0x7c000106
76 #define KVM_INST_WRTEEI_0 0x7c000146
77 #define KVM_INST_WRTEEI_1 0x7c008146
79 #define KVM_INST_MTSRIN 0x7c0001e4
81 static bool kvm_patching_worked = true;
82 static char kvm_tmp[1024 * 1024];
83 static int kvm_tmp_index;
85 static inline void kvm_patch_ins(u32 *inst, u32 new_inst)
88 flush_icache_range((ulong)inst, (ulong)inst + 4);
91 static void kvm_patch_ins_ll(u32 *inst, long addr, u32 rt)
94 kvm_patch_ins(inst, KVM_INST_LD | rt | (addr & 0x0000fffc));
96 kvm_patch_ins(inst, KVM_INST_LWZ | rt | (addr & 0x0000fffc));
100 static void kvm_patch_ins_ld(u32 *inst, long addr, u32 rt)
103 kvm_patch_ins(inst, KVM_INST_LD | rt | (addr & 0x0000fffc));
105 kvm_patch_ins(inst, KVM_INST_LWZ | rt | ((addr + 4) & 0x0000fffc));
109 static void kvm_patch_ins_lwz(u32 *inst, long addr, u32 rt)
111 kvm_patch_ins(inst, KVM_INST_LWZ | rt | (addr & 0x0000ffff));
114 static void kvm_patch_ins_std(u32 *inst, long addr, u32 rt)
117 kvm_patch_ins(inst, KVM_INST_STD | rt | (addr & 0x0000fffc));
119 kvm_patch_ins(inst, KVM_INST_STW | rt | ((addr + 4) & 0x0000fffc));
123 static void kvm_patch_ins_stw(u32 *inst, long addr, u32 rt)
125 kvm_patch_ins(inst, KVM_INST_STW | rt | (addr & 0x0000fffc));
128 static void kvm_patch_ins_nop(u32 *inst)
130 kvm_patch_ins(inst, KVM_INST_NOP);
133 static void kvm_patch_ins_b(u32 *inst, int addr)
135 #if defined(CONFIG_RELOCATABLE) && defined(CONFIG_PPC_BOOK3S)
136 /* On relocatable kernels interrupts handlers and our code
137 can be in different regions, so we don't patch them */
139 if ((ulong)inst < (ulong)&__end_interrupts)
143 kvm_patch_ins(inst, KVM_INST_B | (addr & KVM_INST_B_MASK));
146 static u32 *kvm_alloc(int len)
150 if ((kvm_tmp_index + len) > ARRAY_SIZE(kvm_tmp)) {
151 printk(KERN_ERR "KVM: No more space (%d + %d)\n",
153 kvm_patching_worked = false;
157 p = (void*)&kvm_tmp[kvm_tmp_index];
158 kvm_tmp_index += len;
163 extern u32 kvm_emulate_mtmsrd_branch_offs;
164 extern u32 kvm_emulate_mtmsrd_reg_offs;
165 extern u32 kvm_emulate_mtmsrd_orig_ins_offs;
166 extern u32 kvm_emulate_mtmsrd_len;
167 extern u32 kvm_emulate_mtmsrd[];
169 static void kvm_patch_ins_mtmsrd(u32 *inst, u32 rt)
176 p = kvm_alloc(kvm_emulate_mtmsrd_len * 4);
180 /* Find out where we are and put everything there */
181 distance_start = (ulong)p - (ulong)inst;
182 next_inst = ((ulong)inst + 4);
183 distance_end = next_inst - (ulong)&p[kvm_emulate_mtmsrd_branch_offs];
185 /* Make sure we only write valid b instructions */
186 if (distance_start > KVM_INST_B_MAX) {
187 kvm_patching_worked = false;
191 /* Modify the chunk to fit the invocation */
192 memcpy(p, kvm_emulate_mtmsrd, kvm_emulate_mtmsrd_len * 4);
193 p[kvm_emulate_mtmsrd_branch_offs] |= distance_end & KVM_INST_B_MASK;
194 switch (get_rt(rt)) {
196 kvm_patch_ins_ll(&p[kvm_emulate_mtmsrd_reg_offs],
197 magic_var(scratch2), KVM_RT_30);
200 kvm_patch_ins_ll(&p[kvm_emulate_mtmsrd_reg_offs],
201 magic_var(scratch1), KVM_RT_30);
204 p[kvm_emulate_mtmsrd_reg_offs] |= rt;
208 p[kvm_emulate_mtmsrd_orig_ins_offs] = *inst;
209 flush_icache_range((ulong)p, (ulong)p + kvm_emulate_mtmsrd_len * 4);
211 /* Patch the invocation */
212 kvm_patch_ins_b(inst, distance_start);
215 extern u32 kvm_emulate_mtmsr_branch_offs;
216 extern u32 kvm_emulate_mtmsr_reg1_offs;
217 extern u32 kvm_emulate_mtmsr_reg2_offs;
218 extern u32 kvm_emulate_mtmsr_orig_ins_offs;
219 extern u32 kvm_emulate_mtmsr_len;
220 extern u32 kvm_emulate_mtmsr[];
222 static void kvm_patch_ins_mtmsr(u32 *inst, u32 rt)
229 p = kvm_alloc(kvm_emulate_mtmsr_len * 4);
233 /* Find out where we are and put everything there */
234 distance_start = (ulong)p - (ulong)inst;
235 next_inst = ((ulong)inst + 4);
236 distance_end = next_inst - (ulong)&p[kvm_emulate_mtmsr_branch_offs];
238 /* Make sure we only write valid b instructions */
239 if (distance_start > KVM_INST_B_MAX) {
240 kvm_patching_worked = false;
244 /* Modify the chunk to fit the invocation */
245 memcpy(p, kvm_emulate_mtmsr, kvm_emulate_mtmsr_len * 4);
246 p[kvm_emulate_mtmsr_branch_offs] |= distance_end & KVM_INST_B_MASK;
248 /* Make clobbered registers work too */
249 switch (get_rt(rt)) {
251 kvm_patch_ins_ll(&p[kvm_emulate_mtmsr_reg1_offs],
252 magic_var(scratch2), KVM_RT_30);
253 kvm_patch_ins_ll(&p[kvm_emulate_mtmsr_reg2_offs],
254 magic_var(scratch2), KVM_RT_30);
257 kvm_patch_ins_ll(&p[kvm_emulate_mtmsr_reg1_offs],
258 magic_var(scratch1), KVM_RT_30);
259 kvm_patch_ins_ll(&p[kvm_emulate_mtmsr_reg2_offs],
260 magic_var(scratch1), KVM_RT_30);
263 p[kvm_emulate_mtmsr_reg1_offs] |= rt;
264 p[kvm_emulate_mtmsr_reg2_offs] |= rt;
268 p[kvm_emulate_mtmsr_orig_ins_offs] = *inst;
269 flush_icache_range((ulong)p, (ulong)p + kvm_emulate_mtmsr_len * 4);
271 /* Patch the invocation */
272 kvm_patch_ins_b(inst, distance_start);
277 extern u32 kvm_emulate_wrtee_branch_offs;
278 extern u32 kvm_emulate_wrtee_reg_offs;
279 extern u32 kvm_emulate_wrtee_orig_ins_offs;
280 extern u32 kvm_emulate_wrtee_len;
281 extern u32 kvm_emulate_wrtee[];
283 static void kvm_patch_ins_wrtee(u32 *inst, u32 rt, int imm_one)
290 p = kvm_alloc(kvm_emulate_wrtee_len * 4);
294 /* Find out where we are and put everything there */
295 distance_start = (ulong)p - (ulong)inst;
296 next_inst = ((ulong)inst + 4);
297 distance_end = next_inst - (ulong)&p[kvm_emulate_wrtee_branch_offs];
299 /* Make sure we only write valid b instructions */
300 if (distance_start > KVM_INST_B_MAX) {
301 kvm_patching_worked = false;
305 /* Modify the chunk to fit the invocation */
306 memcpy(p, kvm_emulate_wrtee, kvm_emulate_wrtee_len * 4);
307 p[kvm_emulate_wrtee_branch_offs] |= distance_end & KVM_INST_B_MASK;
310 p[kvm_emulate_wrtee_reg_offs] =
311 KVM_INST_LI | __PPC_RT(30) | MSR_EE;
313 /* Make clobbered registers work too */
314 switch (get_rt(rt)) {
316 kvm_patch_ins_ll(&p[kvm_emulate_wrtee_reg_offs],
317 magic_var(scratch2), KVM_RT_30);
320 kvm_patch_ins_ll(&p[kvm_emulate_wrtee_reg_offs],
321 magic_var(scratch1), KVM_RT_30);
324 p[kvm_emulate_wrtee_reg_offs] |= rt;
329 p[kvm_emulate_wrtee_orig_ins_offs] = *inst;
330 flush_icache_range((ulong)p, (ulong)p + kvm_emulate_wrtee_len * 4);
332 /* Patch the invocation */
333 kvm_patch_ins_b(inst, distance_start);
336 extern u32 kvm_emulate_wrteei_0_branch_offs;
337 extern u32 kvm_emulate_wrteei_0_len;
338 extern u32 kvm_emulate_wrteei_0[];
340 static void kvm_patch_ins_wrteei_0(u32 *inst)
347 p = kvm_alloc(kvm_emulate_wrteei_0_len * 4);
351 /* Find out where we are and put everything there */
352 distance_start = (ulong)p - (ulong)inst;
353 next_inst = ((ulong)inst + 4);
354 distance_end = next_inst - (ulong)&p[kvm_emulate_wrteei_0_branch_offs];
356 /* Make sure we only write valid b instructions */
357 if (distance_start > KVM_INST_B_MAX) {
358 kvm_patching_worked = false;
362 memcpy(p, kvm_emulate_wrteei_0, kvm_emulate_wrteei_0_len * 4);
363 p[kvm_emulate_wrteei_0_branch_offs] |= distance_end & KVM_INST_B_MASK;
364 flush_icache_range((ulong)p, (ulong)p + kvm_emulate_wrteei_0_len * 4);
366 /* Patch the invocation */
367 kvm_patch_ins_b(inst, distance_start);
372 #ifdef CONFIG_PPC_BOOK3S_32
374 extern u32 kvm_emulate_mtsrin_branch_offs;
375 extern u32 kvm_emulate_mtsrin_reg1_offs;
376 extern u32 kvm_emulate_mtsrin_reg2_offs;
377 extern u32 kvm_emulate_mtsrin_orig_ins_offs;
378 extern u32 kvm_emulate_mtsrin_len;
379 extern u32 kvm_emulate_mtsrin[];
381 static void kvm_patch_ins_mtsrin(u32 *inst, u32 rt, u32 rb)
388 p = kvm_alloc(kvm_emulate_mtsrin_len * 4);
392 /* Find out where we are and put everything there */
393 distance_start = (ulong)p - (ulong)inst;
394 next_inst = ((ulong)inst + 4);
395 distance_end = next_inst - (ulong)&p[kvm_emulate_mtsrin_branch_offs];
397 /* Make sure we only write valid b instructions */
398 if (distance_start > KVM_INST_B_MAX) {
399 kvm_patching_worked = false;
403 /* Modify the chunk to fit the invocation */
404 memcpy(p, kvm_emulate_mtsrin, kvm_emulate_mtsrin_len * 4);
405 p[kvm_emulate_mtsrin_branch_offs] |= distance_end & KVM_INST_B_MASK;
406 p[kvm_emulate_mtsrin_reg1_offs] |= (rb << 10);
407 p[kvm_emulate_mtsrin_reg2_offs] |= rt;
408 p[kvm_emulate_mtsrin_orig_ins_offs] = *inst;
409 flush_icache_range((ulong)p, (ulong)p + kvm_emulate_mtsrin_len * 4);
411 /* Patch the invocation */
412 kvm_patch_ins_b(inst, distance_start);
417 static void kvm_map_magic_page(void *data)
419 u32 *features = data;
424 in[0] = KVM_MAGIC_PAGE;
425 in[1] = KVM_MAGIC_PAGE;
427 kvm_hypercall(in, out, HC_VENDOR_KVM | KVM_HC_PPC_MAP_MAGIC_PAGE);
432 static void kvm_check_ins(u32 *inst, u32 features)
435 u32 inst_no_rt = _inst & ~KVM_MASK_RT;
436 u32 inst_rt = _inst & KVM_MASK_RT;
438 switch (inst_no_rt) {
441 kvm_patch_ins_ld(inst, magic_var(msr), inst_rt);
443 case KVM_INST_MFSPR_SPRG0:
444 kvm_patch_ins_ld(inst, magic_var(sprg0), inst_rt);
446 case KVM_INST_MFSPR_SPRG1:
447 kvm_patch_ins_ld(inst, magic_var(sprg1), inst_rt);
449 case KVM_INST_MFSPR_SPRG2:
450 kvm_patch_ins_ld(inst, magic_var(sprg2), inst_rt);
452 case KVM_INST_MFSPR_SPRG3:
453 kvm_patch_ins_ld(inst, magic_var(sprg3), inst_rt);
455 case KVM_INST_MFSPR_SRR0:
456 kvm_patch_ins_ld(inst, magic_var(srr0), inst_rt);
458 case KVM_INST_MFSPR_SRR1:
459 kvm_patch_ins_ld(inst, magic_var(srr1), inst_rt);
461 case KVM_INST_MFSPR_DAR:
462 kvm_patch_ins_ld(inst, magic_var(dar), inst_rt);
464 case KVM_INST_MFSPR_DSISR:
465 kvm_patch_ins_lwz(inst, magic_var(dsisr), inst_rt);
469 case KVM_INST_MTSPR_SPRG0:
470 kvm_patch_ins_std(inst, magic_var(sprg0), inst_rt);
472 case KVM_INST_MTSPR_SPRG1:
473 kvm_patch_ins_std(inst, magic_var(sprg1), inst_rt);
475 case KVM_INST_MTSPR_SPRG2:
476 kvm_patch_ins_std(inst, magic_var(sprg2), inst_rt);
478 case KVM_INST_MTSPR_SPRG3:
479 kvm_patch_ins_std(inst, magic_var(sprg3), inst_rt);
481 case KVM_INST_MTSPR_SRR0:
482 kvm_patch_ins_std(inst, magic_var(srr0), inst_rt);
484 case KVM_INST_MTSPR_SRR1:
485 kvm_patch_ins_std(inst, magic_var(srr1), inst_rt);
487 case KVM_INST_MTSPR_DAR:
488 kvm_patch_ins_std(inst, magic_var(dar), inst_rt);
490 case KVM_INST_MTSPR_DSISR:
491 kvm_patch_ins_stw(inst, magic_var(dsisr), inst_rt);
495 case KVM_INST_TLBSYNC:
496 kvm_patch_ins_nop(inst);
500 case KVM_INST_MTMSRD_L1:
501 kvm_patch_ins_mtmsrd(inst, inst_rt);
504 case KVM_INST_MTMSRD_L0:
505 kvm_patch_ins_mtmsr(inst, inst_rt);
509 kvm_patch_ins_wrtee(inst, inst_rt, 0);
514 switch (inst_no_rt & ~KVM_MASK_RB) {
515 #ifdef CONFIG_PPC_BOOK3S_32
516 case KVM_INST_MTSRIN:
517 if (features & KVM_MAGIC_FEAT_SR) {
518 u32 inst_rb = _inst & KVM_MASK_RB;
519 kvm_patch_ins_mtsrin(inst, inst_rt, inst_rb);
528 case KVM_INST_WRTEEI_0:
529 kvm_patch_ins_wrteei_0(inst);
532 case KVM_INST_WRTEEI_1:
533 kvm_patch_ins_wrtee(inst, 0, 1);
539 static void kvm_use_magic_page(void)
546 /* Tell the host to map the magic page to -4096 on all CPUs */
547 on_each_cpu(kvm_map_magic_page, &features, 1);
549 /* Quick self-test to see if the mapping works */
550 if (__get_user(tmp, (u32*)KVM_MAGIC_PAGE)) {
551 kvm_patching_worked = false;
555 /* Now loop through all code and find instructions */
556 start = (void*)_stext;
559 for (p = start; p < end; p++)
560 kvm_check_ins(p, features);
562 printk(KERN_INFO "KVM: Live patching for a fast VM %s\n",
563 kvm_patching_worked ? "worked" : "failed");
566 unsigned long kvm_hypercall(unsigned long *in,
570 unsigned long register r0 asm("r0");
571 unsigned long register r3 asm("r3") = in[0];
572 unsigned long register r4 asm("r4") = in[1];
573 unsigned long register r5 asm("r5") = in[2];
574 unsigned long register r6 asm("r6") = in[3];
575 unsigned long register r7 asm("r7") = in[4];
576 unsigned long register r8 asm("r8") = in[5];
577 unsigned long register r9 asm("r9") = in[6];
578 unsigned long register r10 asm("r10") = in[7];
579 unsigned long register r11 asm("r11") = nr;
580 unsigned long register r12 asm("r12");
582 asm volatile("bl kvm_hypercall_start"
583 : "=r"(r0), "=r"(r3), "=r"(r4), "=r"(r5), "=r"(r6),
584 "=r"(r7), "=r"(r8), "=r"(r9), "=r"(r10), "=r"(r11),
586 : "r"(r3), "r"(r4), "r"(r5), "r"(r6), "r"(r7), "r"(r8),
587 "r"(r9), "r"(r10), "r"(r11)
588 : "memory", "cc", "xer", "ctr", "lr");
601 EXPORT_SYMBOL_GPL(kvm_hypercall);
603 static int kvm_para_setup(void)
605 extern u32 kvm_hypercall_start;
606 struct device_node *hyper_node;
610 hyper_node = of_find_node_by_path("/hypervisor");
614 insts = (u32*)of_get_property(hyper_node, "hcall-instructions", &len);
620 for (i = 0; i < (len / 4); i++)
621 kvm_patch_ins(&(&kvm_hypercall_start)[i], insts[i]);
626 static __init void kvm_free_tmp(void)
628 unsigned long start, end;
630 start = (ulong)&kvm_tmp[kvm_tmp_index + (PAGE_SIZE - 1)] & PAGE_MASK;
631 end = (ulong)&kvm_tmp[ARRAY_SIZE(kvm_tmp)] & PAGE_MASK;
633 /* Free the tmp space we don't need */
634 for (; start < end; start += PAGE_SIZE) {
635 ClearPageReserved(virt_to_page(start));
636 init_page_count(virt_to_page(start));
642 static int __init kvm_guest_init(void)
644 if (!kvm_para_available())
647 if (kvm_para_setup())
650 if (kvm_para_has_feature(KVM_FEATURE_MAGIC_PAGE))
651 kvm_use_magic_page();
653 #ifdef CONFIG_PPC_BOOK3S_64
664 postcore_initcall(kvm_guest_init);