2 * This program is free software; you can redistribute it and/or modify
3 * it under the terms of the GNU General Public License, version 2, as
4 * published by the Free Software Foundation.
6 * This program is distributed in the hope that it will be useful,
7 * but WITHOUT ANY WARRANTY; without even the implied warranty of
8 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
9 * GNU General Public License for more details.
11 * You should have received a copy of the GNU General Public License
12 * along with this program; if not, write to the Free Software
13 * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
15 * Copyright IBM Corp. 2007
17 * Authors: Hollis Blanchard <hollisb@us.ibm.com>
20 #ifndef __POWERPC_KVM_HOST_H__
21 #define __POWERPC_KVM_HOST_H__
23 #include <linux/mutex.h>
24 #include <linux/hrtimer.h>
25 #include <linux/interrupt.h>
26 #include <linux/types.h>
27 #include <linux/kvm_types.h>
28 #include <linux/threads.h>
29 #include <linux/spinlock.h>
30 #include <linux/kvm_para.h>
31 #include <linux/list.h>
32 #include <linux/atomic.h>
33 #include <asm/kvm_asm.h>
34 #include <asm/processor.h>
36 #include <asm/cacheflush.h>
37 #include <asm/hvcall.h>
39 #define KVM_MAX_VCPUS NR_CPUS
40 #define KVM_MAX_VCORES NR_CPUS
41 #define KVM_USER_MEM_SLOTS 512
43 #ifdef CONFIG_KVM_MMIO
44 #define KVM_COALESCED_MMIO_PAGE_OFFSET 1
46 #define KVM_HALT_POLL_NS_DEFAULT 500000
48 /* These values are internal and can be increased later */
49 #define KVM_NR_IRQCHIPS 1
50 #define KVM_IRQCHIP_NUM_PINS 256
52 /* PPC-specific vcpu->requests bit members */
53 #define KVM_REQ_WATCHDOG 8
54 #define KVM_REQ_EPR_EXIT 9
56 #include <linux/mmu_notifier.h>
58 #define KVM_ARCH_WANT_MMU_NOTIFIER
60 extern int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
61 extern int kvm_unmap_hva_range(struct kvm *kvm,
62 unsigned long start, unsigned long end);
63 extern int kvm_age_hva(struct kvm *kvm, unsigned long start, unsigned long end);
64 extern int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
65 extern void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);
67 static inline void kvm_arch_mmu_notifier_invalidate_page(struct kvm *kvm,
68 unsigned long address)
72 #define HPTEG_CACHE_NUM (1 << 15)
73 #define HPTEG_HASH_BITS_PTE 13
74 #define HPTEG_HASH_BITS_PTE_LONG 12
75 #define HPTEG_HASH_BITS_VPTE 13
76 #define HPTEG_HASH_BITS_VPTE_LONG 5
77 #define HPTEG_HASH_BITS_VPTE_64K 11
78 #define HPTEG_HASH_NUM_PTE (1 << HPTEG_HASH_BITS_PTE)
79 #define HPTEG_HASH_NUM_PTE_LONG (1 << HPTEG_HASH_BITS_PTE_LONG)
80 #define HPTEG_HASH_NUM_VPTE (1 << HPTEG_HASH_BITS_VPTE)
81 #define HPTEG_HASH_NUM_VPTE_LONG (1 << HPTEG_HASH_BITS_VPTE_LONG)
82 #define HPTEG_HASH_NUM_VPTE_64K (1 << HPTEG_HASH_BITS_VPTE_64K)
84 /* Physical Address Mask - allowed range of real mode RAM access */
85 #define KVM_PAM 0x0fffffffffffffffULL
91 struct kvmppc_vcpu_book3s;
92 struct kvmppc_book3s_shadow_vcpu;
98 struct kvm_vcpu_stat {
103 /* Account for special types of light exits: */
104 u32 itlb_real_miss_exits;
105 u32 itlb_virt_miss_exits;
106 u32 dtlb_real_miss_exits;
107 u32 dtlb_virt_miss_exits;
111 u32 emulated_inst_exits;
114 u32 halt_successful_poll;
115 u32 halt_attempted_poll;
121 #ifdef CONFIG_PPC_BOOK3S
132 enum kvm_exit_types {
135 ITLB_REAL_MISS_EXITS,
136 ITLB_VIRT_MISS_EXITS,
137 DTLB_REAL_MISS_EXITS,
138 DTLB_VIRT_MISS_EXITS,
143 EMULATED_MTMSRWE_EXITS,
144 EMULATED_WRTEE_EXITS,
145 EMULATED_MTSPR_EXITS,
146 EMULATED_MFSPR_EXITS,
147 EMULATED_MTMSR_EXITS,
148 EMULATED_MFMSR_EXITS,
149 EMULATED_TLBSX_EXITS,
150 EMULATED_TLBWE_EXITS,
163 __NUMBER_OF_KVM_EXIT_TYPES
166 /* allow access to big endian 32bit upper/lower parts and 64bit var */
167 struct kvmppc_exit_timing {
176 struct kvmppc_pginfo {
181 struct kvmppc_spapr_tce_table {
182 struct list_head list;
186 struct page *pages[0];
189 /* XICS components, defined in book3s_xics.c */
194 * The reverse mapping array has one entry for each HPTE,
195 * which stores the guest's view of the second word of the HPTE
196 * (including the guest physical address of the mapping),
197 * plus forward and backward pointers in a doubly-linked ring
198 * of HPTEs that map the same host page. The pointers in this
199 * ring are 32-bit HPTE indexes, to save space.
201 struct revmap_entry {
202 unsigned long guest_rpte;
203 unsigned int forw, back;
207 * We use the top bit of each memslot->arch.rmap entry as a lock bit,
208 * and bit 32 as a present flag. The bottom 32 bits are the
209 * index in the guest HPT of a HPTE that points to the page.
211 #define KVMPPC_RMAP_LOCK_BIT 63
212 #define KVMPPC_RMAP_RC_SHIFT 32
213 #define KVMPPC_RMAP_CHG_SHIFT 48
214 #define KVMPPC_RMAP_REFERENCED (HPTE_R_R << KVMPPC_RMAP_RC_SHIFT)
215 #define KVMPPC_RMAP_CHANGED (HPTE_R_C << KVMPPC_RMAP_RC_SHIFT)
216 #define KVMPPC_RMAP_CHG_ORDER (0x3ful << KVMPPC_RMAP_CHG_SHIFT)
217 #define KVMPPC_RMAP_PRESENT 0x100000000ul
218 #define KVMPPC_RMAP_INDEX 0xfffffffful
220 struct kvm_arch_memory_slot {
221 #ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
223 #endif /* CONFIG_KVM_BOOK3S_HV_POSSIBLE */
228 #ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
229 unsigned long hpt_virt;
230 struct revmap_entry *revmap;
231 unsigned int host_lpid;
232 unsigned long host_lpcr;
234 unsigned long host_sdr1;
237 unsigned long vrma_slb_v;
240 atomic_t vcpus_running;
242 unsigned long hpt_npte;
243 unsigned long hpt_mask;
244 atomic_t hpte_mod_interest;
245 cpumask_t need_tlb_flush;
247 struct dentry *debugfs_dir;
248 struct dentry *htab_dentry;
249 #endif /* CONFIG_KVM_BOOK3S_HV_POSSIBLE */
250 #ifdef CONFIG_KVM_BOOK3S_PR_POSSIBLE
251 struct mutex hpt_mutex;
253 #ifdef CONFIG_PPC_BOOK3S_64
254 struct list_head spapr_tce_tables;
255 struct list_head rtas_tokens;
256 DECLARE_BITMAP(enabled_hcalls, MAX_HCALL_OPCODE/4 + 1);
258 #ifdef CONFIG_KVM_MPIC
259 struct openpic *mpic;
261 #ifdef CONFIG_KVM_XICS
262 struct kvmppc_xics *xics;
264 struct kvmppc_ops *kvm_ops;
265 #ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
266 /* This array can grow quite large, keep it at the end */
267 struct kvmppc_vcore *vcores[KVM_MAX_VCORES];
272 * Struct for a virtual core.
273 * Note: entry_exit_map combines a bitmap of threads that have entered
274 * in the bottom 8 bits and a bitmap of threads that have exited in the
275 * next 8 bits. This is so that we can atomically set the entry bit
276 * iff the exit map is 0 without taking a lock.
278 struct kvmppc_vcore {
288 struct kvmppc_vcore *master_vcore;
289 struct list_head runnable_threads;
290 struct list_head preempt_list;
292 wait_queue_head_t wq;
293 spinlock_t stoltb_lock; /* protects stolen_tb and preempt_tb */
296 struct kvm_vcpu *runner;
298 u64 tb_offset; /* guest timebase - host timebase */
302 ulong dpdes; /* doorbell state (POWER8) */
303 ulong conferring_threads;
306 #define VCORE_ENTRY_MAP(vc) ((vc)->entry_exit_map & 0xff)
307 #define VCORE_EXIT_MAP(vc) ((vc)->entry_exit_map >> 8)
308 #define VCORE_IS_EXITING(vc) (VCORE_EXIT_MAP(vc) != 0)
310 /* This bit is used when a vcore exit is triggered from outside the vcore */
311 #define VCORE_EXIT_REQ 0x10000
314 * Values for vcore_state.
315 * Note that these are arranged such that lower values
316 * (< VCORE_SLEEPING) don't require stolen time accounting
317 * on load/unload, and higher values do.
319 #define VCORE_INACTIVE 0
320 #define VCORE_PREEMPT 1
321 #define VCORE_PIGGYBACK 2
322 #define VCORE_SLEEPING 3
323 #define VCORE_RUNNING 4
324 #define VCORE_EXITING 5
327 * Struct used to manage memory for a virtual processor area
328 * registered by a PAPR guest. There are three types of area
329 * that a guest can register.
332 unsigned long gpa; /* Current guest phys addr */
333 void *pinned_addr; /* Address in kernel linear mapping */
334 void *pinned_end; /* End of region */
335 unsigned long next_gpa; /* Guest phys addr for update */
336 unsigned long len; /* Number of bytes required */
337 u8 update_pending; /* 1 => update pinned_addr from next_gpa */
338 bool dirty; /* true => area has been modified by kernel */
347 bool may_execute : 1;
348 u8 page_size; /* MMU_PAGE_xxx */
353 void (*slbmte)(struct kvm_vcpu *vcpu, u64 rb, u64 rs);
354 u64 (*slbmfee)(struct kvm_vcpu *vcpu, u64 slb_nr);
355 u64 (*slbmfev)(struct kvm_vcpu *vcpu, u64 slb_nr);
356 void (*slbie)(struct kvm_vcpu *vcpu, u64 slb_nr);
357 void (*slbia)(struct kvm_vcpu *vcpu);
359 void (*mtsrin)(struct kvm_vcpu *vcpu, u32 srnum, ulong value);
360 u32 (*mfsrin)(struct kvm_vcpu *vcpu, u32 srnum);
361 int (*xlate)(struct kvm_vcpu *vcpu, gva_t eaddr,
362 struct kvmppc_pte *pte, bool data, bool iswrite);
363 void (*reset_msr)(struct kvm_vcpu *vcpu);
364 void (*tlbie)(struct kvm_vcpu *vcpu, ulong addr, bool large);
365 int (*esid_to_vsid)(struct kvm_vcpu *vcpu, ulong esid, u64 *vsid);
366 u64 (*ea_to_vp)(struct kvm_vcpu *vcpu, gva_t eaddr, bool data);
367 bool (*is_dcbz32)(struct kvm_vcpu *vcpu);
379 bool large : 1; /* PTEs are 16MB */
380 bool tb : 1; /* 1TB segment */
382 u8 base_page_size; /* MMU_PAGE_xxx */
385 /* Struct used to accumulate timing information in HV real mode code */
386 struct kvmhv_tb_accumulator {
387 u64 seqcount; /* used to synchronize access, also count * 2 */
388 u64 tb_total; /* total time in timebase ticks */
389 u64 tb_min; /* min time */
390 u64 tb_max; /* max time */
393 # ifdef CONFIG_PPC_FSL_BOOK3E
394 #define KVMPPC_BOOKE_IAC_NUM 2
395 #define KVMPPC_BOOKE_DAC_NUM 2
397 #define KVMPPC_BOOKE_IAC_NUM 4
398 #define KVMPPC_BOOKE_DAC_NUM 2
400 #define KVMPPC_BOOKE_MAX_IAC 4
401 #define KVMPPC_BOOKE_MAX_DAC 2
403 /* KVMPPC_EPR_USER takes precedence over KVMPPC_EPR_KERNEL */
404 #define KVMPPC_EPR_NONE 0 /* EPR not supported */
405 #define KVMPPC_EPR_USER 1 /* exit to userspace to fill EPR */
406 #define KVMPPC_EPR_KERNEL 2 /* in-kernel irqchip */
408 #define KVMPPC_IRQ_DEFAULT 0
409 #define KVMPPC_IRQ_MPIC 1
410 #define KVMPPC_IRQ_XICS 2
414 struct kvm_vcpu_arch {
417 #ifdef CONFIG_PPC_BOOK3S
418 struct kvmppc_slb slb[64];
419 int slb_max; /* 1 + index of last valid entry in slb[] */
420 int slb_nr; /* total number of entries in SLB */
421 struct kvmppc_mmu mmu;
422 struct kvmppc_vcpu_book3s *book3s;
424 #ifdef CONFIG_PPC_BOOK3S_32
425 struct kvmppc_book3s_shadow_vcpu *shadow_vcpu;
430 struct thread_fp_state fp;
438 #ifdef CONFIG_ALTIVEC
439 struct thread_vr_state vr;
442 #ifdef CONFIG_KVM_BOOKE_HV
452 #if defined(CONFIG_BOOKE)
453 #if defined(CONFIG_KVM_BOOKE_HV) || defined(CONFIG_64BIT)
458 #ifdef CONFIG_PPC_BOOK3S
459 /* For Gekko paired singles */
466 #ifdef CONFIG_PPC_BOOK3S
473 #ifdef CONFIG_PPC_BOOK3S
475 ulong guest_owned_ext;
505 u32 vrsave; /* also USPRG0 */
507 /* shadow_msr is unused for BookE HV */
520 /* Time base value when we entered the guest */
525 ulong tsr; /* we need to perform set/clr_bits() which requires ulong */
545 #ifdef CONFIG_PPC_TRANSACTIONAL_MEM
560 struct thread_fp_state fp_tm;
562 struct thread_vr_state vr_tm;
563 u32 vrsave_tm; /* also USPRG0 */
567 #ifdef CONFIG_KVM_EXIT_TIMING
568 struct mutex exit_timing_lock;
569 struct kvmppc_exit_timing timing_exit;
570 struct kvmppc_exit_timing timing_last_enter;
572 u32 timing_count_type[__NUMBER_OF_KVM_EXIT_TYPES];
573 u64 timing_sum_duration[__NUMBER_OF_KVM_EXIT_TYPES];
574 u64 timing_sum_quad_duration[__NUMBER_OF_KVM_EXIT_TYPES];
575 u64 timing_min_duration[__NUMBER_OF_KVM_EXIT_TYPES];
576 u64 timing_max_duration[__NUMBER_OF_KVM_EXIT_TYPES];
577 u64 timing_last_exit;
578 struct dentry *debugfs_exit_timing;
581 #ifdef CONFIG_PPC_BOOK3S
584 unsigned long intr_msr;
593 struct timer_list wdt_timer;
602 /* guest debug registers*/
603 struct debug_reg dbg_reg;
605 gpa_t paddr_accessed;
606 gva_t vaddr_accessed;
609 u8 io_gpr; /* GPR used as IO source/target */
610 u8 mmio_host_swabbed;
619 u8 epr_flags; /* KVMPPC_EPR_xxx */
622 u32 cpr0_cfgaddr; /* holds the last set cpr0_cfgaddr */
624 struct hrtimer dec_timer;
627 unsigned long pending_exceptions;
632 wait_queue_head_t *wqp;
633 struct kvmppc_vcore *vcore;
640 wait_queue_head_t cpu_run;
642 struct kvm_vcpu_arch_shared *shared;
643 #if defined(CONFIG_PPC_BOOK3S_64) && defined(CONFIG_KVM_BOOK3S_PR_POSSIBLE)
644 bool shared_big_endian;
646 unsigned long magic_page_pa; /* phys addr to map the magic page to */
647 unsigned long magic_page_ea; /* effect. addr to map the magic page to */
648 bool disable_kernel_nx;
650 int irq_type; /* one of KVM_IRQ_* */
652 struct openpic *mpic; /* KVM_IRQ_MPIC */
653 #ifdef CONFIG_KVM_XICS
654 struct kvmppc_icp *icp; /* XICS presentation controller */
657 #ifdef CONFIG_KVM_BOOK3S_HV_POSSIBLE
658 struct kvm_vcpu_arch_shared shregs;
660 unsigned long pgfault_addr;
662 unsigned long pgfault_hpte[2];
664 struct list_head run_list;
665 struct task_struct *run_task;
666 struct kvm_run *kvm_run;
668 spinlock_t vpa_update_lock;
669 struct kvmppc_vpa vpa;
670 struct kvmppc_vpa dtl;
671 struct dtl_entry *dtl_ptr;
672 unsigned long dtl_index;
674 struct kvmppc_vpa slb_shadow;
676 spinlock_t tbacct_lock;
683 #ifdef CONFIG_KVM_BOOK3S_HV_EXIT_TIMING
684 struct kvmhv_tb_accumulator *cur_activity; /* What we're timing */
685 u64 cur_tb_start; /* when it started */
686 struct kvmhv_tb_accumulator rm_entry; /* real-mode entry code */
687 struct kvmhv_tb_accumulator rm_intr; /* real-mode intr handling */
688 struct kvmhv_tb_accumulator rm_exit; /* real-mode exit code */
689 struct kvmhv_tb_accumulator guest_time; /* guest execution */
690 struct kvmhv_tb_accumulator cede_time; /* time napping inside guest */
692 struct dentry *debugfs_dir;
693 struct dentry *debugfs_timings;
694 #endif /* CONFIG_KVM_BOOK3S_HV_EXIT_TIMING */
697 #define VCPU_FPR(vcpu, i) (vcpu)->arch.fp.fpr[i][TS_FPROFFSET]
699 /* Values for vcpu->arch.state */
700 #define KVMPPC_VCPU_NOTREADY 0
701 #define KVMPPC_VCPU_RUNNABLE 1
702 #define KVMPPC_VCPU_BUSY_IN_HOST 2
704 /* Values for vcpu->arch.io_gpr */
705 #define KVM_MMIO_REG_MASK 0x001f
706 #define KVM_MMIO_REG_EXT_MASK 0xffe0
707 #define KVM_MMIO_REG_GPR 0x0000
708 #define KVM_MMIO_REG_FPR 0x0020
709 #define KVM_MMIO_REG_QPR 0x0040
710 #define KVM_MMIO_REG_FQPR 0x0060
712 #define __KVM_HAVE_ARCH_WQP
713 #define __KVM_HAVE_CREATE_DEVICE
715 static inline void kvm_arch_hardware_disable(void) {}
716 static inline void kvm_arch_hardware_unsetup(void) {}
717 static inline void kvm_arch_sync_events(struct kvm *kvm) {}
718 static inline void kvm_arch_memslots_updated(struct kvm *kvm, struct kvm_memslots *slots) {}
719 static inline void kvm_arch_flush_shadow_all(struct kvm *kvm) {}
720 static inline void kvm_arch_sched_in(struct kvm_vcpu *vcpu, int cpu) {}
721 static inline void kvm_arch_exit(void) {}
722 static inline void kvm_arch_vcpu_blocking(struct kvm_vcpu *vcpu) {}
723 static inline void kvm_arch_vcpu_unblocking(struct kvm_vcpu *vcpu) {}
725 #endif /* __POWERPC_KVM_HOST_H__ */