1 /*
2  * This program is free software; you can redistribute it and/or modify
3  * it under the terms of the GNU General Public License, version 2, as
4  * published by the Free Software Foundation.
5  *
6  * This program is distributed in the hope that it will be useful,
7  * but WITHOUT ANY WARRANTY; without even the implied warranty of
8  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
9  * GNU General Public License for more details.
10  *
11  * You should have received a copy of the GNU General Public License
12  * along with this program; if not, write to the Free Software
13  * Foundation, 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
14  *
15  * Copyright IBM Corp. 2007
16  *
17  * Authors: Hollis Blanchard <hollisb@us.ibm.com>
18  */
19 
20 #ifndef __POWERPC_KVM_HOST_H__
21 #define __POWERPC_KVM_HOST_H__
22 
23 #include <linux/mutex.h>
24 #include <linux/hrtimer.h>
25 #include <linux/interrupt.h>
26 #include <linux/types.h>
27 #include <linux/kvm_types.h>
28 #include <linux/threads.h>
29 #include <linux/spinlock.h>
30 #include <linux/kvm_para.h>
31 #include <linux/list.h>
32 #include <linux/atomic.h>
33 #include <asm/kvm_asm.h>
34 #include <asm/processor.h>
35 #include <asm/page.h>
36 #include <asm/cacheflush.h>
37 
38 #define KVM_MAX_VCPUS		NR_CPUS
39 #define KVM_MAX_VCORES		NR_CPUS
40 #define KVM_USER_MEM_SLOTS 32
41 #define KVM_MEM_SLOTS_NUM KVM_USER_MEM_SLOTS
42 
43 #ifdef CONFIG_KVM_MMIO
44 #define KVM_COALESCED_MMIO_PAGE_OFFSET 1
45 #endif
46 
47 /* These values are internal and can be increased later */
48 #define KVM_NR_IRQCHIPS          1
49 #define KVM_IRQCHIP_NUM_PINS     256
50 
51 #if !defined(CONFIG_KVM_440)
52 #include <linux/mmu_notifier.h>
53 
54 #define KVM_ARCH_WANT_MMU_NOTIFIER
55 
56 struct kvm;
57 extern int kvm_unmap_hva(struct kvm *kvm, unsigned long hva);
58 extern int kvm_unmap_hva_range(struct kvm *kvm,
59 			       unsigned long start, unsigned long end);
60 extern int kvm_age_hva(struct kvm *kvm, unsigned long hva);
61 extern int kvm_test_age_hva(struct kvm *kvm, unsigned long hva);
62 extern void kvm_set_spte_hva(struct kvm *kvm, unsigned long hva, pte_t pte);
63 
64 #endif
65 
66 /* We don't currently support large pages. */
67 #define KVM_HPAGE_GFN_SHIFT(x)	0
68 #define KVM_NR_PAGE_SIZES	1
69 #define KVM_PAGES_PER_HPAGE(x)	(1UL<<31)
70 
71 #define HPTEG_CACHE_NUM			(1 << 15)
72 #define HPTEG_HASH_BITS_PTE		13
73 #define HPTEG_HASH_BITS_PTE_LONG	12
74 #define HPTEG_HASH_BITS_VPTE		13
75 #define HPTEG_HASH_BITS_VPTE_LONG	5
76 #define HPTEG_HASH_NUM_PTE		(1 << HPTEG_HASH_BITS_PTE)
77 #define HPTEG_HASH_NUM_PTE_LONG		(1 << HPTEG_HASH_BITS_PTE_LONG)
78 #define HPTEG_HASH_NUM_VPTE		(1 << HPTEG_HASH_BITS_VPTE)
79 #define HPTEG_HASH_NUM_VPTE_LONG	(1 << HPTEG_HASH_BITS_VPTE_LONG)
80 
81 /* Physical Address Mask - allowed range of real mode RAM access */
82 #define KVM_PAM			0x0fffffffffffffffULL
83 
84 struct kvm;
85 struct kvm_run;
86 struct kvm_vcpu;
87 
88 struct lppaca;
89 struct slb_shadow;
90 struct dtl_entry;
91 
92 struct kvm_vm_stat {
93 	u32 remote_tlb_flush;
94 };
95 
96 struct kvm_vcpu_stat {
97 	u32 sum_exits;
98 	u32 mmio_exits;
99 	u32 dcr_exits;
100 	u32 signal_exits;
101 	u32 light_exits;
102 	/* Account for special types of light exits: */
103 	u32 itlb_real_miss_exits;
104 	u32 itlb_virt_miss_exits;
105 	u32 dtlb_real_miss_exits;
106 	u32 dtlb_virt_miss_exits;
107 	u32 syscall_exits;
108 	u32 isi_exits;
109 	u32 dsi_exits;
110 	u32 emulated_inst_exits;
111 	u32 dec_exits;
112 	u32 ext_intr_exits;
113 	u32 halt_wakeup;
114 	u32 dbell_exits;
115 	u32 gdbell_exits;
116 #ifdef CONFIG_PPC_BOOK3S
117 	u32 pf_storage;
118 	u32 pf_instruc;
119 	u32 sp_storage;
120 	u32 sp_instruc;
121 	u32 queue_intr;
122 	u32 ld;
123 	u32 ld_slow;
124 	u32 st;
125 	u32 st_slow;
126 #endif
127 };
128 
129 enum kvm_exit_types {
130 	MMIO_EXITS,
131 	DCR_EXITS,
132 	SIGNAL_EXITS,
133 	ITLB_REAL_MISS_EXITS,
134 	ITLB_VIRT_MISS_EXITS,
135 	DTLB_REAL_MISS_EXITS,
136 	DTLB_VIRT_MISS_EXITS,
137 	SYSCALL_EXITS,
138 	ISI_EXITS,
139 	DSI_EXITS,
140 	EMULATED_INST_EXITS,
141 	EMULATED_MTMSRWE_EXITS,
142 	EMULATED_WRTEE_EXITS,
143 	EMULATED_MTSPR_EXITS,
144 	EMULATED_MFSPR_EXITS,
145 	EMULATED_MTMSR_EXITS,
146 	EMULATED_MFMSR_EXITS,
147 	EMULATED_TLBSX_EXITS,
148 	EMULATED_TLBWE_EXITS,
149 	EMULATED_RFI_EXITS,
150 	EMULATED_RFCI_EXITS,
151 	DEC_EXITS,
152 	EXT_INTR_EXITS,
153 	HALT_WAKEUP,
154 	USR_PR_INST,
155 	FP_UNAVAIL,
156 	DEBUG_EXITS,
157 	TIMEINGUEST,
158 	DBELL_EXITS,
159 	GDBELL_EXITS,
160 	__NUMBER_OF_KVM_EXIT_TYPES
161 };
162 
163 /* allow access to big endian 32bit upper/lower parts and 64bit var */
164 struct kvmppc_exit_timing {
165 	union {
166 		u64 tv64;
167 		struct {
168 			u32 tbu, tbl;
169 		} tv32;
170 	};
171 };
172 
173 struct kvmppc_pginfo {
174 	unsigned long pfn;
175 	atomic_t refcnt;
176 };
177 
178 struct kvmppc_spapr_tce_table {
179 	struct list_head list;
180 	struct kvm *kvm;
181 	u64 liobn;
182 	u32 window_size;
183 	struct page *pages[0];
184 };
185 
186 struct kvm_rma_info {
187 	atomic_t use_count;
188 	unsigned long base_pfn;
189 };
190 
191 /* XICS components, defined in book3s_xics.c */
192 struct kvmppc_xics;
193 struct kvmppc_icp;
194 
195 /*
196  * The reverse mapping array has one entry for each HPTE,
197  * which stores the guest's view of the second word of the HPTE
198  * (including the guest physical address of the mapping),
199  * plus forward and backward pointers in a doubly-linked ring
200  * of HPTEs that map the same host page.  The pointers in this
201  * ring are 32-bit HPTE indexes, to save space.
202  */
203 struct revmap_entry {
204 	unsigned long guest_rpte;
205 	unsigned int forw, back;
206 };
207 
208 /*
209  * We use the top bit of each memslot->arch.rmap entry as a lock bit,
210  * and bit 32 as a present flag.  The bottom 32 bits are the
211  * index in the guest HPT of a HPTE that points to the page.
212  */
213 #define KVMPPC_RMAP_LOCK_BIT	63
214 #define KVMPPC_RMAP_RC_SHIFT	32
215 #define KVMPPC_RMAP_REFERENCED	(HPTE_R_R << KVMPPC_RMAP_RC_SHIFT)
216 #define KVMPPC_RMAP_CHANGED	(HPTE_R_C << KVMPPC_RMAP_RC_SHIFT)
217 #define KVMPPC_RMAP_PRESENT	0x100000000ul
218 #define KVMPPC_RMAP_INDEX	0xfffffffful
219 
220 /* Low-order bits in memslot->arch.slot_phys[] */
221 #define KVMPPC_PAGE_ORDER_MASK	0x1f
222 #define KVMPPC_PAGE_NO_CACHE	HPTE_R_I	/* 0x20 */
223 #define KVMPPC_PAGE_WRITETHRU	HPTE_R_W	/* 0x40 */
224 #define KVMPPC_GOT_PAGE		0x80
225 
226 struct kvm_arch_memory_slot {
227 #ifdef CONFIG_KVM_BOOK3S_64_HV
228 	unsigned long *rmap;
229 	unsigned long *slot_phys;
230 #endif /* CONFIG_KVM_BOOK3S_64_HV */
231 };
232 
233 struct kvm_arch {
234 	unsigned int lpid;
235 #ifdef CONFIG_KVM_BOOK3S_64_HV
236 	unsigned long hpt_virt;
237 	struct revmap_entry *revmap;
238 	unsigned int host_lpid;
239 	unsigned long host_lpcr;
240 	unsigned long sdr1;
241 	unsigned long host_sdr1;
242 	int tlbie_lock;
243 	unsigned long lpcr;
244 	unsigned long rmor;
245 	struct kvm_rma_info *rma;
246 	unsigned long vrma_slb_v;
247 	int rma_setup_done;
248 	int using_mmu_notifiers;
249 	u32 hpt_order;
250 	atomic_t vcpus_running;
251 	u32 online_vcores;
252 	unsigned long hpt_npte;
253 	unsigned long hpt_mask;
254 	atomic_t hpte_mod_interest;
255 	spinlock_t slot_phys_lock;
256 	cpumask_t need_tlb_flush;
257 	struct kvmppc_vcore *vcores[KVM_MAX_VCORES];
258 	int hpt_cma_alloc;
259 #endif /* CONFIG_KVM_BOOK3S_64_HV */
260 #ifdef CONFIG_PPC_BOOK3S_64
261 	struct list_head spapr_tce_tables;
262 	struct list_head rtas_tokens;
263 #endif
264 #ifdef CONFIG_KVM_MPIC
265 	struct openpic *mpic;
266 #endif
267 #ifdef CONFIG_KVM_XICS
268 	struct kvmppc_xics *xics;
269 #endif
270 };
271 
272 /*
273  * Struct for a virtual core.
274  * Note: entry_exit_count combines an entry count in the bottom 8 bits
275  * and an exit count in the next 8 bits.  This is so that we can
276  * atomically increment the entry count iff the exit count is 0
277  * without taking the lock.
278  */
279 struct kvmppc_vcore {
280 	int n_runnable;
281 	int n_busy;
282 	int num_threads;
283 	int entry_exit_count;
284 	int n_woken;
285 	int nap_count;
286 	int napping_threads;
287 	u16 pcpu;
288 	u16 last_cpu;
289 	u8 vcore_state;
290 	u8 in_guest;
291 	struct list_head runnable_threads;
292 	spinlock_t lock;
293 	wait_queue_head_t wq;
294 	u64 stolen_tb;
295 	u64 preempt_tb;
296 	struct kvm_vcpu *runner;
297 };
298 
299 #define VCORE_ENTRY_COUNT(vc)	((vc)->entry_exit_count & 0xff)
300 #define VCORE_EXIT_COUNT(vc)	((vc)->entry_exit_count >> 8)
301 
302 /* Values for vcore_state */
303 #define VCORE_INACTIVE	0
304 #define VCORE_SLEEPING	1
305 #define VCORE_STARTING	2
306 #define VCORE_RUNNING	3
307 #define VCORE_EXITING	4
308 
309 /*
310  * Struct used to manage memory for a virtual processor area
311  * registered by a PAPR guest.  There are three types of area
312  * that a guest can register.
313  */
314 struct kvmppc_vpa {
315 	unsigned long gpa;	/* Current guest phys addr */
316 	void *pinned_addr;	/* Address in kernel linear mapping */
317 	void *pinned_end;	/* End of region */
318 	unsigned long next_gpa;	/* Guest phys addr for update */
319 	unsigned long len;	/* Number of bytes required */
320 	u8 update_pending;	/* 1 => update pinned_addr from next_gpa */
321 	bool dirty;		/* true => area has been modified by kernel */
322 };
323 
324 struct kvmppc_pte {
325 	ulong eaddr;
326 	u64 vpage;
327 	ulong raddr;
328 	bool may_read		: 1;
329 	bool may_write		: 1;
330 	bool may_execute	: 1;
331 };
332 
333 struct kvmppc_mmu {
334 	/* book3s_64 only */
335 	void (*slbmte)(struct kvm_vcpu *vcpu, u64 rb, u64 rs);
336 	u64  (*slbmfee)(struct kvm_vcpu *vcpu, u64 slb_nr);
337 	u64  (*slbmfev)(struct kvm_vcpu *vcpu, u64 slb_nr);
338 	void (*slbie)(struct kvm_vcpu *vcpu, u64 slb_nr);
339 	void (*slbia)(struct kvm_vcpu *vcpu);
340 	/* book3s */
341 	void (*mtsrin)(struct kvm_vcpu *vcpu, u32 srnum, ulong value);
342 	u32  (*mfsrin)(struct kvm_vcpu *vcpu, u32 srnum);
343 	int  (*xlate)(struct kvm_vcpu *vcpu, gva_t eaddr, struct kvmppc_pte *pte, bool data);
344 	void (*reset_msr)(struct kvm_vcpu *vcpu);
345 	void (*tlbie)(struct kvm_vcpu *vcpu, ulong addr, bool large);
346 	int  (*esid_to_vsid)(struct kvm_vcpu *vcpu, ulong esid, u64 *vsid);
347 	u64  (*ea_to_vp)(struct kvm_vcpu *vcpu, gva_t eaddr, bool data);
348 	bool (*is_dcbz32)(struct kvm_vcpu *vcpu);
349 };
350 
351 struct kvmppc_slb {
352 	u64 esid;
353 	u64 vsid;
354 	u64 orige;
355 	u64 origv;
356 	bool valid	: 1;
357 	bool Ks		: 1;
358 	bool Kp		: 1;
359 	bool nx		: 1;
360 	bool large	: 1;	/* PTEs are 16MB */
361 	bool tb		: 1;	/* 1TB segment */
362 	bool class	: 1;
363 };
364 
365 # ifdef CONFIG_PPC_FSL_BOOK3E
366 #define KVMPPC_BOOKE_IAC_NUM	2
367 #define KVMPPC_BOOKE_DAC_NUM	2
368 # else
369 #define KVMPPC_BOOKE_IAC_NUM	4
370 #define KVMPPC_BOOKE_DAC_NUM	2
371 # endif
372 #define KVMPPC_BOOKE_MAX_IAC	4
373 #define KVMPPC_BOOKE_MAX_DAC	2
374 
375 /* KVMPPC_EPR_USER takes precedence over KVMPPC_EPR_KERNEL */
376 #define KVMPPC_EPR_NONE		0 /* EPR not supported */
377 #define KVMPPC_EPR_USER		1 /* exit to userspace to fill EPR */
378 #define KVMPPC_EPR_KERNEL	2 /* in-kernel irqchip */
379 
380 struct kvmppc_booke_debug_reg {
381 	u32 dbcr0;
382 	u32 dbcr1;
383 	u32 dbcr2;
384 #ifdef CONFIG_KVM_E500MC
385 	u32 dbcr4;
386 #endif
387 	u64 iac[KVMPPC_BOOKE_MAX_IAC];
388 	u64 dac[KVMPPC_BOOKE_MAX_DAC];
389 };
390 
391 #define KVMPPC_IRQ_DEFAULT	0
392 #define KVMPPC_IRQ_MPIC		1
393 #define KVMPPC_IRQ_XICS		2
394 
395 struct openpic;
396 
397 struct kvm_vcpu_arch {
398 	ulong host_stack;
399 	u32 host_pid;
400 #ifdef CONFIG_PPC_BOOK3S
401 	struct kvmppc_slb slb[64];
402 	int slb_max;		/* 1 + index of last valid entry in slb[] */
403 	int slb_nr;		/* total number of entries in SLB */
404 	struct kvmppc_mmu mmu;
405 #endif
406 
407 	ulong gpr[32];
408 
409 	u64 fpr[32];
410 	u64 fpscr;
411 
412 #ifdef CONFIG_SPE
413 	ulong evr[32];
414 	ulong spefscr;
415 	ulong host_spefscr;
416 	u64 acc;
417 #endif
418 #ifdef CONFIG_ALTIVEC
419 	vector128 vr[32];
420 	vector128 vscr;
421 #endif
422 
423 #ifdef CONFIG_VSX
424 	u64 vsr[64];
425 #endif
426 
427 #ifdef CONFIG_KVM_BOOKE_HV
428 	u32 host_mas4;
429 	u32 host_mas6;
430 	u32 shadow_epcr;
431 	u32 shadow_msrp;
432 	u32 eplc;
433 	u32 epsc;
434 	u32 oldpir;
435 #endif
436 
437 #if defined(CONFIG_BOOKE)
438 #if defined(CONFIG_KVM_BOOKE_HV) || defined(CONFIG_64BIT)
439 	u32 epcr;
440 #endif
441 #endif
442 
443 #ifdef CONFIG_PPC_BOOK3S
444 	/* For Gekko paired singles */
445 	u32 qpr[32];
446 #endif
447 
448 	ulong pc;
449 	ulong ctr;
450 	ulong lr;
451 
452 	ulong xer;
453 	u32 cr;
454 
455 #ifdef CONFIG_PPC_BOOK3S
456 	ulong hflags;
457 	ulong guest_owned_ext;
458 	ulong purr;
459 	ulong spurr;
460 	ulong dscr;
461 	ulong amr;
462 	ulong uamor;
463 	u32 ctrl;
464 	ulong dabr;
465 	ulong cfar;
466 #endif
467 	u32 vrsave; /* also USPRG0 */
468 	u32 mmucr;
469 	/* shadow_msr is unused for BookE HV */
470 	ulong shadow_msr;
471 	ulong csrr0;
472 	ulong csrr1;
473 	ulong dsrr0;
474 	ulong dsrr1;
475 	ulong mcsrr0;
476 	ulong mcsrr1;
477 	ulong mcsr;
478 	u32 dec;
479 #ifdef CONFIG_BOOKE
480 	u32 decar;
481 #endif
482 	u32 tbl;
483 	u32 tbu;
484 	u32 tcr;
485 	ulong tsr; /* we need to perform set/clr_bits() which requires ulong */
486 	u32 ivor[64];
487 	ulong ivpr;
488 	u32 pvr;
489 
490 	u32 shadow_pid;
491 	u32 shadow_pid1;
492 	u32 pid;
493 	u32 swap_pid;
494 
495 	u32 ccr0;
496 	u32 ccr1;
497 	u32 dbsr;
498 
499 	u64 mmcr[3];
500 	u32 pmc[8];
501 
502 #ifdef CONFIG_KVM_EXIT_TIMING
503 	struct mutex exit_timing_lock;
504 	struct kvmppc_exit_timing timing_exit;
505 	struct kvmppc_exit_timing timing_last_enter;
506 	u32 last_exit_type;
507 	u32 timing_count_type[__NUMBER_OF_KVM_EXIT_TYPES];
508 	u64 timing_sum_duration[__NUMBER_OF_KVM_EXIT_TYPES];
509 	u64 timing_sum_quad_duration[__NUMBER_OF_KVM_EXIT_TYPES];
510 	u64 timing_min_duration[__NUMBER_OF_KVM_EXIT_TYPES];
511 	u64 timing_max_duration[__NUMBER_OF_KVM_EXIT_TYPES];
512 	u64 timing_last_exit;
513 	struct dentry *debugfs_exit_timing;
514 #endif
515 
516 #ifdef CONFIG_PPC_BOOK3S
517 	ulong fault_dar;
518 	u32 fault_dsisr;
519 #endif
520 
521 #ifdef CONFIG_BOOKE
522 	ulong fault_dear;
523 	ulong fault_esr;
524 	ulong queued_dear;
525 	ulong queued_esr;
526 	spinlock_t wdt_lock;
527 	struct timer_list wdt_timer;
528 	u32 tlbcfg[4];
529 	u32 tlbps[4];
530 	u32 mmucfg;
531 	u32 eptcfg;
532 	u32 epr;
533 	u32 crit_save;
534 	struct kvmppc_booke_debug_reg dbg_reg;
535 #endif
536 	gpa_t paddr_accessed;
537 	gva_t vaddr_accessed;
538 
539 	u8 io_gpr; /* GPR used as IO source/target */
540 	u8 mmio_is_bigendian;
541 	u8 mmio_sign_extend;
542 	u8 dcr_needed;
543 	u8 dcr_is_write;
544 	u8 osi_needed;
545 	u8 osi_enabled;
546 	u8 papr_enabled;
547 	u8 watchdog_enabled;
548 	u8 sane;
549 	u8 cpu_type;
550 	u8 hcall_needed;
551 	u8 epr_flags; /* KVMPPC_EPR_xxx */
552 	u8 epr_needed;
553 
554 	u32 cpr0_cfgaddr; /* holds the last set cpr0_cfgaddr */
555 
556 	struct hrtimer dec_timer;
557 	struct tasklet_struct tasklet;
558 	u64 dec_jiffies;
559 	u64 dec_expires;
560 	unsigned long pending_exceptions;
561 	u8 ceded;
562 	u8 prodded;
563 	u32 last_inst;
564 
565 	wait_queue_head_t *wqp;
566 	struct kvmppc_vcore *vcore;
567 	int ret;
568 	int trap;
569 	int state;
570 	int ptid;
571 	bool timer_running;
572 	wait_queue_head_t cpu_run;
573 
574 	struct kvm_vcpu_arch_shared *shared;
575 	unsigned long magic_page_pa; /* phys addr to map the magic page to */
576 	unsigned long magic_page_ea; /* effect. addr to map the magic page to */
577 
578 	int irq_type;		/* one of KVM_IRQ_* */
579 	int irq_cpu_id;
580 	struct openpic *mpic;	/* KVM_IRQ_MPIC */
581 #ifdef CONFIG_KVM_XICS
582 	struct kvmppc_icp *icp; /* XICS presentation controller */
583 #endif
584 
585 #ifdef CONFIG_KVM_BOOK3S_64_HV
586 	struct kvm_vcpu_arch_shared shregs;
587 
588 	unsigned long pgfault_addr;
589 	long pgfault_index;
590 	unsigned long pgfault_hpte[2];
591 
592 	struct list_head run_list;
593 	struct task_struct *run_task;
594 	struct kvm_run *kvm_run;
595 	pgd_t *pgdir;
596 
597 	spinlock_t vpa_update_lock;
598 	struct kvmppc_vpa vpa;
599 	struct kvmppc_vpa dtl;
600 	struct dtl_entry *dtl_ptr;
601 	unsigned long dtl_index;
602 	u64 stolen_logged;
603 	struct kvmppc_vpa slb_shadow;
604 
605 	spinlock_t tbacct_lock;
606 	u64 busy_stolen;
607 	u64 busy_preempt;
608 #endif
609 };
610 
611 /* Values for vcpu->arch.state */
612 #define KVMPPC_VCPU_NOTREADY		0
613 #define KVMPPC_VCPU_RUNNABLE		1
614 #define KVMPPC_VCPU_BUSY_IN_HOST	2
615 
616 /* Values for vcpu->arch.io_gpr */
617 #define KVM_MMIO_REG_MASK	0x001f
618 #define KVM_MMIO_REG_EXT_MASK	0xffe0
619 #define KVM_MMIO_REG_GPR	0x0000
620 #define KVM_MMIO_REG_FPR	0x0020
621 #define KVM_MMIO_REG_QPR	0x0040
622 #define KVM_MMIO_REG_FQPR	0x0060
623 
624 #define __KVM_HAVE_ARCH_WQP
625 #define __KVM_HAVE_CREATE_DEVICE
626 
627 #endif /* __POWERPC_KVM_HOST_H__ */
628