1 /* 2 * This file is subject to the terms and conditions of the GNU General Public 3 * License. See the file "COPYING" in the main directory of this archive 4 * for more details. 5 * 6 * KVM/MIPS: Support for hardware virtualization extensions 7 * 8 * Copyright (C) 2012 MIPS Technologies, Inc. All rights reserved. 9 * Authors: Yann Le Du <ledu@kymasys.com> 10 */ 11 12 #include <linux/errno.h> 13 #include <linux/err.h> 14 #include <linux/module.h> 15 #include <linux/preempt.h> 16 #include <linux/vmalloc.h> 17 #include <asm/cacheflush.h> 18 #include <asm/cacheops.h> 19 #include <asm/cmpxchg.h> 20 #include <asm/fpu.h> 21 #include <asm/hazards.h> 22 #include <asm/inst.h> 23 #include <asm/mmu_context.h> 24 #include <asm/r4kcache.h> 25 #include <asm/time.h> 26 #include <asm/tlb.h> 27 #include <asm/tlbex.h> 28 29 #include <linux/kvm_host.h> 30 31 #include "interrupt.h" 32 #include "loongson_regs.h" 33 34 #include "trace.h" 35 36 /* Pointers to last VCPU loaded on each physical CPU */ 37 static struct kvm_vcpu *last_vcpu[NR_CPUS]; 38 /* Pointers to last VCPU executed on each physical CPU */ 39 static struct kvm_vcpu *last_exec_vcpu[NR_CPUS]; 40 41 /* 42 * Number of guest VTLB entries to use, so we can catch inconsistency between 43 * CPUs. 44 */ 45 static unsigned int kvm_vz_guest_vtlb_size; 46 47 static inline long kvm_vz_read_gc0_ebase(void) 48 { 49 if (sizeof(long) == 8 && cpu_has_ebase_wg) 50 return read_gc0_ebase_64(); 51 else 52 return read_gc0_ebase(); 53 } 54 55 static inline void kvm_vz_write_gc0_ebase(long v) 56 { 57 /* 58 * First write with WG=1 to write upper bits, then write again in case 59 * WG should be left at 0. 60 * write_gc0_ebase_64() is no longer UNDEFINED since R6. 61 */ 62 if (sizeof(long) == 8 && 63 (cpu_has_mips64r6 || cpu_has_ebase_wg)) { 64 write_gc0_ebase_64(v | MIPS_EBASE_WG); 65 write_gc0_ebase_64(v); 66 } else { 67 write_gc0_ebase(v | MIPS_EBASE_WG); 68 write_gc0_ebase(v); 69 } 70 } 71 72 /* 73 * These Config bits may be writable by the guest: 74 * Config: [K23, KU] (!TLB), K0 75 * Config1: (none) 76 * Config2: [TU, SU] (impl) 77 * Config3: ISAOnExc 78 * Config4: FTLBPageSize 79 * Config5: K, CV, MSAEn, UFE, FRE, SBRI, UFR 80 */ 81 82 static inline unsigned int kvm_vz_config_guest_wrmask(struct kvm_vcpu *vcpu) 83 { 84 return CONF_CM_CMASK; 85 } 86 87 static inline unsigned int kvm_vz_config1_guest_wrmask(struct kvm_vcpu *vcpu) 88 { 89 return 0; 90 } 91 92 static inline unsigned int kvm_vz_config2_guest_wrmask(struct kvm_vcpu *vcpu) 93 { 94 return 0; 95 } 96 97 static inline unsigned int kvm_vz_config3_guest_wrmask(struct kvm_vcpu *vcpu) 98 { 99 return MIPS_CONF3_ISA_OE; 100 } 101 102 static inline unsigned int kvm_vz_config4_guest_wrmask(struct kvm_vcpu *vcpu) 103 { 104 /* no need to be exact */ 105 return MIPS_CONF4_VFTLBPAGESIZE; 106 } 107 108 static inline unsigned int kvm_vz_config5_guest_wrmask(struct kvm_vcpu *vcpu) 109 { 110 unsigned int mask = MIPS_CONF5_K | MIPS_CONF5_CV | MIPS_CONF5_SBRI; 111 112 /* Permit MSAEn changes if MSA supported and enabled */ 113 if (kvm_mips_guest_has_msa(&vcpu->arch)) 114 mask |= MIPS_CONF5_MSAEN; 115 116 /* 117 * Permit guest FPU mode changes if FPU is enabled and the relevant 118 * feature exists according to FIR register. 119 */ 120 if (kvm_mips_guest_has_fpu(&vcpu->arch)) { 121 if (cpu_has_ufr) 122 mask |= MIPS_CONF5_UFR; 123 if (cpu_has_fre) 124 mask |= MIPS_CONF5_FRE | MIPS_CONF5_UFE; 125 } 126 127 return mask; 128 } 129 130 static inline unsigned int kvm_vz_config6_guest_wrmask(struct kvm_vcpu *vcpu) 131 { 132 return LOONGSON_CONF6_INTIMER | LOONGSON_CONF6_EXTIMER; 133 } 134 135 /* 136 * VZ optionally allows these additional Config bits to be written by root: 137 * Config: M, [MT] 138 * Config1: M, [MMUSize-1, C2, MD, PC, WR, CA], FP 139 * Config2: M 140 * Config3: M, MSAP, [BPG], ULRI, [DSP2P, DSPP], CTXTC, [ITL, LPA, VEIC, 141 * VInt, SP, CDMM, MT, SM, TL] 142 * Config4: M, [VTLBSizeExt, MMUSizeExt] 143 * Config5: MRP 144 */ 145 146 static inline unsigned int kvm_vz_config_user_wrmask(struct kvm_vcpu *vcpu) 147 { 148 return kvm_vz_config_guest_wrmask(vcpu) | MIPS_CONF_M; 149 } 150 151 static inline unsigned int kvm_vz_config1_user_wrmask(struct kvm_vcpu *vcpu) 152 { 153 unsigned int mask = kvm_vz_config1_guest_wrmask(vcpu) | MIPS_CONF_M; 154 155 /* Permit FPU to be present if FPU is supported */ 156 if (kvm_mips_guest_can_have_fpu(&vcpu->arch)) 157 mask |= MIPS_CONF1_FP; 158 159 return mask; 160 } 161 162 static inline unsigned int kvm_vz_config2_user_wrmask(struct kvm_vcpu *vcpu) 163 { 164 return kvm_vz_config2_guest_wrmask(vcpu) | MIPS_CONF_M; 165 } 166 167 static inline unsigned int kvm_vz_config3_user_wrmask(struct kvm_vcpu *vcpu) 168 { 169 unsigned int mask = kvm_vz_config3_guest_wrmask(vcpu) | MIPS_CONF_M | 170 MIPS_CONF3_ULRI | MIPS_CONF3_CTXTC; 171 172 /* Permit MSA to be present if MSA is supported */ 173 if (kvm_mips_guest_can_have_msa(&vcpu->arch)) 174 mask |= MIPS_CONF3_MSA; 175 176 return mask; 177 } 178 179 static inline unsigned int kvm_vz_config4_user_wrmask(struct kvm_vcpu *vcpu) 180 { 181 return kvm_vz_config4_guest_wrmask(vcpu) | MIPS_CONF_M; 182 } 183 184 static inline unsigned int kvm_vz_config5_user_wrmask(struct kvm_vcpu *vcpu) 185 { 186 return kvm_vz_config5_guest_wrmask(vcpu) | MIPS_CONF5_MRP; 187 } 188 189 static inline unsigned int kvm_vz_config6_user_wrmask(struct kvm_vcpu *vcpu) 190 { 191 return kvm_vz_config6_guest_wrmask(vcpu) | 192 LOONGSON_CONF6_SFBEN | LOONGSON_CONF6_FTLBDIS; 193 } 194 195 static gpa_t kvm_vz_gva_to_gpa_cb(gva_t gva) 196 { 197 /* VZ guest has already converted gva to gpa */ 198 return gva; 199 } 200 201 static void kvm_vz_queue_irq(struct kvm_vcpu *vcpu, unsigned int priority) 202 { 203 set_bit(priority, &vcpu->arch.pending_exceptions); 204 clear_bit(priority, &vcpu->arch.pending_exceptions_clr); 205 } 206 207 static void kvm_vz_dequeue_irq(struct kvm_vcpu *vcpu, unsigned int priority) 208 { 209 clear_bit(priority, &vcpu->arch.pending_exceptions); 210 set_bit(priority, &vcpu->arch.pending_exceptions_clr); 211 } 212 213 static void kvm_vz_queue_timer_int_cb(struct kvm_vcpu *vcpu) 214 { 215 /* 216 * timer expiry is asynchronous to vcpu execution therefore defer guest 217 * cp0 accesses 218 */ 219 kvm_vz_queue_irq(vcpu, MIPS_EXC_INT_TIMER); 220 } 221 222 static void kvm_vz_dequeue_timer_int_cb(struct kvm_vcpu *vcpu) 223 { 224 /* 225 * timer expiry is asynchronous to vcpu execution therefore defer guest 226 * cp0 accesses 227 */ 228 kvm_vz_dequeue_irq(vcpu, MIPS_EXC_INT_TIMER); 229 } 230 231 static void kvm_vz_queue_io_int_cb(struct kvm_vcpu *vcpu, 232 struct kvm_mips_interrupt *irq) 233 { 234 int intr = (int)irq->irq; 235 236 /* 237 * interrupts are asynchronous to vcpu execution therefore defer guest 238 * cp0 accesses 239 */ 240 kvm_vz_queue_irq(vcpu, kvm_irq_to_priority(intr)); 241 } 242 243 static void kvm_vz_dequeue_io_int_cb(struct kvm_vcpu *vcpu, 244 struct kvm_mips_interrupt *irq) 245 { 246 int intr = (int)irq->irq; 247 248 /* 249 * interrupts are asynchronous to vcpu execution therefore defer guest 250 * cp0 accesses 251 */ 252 kvm_vz_dequeue_irq(vcpu, kvm_irq_to_priority(-intr)); 253 } 254 255 static int kvm_vz_irq_deliver_cb(struct kvm_vcpu *vcpu, unsigned int priority, 256 u32 cause) 257 { 258 u32 irq = (priority < MIPS_EXC_MAX) ? 259 kvm_priority_to_irq[priority] : 0; 260 261 switch (priority) { 262 case MIPS_EXC_INT_TIMER: 263 set_gc0_cause(C_TI); 264 break; 265 266 case MIPS_EXC_INT_IO_1: 267 case MIPS_EXC_INT_IO_2: 268 case MIPS_EXC_INT_IPI_1: 269 case MIPS_EXC_INT_IPI_2: 270 if (cpu_has_guestctl2) 271 set_c0_guestctl2(irq); 272 else 273 set_gc0_cause(irq); 274 break; 275 276 default: 277 break; 278 } 279 280 clear_bit(priority, &vcpu->arch.pending_exceptions); 281 return 1; 282 } 283 284 static int kvm_vz_irq_clear_cb(struct kvm_vcpu *vcpu, unsigned int priority, 285 u32 cause) 286 { 287 u32 irq = (priority < MIPS_EXC_MAX) ? 288 kvm_priority_to_irq[priority] : 0; 289 290 switch (priority) { 291 case MIPS_EXC_INT_TIMER: 292 /* 293 * Call to kvm_write_c0_guest_compare() clears Cause.TI in 294 * kvm_mips_emulate_CP0(). Explicitly clear irq associated with 295 * Cause.IP[IPTI] if GuestCtl2 virtual interrupt register not 296 * supported or if not using GuestCtl2 Hardware Clear. 297 */ 298 if (cpu_has_guestctl2) { 299 if (!(read_c0_guestctl2() & (irq << 14))) 300 clear_c0_guestctl2(irq); 301 } else { 302 clear_gc0_cause(irq); 303 } 304 break; 305 306 case MIPS_EXC_INT_IO_1: 307 case MIPS_EXC_INT_IO_2: 308 case MIPS_EXC_INT_IPI_1: 309 case MIPS_EXC_INT_IPI_2: 310 /* Clear GuestCtl2.VIP irq if not using Hardware Clear */ 311 if (cpu_has_guestctl2) { 312 if (!(read_c0_guestctl2() & (irq << 14))) 313 clear_c0_guestctl2(irq); 314 } else { 315 clear_gc0_cause(irq); 316 } 317 break; 318 319 default: 320 break; 321 } 322 323 clear_bit(priority, &vcpu->arch.pending_exceptions_clr); 324 return 1; 325 } 326 327 /* 328 * VZ guest timer handling. 329 */ 330 331 /** 332 * kvm_vz_should_use_htimer() - Find whether to use the VZ hard guest timer. 333 * @vcpu: Virtual CPU. 334 * 335 * Returns: true if the VZ GTOffset & real guest CP0_Count should be used 336 * instead of software emulation of guest timer. 337 * false otherwise. 338 */ 339 static bool kvm_vz_should_use_htimer(struct kvm_vcpu *vcpu) 340 { 341 if (kvm_mips_count_disabled(vcpu)) 342 return false; 343 344 /* Chosen frequency must match real frequency */ 345 if (mips_hpt_frequency != vcpu->arch.count_hz) 346 return false; 347 348 /* We don't support a CP0_GTOffset with fewer bits than CP0_Count */ 349 if (current_cpu_data.gtoffset_mask != 0xffffffff) 350 return false; 351 352 return true; 353 } 354 355 /** 356 * _kvm_vz_restore_stimer() - Restore soft timer state. 357 * @vcpu: Virtual CPU. 358 * @compare: CP0_Compare register value, restored by caller. 359 * @cause: CP0_Cause register to restore. 360 * 361 * Restore VZ state relating to the soft timer. The hard timer can be enabled 362 * later. 363 */ 364 static void _kvm_vz_restore_stimer(struct kvm_vcpu *vcpu, u32 compare, 365 u32 cause) 366 { 367 /* 368 * Avoid spurious counter interrupts by setting Guest CP0_Count to just 369 * after Guest CP0_Compare. 370 */ 371 write_c0_gtoffset(compare - read_c0_count()); 372 373 back_to_back_c0_hazard(); 374 write_gc0_cause(cause); 375 } 376 377 /** 378 * _kvm_vz_restore_htimer() - Restore hard timer state. 379 * @vcpu: Virtual CPU. 380 * @compare: CP0_Compare register value, restored by caller. 381 * @cause: CP0_Cause register to restore. 382 * 383 * Restore hard timer Guest.Count & Guest.Cause taking care to preserve the 384 * value of Guest.CP0_Cause.TI while restoring Guest.CP0_Cause. 385 */ 386 static void _kvm_vz_restore_htimer(struct kvm_vcpu *vcpu, 387 u32 compare, u32 cause) 388 { 389 u32 start_count, after_count; 390 ktime_t freeze_time; 391 unsigned long flags; 392 393 /* 394 * Freeze the soft-timer and sync the guest CP0_Count with it. We do 395 * this with interrupts disabled to avoid latency. 396 */ 397 local_irq_save(flags); 398 freeze_time = kvm_mips_freeze_hrtimer(vcpu, &start_count); 399 write_c0_gtoffset(start_count - read_c0_count()); 400 local_irq_restore(flags); 401 402 /* restore guest CP0_Cause, as TI may already be set */ 403 back_to_back_c0_hazard(); 404 write_gc0_cause(cause); 405 406 /* 407 * The above sequence isn't atomic and would result in lost timer 408 * interrupts if we're not careful. Detect if a timer interrupt is due 409 * and assert it. 410 */ 411 back_to_back_c0_hazard(); 412 after_count = read_gc0_count(); 413 if (after_count - start_count > compare - start_count - 1) 414 kvm_vz_queue_irq(vcpu, MIPS_EXC_INT_TIMER); 415 } 416 417 /** 418 * kvm_vz_restore_timer() - Restore timer state. 419 * @vcpu: Virtual CPU. 420 * 421 * Restore soft timer state from saved context. 422 */ 423 static void kvm_vz_restore_timer(struct kvm_vcpu *vcpu) 424 { 425 struct mips_coproc *cop0 = vcpu->arch.cop0; 426 u32 cause, compare; 427 428 compare = kvm_read_sw_gc0_compare(cop0); 429 cause = kvm_read_sw_gc0_cause(cop0); 430 431 write_gc0_compare(compare); 432 _kvm_vz_restore_stimer(vcpu, compare, cause); 433 } 434 435 /** 436 * kvm_vz_acquire_htimer() - Switch to hard timer state. 437 * @vcpu: Virtual CPU. 438 * 439 * Restore hard timer state on top of existing soft timer state if possible. 440 * 441 * Since hard timer won't remain active over preemption, preemption should be 442 * disabled by the caller. 443 */ 444 void kvm_vz_acquire_htimer(struct kvm_vcpu *vcpu) 445 { 446 u32 gctl0; 447 448 gctl0 = read_c0_guestctl0(); 449 if (!(gctl0 & MIPS_GCTL0_GT) && kvm_vz_should_use_htimer(vcpu)) { 450 /* enable guest access to hard timer */ 451 write_c0_guestctl0(gctl0 | MIPS_GCTL0_GT); 452 453 _kvm_vz_restore_htimer(vcpu, read_gc0_compare(), 454 read_gc0_cause()); 455 } 456 } 457 458 /** 459 * _kvm_vz_save_htimer() - Switch to software emulation of guest timer. 460 * @vcpu: Virtual CPU. 461 * @compare: Pointer to write compare value to. 462 * @cause: Pointer to write cause value to. 463 * 464 * Save VZ guest timer state and switch to software emulation of guest CP0 465 * timer. The hard timer must already be in use, so preemption should be 466 * disabled. 467 */ 468 static void _kvm_vz_save_htimer(struct kvm_vcpu *vcpu, 469 u32 *out_compare, u32 *out_cause) 470 { 471 u32 cause, compare, before_count, end_count; 472 ktime_t before_time; 473 474 compare = read_gc0_compare(); 475 *out_compare = compare; 476 477 before_time = ktime_get(); 478 479 /* 480 * Record the CP0_Count *prior* to saving CP0_Cause, so we have a time 481 * at which no pending timer interrupt is missing. 482 */ 483 before_count = read_gc0_count(); 484 back_to_back_c0_hazard(); 485 cause = read_gc0_cause(); 486 *out_cause = cause; 487 488 /* 489 * Record a final CP0_Count which we will transfer to the soft-timer. 490 * This is recorded *after* saving CP0_Cause, so we don't get any timer 491 * interrupts from just after the final CP0_Count point. 492 */ 493 back_to_back_c0_hazard(); 494 end_count = read_gc0_count(); 495 496 /* 497 * The above sequence isn't atomic, so we could miss a timer interrupt 498 * between reading CP0_Cause and end_count. Detect and record any timer 499 * interrupt due between before_count and end_count. 500 */ 501 if (end_count - before_count > compare - before_count - 1) 502 kvm_vz_queue_irq(vcpu, MIPS_EXC_INT_TIMER); 503 504 /* 505 * Restore soft-timer, ignoring a small amount of negative drift due to 506 * delay between freeze_hrtimer and setting CP0_GTOffset. 507 */ 508 kvm_mips_restore_hrtimer(vcpu, before_time, end_count, -0x10000); 509 } 510 511 /** 512 * kvm_vz_save_timer() - Save guest timer state. 513 * @vcpu: Virtual CPU. 514 * 515 * Save VZ guest timer state and switch to soft guest timer if hard timer was in 516 * use. 517 */ 518 static void kvm_vz_save_timer(struct kvm_vcpu *vcpu) 519 { 520 struct mips_coproc *cop0 = vcpu->arch.cop0; 521 u32 gctl0, compare, cause; 522 523 gctl0 = read_c0_guestctl0(); 524 if (gctl0 & MIPS_GCTL0_GT) { 525 /* disable guest use of hard timer */ 526 write_c0_guestctl0(gctl0 & ~MIPS_GCTL0_GT); 527 528 /* save hard timer state */ 529 _kvm_vz_save_htimer(vcpu, &compare, &cause); 530 } else { 531 compare = read_gc0_compare(); 532 cause = read_gc0_cause(); 533 } 534 535 /* save timer-related state to VCPU context */ 536 kvm_write_sw_gc0_cause(cop0, cause); 537 kvm_write_sw_gc0_compare(cop0, compare); 538 } 539 540 /** 541 * kvm_vz_lose_htimer() - Ensure hard guest timer is not in use. 542 * @vcpu: Virtual CPU. 543 * 544 * Transfers the state of the hard guest timer to the soft guest timer, leaving 545 * guest state intact so it can continue to be used with the soft timer. 546 */ 547 void kvm_vz_lose_htimer(struct kvm_vcpu *vcpu) 548 { 549 u32 gctl0, compare, cause; 550 551 preempt_disable(); 552 gctl0 = read_c0_guestctl0(); 553 if (gctl0 & MIPS_GCTL0_GT) { 554 /* disable guest use of timer */ 555 write_c0_guestctl0(gctl0 & ~MIPS_GCTL0_GT); 556 557 /* switch to soft timer */ 558 _kvm_vz_save_htimer(vcpu, &compare, &cause); 559 560 /* leave soft timer in usable state */ 561 _kvm_vz_restore_stimer(vcpu, compare, cause); 562 } 563 preempt_enable(); 564 } 565 566 /** 567 * is_eva_access() - Find whether an instruction is an EVA memory accessor. 568 * @inst: 32-bit instruction encoding. 569 * 570 * Finds whether @inst encodes an EVA memory access instruction, which would 571 * indicate that emulation of it should access the user mode address space 572 * instead of the kernel mode address space. This matters for MUSUK segments 573 * which are TLB mapped for user mode but unmapped for kernel mode. 574 * 575 * Returns: Whether @inst encodes an EVA accessor instruction. 576 */ 577 static bool is_eva_access(union mips_instruction inst) 578 { 579 if (inst.spec3_format.opcode != spec3_op) 580 return false; 581 582 switch (inst.spec3_format.func) { 583 case lwle_op: 584 case lwre_op: 585 case cachee_op: 586 case sbe_op: 587 case she_op: 588 case sce_op: 589 case swe_op: 590 case swle_op: 591 case swre_op: 592 case prefe_op: 593 case lbue_op: 594 case lhue_op: 595 case lbe_op: 596 case lhe_op: 597 case lle_op: 598 case lwe_op: 599 return true; 600 default: 601 return false; 602 } 603 } 604 605 /** 606 * is_eva_am_mapped() - Find whether an access mode is mapped. 607 * @vcpu: KVM VCPU state. 608 * @am: 3-bit encoded access mode. 609 * @eu: Segment becomes unmapped and uncached when Status.ERL=1. 610 * 611 * Decode @am to find whether it encodes a mapped segment for the current VCPU 612 * state. Where necessary @eu and the actual instruction causing the fault are 613 * taken into account to make the decision. 614 * 615 * Returns: Whether the VCPU faulted on a TLB mapped address. 616 */ 617 static bool is_eva_am_mapped(struct kvm_vcpu *vcpu, unsigned int am, bool eu) 618 { 619 u32 am_lookup; 620 int err; 621 622 /* 623 * Interpret access control mode. We assume address errors will already 624 * have been caught by the guest, leaving us with: 625 * AM UM SM KM 31..24 23..16 626 * UK 0 000 Unm 0 0 627 * MK 1 001 TLB 1 628 * MSK 2 010 TLB TLB 1 629 * MUSK 3 011 TLB TLB TLB 1 630 * MUSUK 4 100 TLB TLB Unm 0 1 631 * USK 5 101 Unm Unm 0 0 632 * - 6 110 0 0 633 * UUSK 7 111 Unm Unm Unm 0 0 634 * 635 * We shift a magic value by AM across the sign bit to find if always 636 * TLB mapped, and if not shift by 8 again to find if it depends on KM. 637 */ 638 am_lookup = 0x70080000 << am; 639 if ((s32)am_lookup < 0) { 640 /* 641 * MK, MSK, MUSK 642 * Always TLB mapped, unless SegCtl.EU && ERL 643 */ 644 if (!eu || !(read_gc0_status() & ST0_ERL)) 645 return true; 646 } else { 647 am_lookup <<= 8; 648 if ((s32)am_lookup < 0) { 649 union mips_instruction inst; 650 unsigned int status; 651 u32 *opc; 652 653 /* 654 * MUSUK 655 * TLB mapped if not in kernel mode 656 */ 657 status = read_gc0_status(); 658 if (!(status & (ST0_EXL | ST0_ERL)) && 659 (status & ST0_KSU)) 660 return true; 661 /* 662 * EVA access instructions in kernel 663 * mode access user address space. 664 */ 665 opc = (u32 *)vcpu->arch.pc; 666 if (vcpu->arch.host_cp0_cause & CAUSEF_BD) 667 opc += 1; 668 err = kvm_get_badinstr(opc, vcpu, &inst.word); 669 if (!err && is_eva_access(inst)) 670 return true; 671 } 672 } 673 674 return false; 675 } 676 677 /** 678 * kvm_vz_gva_to_gpa() - Convert valid GVA to GPA. 679 * @vcpu: KVM VCPU state. 680 * @gva: Guest virtual address to convert. 681 * @gpa: Output guest physical address. 682 * 683 * Convert a guest virtual address (GVA) which is valid according to the guest 684 * context, to a guest physical address (GPA). 685 * 686 * Returns: 0 on success. 687 * -errno on failure. 688 */ 689 static int kvm_vz_gva_to_gpa(struct kvm_vcpu *vcpu, unsigned long gva, 690 unsigned long *gpa) 691 { 692 u32 gva32 = gva; 693 unsigned long segctl; 694 695 if ((long)gva == (s32)gva32) { 696 /* Handle canonical 32-bit virtual address */ 697 if (cpu_guest_has_segments) { 698 unsigned long mask, pa; 699 700 switch (gva32 >> 29) { 701 case 0: 702 case 1: /* CFG5 (1GB) */ 703 segctl = read_gc0_segctl2() >> 16; 704 mask = (unsigned long)0xfc0000000ull; 705 break; 706 case 2: 707 case 3: /* CFG4 (1GB) */ 708 segctl = read_gc0_segctl2(); 709 mask = (unsigned long)0xfc0000000ull; 710 break; 711 case 4: /* CFG3 (512MB) */ 712 segctl = read_gc0_segctl1() >> 16; 713 mask = (unsigned long)0xfe0000000ull; 714 break; 715 case 5: /* CFG2 (512MB) */ 716 segctl = read_gc0_segctl1(); 717 mask = (unsigned long)0xfe0000000ull; 718 break; 719 case 6: /* CFG1 (512MB) */ 720 segctl = read_gc0_segctl0() >> 16; 721 mask = (unsigned long)0xfe0000000ull; 722 break; 723 case 7: /* CFG0 (512MB) */ 724 segctl = read_gc0_segctl0(); 725 mask = (unsigned long)0xfe0000000ull; 726 break; 727 default: 728 /* 729 * GCC 4.9 isn't smart enough to figure out that 730 * segctl and mask are always initialised. 731 */ 732 unreachable(); 733 } 734 735 if (is_eva_am_mapped(vcpu, (segctl >> 4) & 0x7, 736 segctl & 0x0008)) 737 goto tlb_mapped; 738 739 /* Unmapped, find guest physical address */ 740 pa = (segctl << 20) & mask; 741 pa |= gva32 & ~mask; 742 *gpa = pa; 743 return 0; 744 } else if ((s32)gva32 < (s32)0xc0000000) { 745 /* legacy unmapped KSeg0 or KSeg1 */ 746 *gpa = gva32 & 0x1fffffff; 747 return 0; 748 } 749 #ifdef CONFIG_64BIT 750 } else if ((gva & 0xc000000000000000) == 0x8000000000000000) { 751 /* XKPHYS */ 752 if (cpu_guest_has_segments) { 753 /* 754 * Each of the 8 regions can be overridden by SegCtl2.XR 755 * to use SegCtl1.XAM. 756 */ 757 segctl = read_gc0_segctl2(); 758 if (segctl & (1ull << (56 + ((gva >> 59) & 0x7)))) { 759 segctl = read_gc0_segctl1(); 760 if (is_eva_am_mapped(vcpu, (segctl >> 59) & 0x7, 761 0)) 762 goto tlb_mapped; 763 } 764 765 } 766 /* 767 * Traditionally fully unmapped. 768 * Bits 61:59 specify the CCA, which we can just mask off here. 769 * Bits 58:PABITS should be zero, but we shouldn't have got here 770 * if it wasn't. 771 */ 772 *gpa = gva & 0x07ffffffffffffff; 773 return 0; 774 #endif 775 } 776 777 tlb_mapped: 778 return kvm_vz_guest_tlb_lookup(vcpu, gva, gpa); 779 } 780 781 /** 782 * kvm_vz_badvaddr_to_gpa() - Convert GVA BadVAddr from root exception to GPA. 783 * @vcpu: KVM VCPU state. 784 * @badvaddr: Root BadVAddr. 785 * @gpa: Output guest physical address. 786 * 787 * VZ implementations are permitted to report guest virtual addresses (GVA) in 788 * BadVAddr on a root exception during guest execution, instead of the more 789 * convenient guest physical addresses (GPA). When we get a GVA, this function 790 * converts it to a GPA, taking into account guest segmentation and guest TLB 791 * state. 792 * 793 * Returns: 0 on success. 794 * -errno on failure. 795 */ 796 static int kvm_vz_badvaddr_to_gpa(struct kvm_vcpu *vcpu, unsigned long badvaddr, 797 unsigned long *gpa) 798 { 799 unsigned int gexccode = (vcpu->arch.host_cp0_guestctl0 & 800 MIPS_GCTL0_GEXC) >> MIPS_GCTL0_GEXC_SHIFT; 801 802 /* If BadVAddr is GPA, then all is well in the world */ 803 if (likely(gexccode == MIPS_GCTL0_GEXC_GPA)) { 804 *gpa = badvaddr; 805 return 0; 806 } 807 808 /* Otherwise we'd expect it to be GVA ... */ 809 if (WARN(gexccode != MIPS_GCTL0_GEXC_GVA, 810 "Unexpected gexccode %#x\n", gexccode)) 811 return -EINVAL; 812 813 /* ... and we need to perform the GVA->GPA translation in software */ 814 return kvm_vz_gva_to_gpa(vcpu, badvaddr, gpa); 815 } 816 817 static int kvm_trap_vz_no_handler(struct kvm_vcpu *vcpu) 818 { 819 u32 *opc = (u32 *) vcpu->arch.pc; 820 u32 cause = vcpu->arch.host_cp0_cause; 821 u32 exccode = (cause & CAUSEF_EXCCODE) >> CAUSEB_EXCCODE; 822 unsigned long badvaddr = vcpu->arch.host_cp0_badvaddr; 823 u32 inst = 0; 824 825 /* 826 * Fetch the instruction. 827 */ 828 if (cause & CAUSEF_BD) 829 opc += 1; 830 kvm_get_badinstr(opc, vcpu, &inst); 831 832 kvm_err("Exception Code: %d not handled @ PC: %p, inst: 0x%08x BadVaddr: %#lx Status: %#x\n", 833 exccode, opc, inst, badvaddr, 834 read_gc0_status()); 835 kvm_arch_vcpu_dump_regs(vcpu); 836 vcpu->run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 837 return RESUME_HOST; 838 } 839 840 static unsigned long mips_process_maar(unsigned int op, unsigned long val) 841 { 842 /* Mask off unused bits */ 843 unsigned long mask = 0xfffff000 | MIPS_MAAR_S | MIPS_MAAR_VL; 844 845 if (read_gc0_pagegrain() & PG_ELPA) 846 mask |= 0x00ffffff00000000ull; 847 if (cpu_guest_has_mvh) 848 mask |= MIPS_MAAR_VH; 849 850 /* Set or clear VH */ 851 if (op == mtc_op) { 852 /* clear VH */ 853 val &= ~MIPS_MAAR_VH; 854 } else if (op == dmtc_op) { 855 /* set VH to match VL */ 856 val &= ~MIPS_MAAR_VH; 857 if (val & MIPS_MAAR_VL) 858 val |= MIPS_MAAR_VH; 859 } 860 861 return val & mask; 862 } 863 864 static void kvm_write_maari(struct kvm_vcpu *vcpu, unsigned long val) 865 { 866 struct mips_coproc *cop0 = vcpu->arch.cop0; 867 868 val &= MIPS_MAARI_INDEX; 869 if (val == MIPS_MAARI_INDEX) 870 kvm_write_sw_gc0_maari(cop0, ARRAY_SIZE(vcpu->arch.maar) - 1); 871 else if (val < ARRAY_SIZE(vcpu->arch.maar)) 872 kvm_write_sw_gc0_maari(cop0, val); 873 } 874 875 static enum emulation_result kvm_vz_gpsi_cop0(union mips_instruction inst, 876 u32 *opc, u32 cause, 877 struct kvm_vcpu *vcpu) 878 { 879 struct mips_coproc *cop0 = vcpu->arch.cop0; 880 enum emulation_result er = EMULATE_DONE; 881 u32 rt, rd, sel; 882 unsigned long curr_pc; 883 unsigned long val; 884 885 /* 886 * Update PC and hold onto current PC in case there is 887 * an error and we want to rollback the PC 888 */ 889 curr_pc = vcpu->arch.pc; 890 er = update_pc(vcpu, cause); 891 if (er == EMULATE_FAIL) 892 return er; 893 894 if (inst.co_format.co) { 895 switch (inst.co_format.func) { 896 case wait_op: 897 er = kvm_mips_emul_wait(vcpu); 898 break; 899 default: 900 er = EMULATE_FAIL; 901 } 902 } else { 903 rt = inst.c0r_format.rt; 904 rd = inst.c0r_format.rd; 905 sel = inst.c0r_format.sel; 906 907 switch (inst.c0r_format.rs) { 908 case dmfc_op: 909 case mfc_op: 910 #ifdef CONFIG_KVM_MIPS_DEBUG_COP0_COUNTERS 911 cop0->stat[rd][sel]++; 912 #endif 913 if (rd == MIPS_CP0_COUNT && 914 sel == 0) { /* Count */ 915 val = kvm_mips_read_count(vcpu); 916 } else if (rd == MIPS_CP0_COMPARE && 917 sel == 0) { /* Compare */ 918 val = read_gc0_compare(); 919 } else if (rd == MIPS_CP0_LLADDR && 920 sel == 0) { /* LLAddr */ 921 if (cpu_guest_has_rw_llb) 922 val = read_gc0_lladdr() & 923 MIPS_LLADDR_LLB; 924 else 925 val = 0; 926 } else if (rd == MIPS_CP0_LLADDR && 927 sel == 1 && /* MAAR */ 928 cpu_guest_has_maar && 929 !cpu_guest_has_dyn_maar) { 930 /* MAARI must be in range */ 931 BUG_ON(kvm_read_sw_gc0_maari(cop0) >= 932 ARRAY_SIZE(vcpu->arch.maar)); 933 val = vcpu->arch.maar[ 934 kvm_read_sw_gc0_maari(cop0)]; 935 } else if ((rd == MIPS_CP0_PRID && 936 (sel == 0 || /* PRid */ 937 sel == 2 || /* CDMMBase */ 938 sel == 3)) || /* CMGCRBase */ 939 (rd == MIPS_CP0_STATUS && 940 (sel == 2 || /* SRSCtl */ 941 sel == 3)) || /* SRSMap */ 942 (rd == MIPS_CP0_CONFIG && 943 (sel == 6 || /* Config6 */ 944 sel == 7)) || /* Config7 */ 945 (rd == MIPS_CP0_LLADDR && 946 (sel == 2) && /* MAARI */ 947 cpu_guest_has_maar && 948 !cpu_guest_has_dyn_maar) || 949 (rd == MIPS_CP0_ERRCTL && 950 (sel == 0))) { /* ErrCtl */ 951 val = cop0->reg[rd][sel]; 952 #ifdef CONFIG_CPU_LOONGSON64 953 } else if (rd == MIPS_CP0_DIAG && 954 (sel == 0)) { /* Diag */ 955 val = cop0->reg[rd][sel]; 956 #endif 957 } else { 958 val = 0; 959 er = EMULATE_FAIL; 960 } 961 962 if (er != EMULATE_FAIL) { 963 /* Sign extend */ 964 if (inst.c0r_format.rs == mfc_op) 965 val = (int)val; 966 vcpu->arch.gprs[rt] = val; 967 } 968 969 trace_kvm_hwr(vcpu, (inst.c0r_format.rs == mfc_op) ? 970 KVM_TRACE_MFC0 : KVM_TRACE_DMFC0, 971 KVM_TRACE_COP0(rd, sel), val); 972 break; 973 974 case dmtc_op: 975 case mtc_op: 976 #ifdef CONFIG_KVM_MIPS_DEBUG_COP0_COUNTERS 977 cop0->stat[rd][sel]++; 978 #endif 979 val = vcpu->arch.gprs[rt]; 980 trace_kvm_hwr(vcpu, (inst.c0r_format.rs == mtc_op) ? 981 KVM_TRACE_MTC0 : KVM_TRACE_DMTC0, 982 KVM_TRACE_COP0(rd, sel), val); 983 984 if (rd == MIPS_CP0_COUNT && 985 sel == 0) { /* Count */ 986 kvm_vz_lose_htimer(vcpu); 987 kvm_mips_write_count(vcpu, vcpu->arch.gprs[rt]); 988 } else if (rd == MIPS_CP0_COMPARE && 989 sel == 0) { /* Compare */ 990 kvm_mips_write_compare(vcpu, 991 vcpu->arch.gprs[rt], 992 true); 993 } else if (rd == MIPS_CP0_LLADDR && 994 sel == 0) { /* LLAddr */ 995 /* 996 * P5600 generates GPSI on guest MTC0 LLAddr. 997 * Only allow the guest to clear LLB. 998 */ 999 if (cpu_guest_has_rw_llb && 1000 !(val & MIPS_LLADDR_LLB)) 1001 write_gc0_lladdr(0); 1002 } else if (rd == MIPS_CP0_LLADDR && 1003 sel == 1 && /* MAAR */ 1004 cpu_guest_has_maar && 1005 !cpu_guest_has_dyn_maar) { 1006 val = mips_process_maar(inst.c0r_format.rs, 1007 val); 1008 1009 /* MAARI must be in range */ 1010 BUG_ON(kvm_read_sw_gc0_maari(cop0) >= 1011 ARRAY_SIZE(vcpu->arch.maar)); 1012 vcpu->arch.maar[kvm_read_sw_gc0_maari(cop0)] = 1013 val; 1014 } else if (rd == MIPS_CP0_LLADDR && 1015 (sel == 2) && /* MAARI */ 1016 cpu_guest_has_maar && 1017 !cpu_guest_has_dyn_maar) { 1018 kvm_write_maari(vcpu, val); 1019 } else if (rd == MIPS_CP0_CONFIG && 1020 (sel == 6)) { 1021 cop0->reg[rd][sel] = (int)val; 1022 } else if (rd == MIPS_CP0_ERRCTL && 1023 (sel == 0)) { /* ErrCtl */ 1024 /* ignore the written value */ 1025 #ifdef CONFIG_CPU_LOONGSON64 1026 } else if (rd == MIPS_CP0_DIAG && 1027 (sel == 0)) { /* Diag */ 1028 unsigned long flags; 1029 1030 local_irq_save(flags); 1031 if (val & LOONGSON_DIAG_BTB) { 1032 /* Flush BTB */ 1033 set_c0_diag(LOONGSON_DIAG_BTB); 1034 } 1035 if (val & LOONGSON_DIAG_ITLB) { 1036 /* Flush ITLB */ 1037 set_c0_diag(LOONGSON_DIAG_ITLB); 1038 } 1039 if (val & LOONGSON_DIAG_DTLB) { 1040 /* Flush DTLB */ 1041 set_c0_diag(LOONGSON_DIAG_DTLB); 1042 } 1043 if (val & LOONGSON_DIAG_VTLB) { 1044 /* Flush VTLB */ 1045 kvm_loongson_clear_guest_vtlb(); 1046 } 1047 if (val & LOONGSON_DIAG_FTLB) { 1048 /* Flush FTLB */ 1049 kvm_loongson_clear_guest_ftlb(); 1050 } 1051 local_irq_restore(flags); 1052 #endif 1053 } else { 1054 er = EMULATE_FAIL; 1055 } 1056 break; 1057 1058 default: 1059 er = EMULATE_FAIL; 1060 break; 1061 } 1062 } 1063 /* Rollback PC only if emulation was unsuccessful */ 1064 if (er == EMULATE_FAIL) { 1065 kvm_err("[%#lx]%s: unsupported cop0 instruction 0x%08x\n", 1066 curr_pc, __func__, inst.word); 1067 1068 vcpu->arch.pc = curr_pc; 1069 } 1070 1071 return er; 1072 } 1073 1074 static enum emulation_result kvm_vz_gpsi_cache(union mips_instruction inst, 1075 u32 *opc, u32 cause, 1076 struct kvm_vcpu *vcpu) 1077 { 1078 enum emulation_result er = EMULATE_DONE; 1079 u32 cache, op_inst, op, base; 1080 s16 offset; 1081 struct kvm_vcpu_arch *arch = &vcpu->arch; 1082 unsigned long va, curr_pc; 1083 1084 /* 1085 * Update PC and hold onto current PC in case there is 1086 * an error and we want to rollback the PC 1087 */ 1088 curr_pc = vcpu->arch.pc; 1089 er = update_pc(vcpu, cause); 1090 if (er == EMULATE_FAIL) 1091 return er; 1092 1093 base = inst.i_format.rs; 1094 op_inst = inst.i_format.rt; 1095 if (cpu_has_mips_r6) 1096 offset = inst.spec3_format.simmediate; 1097 else 1098 offset = inst.i_format.simmediate; 1099 cache = op_inst & CacheOp_Cache; 1100 op = op_inst & CacheOp_Op; 1101 1102 va = arch->gprs[base] + offset; 1103 1104 kvm_debug("CACHE (cache: %#x, op: %#x, base[%d]: %#lx, offset: %#x\n", 1105 cache, op, base, arch->gprs[base], offset); 1106 1107 /* Secondary or tirtiary cache ops ignored */ 1108 if (cache != Cache_I && cache != Cache_D) 1109 return EMULATE_DONE; 1110 1111 switch (op_inst) { 1112 case Index_Invalidate_I: 1113 flush_icache_line_indexed(va); 1114 return EMULATE_DONE; 1115 case Index_Writeback_Inv_D: 1116 flush_dcache_line_indexed(va); 1117 return EMULATE_DONE; 1118 case Hit_Invalidate_I: 1119 case Hit_Invalidate_D: 1120 case Hit_Writeback_Inv_D: 1121 if (boot_cpu_type() == CPU_CAVIUM_OCTEON3) { 1122 /* We can just flush entire icache */ 1123 local_flush_icache_range(0, 0); 1124 return EMULATE_DONE; 1125 } 1126 1127 /* So far, other platforms support guest hit cache ops */ 1128 break; 1129 default: 1130 break; 1131 } 1132 1133 kvm_err("@ %#lx/%#lx CACHE (cache: %#x, op: %#x, base[%d]: %#lx, offset: %#x\n", 1134 curr_pc, vcpu->arch.gprs[31], cache, op, base, arch->gprs[base], 1135 offset); 1136 /* Rollback PC */ 1137 vcpu->arch.pc = curr_pc; 1138 1139 return EMULATE_FAIL; 1140 } 1141 1142 #ifdef CONFIG_CPU_LOONGSON64 1143 static enum emulation_result kvm_vz_gpsi_lwc2(union mips_instruction inst, 1144 u32 *opc, u32 cause, 1145 struct kvm_run *run, 1146 struct kvm_vcpu *vcpu) 1147 { 1148 unsigned int rs, rd; 1149 unsigned int hostcfg; 1150 unsigned long curr_pc; 1151 enum emulation_result er = EMULATE_DONE; 1152 1153 /* 1154 * Update PC and hold onto current PC in case there is 1155 * an error and we want to rollback the PC 1156 */ 1157 curr_pc = vcpu->arch.pc; 1158 er = update_pc(vcpu, cause); 1159 if (er == EMULATE_FAIL) 1160 return er; 1161 1162 rs = inst.loongson3_lscsr_format.rs; 1163 rd = inst.loongson3_lscsr_format.rd; 1164 switch (inst.loongson3_lscsr_format.fr) { 1165 case 0x8: /* Read CPUCFG */ 1166 ++vcpu->stat.vz_cpucfg_exits; 1167 hostcfg = read_cpucfg(vcpu->arch.gprs[rs]); 1168 1169 switch (vcpu->arch.gprs[rs]) { 1170 case LOONGSON_CFG0: 1171 vcpu->arch.gprs[rd] = 0x14c000; 1172 break; 1173 case LOONGSON_CFG1: 1174 hostcfg &= (LOONGSON_CFG1_FP | LOONGSON_CFG1_MMI | 1175 LOONGSON_CFG1_MSA1 | LOONGSON_CFG1_MSA2 | 1176 LOONGSON_CFG1_SFBP); 1177 vcpu->arch.gprs[rd] = hostcfg; 1178 break; 1179 case LOONGSON_CFG2: 1180 hostcfg &= (LOONGSON_CFG2_LEXT1 | LOONGSON_CFG2_LEXT2 | 1181 LOONGSON_CFG2_LEXT3 | LOONGSON_CFG2_LSPW); 1182 vcpu->arch.gprs[rd] = hostcfg; 1183 break; 1184 case LOONGSON_CFG3: 1185 vcpu->arch.gprs[rd] = hostcfg; 1186 break; 1187 default: 1188 /* Don't export any other advanced features to guest */ 1189 vcpu->arch.gprs[rd] = 0; 1190 break; 1191 } 1192 break; 1193 1194 default: 1195 kvm_err("lwc2 emulate not impl %d rs %lx @%lx\n", 1196 inst.loongson3_lscsr_format.fr, vcpu->arch.gprs[rs], curr_pc); 1197 er = EMULATE_FAIL; 1198 break; 1199 } 1200 1201 /* Rollback PC only if emulation was unsuccessful */ 1202 if (er == EMULATE_FAIL) { 1203 kvm_err("[%#lx]%s: unsupported lwc2 instruction 0x%08x 0x%08x\n", 1204 curr_pc, __func__, inst.word, inst.loongson3_lscsr_format.fr); 1205 1206 vcpu->arch.pc = curr_pc; 1207 } 1208 1209 return er; 1210 } 1211 #endif 1212 1213 static enum emulation_result kvm_trap_vz_handle_gpsi(u32 cause, u32 *opc, 1214 struct kvm_vcpu *vcpu) 1215 { 1216 enum emulation_result er = EMULATE_DONE; 1217 struct kvm_vcpu_arch *arch = &vcpu->arch; 1218 union mips_instruction inst; 1219 int rd, rt, sel; 1220 int err; 1221 1222 /* 1223 * Fetch the instruction. 1224 */ 1225 if (cause & CAUSEF_BD) 1226 opc += 1; 1227 err = kvm_get_badinstr(opc, vcpu, &inst.word); 1228 if (err) 1229 return EMULATE_FAIL; 1230 1231 switch (inst.r_format.opcode) { 1232 case cop0_op: 1233 er = kvm_vz_gpsi_cop0(inst, opc, cause, vcpu); 1234 break; 1235 #ifndef CONFIG_CPU_MIPSR6 1236 case cache_op: 1237 trace_kvm_exit(vcpu, KVM_TRACE_EXIT_CACHE); 1238 er = kvm_vz_gpsi_cache(inst, opc, cause, vcpu); 1239 break; 1240 #endif 1241 #ifdef CONFIG_CPU_LOONGSON64 1242 case lwc2_op: 1243 er = kvm_vz_gpsi_lwc2(inst, opc, cause, run, vcpu); 1244 break; 1245 #endif 1246 case spec3_op: 1247 switch (inst.spec3_format.func) { 1248 #ifdef CONFIG_CPU_MIPSR6 1249 case cache6_op: 1250 trace_kvm_exit(vcpu, KVM_TRACE_EXIT_CACHE); 1251 er = kvm_vz_gpsi_cache(inst, opc, cause, vcpu); 1252 break; 1253 #endif 1254 case rdhwr_op: 1255 if (inst.r_format.rs || (inst.r_format.re >> 3)) 1256 goto unknown; 1257 1258 rd = inst.r_format.rd; 1259 rt = inst.r_format.rt; 1260 sel = inst.r_format.re & 0x7; 1261 1262 switch (rd) { 1263 case MIPS_HWR_CC: /* Read count register */ 1264 arch->gprs[rt] = 1265 (long)(int)kvm_mips_read_count(vcpu); 1266 break; 1267 default: 1268 trace_kvm_hwr(vcpu, KVM_TRACE_RDHWR, 1269 KVM_TRACE_HWR(rd, sel), 0); 1270 goto unknown; 1271 } 1272 1273 trace_kvm_hwr(vcpu, KVM_TRACE_RDHWR, 1274 KVM_TRACE_HWR(rd, sel), arch->gprs[rt]); 1275 1276 er = update_pc(vcpu, cause); 1277 break; 1278 default: 1279 goto unknown; 1280 } 1281 break; 1282 unknown: 1283 1284 default: 1285 kvm_err("GPSI exception not supported (%p/%#x)\n", 1286 opc, inst.word); 1287 kvm_arch_vcpu_dump_regs(vcpu); 1288 er = EMULATE_FAIL; 1289 break; 1290 } 1291 1292 return er; 1293 } 1294 1295 static enum emulation_result kvm_trap_vz_handle_gsfc(u32 cause, u32 *opc, 1296 struct kvm_vcpu *vcpu) 1297 { 1298 enum emulation_result er = EMULATE_DONE; 1299 struct kvm_vcpu_arch *arch = &vcpu->arch; 1300 union mips_instruction inst; 1301 int err; 1302 1303 /* 1304 * Fetch the instruction. 1305 */ 1306 if (cause & CAUSEF_BD) 1307 opc += 1; 1308 err = kvm_get_badinstr(opc, vcpu, &inst.word); 1309 if (err) 1310 return EMULATE_FAIL; 1311 1312 /* complete MTC0 on behalf of guest and advance EPC */ 1313 if (inst.c0r_format.opcode == cop0_op && 1314 inst.c0r_format.rs == mtc_op && 1315 inst.c0r_format.z == 0) { 1316 int rt = inst.c0r_format.rt; 1317 int rd = inst.c0r_format.rd; 1318 int sel = inst.c0r_format.sel; 1319 unsigned int val = arch->gprs[rt]; 1320 unsigned int old_val, change; 1321 1322 trace_kvm_hwr(vcpu, KVM_TRACE_MTC0, KVM_TRACE_COP0(rd, sel), 1323 val); 1324 1325 if ((rd == MIPS_CP0_STATUS) && (sel == 0)) { 1326 /* FR bit should read as zero if no FPU */ 1327 if (!kvm_mips_guest_has_fpu(&vcpu->arch)) 1328 val &= ~(ST0_CU1 | ST0_FR); 1329 1330 /* 1331 * Also don't allow FR to be set if host doesn't support 1332 * it. 1333 */ 1334 if (!(boot_cpu_data.fpu_id & MIPS_FPIR_F64)) 1335 val &= ~ST0_FR; 1336 1337 old_val = read_gc0_status(); 1338 change = val ^ old_val; 1339 1340 if (change & ST0_FR) { 1341 /* 1342 * FPU and Vector register state is made 1343 * UNPREDICTABLE by a change of FR, so don't 1344 * even bother saving it. 1345 */ 1346 kvm_drop_fpu(vcpu); 1347 } 1348 1349 /* 1350 * If MSA state is already live, it is undefined how it 1351 * interacts with FR=0 FPU state, and we don't want to 1352 * hit reserved instruction exceptions trying to save 1353 * the MSA state later when CU=1 && FR=1, so play it 1354 * safe and save it first. 1355 */ 1356 if (change & ST0_CU1 && !(val & ST0_FR) && 1357 vcpu->arch.aux_inuse & KVM_MIPS_AUX_MSA) 1358 kvm_lose_fpu(vcpu); 1359 1360 write_gc0_status(val); 1361 } else if ((rd == MIPS_CP0_CAUSE) && (sel == 0)) { 1362 u32 old_cause = read_gc0_cause(); 1363 u32 change = old_cause ^ val; 1364 1365 /* DC bit enabling/disabling timer? */ 1366 if (change & CAUSEF_DC) { 1367 if (val & CAUSEF_DC) { 1368 kvm_vz_lose_htimer(vcpu); 1369 kvm_mips_count_disable_cause(vcpu); 1370 } else { 1371 kvm_mips_count_enable_cause(vcpu); 1372 } 1373 } 1374 1375 /* Only certain bits are RW to the guest */ 1376 change &= (CAUSEF_DC | CAUSEF_IV | CAUSEF_WP | 1377 CAUSEF_IP0 | CAUSEF_IP1); 1378 1379 /* WP can only be cleared */ 1380 change &= ~CAUSEF_WP | old_cause; 1381 1382 write_gc0_cause(old_cause ^ change); 1383 } else if ((rd == MIPS_CP0_STATUS) && (sel == 1)) { /* IntCtl */ 1384 write_gc0_intctl(val); 1385 } else if ((rd == MIPS_CP0_CONFIG) && (sel == 5)) { 1386 old_val = read_gc0_config5(); 1387 change = val ^ old_val; 1388 /* Handle changes in FPU/MSA modes */ 1389 preempt_disable(); 1390 1391 /* 1392 * Propagate FRE changes immediately if the FPU 1393 * context is already loaded. 1394 */ 1395 if (change & MIPS_CONF5_FRE && 1396 vcpu->arch.aux_inuse & KVM_MIPS_AUX_FPU) 1397 change_c0_config5(MIPS_CONF5_FRE, val); 1398 1399 preempt_enable(); 1400 1401 val = old_val ^ 1402 (change & kvm_vz_config5_guest_wrmask(vcpu)); 1403 write_gc0_config5(val); 1404 } else { 1405 kvm_err("Handle GSFC, unsupported field change @ %p: %#x\n", 1406 opc, inst.word); 1407 er = EMULATE_FAIL; 1408 } 1409 1410 if (er != EMULATE_FAIL) 1411 er = update_pc(vcpu, cause); 1412 } else { 1413 kvm_err("Handle GSFC, unrecognized instruction @ %p: %#x\n", 1414 opc, inst.word); 1415 er = EMULATE_FAIL; 1416 } 1417 1418 return er; 1419 } 1420 1421 static enum emulation_result kvm_trap_vz_handle_ghfc(u32 cause, u32 *opc, 1422 struct kvm_vcpu *vcpu) 1423 { 1424 /* 1425 * Presumably this is due to MC (guest mode change), so lets trace some 1426 * relevant info. 1427 */ 1428 trace_kvm_guest_mode_change(vcpu); 1429 1430 return EMULATE_DONE; 1431 } 1432 1433 static enum emulation_result kvm_trap_vz_handle_hc(u32 cause, u32 *opc, 1434 struct kvm_vcpu *vcpu) 1435 { 1436 enum emulation_result er; 1437 union mips_instruction inst; 1438 unsigned long curr_pc; 1439 int err; 1440 1441 if (cause & CAUSEF_BD) 1442 opc += 1; 1443 err = kvm_get_badinstr(opc, vcpu, &inst.word); 1444 if (err) 1445 return EMULATE_FAIL; 1446 1447 /* 1448 * Update PC and hold onto current PC in case there is 1449 * an error and we want to rollback the PC 1450 */ 1451 curr_pc = vcpu->arch.pc; 1452 er = update_pc(vcpu, cause); 1453 if (er == EMULATE_FAIL) 1454 return er; 1455 1456 er = kvm_mips_emul_hypcall(vcpu, inst); 1457 if (er == EMULATE_FAIL) 1458 vcpu->arch.pc = curr_pc; 1459 1460 return er; 1461 } 1462 1463 static enum emulation_result kvm_trap_vz_no_handler_guest_exit(u32 gexccode, 1464 u32 cause, 1465 u32 *opc, 1466 struct kvm_vcpu *vcpu) 1467 { 1468 u32 inst; 1469 1470 /* 1471 * Fetch the instruction. 1472 */ 1473 if (cause & CAUSEF_BD) 1474 opc += 1; 1475 kvm_get_badinstr(opc, vcpu, &inst); 1476 1477 kvm_err("Guest Exception Code: %d not yet handled @ PC: %p, inst: 0x%08x Status: %#x\n", 1478 gexccode, opc, inst, read_gc0_status()); 1479 1480 return EMULATE_FAIL; 1481 } 1482 1483 static int kvm_trap_vz_handle_guest_exit(struct kvm_vcpu *vcpu) 1484 { 1485 u32 *opc = (u32 *) vcpu->arch.pc; 1486 u32 cause = vcpu->arch.host_cp0_cause; 1487 enum emulation_result er = EMULATE_DONE; 1488 u32 gexccode = (vcpu->arch.host_cp0_guestctl0 & 1489 MIPS_GCTL0_GEXC) >> MIPS_GCTL0_GEXC_SHIFT; 1490 int ret = RESUME_GUEST; 1491 1492 trace_kvm_exit(vcpu, KVM_TRACE_EXIT_GEXCCODE_BASE + gexccode); 1493 switch (gexccode) { 1494 case MIPS_GCTL0_GEXC_GPSI: 1495 ++vcpu->stat.vz_gpsi_exits; 1496 er = kvm_trap_vz_handle_gpsi(cause, opc, vcpu); 1497 break; 1498 case MIPS_GCTL0_GEXC_GSFC: 1499 ++vcpu->stat.vz_gsfc_exits; 1500 er = kvm_trap_vz_handle_gsfc(cause, opc, vcpu); 1501 break; 1502 case MIPS_GCTL0_GEXC_HC: 1503 ++vcpu->stat.vz_hc_exits; 1504 er = kvm_trap_vz_handle_hc(cause, opc, vcpu); 1505 break; 1506 case MIPS_GCTL0_GEXC_GRR: 1507 ++vcpu->stat.vz_grr_exits; 1508 er = kvm_trap_vz_no_handler_guest_exit(gexccode, cause, opc, 1509 vcpu); 1510 break; 1511 case MIPS_GCTL0_GEXC_GVA: 1512 ++vcpu->stat.vz_gva_exits; 1513 er = kvm_trap_vz_no_handler_guest_exit(gexccode, cause, opc, 1514 vcpu); 1515 break; 1516 case MIPS_GCTL0_GEXC_GHFC: 1517 ++vcpu->stat.vz_ghfc_exits; 1518 er = kvm_trap_vz_handle_ghfc(cause, opc, vcpu); 1519 break; 1520 case MIPS_GCTL0_GEXC_GPA: 1521 ++vcpu->stat.vz_gpa_exits; 1522 er = kvm_trap_vz_no_handler_guest_exit(gexccode, cause, opc, 1523 vcpu); 1524 break; 1525 default: 1526 ++vcpu->stat.vz_resvd_exits; 1527 er = kvm_trap_vz_no_handler_guest_exit(gexccode, cause, opc, 1528 vcpu); 1529 break; 1530 1531 } 1532 1533 if (er == EMULATE_DONE) { 1534 ret = RESUME_GUEST; 1535 } else if (er == EMULATE_HYPERCALL) { 1536 ret = kvm_mips_handle_hypcall(vcpu); 1537 } else { 1538 vcpu->run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1539 ret = RESUME_HOST; 1540 } 1541 return ret; 1542 } 1543 1544 /** 1545 * kvm_trap_vz_handle_cop_unusuable() - Guest used unusable coprocessor. 1546 * @vcpu: Virtual CPU context. 1547 * 1548 * Handle when the guest attempts to use a coprocessor which hasn't been allowed 1549 * by the root context. 1550 */ 1551 static int kvm_trap_vz_handle_cop_unusable(struct kvm_vcpu *vcpu) 1552 { 1553 u32 cause = vcpu->arch.host_cp0_cause; 1554 enum emulation_result er = EMULATE_FAIL; 1555 int ret = RESUME_GUEST; 1556 1557 if (((cause & CAUSEF_CE) >> CAUSEB_CE) == 1) { 1558 /* 1559 * If guest FPU not present, the FPU operation should have been 1560 * treated as a reserved instruction! 1561 * If FPU already in use, we shouldn't get this at all. 1562 */ 1563 if (WARN_ON(!kvm_mips_guest_has_fpu(&vcpu->arch) || 1564 vcpu->arch.aux_inuse & KVM_MIPS_AUX_FPU)) { 1565 preempt_enable(); 1566 return EMULATE_FAIL; 1567 } 1568 1569 kvm_own_fpu(vcpu); 1570 er = EMULATE_DONE; 1571 } 1572 /* other coprocessors not handled */ 1573 1574 switch (er) { 1575 case EMULATE_DONE: 1576 ret = RESUME_GUEST; 1577 break; 1578 1579 case EMULATE_FAIL: 1580 vcpu->run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1581 ret = RESUME_HOST; 1582 break; 1583 1584 default: 1585 BUG(); 1586 } 1587 return ret; 1588 } 1589 1590 /** 1591 * kvm_trap_vz_handle_msa_disabled() - Guest used MSA while disabled in root. 1592 * @vcpu: Virtual CPU context. 1593 * 1594 * Handle when the guest attempts to use MSA when it is disabled in the root 1595 * context. 1596 */ 1597 static int kvm_trap_vz_handle_msa_disabled(struct kvm_vcpu *vcpu) 1598 { 1599 /* 1600 * If MSA not present or not exposed to guest or FR=0, the MSA operation 1601 * should have been treated as a reserved instruction! 1602 * Same if CU1=1, FR=0. 1603 * If MSA already in use, we shouldn't get this at all. 1604 */ 1605 if (!kvm_mips_guest_has_msa(&vcpu->arch) || 1606 (read_gc0_status() & (ST0_CU1 | ST0_FR)) == ST0_CU1 || 1607 !(read_gc0_config5() & MIPS_CONF5_MSAEN) || 1608 vcpu->arch.aux_inuse & KVM_MIPS_AUX_MSA) { 1609 vcpu->run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1610 return RESUME_HOST; 1611 } 1612 1613 kvm_own_msa(vcpu); 1614 1615 return RESUME_GUEST; 1616 } 1617 1618 static int kvm_trap_vz_handle_tlb_ld_miss(struct kvm_vcpu *vcpu) 1619 { 1620 struct kvm_run *run = vcpu->run; 1621 u32 *opc = (u32 *) vcpu->arch.pc; 1622 u32 cause = vcpu->arch.host_cp0_cause; 1623 ulong badvaddr = vcpu->arch.host_cp0_badvaddr; 1624 union mips_instruction inst; 1625 enum emulation_result er = EMULATE_DONE; 1626 int err, ret = RESUME_GUEST; 1627 1628 if (kvm_mips_handle_vz_root_tlb_fault(badvaddr, vcpu, false)) { 1629 /* A code fetch fault doesn't count as an MMIO */ 1630 if (kvm_is_ifetch_fault(&vcpu->arch)) { 1631 run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1632 return RESUME_HOST; 1633 } 1634 1635 /* Fetch the instruction */ 1636 if (cause & CAUSEF_BD) 1637 opc += 1; 1638 err = kvm_get_badinstr(opc, vcpu, &inst.word); 1639 if (err) { 1640 run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1641 return RESUME_HOST; 1642 } 1643 1644 /* Treat as MMIO */ 1645 er = kvm_mips_emulate_load(inst, cause, vcpu); 1646 if (er == EMULATE_FAIL) { 1647 kvm_err("Guest Emulate Load from MMIO space failed: PC: %p, BadVaddr: %#lx\n", 1648 opc, badvaddr); 1649 run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1650 } 1651 } 1652 1653 if (er == EMULATE_DONE) { 1654 ret = RESUME_GUEST; 1655 } else if (er == EMULATE_DO_MMIO) { 1656 run->exit_reason = KVM_EXIT_MMIO; 1657 ret = RESUME_HOST; 1658 } else { 1659 run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1660 ret = RESUME_HOST; 1661 } 1662 return ret; 1663 } 1664 1665 static int kvm_trap_vz_handle_tlb_st_miss(struct kvm_vcpu *vcpu) 1666 { 1667 struct kvm_run *run = vcpu->run; 1668 u32 *opc = (u32 *) vcpu->arch.pc; 1669 u32 cause = vcpu->arch.host_cp0_cause; 1670 ulong badvaddr = vcpu->arch.host_cp0_badvaddr; 1671 union mips_instruction inst; 1672 enum emulation_result er = EMULATE_DONE; 1673 int err; 1674 int ret = RESUME_GUEST; 1675 1676 /* Just try the access again if we couldn't do the translation */ 1677 if (kvm_vz_badvaddr_to_gpa(vcpu, badvaddr, &badvaddr)) 1678 return RESUME_GUEST; 1679 vcpu->arch.host_cp0_badvaddr = badvaddr; 1680 1681 if (kvm_mips_handle_vz_root_tlb_fault(badvaddr, vcpu, true)) { 1682 /* Fetch the instruction */ 1683 if (cause & CAUSEF_BD) 1684 opc += 1; 1685 err = kvm_get_badinstr(opc, vcpu, &inst.word); 1686 if (err) { 1687 run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1688 return RESUME_HOST; 1689 } 1690 1691 /* Treat as MMIO */ 1692 er = kvm_mips_emulate_store(inst, cause, vcpu); 1693 if (er == EMULATE_FAIL) { 1694 kvm_err("Guest Emulate Store to MMIO space failed: PC: %p, BadVaddr: %#lx\n", 1695 opc, badvaddr); 1696 run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1697 } 1698 } 1699 1700 if (er == EMULATE_DONE) { 1701 ret = RESUME_GUEST; 1702 } else if (er == EMULATE_DO_MMIO) { 1703 run->exit_reason = KVM_EXIT_MMIO; 1704 ret = RESUME_HOST; 1705 } else { 1706 run->exit_reason = KVM_EXIT_INTERNAL_ERROR; 1707 ret = RESUME_HOST; 1708 } 1709 return ret; 1710 } 1711 1712 static u64 kvm_vz_get_one_regs[] = { 1713 KVM_REG_MIPS_CP0_INDEX, 1714 KVM_REG_MIPS_CP0_ENTRYLO0, 1715 KVM_REG_MIPS_CP0_ENTRYLO1, 1716 KVM_REG_MIPS_CP0_CONTEXT, 1717 KVM_REG_MIPS_CP0_PAGEMASK, 1718 KVM_REG_MIPS_CP0_PAGEGRAIN, 1719 KVM_REG_MIPS_CP0_WIRED, 1720 KVM_REG_MIPS_CP0_HWRENA, 1721 KVM_REG_MIPS_CP0_BADVADDR, 1722 KVM_REG_MIPS_CP0_COUNT, 1723 KVM_REG_MIPS_CP0_ENTRYHI, 1724 KVM_REG_MIPS_CP0_COMPARE, 1725 KVM_REG_MIPS_CP0_STATUS, 1726 KVM_REG_MIPS_CP0_INTCTL, 1727 KVM_REG_MIPS_CP0_CAUSE, 1728 KVM_REG_MIPS_CP0_EPC, 1729 KVM_REG_MIPS_CP0_PRID, 1730 KVM_REG_MIPS_CP0_EBASE, 1731 KVM_REG_MIPS_CP0_CONFIG, 1732 KVM_REG_MIPS_CP0_CONFIG1, 1733 KVM_REG_MIPS_CP0_CONFIG2, 1734 KVM_REG_MIPS_CP0_CONFIG3, 1735 KVM_REG_MIPS_CP0_CONFIG4, 1736 KVM_REG_MIPS_CP0_CONFIG5, 1737 KVM_REG_MIPS_CP0_CONFIG6, 1738 #ifdef CONFIG_64BIT 1739 KVM_REG_MIPS_CP0_XCONTEXT, 1740 #endif 1741 KVM_REG_MIPS_CP0_ERROREPC, 1742 1743 KVM_REG_MIPS_COUNT_CTL, 1744 KVM_REG_MIPS_COUNT_RESUME, 1745 KVM_REG_MIPS_COUNT_HZ, 1746 }; 1747 1748 static u64 kvm_vz_get_one_regs_contextconfig[] = { 1749 KVM_REG_MIPS_CP0_CONTEXTCONFIG, 1750 #ifdef CONFIG_64BIT 1751 KVM_REG_MIPS_CP0_XCONTEXTCONFIG, 1752 #endif 1753 }; 1754 1755 static u64 kvm_vz_get_one_regs_segments[] = { 1756 KVM_REG_MIPS_CP0_SEGCTL0, 1757 KVM_REG_MIPS_CP0_SEGCTL1, 1758 KVM_REG_MIPS_CP0_SEGCTL2, 1759 }; 1760 1761 static u64 kvm_vz_get_one_regs_htw[] = { 1762 KVM_REG_MIPS_CP0_PWBASE, 1763 KVM_REG_MIPS_CP0_PWFIELD, 1764 KVM_REG_MIPS_CP0_PWSIZE, 1765 KVM_REG_MIPS_CP0_PWCTL, 1766 }; 1767 1768 static u64 kvm_vz_get_one_regs_kscratch[] = { 1769 KVM_REG_MIPS_CP0_KSCRATCH1, 1770 KVM_REG_MIPS_CP0_KSCRATCH2, 1771 KVM_REG_MIPS_CP0_KSCRATCH3, 1772 KVM_REG_MIPS_CP0_KSCRATCH4, 1773 KVM_REG_MIPS_CP0_KSCRATCH5, 1774 KVM_REG_MIPS_CP0_KSCRATCH6, 1775 }; 1776 1777 static unsigned long kvm_vz_num_regs(struct kvm_vcpu *vcpu) 1778 { 1779 unsigned long ret; 1780 1781 ret = ARRAY_SIZE(kvm_vz_get_one_regs); 1782 if (cpu_guest_has_userlocal) 1783 ++ret; 1784 if (cpu_guest_has_badinstr) 1785 ++ret; 1786 if (cpu_guest_has_badinstrp) 1787 ++ret; 1788 if (cpu_guest_has_contextconfig) 1789 ret += ARRAY_SIZE(kvm_vz_get_one_regs_contextconfig); 1790 if (cpu_guest_has_segments) 1791 ret += ARRAY_SIZE(kvm_vz_get_one_regs_segments); 1792 if (cpu_guest_has_htw || cpu_guest_has_ldpte) 1793 ret += ARRAY_SIZE(kvm_vz_get_one_regs_htw); 1794 if (cpu_guest_has_maar && !cpu_guest_has_dyn_maar) 1795 ret += 1 + ARRAY_SIZE(vcpu->arch.maar); 1796 ret += __arch_hweight8(cpu_data[0].guest.kscratch_mask); 1797 1798 return ret; 1799 } 1800 1801 static int kvm_vz_copy_reg_indices(struct kvm_vcpu *vcpu, u64 __user *indices) 1802 { 1803 u64 index; 1804 unsigned int i; 1805 1806 if (copy_to_user(indices, kvm_vz_get_one_regs, 1807 sizeof(kvm_vz_get_one_regs))) 1808 return -EFAULT; 1809 indices += ARRAY_SIZE(kvm_vz_get_one_regs); 1810 1811 if (cpu_guest_has_userlocal) { 1812 index = KVM_REG_MIPS_CP0_USERLOCAL; 1813 if (copy_to_user(indices, &index, sizeof(index))) 1814 return -EFAULT; 1815 ++indices; 1816 } 1817 if (cpu_guest_has_badinstr) { 1818 index = KVM_REG_MIPS_CP0_BADINSTR; 1819 if (copy_to_user(indices, &index, sizeof(index))) 1820 return -EFAULT; 1821 ++indices; 1822 } 1823 if (cpu_guest_has_badinstrp) { 1824 index = KVM_REG_MIPS_CP0_BADINSTRP; 1825 if (copy_to_user(indices, &index, sizeof(index))) 1826 return -EFAULT; 1827 ++indices; 1828 } 1829 if (cpu_guest_has_contextconfig) { 1830 if (copy_to_user(indices, kvm_vz_get_one_regs_contextconfig, 1831 sizeof(kvm_vz_get_one_regs_contextconfig))) 1832 return -EFAULT; 1833 indices += ARRAY_SIZE(kvm_vz_get_one_regs_contextconfig); 1834 } 1835 if (cpu_guest_has_segments) { 1836 if (copy_to_user(indices, kvm_vz_get_one_regs_segments, 1837 sizeof(kvm_vz_get_one_regs_segments))) 1838 return -EFAULT; 1839 indices += ARRAY_SIZE(kvm_vz_get_one_regs_segments); 1840 } 1841 if (cpu_guest_has_htw || cpu_guest_has_ldpte) { 1842 if (copy_to_user(indices, kvm_vz_get_one_regs_htw, 1843 sizeof(kvm_vz_get_one_regs_htw))) 1844 return -EFAULT; 1845 indices += ARRAY_SIZE(kvm_vz_get_one_regs_htw); 1846 } 1847 if (cpu_guest_has_maar && !cpu_guest_has_dyn_maar) { 1848 for (i = 0; i < ARRAY_SIZE(vcpu->arch.maar); ++i) { 1849 index = KVM_REG_MIPS_CP0_MAAR(i); 1850 if (copy_to_user(indices, &index, sizeof(index))) 1851 return -EFAULT; 1852 ++indices; 1853 } 1854 1855 index = KVM_REG_MIPS_CP0_MAARI; 1856 if (copy_to_user(indices, &index, sizeof(index))) 1857 return -EFAULT; 1858 ++indices; 1859 } 1860 for (i = 0; i < 6; ++i) { 1861 if (!cpu_guest_has_kscr(i + 2)) 1862 continue; 1863 1864 if (copy_to_user(indices, &kvm_vz_get_one_regs_kscratch[i], 1865 sizeof(kvm_vz_get_one_regs_kscratch[i]))) 1866 return -EFAULT; 1867 ++indices; 1868 } 1869 1870 return 0; 1871 } 1872 1873 static inline s64 entrylo_kvm_to_user(unsigned long v) 1874 { 1875 s64 mask, ret = v; 1876 1877 if (BITS_PER_LONG == 32) { 1878 /* 1879 * KVM API exposes 64-bit version of the register, so move the 1880 * RI/XI bits up into place. 1881 */ 1882 mask = MIPS_ENTRYLO_RI | MIPS_ENTRYLO_XI; 1883 ret &= ~mask; 1884 ret |= ((s64)v & mask) << 32; 1885 } 1886 return ret; 1887 } 1888 1889 static inline unsigned long entrylo_user_to_kvm(s64 v) 1890 { 1891 unsigned long mask, ret = v; 1892 1893 if (BITS_PER_LONG == 32) { 1894 /* 1895 * KVM API exposes 64-bit versiono of the register, so move the 1896 * RI/XI bits down into place. 1897 */ 1898 mask = MIPS_ENTRYLO_RI | MIPS_ENTRYLO_XI; 1899 ret &= ~mask; 1900 ret |= (v >> 32) & mask; 1901 } 1902 return ret; 1903 } 1904 1905 static int kvm_vz_get_one_reg(struct kvm_vcpu *vcpu, 1906 const struct kvm_one_reg *reg, 1907 s64 *v) 1908 { 1909 struct mips_coproc *cop0 = vcpu->arch.cop0; 1910 unsigned int idx; 1911 1912 switch (reg->id) { 1913 case KVM_REG_MIPS_CP0_INDEX: 1914 *v = (long)read_gc0_index(); 1915 break; 1916 case KVM_REG_MIPS_CP0_ENTRYLO0: 1917 *v = entrylo_kvm_to_user(read_gc0_entrylo0()); 1918 break; 1919 case KVM_REG_MIPS_CP0_ENTRYLO1: 1920 *v = entrylo_kvm_to_user(read_gc0_entrylo1()); 1921 break; 1922 case KVM_REG_MIPS_CP0_CONTEXT: 1923 *v = (long)read_gc0_context(); 1924 break; 1925 case KVM_REG_MIPS_CP0_CONTEXTCONFIG: 1926 if (!cpu_guest_has_contextconfig) 1927 return -EINVAL; 1928 *v = read_gc0_contextconfig(); 1929 break; 1930 case KVM_REG_MIPS_CP0_USERLOCAL: 1931 if (!cpu_guest_has_userlocal) 1932 return -EINVAL; 1933 *v = read_gc0_userlocal(); 1934 break; 1935 #ifdef CONFIG_64BIT 1936 case KVM_REG_MIPS_CP0_XCONTEXTCONFIG: 1937 if (!cpu_guest_has_contextconfig) 1938 return -EINVAL; 1939 *v = read_gc0_xcontextconfig(); 1940 break; 1941 #endif 1942 case KVM_REG_MIPS_CP0_PAGEMASK: 1943 *v = (long)read_gc0_pagemask(); 1944 break; 1945 case KVM_REG_MIPS_CP0_PAGEGRAIN: 1946 *v = (long)read_gc0_pagegrain(); 1947 break; 1948 case KVM_REG_MIPS_CP0_SEGCTL0: 1949 if (!cpu_guest_has_segments) 1950 return -EINVAL; 1951 *v = read_gc0_segctl0(); 1952 break; 1953 case KVM_REG_MIPS_CP0_SEGCTL1: 1954 if (!cpu_guest_has_segments) 1955 return -EINVAL; 1956 *v = read_gc0_segctl1(); 1957 break; 1958 case KVM_REG_MIPS_CP0_SEGCTL2: 1959 if (!cpu_guest_has_segments) 1960 return -EINVAL; 1961 *v = read_gc0_segctl2(); 1962 break; 1963 case KVM_REG_MIPS_CP0_PWBASE: 1964 if (!cpu_guest_has_htw && !cpu_guest_has_ldpte) 1965 return -EINVAL; 1966 *v = read_gc0_pwbase(); 1967 break; 1968 case KVM_REG_MIPS_CP0_PWFIELD: 1969 if (!cpu_guest_has_htw && !cpu_guest_has_ldpte) 1970 return -EINVAL; 1971 *v = read_gc0_pwfield(); 1972 break; 1973 case KVM_REG_MIPS_CP0_PWSIZE: 1974 if (!cpu_guest_has_htw && !cpu_guest_has_ldpte) 1975 return -EINVAL; 1976 *v = read_gc0_pwsize(); 1977 break; 1978 case KVM_REG_MIPS_CP0_WIRED: 1979 *v = (long)read_gc0_wired(); 1980 break; 1981 case KVM_REG_MIPS_CP0_PWCTL: 1982 if (!cpu_guest_has_htw && !cpu_guest_has_ldpte) 1983 return -EINVAL; 1984 *v = read_gc0_pwctl(); 1985 break; 1986 case KVM_REG_MIPS_CP0_HWRENA: 1987 *v = (long)read_gc0_hwrena(); 1988 break; 1989 case KVM_REG_MIPS_CP0_BADVADDR: 1990 *v = (long)read_gc0_badvaddr(); 1991 break; 1992 case KVM_REG_MIPS_CP0_BADINSTR: 1993 if (!cpu_guest_has_badinstr) 1994 return -EINVAL; 1995 *v = read_gc0_badinstr(); 1996 break; 1997 case KVM_REG_MIPS_CP0_BADINSTRP: 1998 if (!cpu_guest_has_badinstrp) 1999 return -EINVAL; 2000 *v = read_gc0_badinstrp(); 2001 break; 2002 case KVM_REG_MIPS_CP0_COUNT: 2003 *v = kvm_mips_read_count(vcpu); 2004 break; 2005 case KVM_REG_MIPS_CP0_ENTRYHI: 2006 *v = (long)read_gc0_entryhi(); 2007 break; 2008 case KVM_REG_MIPS_CP0_COMPARE: 2009 *v = (long)read_gc0_compare(); 2010 break; 2011 case KVM_REG_MIPS_CP0_STATUS: 2012 *v = (long)read_gc0_status(); 2013 break; 2014 case KVM_REG_MIPS_CP0_INTCTL: 2015 *v = read_gc0_intctl(); 2016 break; 2017 case KVM_REG_MIPS_CP0_CAUSE: 2018 *v = (long)read_gc0_cause(); 2019 break; 2020 case KVM_REG_MIPS_CP0_EPC: 2021 *v = (long)read_gc0_epc(); 2022 break; 2023 case KVM_REG_MIPS_CP0_PRID: 2024 switch (boot_cpu_type()) { 2025 case CPU_CAVIUM_OCTEON3: 2026 /* Octeon III has a read-only guest.PRid */ 2027 *v = read_gc0_prid(); 2028 break; 2029 default: 2030 *v = (long)kvm_read_c0_guest_prid(cop0); 2031 break; 2032 } 2033 break; 2034 case KVM_REG_MIPS_CP0_EBASE: 2035 *v = kvm_vz_read_gc0_ebase(); 2036 break; 2037 case KVM_REG_MIPS_CP0_CONFIG: 2038 *v = read_gc0_config(); 2039 break; 2040 case KVM_REG_MIPS_CP0_CONFIG1: 2041 if (!cpu_guest_has_conf1) 2042 return -EINVAL; 2043 *v = read_gc0_config1(); 2044 break; 2045 case KVM_REG_MIPS_CP0_CONFIG2: 2046 if (!cpu_guest_has_conf2) 2047 return -EINVAL; 2048 *v = read_gc0_config2(); 2049 break; 2050 case KVM_REG_MIPS_CP0_CONFIG3: 2051 if (!cpu_guest_has_conf3) 2052 return -EINVAL; 2053 *v = read_gc0_config3(); 2054 break; 2055 case KVM_REG_MIPS_CP0_CONFIG4: 2056 if (!cpu_guest_has_conf4) 2057 return -EINVAL; 2058 *v = read_gc0_config4(); 2059 break; 2060 case KVM_REG_MIPS_CP0_CONFIG5: 2061 if (!cpu_guest_has_conf5) 2062 return -EINVAL; 2063 *v = read_gc0_config5(); 2064 break; 2065 case KVM_REG_MIPS_CP0_CONFIG6: 2066 *v = kvm_read_sw_gc0_config6(cop0); 2067 break; 2068 case KVM_REG_MIPS_CP0_MAAR(0) ... KVM_REG_MIPS_CP0_MAAR(0x3f): 2069 if (!cpu_guest_has_maar || cpu_guest_has_dyn_maar) 2070 return -EINVAL; 2071 idx = reg->id - KVM_REG_MIPS_CP0_MAAR(0); 2072 if (idx >= ARRAY_SIZE(vcpu->arch.maar)) 2073 return -EINVAL; 2074 *v = vcpu->arch.maar[idx]; 2075 break; 2076 case KVM_REG_MIPS_CP0_MAARI: 2077 if (!cpu_guest_has_maar || cpu_guest_has_dyn_maar) 2078 return -EINVAL; 2079 *v = kvm_read_sw_gc0_maari(vcpu->arch.cop0); 2080 break; 2081 #ifdef CONFIG_64BIT 2082 case KVM_REG_MIPS_CP0_XCONTEXT: 2083 *v = read_gc0_xcontext(); 2084 break; 2085 #endif 2086 case KVM_REG_MIPS_CP0_ERROREPC: 2087 *v = (long)read_gc0_errorepc(); 2088 break; 2089 case KVM_REG_MIPS_CP0_KSCRATCH1 ... KVM_REG_MIPS_CP0_KSCRATCH6: 2090 idx = reg->id - KVM_REG_MIPS_CP0_KSCRATCH1 + 2; 2091 if (!cpu_guest_has_kscr(idx)) 2092 return -EINVAL; 2093 switch (idx) { 2094 case 2: 2095 *v = (long)read_gc0_kscratch1(); 2096 break; 2097 case 3: 2098 *v = (long)read_gc0_kscratch2(); 2099 break; 2100 case 4: 2101 *v = (long)read_gc0_kscratch3(); 2102 break; 2103 case 5: 2104 *v = (long)read_gc0_kscratch4(); 2105 break; 2106 case 6: 2107 *v = (long)read_gc0_kscratch5(); 2108 break; 2109 case 7: 2110 *v = (long)read_gc0_kscratch6(); 2111 break; 2112 } 2113 break; 2114 case KVM_REG_MIPS_COUNT_CTL: 2115 *v = vcpu->arch.count_ctl; 2116 break; 2117 case KVM_REG_MIPS_COUNT_RESUME: 2118 *v = ktime_to_ns(vcpu->arch.count_resume); 2119 break; 2120 case KVM_REG_MIPS_COUNT_HZ: 2121 *v = vcpu->arch.count_hz; 2122 break; 2123 default: 2124 return -EINVAL; 2125 } 2126 return 0; 2127 } 2128 2129 static int kvm_vz_set_one_reg(struct kvm_vcpu *vcpu, 2130 const struct kvm_one_reg *reg, 2131 s64 v) 2132 { 2133 struct mips_coproc *cop0 = vcpu->arch.cop0; 2134 unsigned int idx; 2135 int ret = 0; 2136 unsigned int cur, change; 2137 2138 switch (reg->id) { 2139 case KVM_REG_MIPS_CP0_INDEX: 2140 write_gc0_index(v); 2141 break; 2142 case KVM_REG_MIPS_CP0_ENTRYLO0: 2143 write_gc0_entrylo0(entrylo_user_to_kvm(v)); 2144 break; 2145 case KVM_REG_MIPS_CP0_ENTRYLO1: 2146 write_gc0_entrylo1(entrylo_user_to_kvm(v)); 2147 break; 2148 case KVM_REG_MIPS_CP0_CONTEXT: 2149 write_gc0_context(v); 2150 break; 2151 case KVM_REG_MIPS_CP0_CONTEXTCONFIG: 2152 if (!cpu_guest_has_contextconfig) 2153 return -EINVAL; 2154 write_gc0_contextconfig(v); 2155 break; 2156 case KVM_REG_MIPS_CP0_USERLOCAL: 2157 if (!cpu_guest_has_userlocal) 2158 return -EINVAL; 2159 write_gc0_userlocal(v); 2160 break; 2161 #ifdef CONFIG_64BIT 2162 case KVM_REG_MIPS_CP0_XCONTEXTCONFIG: 2163 if (!cpu_guest_has_contextconfig) 2164 return -EINVAL; 2165 write_gc0_xcontextconfig(v); 2166 break; 2167 #endif 2168 case KVM_REG_MIPS_CP0_PAGEMASK: 2169 write_gc0_pagemask(v); 2170 break; 2171 case KVM_REG_MIPS_CP0_PAGEGRAIN: 2172 write_gc0_pagegrain(v); 2173 break; 2174 case KVM_REG_MIPS_CP0_SEGCTL0: 2175 if (!cpu_guest_has_segments) 2176 return -EINVAL; 2177 write_gc0_segctl0(v); 2178 break; 2179 case KVM_REG_MIPS_CP0_SEGCTL1: 2180 if (!cpu_guest_has_segments) 2181 return -EINVAL; 2182 write_gc0_segctl1(v); 2183 break; 2184 case KVM_REG_MIPS_CP0_SEGCTL2: 2185 if (!cpu_guest_has_segments) 2186 return -EINVAL; 2187 write_gc0_segctl2(v); 2188 break; 2189 case KVM_REG_MIPS_CP0_PWBASE: 2190 if (!cpu_guest_has_htw && !cpu_guest_has_ldpte) 2191 return -EINVAL; 2192 write_gc0_pwbase(v); 2193 break; 2194 case KVM_REG_MIPS_CP0_PWFIELD: 2195 if (!cpu_guest_has_htw && !cpu_guest_has_ldpte) 2196 return -EINVAL; 2197 write_gc0_pwfield(v); 2198 break; 2199 case KVM_REG_MIPS_CP0_PWSIZE: 2200 if (!cpu_guest_has_htw && !cpu_guest_has_ldpte) 2201 return -EINVAL; 2202 write_gc0_pwsize(v); 2203 break; 2204 case KVM_REG_MIPS_CP0_WIRED: 2205 change_gc0_wired(MIPSR6_WIRED_WIRED, v); 2206 break; 2207 case KVM_REG_MIPS_CP0_PWCTL: 2208 if (!cpu_guest_has_htw && !cpu_guest_has_ldpte) 2209 return -EINVAL; 2210 write_gc0_pwctl(v); 2211 break; 2212 case KVM_REG_MIPS_CP0_HWRENA: 2213 write_gc0_hwrena(v); 2214 break; 2215 case KVM_REG_MIPS_CP0_BADVADDR: 2216 write_gc0_badvaddr(v); 2217 break; 2218 case KVM_REG_MIPS_CP0_BADINSTR: 2219 if (!cpu_guest_has_badinstr) 2220 return -EINVAL; 2221 write_gc0_badinstr(v); 2222 break; 2223 case KVM_REG_MIPS_CP0_BADINSTRP: 2224 if (!cpu_guest_has_badinstrp) 2225 return -EINVAL; 2226 write_gc0_badinstrp(v); 2227 break; 2228 case KVM_REG_MIPS_CP0_COUNT: 2229 kvm_mips_write_count(vcpu, v); 2230 break; 2231 case KVM_REG_MIPS_CP0_ENTRYHI: 2232 write_gc0_entryhi(v); 2233 break; 2234 case KVM_REG_MIPS_CP0_COMPARE: 2235 kvm_mips_write_compare(vcpu, v, false); 2236 break; 2237 case KVM_REG_MIPS_CP0_STATUS: 2238 write_gc0_status(v); 2239 break; 2240 case KVM_REG_MIPS_CP0_INTCTL: 2241 write_gc0_intctl(v); 2242 break; 2243 case KVM_REG_MIPS_CP0_CAUSE: 2244 /* 2245 * If the timer is stopped or started (DC bit) it must look 2246 * atomic with changes to the timer interrupt pending bit (TI). 2247 * A timer interrupt should not happen in between. 2248 */ 2249 if ((read_gc0_cause() ^ v) & CAUSEF_DC) { 2250 if (v & CAUSEF_DC) { 2251 /* disable timer first */ 2252 kvm_mips_count_disable_cause(vcpu); 2253 change_gc0_cause((u32)~CAUSEF_DC, v); 2254 } else { 2255 /* enable timer last */ 2256 change_gc0_cause((u32)~CAUSEF_DC, v); 2257 kvm_mips_count_enable_cause(vcpu); 2258 } 2259 } else { 2260 write_gc0_cause(v); 2261 } 2262 break; 2263 case KVM_REG_MIPS_CP0_EPC: 2264 write_gc0_epc(v); 2265 break; 2266 case KVM_REG_MIPS_CP0_PRID: 2267 switch (boot_cpu_type()) { 2268 case CPU_CAVIUM_OCTEON3: 2269 /* Octeon III has a guest.PRid, but its read-only */ 2270 break; 2271 default: 2272 kvm_write_c0_guest_prid(cop0, v); 2273 break; 2274 } 2275 break; 2276 case KVM_REG_MIPS_CP0_EBASE: 2277 kvm_vz_write_gc0_ebase(v); 2278 break; 2279 case KVM_REG_MIPS_CP0_CONFIG: 2280 cur = read_gc0_config(); 2281 change = (cur ^ v) & kvm_vz_config_user_wrmask(vcpu); 2282 if (change) { 2283 v = cur ^ change; 2284 write_gc0_config(v); 2285 } 2286 break; 2287 case KVM_REG_MIPS_CP0_CONFIG1: 2288 if (!cpu_guest_has_conf1) 2289 break; 2290 cur = read_gc0_config1(); 2291 change = (cur ^ v) & kvm_vz_config1_user_wrmask(vcpu); 2292 if (change) { 2293 v = cur ^ change; 2294 write_gc0_config1(v); 2295 } 2296 break; 2297 case KVM_REG_MIPS_CP0_CONFIG2: 2298 if (!cpu_guest_has_conf2) 2299 break; 2300 cur = read_gc0_config2(); 2301 change = (cur ^ v) & kvm_vz_config2_user_wrmask(vcpu); 2302 if (change) { 2303 v = cur ^ change; 2304 write_gc0_config2(v); 2305 } 2306 break; 2307 case KVM_REG_MIPS_CP0_CONFIG3: 2308 if (!cpu_guest_has_conf3) 2309 break; 2310 cur = read_gc0_config3(); 2311 change = (cur ^ v) & kvm_vz_config3_user_wrmask(vcpu); 2312 if (change) { 2313 v = cur ^ change; 2314 write_gc0_config3(v); 2315 } 2316 break; 2317 case KVM_REG_MIPS_CP0_CONFIG4: 2318 if (!cpu_guest_has_conf4) 2319 break; 2320 cur = read_gc0_config4(); 2321 change = (cur ^ v) & kvm_vz_config4_user_wrmask(vcpu); 2322 if (change) { 2323 v = cur ^ change; 2324 write_gc0_config4(v); 2325 } 2326 break; 2327 case KVM_REG_MIPS_CP0_CONFIG5: 2328 if (!cpu_guest_has_conf5) 2329 break; 2330 cur = read_gc0_config5(); 2331 change = (cur ^ v) & kvm_vz_config5_user_wrmask(vcpu); 2332 if (change) { 2333 v = cur ^ change; 2334 write_gc0_config5(v); 2335 } 2336 break; 2337 case KVM_REG_MIPS_CP0_CONFIG6: 2338 cur = kvm_read_sw_gc0_config6(cop0); 2339 change = (cur ^ v) & kvm_vz_config6_user_wrmask(vcpu); 2340 if (change) { 2341 v = cur ^ change; 2342 kvm_write_sw_gc0_config6(cop0, (int)v); 2343 } 2344 break; 2345 case KVM_REG_MIPS_CP0_MAAR(0) ... KVM_REG_MIPS_CP0_MAAR(0x3f): 2346 if (!cpu_guest_has_maar || cpu_guest_has_dyn_maar) 2347 return -EINVAL; 2348 idx = reg->id - KVM_REG_MIPS_CP0_MAAR(0); 2349 if (idx >= ARRAY_SIZE(vcpu->arch.maar)) 2350 return -EINVAL; 2351 vcpu->arch.maar[idx] = mips_process_maar(dmtc_op, v); 2352 break; 2353 case KVM_REG_MIPS_CP0_MAARI: 2354 if (!cpu_guest_has_maar || cpu_guest_has_dyn_maar) 2355 return -EINVAL; 2356 kvm_write_maari(vcpu, v); 2357 break; 2358 #ifdef CONFIG_64BIT 2359 case KVM_REG_MIPS_CP0_XCONTEXT: 2360 write_gc0_xcontext(v); 2361 break; 2362 #endif 2363 case KVM_REG_MIPS_CP0_ERROREPC: 2364 write_gc0_errorepc(v); 2365 break; 2366 case KVM_REG_MIPS_CP0_KSCRATCH1 ... KVM_REG_MIPS_CP0_KSCRATCH6: 2367 idx = reg->id - KVM_REG_MIPS_CP0_KSCRATCH1 + 2; 2368 if (!cpu_guest_has_kscr(idx)) 2369 return -EINVAL; 2370 switch (idx) { 2371 case 2: 2372 write_gc0_kscratch1(v); 2373 break; 2374 case 3: 2375 write_gc0_kscratch2(v); 2376 break; 2377 case 4: 2378 write_gc0_kscratch3(v); 2379 break; 2380 case 5: 2381 write_gc0_kscratch4(v); 2382 break; 2383 case 6: 2384 write_gc0_kscratch5(v); 2385 break; 2386 case 7: 2387 write_gc0_kscratch6(v); 2388 break; 2389 } 2390 break; 2391 case KVM_REG_MIPS_COUNT_CTL: 2392 ret = kvm_mips_set_count_ctl(vcpu, v); 2393 break; 2394 case KVM_REG_MIPS_COUNT_RESUME: 2395 ret = kvm_mips_set_count_resume(vcpu, v); 2396 break; 2397 case KVM_REG_MIPS_COUNT_HZ: 2398 ret = kvm_mips_set_count_hz(vcpu, v); 2399 break; 2400 default: 2401 return -EINVAL; 2402 } 2403 return ret; 2404 } 2405 2406 #define guestid_cache(cpu) (cpu_data[cpu].guestid_cache) 2407 static void kvm_vz_get_new_guestid(unsigned long cpu, struct kvm_vcpu *vcpu) 2408 { 2409 unsigned long guestid = guestid_cache(cpu); 2410 2411 if (!(++guestid & GUESTID_MASK)) { 2412 if (cpu_has_vtag_icache) 2413 flush_icache_all(); 2414 2415 if (!guestid) /* fix version if needed */ 2416 guestid = GUESTID_FIRST_VERSION; 2417 2418 ++guestid; /* guestid 0 reserved for root */ 2419 2420 /* start new guestid cycle */ 2421 kvm_vz_local_flush_roottlb_all_guests(); 2422 kvm_vz_local_flush_guesttlb_all(); 2423 } 2424 2425 guestid_cache(cpu) = guestid; 2426 } 2427 2428 /* Returns 1 if the guest TLB may be clobbered */ 2429 static int kvm_vz_check_requests(struct kvm_vcpu *vcpu, int cpu) 2430 { 2431 int ret = 0; 2432 int i; 2433 2434 if (!kvm_request_pending(vcpu)) 2435 return 0; 2436 2437 if (kvm_check_request(KVM_REQ_TLB_FLUSH, vcpu)) { 2438 if (cpu_has_guestid) { 2439 /* Drop all GuestIDs for this VCPU */ 2440 for_each_possible_cpu(i) 2441 vcpu->arch.vzguestid[i] = 0; 2442 /* This will clobber guest TLB contents too */ 2443 ret = 1; 2444 } 2445 /* 2446 * For Root ASID Dealias (RAD) we don't do anything here, but we 2447 * still need the request to ensure we recheck asid_flush_mask. 2448 * We can still return 0 as only the root TLB will be affected 2449 * by a root ASID flush. 2450 */ 2451 } 2452 2453 return ret; 2454 } 2455 2456 static void kvm_vz_vcpu_save_wired(struct kvm_vcpu *vcpu) 2457 { 2458 unsigned int wired = read_gc0_wired(); 2459 struct kvm_mips_tlb *tlbs; 2460 int i; 2461 2462 /* Expand the wired TLB array if necessary */ 2463 wired &= MIPSR6_WIRED_WIRED; 2464 if (wired > vcpu->arch.wired_tlb_limit) { 2465 tlbs = krealloc(vcpu->arch.wired_tlb, wired * 2466 sizeof(*vcpu->arch.wired_tlb), GFP_ATOMIC); 2467 if (WARN_ON(!tlbs)) { 2468 /* Save whatever we can */ 2469 wired = vcpu->arch.wired_tlb_limit; 2470 } else { 2471 vcpu->arch.wired_tlb = tlbs; 2472 vcpu->arch.wired_tlb_limit = wired; 2473 } 2474 } 2475 2476 if (wired) 2477 /* Save wired entries from the guest TLB */ 2478 kvm_vz_save_guesttlb(vcpu->arch.wired_tlb, 0, wired); 2479 /* Invalidate any dropped entries since last time */ 2480 for (i = wired; i < vcpu->arch.wired_tlb_used; ++i) { 2481 vcpu->arch.wired_tlb[i].tlb_hi = UNIQUE_GUEST_ENTRYHI(i); 2482 vcpu->arch.wired_tlb[i].tlb_lo[0] = 0; 2483 vcpu->arch.wired_tlb[i].tlb_lo[1] = 0; 2484 vcpu->arch.wired_tlb[i].tlb_mask = 0; 2485 } 2486 vcpu->arch.wired_tlb_used = wired; 2487 } 2488 2489 static void kvm_vz_vcpu_load_wired(struct kvm_vcpu *vcpu) 2490 { 2491 /* Load wired entries into the guest TLB */ 2492 if (vcpu->arch.wired_tlb) 2493 kvm_vz_load_guesttlb(vcpu->arch.wired_tlb, 0, 2494 vcpu->arch.wired_tlb_used); 2495 } 2496 2497 static void kvm_vz_vcpu_load_tlb(struct kvm_vcpu *vcpu, int cpu) 2498 { 2499 struct kvm *kvm = vcpu->kvm; 2500 struct mm_struct *gpa_mm = &kvm->arch.gpa_mm; 2501 bool migrated; 2502 2503 /* 2504 * Are we entering guest context on a different CPU to last time? 2505 * If so, the VCPU's guest TLB state on this CPU may be stale. 2506 */ 2507 migrated = (vcpu->arch.last_exec_cpu != cpu); 2508 vcpu->arch.last_exec_cpu = cpu; 2509 2510 /* 2511 * A vcpu's GuestID is set in GuestCtl1.ID when the vcpu is loaded and 2512 * remains set until another vcpu is loaded in. As a rule GuestRID 2513 * remains zeroed when in root context unless the kernel is busy 2514 * manipulating guest tlb entries. 2515 */ 2516 if (cpu_has_guestid) { 2517 /* 2518 * Check if our GuestID is of an older version and thus invalid. 2519 * 2520 * We also discard the stored GuestID if we've executed on 2521 * another CPU, as the guest mappings may have changed without 2522 * hypervisor knowledge. 2523 */ 2524 if (migrated || 2525 (vcpu->arch.vzguestid[cpu] ^ guestid_cache(cpu)) & 2526 GUESTID_VERSION_MASK) { 2527 kvm_vz_get_new_guestid(cpu, vcpu); 2528 vcpu->arch.vzguestid[cpu] = guestid_cache(cpu); 2529 trace_kvm_guestid_change(vcpu, 2530 vcpu->arch.vzguestid[cpu]); 2531 } 2532 2533 /* Restore GuestID */ 2534 change_c0_guestctl1(GUESTID_MASK, vcpu->arch.vzguestid[cpu]); 2535 } else { 2536 /* 2537 * The Guest TLB only stores a single guest's TLB state, so 2538 * flush it if another VCPU has executed on this CPU. 2539 * 2540 * We also flush if we've executed on another CPU, as the guest 2541 * mappings may have changed without hypervisor knowledge. 2542 */ 2543 if (migrated || last_exec_vcpu[cpu] != vcpu) 2544 kvm_vz_local_flush_guesttlb_all(); 2545 last_exec_vcpu[cpu] = vcpu; 2546 2547 /* 2548 * Root ASID dealiases guest GPA mappings in the root TLB. 2549 * Allocate new root ASID if needed. 2550 */ 2551 if (cpumask_test_and_clear_cpu(cpu, &kvm->arch.asid_flush_mask)) 2552 get_new_mmu_context(gpa_mm); 2553 else 2554 check_mmu_context(gpa_mm); 2555 } 2556 } 2557 2558 static int kvm_vz_vcpu_load(struct kvm_vcpu *vcpu, int cpu) 2559 { 2560 struct mips_coproc *cop0 = vcpu->arch.cop0; 2561 bool migrated, all; 2562 2563 /* 2564 * Have we migrated to a different CPU? 2565 * If so, any old guest TLB state may be stale. 2566 */ 2567 migrated = (vcpu->arch.last_sched_cpu != cpu); 2568 2569 /* 2570 * Was this the last VCPU to run on this CPU? 2571 * If not, any old guest state from this VCPU will have been clobbered. 2572 */ 2573 all = migrated || (last_vcpu[cpu] != vcpu); 2574 last_vcpu[cpu] = vcpu; 2575 2576 /* 2577 * Restore CP0_Wired unconditionally as we clear it after use, and 2578 * restore wired guest TLB entries (while in guest context). 2579 */ 2580 kvm_restore_gc0_wired(cop0); 2581 if (current->flags & PF_VCPU) { 2582 tlbw_use_hazard(); 2583 kvm_vz_vcpu_load_tlb(vcpu, cpu); 2584 kvm_vz_vcpu_load_wired(vcpu); 2585 } 2586 2587 /* 2588 * Restore timer state regardless, as e.g. Cause.TI can change over time 2589 * if left unmaintained. 2590 */ 2591 kvm_vz_restore_timer(vcpu); 2592 2593 /* Set MC bit if we want to trace guest mode changes */ 2594 if (kvm_trace_guest_mode_change) 2595 set_c0_guestctl0(MIPS_GCTL0_MC); 2596 else 2597 clear_c0_guestctl0(MIPS_GCTL0_MC); 2598 2599 /* Don't bother restoring registers multiple times unless necessary */ 2600 if (!all) 2601 return 0; 2602 2603 /* 2604 * Restore config registers first, as some implementations restrict 2605 * writes to other registers when the corresponding feature bits aren't 2606 * set. For example Status.CU1 cannot be set unless Config1.FP is set. 2607 */ 2608 kvm_restore_gc0_config(cop0); 2609 if (cpu_guest_has_conf1) 2610 kvm_restore_gc0_config1(cop0); 2611 if (cpu_guest_has_conf2) 2612 kvm_restore_gc0_config2(cop0); 2613 if (cpu_guest_has_conf3) 2614 kvm_restore_gc0_config3(cop0); 2615 if (cpu_guest_has_conf4) 2616 kvm_restore_gc0_config4(cop0); 2617 if (cpu_guest_has_conf5) 2618 kvm_restore_gc0_config5(cop0); 2619 if (cpu_guest_has_conf6) 2620 kvm_restore_gc0_config6(cop0); 2621 if (cpu_guest_has_conf7) 2622 kvm_restore_gc0_config7(cop0); 2623 2624 kvm_restore_gc0_index(cop0); 2625 kvm_restore_gc0_entrylo0(cop0); 2626 kvm_restore_gc0_entrylo1(cop0); 2627 kvm_restore_gc0_context(cop0); 2628 if (cpu_guest_has_contextconfig) 2629 kvm_restore_gc0_contextconfig(cop0); 2630 #ifdef CONFIG_64BIT 2631 kvm_restore_gc0_xcontext(cop0); 2632 if (cpu_guest_has_contextconfig) 2633 kvm_restore_gc0_xcontextconfig(cop0); 2634 #endif 2635 kvm_restore_gc0_pagemask(cop0); 2636 kvm_restore_gc0_pagegrain(cop0); 2637 kvm_restore_gc0_hwrena(cop0); 2638 kvm_restore_gc0_badvaddr(cop0); 2639 kvm_restore_gc0_entryhi(cop0); 2640 kvm_restore_gc0_status(cop0); 2641 kvm_restore_gc0_intctl(cop0); 2642 kvm_restore_gc0_epc(cop0); 2643 kvm_vz_write_gc0_ebase(kvm_read_sw_gc0_ebase(cop0)); 2644 if (cpu_guest_has_userlocal) 2645 kvm_restore_gc0_userlocal(cop0); 2646 2647 kvm_restore_gc0_errorepc(cop0); 2648 2649 /* restore KScratch registers if enabled in guest */ 2650 if (cpu_guest_has_conf4) { 2651 if (cpu_guest_has_kscr(2)) 2652 kvm_restore_gc0_kscratch1(cop0); 2653 if (cpu_guest_has_kscr(3)) 2654 kvm_restore_gc0_kscratch2(cop0); 2655 if (cpu_guest_has_kscr(4)) 2656 kvm_restore_gc0_kscratch3(cop0); 2657 if (cpu_guest_has_kscr(5)) 2658 kvm_restore_gc0_kscratch4(cop0); 2659 if (cpu_guest_has_kscr(6)) 2660 kvm_restore_gc0_kscratch5(cop0); 2661 if (cpu_guest_has_kscr(7)) 2662 kvm_restore_gc0_kscratch6(cop0); 2663 } 2664 2665 if (cpu_guest_has_badinstr) 2666 kvm_restore_gc0_badinstr(cop0); 2667 if (cpu_guest_has_badinstrp) 2668 kvm_restore_gc0_badinstrp(cop0); 2669 2670 if (cpu_guest_has_segments) { 2671 kvm_restore_gc0_segctl0(cop0); 2672 kvm_restore_gc0_segctl1(cop0); 2673 kvm_restore_gc0_segctl2(cop0); 2674 } 2675 2676 /* restore HTW registers */ 2677 if (cpu_guest_has_htw || cpu_guest_has_ldpte) { 2678 kvm_restore_gc0_pwbase(cop0); 2679 kvm_restore_gc0_pwfield(cop0); 2680 kvm_restore_gc0_pwsize(cop0); 2681 kvm_restore_gc0_pwctl(cop0); 2682 } 2683 2684 /* restore Root.GuestCtl2 from unused Guest guestctl2 register */ 2685 if (cpu_has_guestctl2) 2686 write_c0_guestctl2( 2687 cop0->reg[MIPS_CP0_GUESTCTL2][MIPS_CP0_GUESTCTL2_SEL]); 2688 2689 /* 2690 * We should clear linked load bit to break interrupted atomics. This 2691 * prevents a SC on the next VCPU from succeeding by matching a LL on 2692 * the previous VCPU. 2693 */ 2694 if (vcpu->kvm->created_vcpus > 1) 2695 write_gc0_lladdr(0); 2696 2697 return 0; 2698 } 2699 2700 static int kvm_vz_vcpu_put(struct kvm_vcpu *vcpu, int cpu) 2701 { 2702 struct mips_coproc *cop0 = vcpu->arch.cop0; 2703 2704 if (current->flags & PF_VCPU) 2705 kvm_vz_vcpu_save_wired(vcpu); 2706 2707 kvm_lose_fpu(vcpu); 2708 2709 kvm_save_gc0_index(cop0); 2710 kvm_save_gc0_entrylo0(cop0); 2711 kvm_save_gc0_entrylo1(cop0); 2712 kvm_save_gc0_context(cop0); 2713 if (cpu_guest_has_contextconfig) 2714 kvm_save_gc0_contextconfig(cop0); 2715 #ifdef CONFIG_64BIT 2716 kvm_save_gc0_xcontext(cop0); 2717 if (cpu_guest_has_contextconfig) 2718 kvm_save_gc0_xcontextconfig(cop0); 2719 #endif 2720 kvm_save_gc0_pagemask(cop0); 2721 kvm_save_gc0_pagegrain(cop0); 2722 kvm_save_gc0_wired(cop0); 2723 /* allow wired TLB entries to be overwritten */ 2724 clear_gc0_wired(MIPSR6_WIRED_WIRED); 2725 kvm_save_gc0_hwrena(cop0); 2726 kvm_save_gc0_badvaddr(cop0); 2727 kvm_save_gc0_entryhi(cop0); 2728 kvm_save_gc0_status(cop0); 2729 kvm_save_gc0_intctl(cop0); 2730 kvm_save_gc0_epc(cop0); 2731 kvm_write_sw_gc0_ebase(cop0, kvm_vz_read_gc0_ebase()); 2732 if (cpu_guest_has_userlocal) 2733 kvm_save_gc0_userlocal(cop0); 2734 2735 /* only save implemented config registers */ 2736 kvm_save_gc0_config(cop0); 2737 if (cpu_guest_has_conf1) 2738 kvm_save_gc0_config1(cop0); 2739 if (cpu_guest_has_conf2) 2740 kvm_save_gc0_config2(cop0); 2741 if (cpu_guest_has_conf3) 2742 kvm_save_gc0_config3(cop0); 2743 if (cpu_guest_has_conf4) 2744 kvm_save_gc0_config4(cop0); 2745 if (cpu_guest_has_conf5) 2746 kvm_save_gc0_config5(cop0); 2747 if (cpu_guest_has_conf6) 2748 kvm_save_gc0_config6(cop0); 2749 if (cpu_guest_has_conf7) 2750 kvm_save_gc0_config7(cop0); 2751 2752 kvm_save_gc0_errorepc(cop0); 2753 2754 /* save KScratch registers if enabled in guest */ 2755 if (cpu_guest_has_conf4) { 2756 if (cpu_guest_has_kscr(2)) 2757 kvm_save_gc0_kscratch1(cop0); 2758 if (cpu_guest_has_kscr(3)) 2759 kvm_save_gc0_kscratch2(cop0); 2760 if (cpu_guest_has_kscr(4)) 2761 kvm_save_gc0_kscratch3(cop0); 2762 if (cpu_guest_has_kscr(5)) 2763 kvm_save_gc0_kscratch4(cop0); 2764 if (cpu_guest_has_kscr(6)) 2765 kvm_save_gc0_kscratch5(cop0); 2766 if (cpu_guest_has_kscr(7)) 2767 kvm_save_gc0_kscratch6(cop0); 2768 } 2769 2770 if (cpu_guest_has_badinstr) 2771 kvm_save_gc0_badinstr(cop0); 2772 if (cpu_guest_has_badinstrp) 2773 kvm_save_gc0_badinstrp(cop0); 2774 2775 if (cpu_guest_has_segments) { 2776 kvm_save_gc0_segctl0(cop0); 2777 kvm_save_gc0_segctl1(cop0); 2778 kvm_save_gc0_segctl2(cop0); 2779 } 2780 2781 /* save HTW registers if enabled in guest */ 2782 if (cpu_guest_has_ldpte || (cpu_guest_has_htw && 2783 kvm_read_sw_gc0_config3(cop0) & MIPS_CONF3_PW)) { 2784 kvm_save_gc0_pwbase(cop0); 2785 kvm_save_gc0_pwfield(cop0); 2786 kvm_save_gc0_pwsize(cop0); 2787 kvm_save_gc0_pwctl(cop0); 2788 } 2789 2790 kvm_vz_save_timer(vcpu); 2791 2792 /* save Root.GuestCtl2 in unused Guest guestctl2 register */ 2793 if (cpu_has_guestctl2) 2794 cop0->reg[MIPS_CP0_GUESTCTL2][MIPS_CP0_GUESTCTL2_SEL] = 2795 read_c0_guestctl2(); 2796 2797 return 0; 2798 } 2799 2800 /** 2801 * kvm_vz_resize_guest_vtlb() - Attempt to resize guest VTLB. 2802 * @size: Number of guest VTLB entries (0 < @size <= root VTLB entries). 2803 * 2804 * Attempt to resize the guest VTLB by writing guest Config registers. This is 2805 * necessary for cores with a shared root/guest TLB to avoid overlap with wired 2806 * entries in the root VTLB. 2807 * 2808 * Returns: The resulting guest VTLB size. 2809 */ 2810 static unsigned int kvm_vz_resize_guest_vtlb(unsigned int size) 2811 { 2812 unsigned int config4 = 0, ret = 0, limit; 2813 2814 /* Write MMUSize - 1 into guest Config registers */ 2815 if (cpu_guest_has_conf1) 2816 change_gc0_config1(MIPS_CONF1_TLBS, 2817 (size - 1) << MIPS_CONF1_TLBS_SHIFT); 2818 if (cpu_guest_has_conf4) { 2819 config4 = read_gc0_config4(); 2820 if (cpu_has_mips_r6 || (config4 & MIPS_CONF4_MMUEXTDEF) == 2821 MIPS_CONF4_MMUEXTDEF_VTLBSIZEEXT) { 2822 config4 &= ~MIPS_CONF4_VTLBSIZEEXT; 2823 config4 |= ((size - 1) >> MIPS_CONF1_TLBS_SIZE) << 2824 MIPS_CONF4_VTLBSIZEEXT_SHIFT; 2825 } else if ((config4 & MIPS_CONF4_MMUEXTDEF) == 2826 MIPS_CONF4_MMUEXTDEF_MMUSIZEEXT) { 2827 config4 &= ~MIPS_CONF4_MMUSIZEEXT; 2828 config4 |= ((size - 1) >> MIPS_CONF1_TLBS_SIZE) << 2829 MIPS_CONF4_MMUSIZEEXT_SHIFT; 2830 } 2831 write_gc0_config4(config4); 2832 } 2833 2834 /* 2835 * Set Guest.Wired.Limit = 0 (no limit up to Guest.MMUSize-1), unless it 2836 * would exceed Root.Wired.Limit (clearing Guest.Wired.Wired so write 2837 * not dropped) 2838 */ 2839 if (cpu_has_mips_r6) { 2840 limit = (read_c0_wired() & MIPSR6_WIRED_LIMIT) >> 2841 MIPSR6_WIRED_LIMIT_SHIFT; 2842 if (size - 1 <= limit) 2843 limit = 0; 2844 write_gc0_wired(limit << MIPSR6_WIRED_LIMIT_SHIFT); 2845 } 2846 2847 /* Read back MMUSize - 1 */ 2848 back_to_back_c0_hazard(); 2849 if (cpu_guest_has_conf1) 2850 ret = (read_gc0_config1() & MIPS_CONF1_TLBS) >> 2851 MIPS_CONF1_TLBS_SHIFT; 2852 if (config4) { 2853 if (cpu_has_mips_r6 || (config4 & MIPS_CONF4_MMUEXTDEF) == 2854 MIPS_CONF4_MMUEXTDEF_VTLBSIZEEXT) 2855 ret |= ((config4 & MIPS_CONF4_VTLBSIZEEXT) >> 2856 MIPS_CONF4_VTLBSIZEEXT_SHIFT) << 2857 MIPS_CONF1_TLBS_SIZE; 2858 else if ((config4 & MIPS_CONF4_MMUEXTDEF) == 2859 MIPS_CONF4_MMUEXTDEF_MMUSIZEEXT) 2860 ret |= ((config4 & MIPS_CONF4_MMUSIZEEXT) >> 2861 MIPS_CONF4_MMUSIZEEXT_SHIFT) << 2862 MIPS_CONF1_TLBS_SIZE; 2863 } 2864 return ret + 1; 2865 } 2866 2867 static int kvm_vz_hardware_enable(void) 2868 { 2869 unsigned int mmu_size, guest_mmu_size, ftlb_size; 2870 u64 guest_cvmctl, cvmvmconfig; 2871 2872 switch (current_cpu_type()) { 2873 case CPU_CAVIUM_OCTEON3: 2874 /* Set up guest timer/perfcount IRQ lines */ 2875 guest_cvmctl = read_gc0_cvmctl(); 2876 guest_cvmctl &= ~CVMCTL_IPTI; 2877 guest_cvmctl |= 7ull << CVMCTL_IPTI_SHIFT; 2878 guest_cvmctl &= ~CVMCTL_IPPCI; 2879 guest_cvmctl |= 6ull << CVMCTL_IPPCI_SHIFT; 2880 write_gc0_cvmctl(guest_cvmctl); 2881 2882 cvmvmconfig = read_c0_cvmvmconfig(); 2883 /* No I/O hole translation. */ 2884 cvmvmconfig |= CVMVMCONF_DGHT; 2885 /* Halve the root MMU size */ 2886 mmu_size = ((cvmvmconfig & CVMVMCONF_MMUSIZEM1) 2887 >> CVMVMCONF_MMUSIZEM1_S) + 1; 2888 guest_mmu_size = mmu_size / 2; 2889 mmu_size -= guest_mmu_size; 2890 cvmvmconfig &= ~CVMVMCONF_RMMUSIZEM1; 2891 cvmvmconfig |= mmu_size - 1; 2892 write_c0_cvmvmconfig(cvmvmconfig); 2893 2894 /* Update our records */ 2895 current_cpu_data.tlbsize = mmu_size; 2896 current_cpu_data.tlbsizevtlb = mmu_size; 2897 current_cpu_data.guest.tlbsize = guest_mmu_size; 2898 2899 /* Flush moved entries in new (guest) context */ 2900 kvm_vz_local_flush_guesttlb_all(); 2901 break; 2902 default: 2903 /* 2904 * ImgTec cores tend to use a shared root/guest TLB. To avoid 2905 * overlap of root wired and guest entries, the guest TLB may 2906 * need resizing. 2907 */ 2908 mmu_size = current_cpu_data.tlbsizevtlb; 2909 ftlb_size = current_cpu_data.tlbsize - mmu_size; 2910 2911 /* Try switching to maximum guest VTLB size for flush */ 2912 guest_mmu_size = kvm_vz_resize_guest_vtlb(mmu_size); 2913 current_cpu_data.guest.tlbsize = guest_mmu_size + ftlb_size; 2914 kvm_vz_local_flush_guesttlb_all(); 2915 2916 /* 2917 * Reduce to make space for root wired entries and at least 2 2918 * root non-wired entries. This does assume that long-term wired 2919 * entries won't be added later. 2920 */ 2921 guest_mmu_size = mmu_size - num_wired_entries() - 2; 2922 guest_mmu_size = kvm_vz_resize_guest_vtlb(guest_mmu_size); 2923 current_cpu_data.guest.tlbsize = guest_mmu_size + ftlb_size; 2924 2925 /* 2926 * Write the VTLB size, but if another CPU has already written, 2927 * check it matches or we won't provide a consistent view to the 2928 * guest. If this ever happens it suggests an asymmetric number 2929 * of wired entries. 2930 */ 2931 if (cmpxchg(&kvm_vz_guest_vtlb_size, 0, guest_mmu_size) && 2932 WARN(guest_mmu_size != kvm_vz_guest_vtlb_size, 2933 "Available guest VTLB size mismatch")) 2934 return -EINVAL; 2935 break; 2936 } 2937 2938 /* 2939 * Enable virtualization features granting guest direct control of 2940 * certain features: 2941 * CP0=1: Guest coprocessor 0 context. 2942 * AT=Guest: Guest MMU. 2943 * CG=1: Hit (virtual address) CACHE operations (optional). 2944 * CF=1: Guest Config registers. 2945 * CGI=1: Indexed flush CACHE operations (optional). 2946 */ 2947 write_c0_guestctl0(MIPS_GCTL0_CP0 | 2948 (MIPS_GCTL0_AT_GUEST << MIPS_GCTL0_AT_SHIFT) | 2949 MIPS_GCTL0_CG | MIPS_GCTL0_CF); 2950 if (cpu_has_guestctl0ext) { 2951 if (current_cpu_type() != CPU_LOONGSON64) 2952 set_c0_guestctl0ext(MIPS_GCTL0EXT_CGI); 2953 else 2954 clear_c0_guestctl0ext(MIPS_GCTL0EXT_CGI); 2955 } 2956 2957 if (cpu_has_guestid) { 2958 write_c0_guestctl1(0); 2959 kvm_vz_local_flush_roottlb_all_guests(); 2960 2961 GUESTID_MASK = current_cpu_data.guestid_mask; 2962 GUESTID_FIRST_VERSION = GUESTID_MASK + 1; 2963 GUESTID_VERSION_MASK = ~GUESTID_MASK; 2964 2965 current_cpu_data.guestid_cache = GUESTID_FIRST_VERSION; 2966 } 2967 2968 /* clear any pending injected virtual guest interrupts */ 2969 if (cpu_has_guestctl2) 2970 clear_c0_guestctl2(0x3f << 10); 2971 2972 #ifdef CONFIG_CPU_LOONGSON64 2973 /* Control guest CCA attribute */ 2974 if (cpu_has_csr()) 2975 csr_writel(csr_readl(0xffffffec) | 0x1, 0xffffffec); 2976 #endif 2977 2978 return 0; 2979 } 2980 2981 static void kvm_vz_hardware_disable(void) 2982 { 2983 u64 cvmvmconfig; 2984 unsigned int mmu_size; 2985 2986 /* Flush any remaining guest TLB entries */ 2987 kvm_vz_local_flush_guesttlb_all(); 2988 2989 switch (current_cpu_type()) { 2990 case CPU_CAVIUM_OCTEON3: 2991 /* 2992 * Allocate whole TLB for root. Existing guest TLB entries will 2993 * change ownership to the root TLB. We should be safe though as 2994 * they've already been flushed above while in guest TLB. 2995 */ 2996 cvmvmconfig = read_c0_cvmvmconfig(); 2997 mmu_size = ((cvmvmconfig & CVMVMCONF_MMUSIZEM1) 2998 >> CVMVMCONF_MMUSIZEM1_S) + 1; 2999 cvmvmconfig &= ~CVMVMCONF_RMMUSIZEM1; 3000 cvmvmconfig |= mmu_size - 1; 3001 write_c0_cvmvmconfig(cvmvmconfig); 3002 3003 /* Update our records */ 3004 current_cpu_data.tlbsize = mmu_size; 3005 current_cpu_data.tlbsizevtlb = mmu_size; 3006 current_cpu_data.guest.tlbsize = 0; 3007 3008 /* Flush moved entries in new (root) context */ 3009 local_flush_tlb_all(); 3010 break; 3011 } 3012 3013 if (cpu_has_guestid) { 3014 write_c0_guestctl1(0); 3015 kvm_vz_local_flush_roottlb_all_guests(); 3016 } 3017 } 3018 3019 static int kvm_vz_check_extension(struct kvm *kvm, long ext) 3020 { 3021 int r; 3022 3023 switch (ext) { 3024 case KVM_CAP_MIPS_VZ: 3025 /* we wouldn't be here unless cpu_has_vz */ 3026 r = 1; 3027 break; 3028 #ifdef CONFIG_64BIT 3029 case KVM_CAP_MIPS_64BIT: 3030 /* We support 64-bit registers/operations and addresses */ 3031 r = 2; 3032 break; 3033 #endif 3034 case KVM_CAP_IOEVENTFD: 3035 r = 1; 3036 break; 3037 default: 3038 r = 0; 3039 break; 3040 } 3041 3042 return r; 3043 } 3044 3045 static int kvm_vz_vcpu_init(struct kvm_vcpu *vcpu) 3046 { 3047 int i; 3048 3049 for_each_possible_cpu(i) 3050 vcpu->arch.vzguestid[i] = 0; 3051 3052 return 0; 3053 } 3054 3055 static void kvm_vz_vcpu_uninit(struct kvm_vcpu *vcpu) 3056 { 3057 int cpu; 3058 3059 /* 3060 * If the VCPU is freed and reused as another VCPU, we don't want the 3061 * matching pointer wrongly hanging around in last_vcpu[] or 3062 * last_exec_vcpu[]. 3063 */ 3064 for_each_possible_cpu(cpu) { 3065 if (last_vcpu[cpu] == vcpu) 3066 last_vcpu[cpu] = NULL; 3067 if (last_exec_vcpu[cpu] == vcpu) 3068 last_exec_vcpu[cpu] = NULL; 3069 } 3070 } 3071 3072 static int kvm_vz_vcpu_setup(struct kvm_vcpu *vcpu) 3073 { 3074 struct mips_coproc *cop0 = vcpu->arch.cop0; 3075 unsigned long count_hz = 100*1000*1000; /* default to 100 MHz */ 3076 3077 /* 3078 * Start off the timer at the same frequency as the host timer, but the 3079 * soft timer doesn't handle frequencies greater than 1GHz yet. 3080 */ 3081 if (mips_hpt_frequency && mips_hpt_frequency <= NSEC_PER_SEC) 3082 count_hz = mips_hpt_frequency; 3083 kvm_mips_init_count(vcpu, count_hz); 3084 3085 /* 3086 * Initialize guest register state to valid architectural reset state. 3087 */ 3088 3089 /* PageGrain */ 3090 if (cpu_has_mips_r5 || cpu_has_mips_r6) 3091 kvm_write_sw_gc0_pagegrain(cop0, PG_RIE | PG_XIE | PG_IEC); 3092 /* Wired */ 3093 if (cpu_has_mips_r6) 3094 kvm_write_sw_gc0_wired(cop0, 3095 read_gc0_wired() & MIPSR6_WIRED_LIMIT); 3096 /* Status */ 3097 kvm_write_sw_gc0_status(cop0, ST0_BEV | ST0_ERL); 3098 if (cpu_has_mips_r5 || cpu_has_mips_r6) 3099 kvm_change_sw_gc0_status(cop0, ST0_FR, read_gc0_status()); 3100 /* IntCtl */ 3101 kvm_write_sw_gc0_intctl(cop0, read_gc0_intctl() & 3102 (INTCTLF_IPFDC | INTCTLF_IPPCI | INTCTLF_IPTI)); 3103 /* PRId */ 3104 kvm_write_sw_gc0_prid(cop0, boot_cpu_data.processor_id); 3105 /* EBase */ 3106 kvm_write_sw_gc0_ebase(cop0, (s32)0x80000000 | vcpu->vcpu_id); 3107 /* Config */ 3108 kvm_save_gc0_config(cop0); 3109 /* architecturally writable (e.g. from guest) */ 3110 kvm_change_sw_gc0_config(cop0, CONF_CM_CMASK, 3111 _page_cachable_default >> _CACHE_SHIFT); 3112 /* architecturally read only, but maybe writable from root */ 3113 kvm_change_sw_gc0_config(cop0, MIPS_CONF_MT, read_c0_config()); 3114 if (cpu_guest_has_conf1) { 3115 kvm_set_sw_gc0_config(cop0, MIPS_CONF_M); 3116 /* Config1 */ 3117 kvm_save_gc0_config1(cop0); 3118 /* architecturally read only, but maybe writable from root */ 3119 kvm_clear_sw_gc0_config1(cop0, MIPS_CONF1_C2 | 3120 MIPS_CONF1_MD | 3121 MIPS_CONF1_PC | 3122 MIPS_CONF1_WR | 3123 MIPS_CONF1_CA | 3124 MIPS_CONF1_FP); 3125 } 3126 if (cpu_guest_has_conf2) { 3127 kvm_set_sw_gc0_config1(cop0, MIPS_CONF_M); 3128 /* Config2 */ 3129 kvm_save_gc0_config2(cop0); 3130 } 3131 if (cpu_guest_has_conf3) { 3132 kvm_set_sw_gc0_config2(cop0, MIPS_CONF_M); 3133 /* Config3 */ 3134 kvm_save_gc0_config3(cop0); 3135 /* architecturally writable (e.g. from guest) */ 3136 kvm_clear_sw_gc0_config3(cop0, MIPS_CONF3_ISA_OE); 3137 /* architecturally read only, but maybe writable from root */ 3138 kvm_clear_sw_gc0_config3(cop0, MIPS_CONF3_MSA | 3139 MIPS_CONF3_BPG | 3140 MIPS_CONF3_ULRI | 3141 MIPS_CONF3_DSP | 3142 MIPS_CONF3_CTXTC | 3143 MIPS_CONF3_ITL | 3144 MIPS_CONF3_LPA | 3145 MIPS_CONF3_VEIC | 3146 MIPS_CONF3_VINT | 3147 MIPS_CONF3_SP | 3148 MIPS_CONF3_CDMM | 3149 MIPS_CONF3_MT | 3150 MIPS_CONF3_SM | 3151 MIPS_CONF3_TL); 3152 } 3153 if (cpu_guest_has_conf4) { 3154 kvm_set_sw_gc0_config3(cop0, MIPS_CONF_M); 3155 /* Config4 */ 3156 kvm_save_gc0_config4(cop0); 3157 } 3158 if (cpu_guest_has_conf5) { 3159 kvm_set_sw_gc0_config4(cop0, MIPS_CONF_M); 3160 /* Config5 */ 3161 kvm_save_gc0_config5(cop0); 3162 /* architecturally writable (e.g. from guest) */ 3163 kvm_clear_sw_gc0_config5(cop0, MIPS_CONF5_K | 3164 MIPS_CONF5_CV | 3165 MIPS_CONF5_MSAEN | 3166 MIPS_CONF5_UFE | 3167 MIPS_CONF5_FRE | 3168 MIPS_CONF5_SBRI | 3169 MIPS_CONF5_UFR); 3170 /* architecturally read only, but maybe writable from root */ 3171 kvm_clear_sw_gc0_config5(cop0, MIPS_CONF5_MRP); 3172 } 3173 3174 if (cpu_guest_has_contextconfig) { 3175 /* ContextConfig */ 3176 kvm_write_sw_gc0_contextconfig(cop0, 0x007ffff0); 3177 #ifdef CONFIG_64BIT 3178 /* XContextConfig */ 3179 /* bits SEGBITS-13+3:4 set */ 3180 kvm_write_sw_gc0_xcontextconfig(cop0, 3181 ((1ull << (cpu_vmbits - 13)) - 1) << 4); 3182 #endif 3183 } 3184 3185 /* Implementation dependent, use the legacy layout */ 3186 if (cpu_guest_has_segments) { 3187 /* SegCtl0, SegCtl1, SegCtl2 */ 3188 kvm_write_sw_gc0_segctl0(cop0, 0x00200010); 3189 kvm_write_sw_gc0_segctl1(cop0, 0x00000002 | 3190 (_page_cachable_default >> _CACHE_SHIFT) << 3191 (16 + MIPS_SEGCFG_C_SHIFT)); 3192 kvm_write_sw_gc0_segctl2(cop0, 0x00380438); 3193 } 3194 3195 /* reset HTW registers */ 3196 if (cpu_guest_has_htw && (cpu_has_mips_r5 || cpu_has_mips_r6)) { 3197 /* PWField */ 3198 kvm_write_sw_gc0_pwfield(cop0, 0x0c30c302); 3199 /* PWSize */ 3200 kvm_write_sw_gc0_pwsize(cop0, 1 << MIPS_PWSIZE_PTW_SHIFT); 3201 } 3202 3203 /* start with no pending virtual guest interrupts */ 3204 if (cpu_has_guestctl2) 3205 cop0->reg[MIPS_CP0_GUESTCTL2][MIPS_CP0_GUESTCTL2_SEL] = 0; 3206 3207 /* Put PC at reset vector */ 3208 vcpu->arch.pc = CKSEG1ADDR(0x1fc00000); 3209 3210 return 0; 3211 } 3212 3213 static void kvm_vz_flush_shadow_all(struct kvm *kvm) 3214 { 3215 if (cpu_has_guestid) { 3216 /* Flush GuestID for each VCPU individually */ 3217 kvm_flush_remote_tlbs(kvm); 3218 } else { 3219 /* 3220 * For each CPU there is a single GPA ASID used by all VCPUs in 3221 * the VM, so it doesn't make sense for the VCPUs to handle 3222 * invalidation of these ASIDs individually. 3223 * 3224 * Instead mark all CPUs as needing ASID invalidation in 3225 * asid_flush_mask, and just use kvm_flush_remote_tlbs(kvm) to 3226 * kick any running VCPUs so they check asid_flush_mask. 3227 */ 3228 cpumask_setall(&kvm->arch.asid_flush_mask); 3229 kvm_flush_remote_tlbs(kvm); 3230 } 3231 } 3232 3233 static void kvm_vz_flush_shadow_memslot(struct kvm *kvm, 3234 const struct kvm_memory_slot *slot) 3235 { 3236 kvm_vz_flush_shadow_all(kvm); 3237 } 3238 3239 static void kvm_vz_vcpu_reenter(struct kvm_vcpu *vcpu) 3240 { 3241 int cpu = smp_processor_id(); 3242 int preserve_guest_tlb; 3243 3244 preserve_guest_tlb = kvm_vz_check_requests(vcpu, cpu); 3245 3246 if (preserve_guest_tlb) 3247 kvm_vz_vcpu_save_wired(vcpu); 3248 3249 kvm_vz_vcpu_load_tlb(vcpu, cpu); 3250 3251 if (preserve_guest_tlb) 3252 kvm_vz_vcpu_load_wired(vcpu); 3253 } 3254 3255 static int kvm_vz_vcpu_run(struct kvm_vcpu *vcpu) 3256 { 3257 int cpu = smp_processor_id(); 3258 int r; 3259 3260 kvm_vz_acquire_htimer(vcpu); 3261 /* Check if we have any exceptions/interrupts pending */ 3262 kvm_mips_deliver_interrupts(vcpu, read_gc0_cause()); 3263 3264 kvm_vz_check_requests(vcpu, cpu); 3265 kvm_vz_vcpu_load_tlb(vcpu, cpu); 3266 kvm_vz_vcpu_load_wired(vcpu); 3267 3268 r = vcpu->arch.vcpu_run(vcpu->run, vcpu); 3269 3270 kvm_vz_vcpu_save_wired(vcpu); 3271 3272 return r; 3273 } 3274 3275 static struct kvm_mips_callbacks kvm_vz_callbacks = { 3276 .handle_cop_unusable = kvm_trap_vz_handle_cop_unusable, 3277 .handle_tlb_mod = kvm_trap_vz_handle_tlb_st_miss, 3278 .handle_tlb_ld_miss = kvm_trap_vz_handle_tlb_ld_miss, 3279 .handle_tlb_st_miss = kvm_trap_vz_handle_tlb_st_miss, 3280 .handle_addr_err_st = kvm_trap_vz_no_handler, 3281 .handle_addr_err_ld = kvm_trap_vz_no_handler, 3282 .handle_syscall = kvm_trap_vz_no_handler, 3283 .handle_res_inst = kvm_trap_vz_no_handler, 3284 .handle_break = kvm_trap_vz_no_handler, 3285 .handle_msa_disabled = kvm_trap_vz_handle_msa_disabled, 3286 .handle_guest_exit = kvm_trap_vz_handle_guest_exit, 3287 3288 .hardware_enable = kvm_vz_hardware_enable, 3289 .hardware_disable = kvm_vz_hardware_disable, 3290 .check_extension = kvm_vz_check_extension, 3291 .vcpu_init = kvm_vz_vcpu_init, 3292 .vcpu_uninit = kvm_vz_vcpu_uninit, 3293 .vcpu_setup = kvm_vz_vcpu_setup, 3294 .flush_shadow_all = kvm_vz_flush_shadow_all, 3295 .flush_shadow_memslot = kvm_vz_flush_shadow_memslot, 3296 .gva_to_gpa = kvm_vz_gva_to_gpa_cb, 3297 .queue_timer_int = kvm_vz_queue_timer_int_cb, 3298 .dequeue_timer_int = kvm_vz_dequeue_timer_int_cb, 3299 .queue_io_int = kvm_vz_queue_io_int_cb, 3300 .dequeue_io_int = kvm_vz_dequeue_io_int_cb, 3301 .irq_deliver = kvm_vz_irq_deliver_cb, 3302 .irq_clear = kvm_vz_irq_clear_cb, 3303 .num_regs = kvm_vz_num_regs, 3304 .copy_reg_indices = kvm_vz_copy_reg_indices, 3305 .get_one_reg = kvm_vz_get_one_reg, 3306 .set_one_reg = kvm_vz_set_one_reg, 3307 .vcpu_load = kvm_vz_vcpu_load, 3308 .vcpu_put = kvm_vz_vcpu_put, 3309 .vcpu_run = kvm_vz_vcpu_run, 3310 .vcpu_reenter = kvm_vz_vcpu_reenter, 3311 }; 3312 3313 int kvm_mips_emulation_init(struct kvm_mips_callbacks **install_callbacks) 3314 { 3315 if (!cpu_has_vz) 3316 return -ENODEV; 3317 3318 /* 3319 * VZ requires at least 2 KScratch registers, so it should have been 3320 * possible to allocate pgd_reg. 3321 */ 3322 if (WARN(pgd_reg == -1, 3323 "pgd_reg not allocated even though cpu_has_vz\n")) 3324 return -ENODEV; 3325 3326 pr_info("Starting KVM with MIPS VZ extensions\n"); 3327 3328 *install_callbacks = &kvm_vz_callbacks; 3329 return 0; 3330 } 3331