• Home
  • Raw
  • Download

Lines Matching +full:pic +full:- +full:base +full:- +full:vec

1 // SPDX-License-Identifier: GPL-2.0-only
3 * Kernel-based Virtual Machine driver for Linux
16 * Ben-Ami Yassour <benami@il.ibm.com>
43 #include <linux/intel-iommu.h>
45 #include <linux/user-return-notifier.h>
59 #include <linux/entry-kvm.h>
88 ((struct kvm_vcpu *)(ctxt)->vcpu)
91 * - enable syscall per default because its emulated by KVM
92 * - enable LME and LMA per default on 64 bit KVM
140 /* tsc tolerance in parts per million - default to 1/2 of the NTP threshold */
145 * lapic timer advance (tscdeadline mode only) in nanoseconds. '-1' enables
147 * advancement entirely. Any other value is used as-is and disables adaptive
150 static int __read_mostly lapic_timer_advance_ns = -1;
163 int __read_mostly pi_inject_timer = -1;
288 size - useroffset, NULL); in kvm_alloc_emulator_cache()
297 vcpu->arch.apf.gfns[i] = ~0; in kvm_async_pf_hash_reset()
313 if (msrs->registered) { in kvm_on_user_return()
314 msrs->registered = false; in kvm_on_user_return()
319 values = &msrs->values[slot]; in kvm_on_user_return()
320 if (values->host != values->curr) { in kvm_on_user_return()
321 wrmsrl(user_return_msrs_global.msrs[slot], values->host); in kvm_on_user_return()
322 values->curr = values->host; in kvm_on_user_return()
361 msrs->values[i].host = value; in kvm_user_return_msr_cpu_online()
362 msrs->values[i].curr = value; in kvm_user_return_msr_cpu_online()
372 value = (value & mask) | (msrs->values[slot].host & ~mask); in kvm_set_user_return_msr()
373 if (value == msrs->values[slot].curr) in kvm_set_user_return_msr()
379 msrs->values[slot].curr = value; in kvm_set_user_return_msr()
380 if (!msrs->registered) { in kvm_set_user_return_msr()
381 msrs->urn.on_user_return = kvm_on_user_return; in kvm_set_user_return_msr()
382 user_return_notifier_register(&msrs->urn); in kvm_set_user_return_msr()
383 msrs->registered = true; in kvm_set_user_return_msr()
394 if (msrs->registered) in drop_user_return_notifiers()
395 kvm_on_user_return(&msrs->urn); in drop_user_return_notifiers()
400 return vcpu->arch.apic_base; in kvm_get_apic_base()
413 enum lapic_mode new_mode = kvm_apic_mode(msr_info->data); in kvm_set_apic_base()
417 if ((msr_info->data & reserved_bits) != 0 || new_mode == LAPIC_MODE_INVALID) in kvm_set_apic_base()
419 if (!msr_info->host_initiated) { in kvm_set_apic_base()
426 kvm_lapic_set_base(vcpu, msr_info->data); in kvm_set_apic_base()
427 kvm_recalculate_apic_map(vcpu->kvm); in kvm_set_apic_base()
476 * #DBs can be trap-like or fault-like, the caller must check other CPU in exception_type()
494 unsigned nr = vcpu->arch.exception.nr; in kvm_deliver_exception_payload()
495 bool has_payload = vcpu->arch.exception.has_payload; in kvm_deliver_exception_payload()
496 unsigned long payload = vcpu->arch.exception.payload; in kvm_deliver_exception_payload()
504 * "Certain debug exceptions may clear bit 0-3. The in kvm_deliver_exception_payload()
508 vcpu->arch.dr6 &= ~DR_TRAP_BITS; in kvm_deliver_exception_payload()
512 vcpu->arch.dr6 |= DR6_RTM; in kvm_deliver_exception_payload()
513 vcpu->arch.dr6 |= payload; in kvm_deliver_exception_payload()
522 vcpu->arch.dr6 ^= payload & DR6_RTM; in kvm_deliver_exception_payload()
530 vcpu->arch.dr6 &= ~BIT(12); in kvm_deliver_exception_payload()
533 vcpu->arch.cr2 = payload; in kvm_deliver_exception_payload()
537 vcpu->arch.exception.has_payload = false; in kvm_deliver_exception_payload()
538 vcpu->arch.exception.payload = 0; in kvm_deliver_exception_payload()
551 if (!vcpu->arch.exception.pending && !vcpu->arch.exception.injected) { in kvm_multiple_exception()
555 * On vmentry, vcpu->arch.exception.pending is only in kvm_multiple_exception()
562 WARN_ON_ONCE(vcpu->arch.exception.pending); in kvm_multiple_exception()
563 vcpu->arch.exception.injected = true; in kvm_multiple_exception()
573 vcpu->arch.exception.pending = true; in kvm_multiple_exception()
574 vcpu->arch.exception.injected = false; in kvm_multiple_exception()
576 vcpu->arch.exception.has_error_code = has_error; in kvm_multiple_exception()
577 vcpu->arch.exception.nr = nr; in kvm_multiple_exception()
578 vcpu->arch.exception.error_code = error_code; in kvm_multiple_exception()
579 vcpu->arch.exception.has_payload = has_payload; in kvm_multiple_exception()
580 vcpu->arch.exception.payload = payload; in kvm_multiple_exception()
587 prev_nr = vcpu->arch.exception.nr; in kvm_multiple_exception()
589 /* triple fault -> shutdown */ in kvm_multiple_exception()
598 * Generate double fault per SDM Table 5-5. Set in kvm_multiple_exception()
602 vcpu->arch.exception.pending = true; in kvm_multiple_exception()
603 vcpu->arch.exception.injected = false; in kvm_multiple_exception()
604 vcpu->arch.exception.has_error_code = true; in kvm_multiple_exception()
605 vcpu->arch.exception.nr = DF_VECTOR; in kvm_multiple_exception()
606 vcpu->arch.exception.error_code = 0; in kvm_multiple_exception()
607 vcpu->arch.exception.has_payload = false; in kvm_multiple_exception()
608 vcpu->arch.exception.payload = 0; in kvm_multiple_exception()
611 that instruction re-execution will regenerate lost in kvm_multiple_exception()
655 ++vcpu->stat.pf_guest; in kvm_inject_page_fault()
656 vcpu->arch.exception.nested_apf = in kvm_inject_page_fault()
657 is_guest_mode(vcpu) && fault->async_page_fault; in kvm_inject_page_fault()
658 if (vcpu->arch.exception.nested_apf) { in kvm_inject_page_fault()
659 vcpu->arch.apf.nested_apf_token = fault->address; in kvm_inject_page_fault()
660 kvm_queue_exception_e(vcpu, PF_VECTOR, fault->error_code); in kvm_inject_page_fault()
662 kvm_queue_exception_e_p(vcpu, PF_VECTOR, fault->error_code, in kvm_inject_page_fault()
663 fault->address); in kvm_inject_page_fault()
672 WARN_ON_ONCE(fault->vector != PF_VECTOR); in kvm_inject_emulated_page_fault()
674 fault_mmu = fault->nested_page_fault ? vcpu->arch.mmu : in kvm_inject_emulated_page_fault()
675 vcpu->arch.walk_mmu; in kvm_inject_emulated_page_fault()
681 if ((fault->error_code & PFERR_PRESENT_MASK) && in kvm_inject_emulated_page_fault()
682 !(fault->error_code & PFERR_RSVD_MASK)) in kvm_inject_emulated_page_fault()
683 kvm_mmu_invalidate_gva(vcpu, fault_mmu, fault->address, in kvm_inject_emulated_page_fault()
684 fault_mmu->root_hpa); in kvm_inject_emulated_page_fault()
686 fault_mmu->inject_page_fault(vcpu, fault); in kvm_inject_emulated_page_fault()
687 return fault->nested_page_fault; in kvm_inject_emulated_page_fault()
693 atomic_inc(&vcpu->arch.nmi_queued); in kvm_inject_nmi()
747 real_gfn = mmu->translate_gpa(vcpu, ngpa, access, &exception); in kvm_read_guest_page_mmu()
749 return -EFAULT; in kvm_read_guest_page_mmu()
760 return kvm_read_guest_page_mmu(vcpu, vcpu->arch.walk_mmu, gfn, in kvm_read_nested_guest_page()
776 unsigned offset = ((cr3 & (PAGE_SIZE-1)) >> 5) << 2; in load_pdptrs()
779 u64 pdpte[ARRAY_SIZE(mmu->pdptrs)]; in load_pdptrs()
797 memcpy(mmu->pdptrs, pdpte, sizeof(mmu->pdptrs)); in load_pdptrs()
808 u64 pdpte[ARRAY_SIZE(vcpu->arch.walk_mmu->pdptrs)]; in pdptrs_changed()
820 offset = (kvm_read_cr3(vcpu) & 0xffffffe0ul) & (PAGE_SIZE - 1); in pdptrs_changed()
826 return memcmp(pdpte, vcpu->arch.walk_mmu->pdptrs, sizeof(pdpte)) != 0; in pdptrs_changed()
852 if ((vcpu->arch.efer & EFER_LME) && !is_paging(vcpu) && in kvm_set_cr0()
863 if (!(vcpu->arch.efer & EFER_LME) && (cr0 & X86_CR0_PG) && in kvm_set_cr0()
865 !load_pdptrs(vcpu, vcpu->arch.walk_mmu, kvm_read_cr3(vcpu))) in kvm_set_cr0()
882 kvm_arch_has_noncoherent_dma(vcpu->kvm) && in kvm_set_cr0()
883 !kvm_check_has_quirk(vcpu->kvm, KVM_X86_QUIRK_CD_NW_CLEARED)) in kvm_set_cr0()
884 kvm_zap_gfn_range(vcpu->kvm, 0, ~0ULL); in kvm_set_cr0()
900 if (vcpu->arch.xcr0 != host_xcr0) in kvm_load_guest_xsave_state()
901 xsetbv(XCR_XFEATURE_ENABLED_MASK, vcpu->arch.xcr0); in kvm_load_guest_xsave_state()
903 if (vcpu->arch.xsaves_enabled && in kvm_load_guest_xsave_state()
904 vcpu->arch.ia32_xss != host_xss) in kvm_load_guest_xsave_state()
905 wrmsrl(MSR_IA32_XSS, vcpu->arch.ia32_xss); in kvm_load_guest_xsave_state()
910 (vcpu->arch.xcr0 & XFEATURE_MASK_PKRU)) && in kvm_load_guest_xsave_state()
911 vcpu->arch.pkru != vcpu->arch.host_pkru) in kvm_load_guest_xsave_state()
912 __write_pkru(vcpu->arch.pkru); in kvm_load_guest_xsave_state()
920 (vcpu->arch.xcr0 & XFEATURE_MASK_PKRU))) { in kvm_load_host_xsave_state()
921 vcpu->arch.pkru = rdpkru(); in kvm_load_host_xsave_state()
922 if (vcpu->arch.pkru != vcpu->arch.host_pkru) in kvm_load_host_xsave_state()
923 __write_pkru(vcpu->arch.host_pkru); in kvm_load_host_xsave_state()
928 if (vcpu->arch.xcr0 != host_xcr0) in kvm_load_host_xsave_state()
931 if (vcpu->arch.xsaves_enabled && in kvm_load_host_xsave_state()
932 vcpu->arch.ia32_xss != host_xss) in kvm_load_host_xsave_state()
942 u64 old_xcr0 = vcpu->arch.xcr0; in __kvm_set_xcr()
958 valid_bits = vcpu->arch.guest_supported_xcr0 | XFEATURE_MASK_FP; in __kvm_set_xcr()
972 vcpu->arch.xcr0 = xcr0; in __kvm_set_xcr()
993 return -EINVAL; in kvm_valid_cr4()
995 if (cr4 & vcpu->arch.cr4_guest_rsvd_bits) in kvm_valid_cr4()
996 return -EINVAL; in kvm_valid_cr4()
999 return -EINVAL; in kvm_valid_cr4()
1022 && !load_pdptrs(vcpu, vcpu->arch.walk_mmu, in kvm_set_cr4()
1069 (cr3 & vcpu->arch.cr3_lm_rsvd_bits)) in kvm_set_cr3()
1072 !load_pdptrs(vcpu, vcpu->arch.walk_mmu, cr3)) in kvm_set_cr3()
1076 vcpu->arch.cr3 = cr3; in kvm_set_cr3()
1090 vcpu->arch.cr8 = cr8; in kvm_set_cr8()
1100 return vcpu->arch.cr8; in kvm_get_cr8()
1108 if (!(vcpu->guest_debug & KVM_GUESTDBG_USE_HW_BP)) { in kvm_update_dr0123()
1110 vcpu->arch.eff_db[i] = vcpu->arch.db[i]; in kvm_update_dr0123()
1111 vcpu->arch.switch_db_regs |= KVM_DEBUGREG_RELOAD; in kvm_update_dr0123()
1119 if (vcpu->guest_debug & KVM_GUESTDBG_USE_HW_BP) in kvm_update_dr7()
1120 dr7 = vcpu->arch.guest_debug_dr7; in kvm_update_dr7()
1122 dr7 = vcpu->arch.dr7; in kvm_update_dr7()
1124 vcpu->arch.switch_db_regs &= ~KVM_DEBUGREG_BP_ENABLED; in kvm_update_dr7()
1126 vcpu->arch.switch_db_regs |= KVM_DEBUGREG_BP_ENABLED; in kvm_update_dr7()
1141 size_t size = ARRAY_SIZE(vcpu->arch.db); in __kvm_set_dr()
1145 vcpu->arch.db[array_index_nospec(dr, size)] = val; in __kvm_set_dr()
1146 if (!(vcpu->guest_debug & KVM_GUESTDBG_USE_HW_BP)) in __kvm_set_dr()
1147 vcpu->arch.eff_db[dr] = val; in __kvm_set_dr()
1152 return -1; /* #GP */ in __kvm_set_dr()
1153 vcpu->arch.dr6 = (val & DR6_VOLATILE) | kvm_dr6_fixed(vcpu); in __kvm_set_dr()
1158 return -1; /* #GP */ in __kvm_set_dr()
1159 vcpu->arch.dr7 = (val & DR7_VOLATILE) | DR7_FIXED_1; in __kvm_set_dr()
1179 size_t size = ARRAY_SIZE(vcpu->arch.db); in kvm_get_dr()
1183 *val = vcpu->arch.db[array_index_nospec(dr, size)]; in kvm_get_dr()
1187 *val = vcpu->arch.dr6; in kvm_get_dr()
1191 *val = vcpu->arch.dr7; in kvm_get_dr()
1221 * kvm-specific. Those are put in emulated_msrs_all; filtering of emulated_msrs
1344 * List of msr numbers which are used to expose MSR-based features that
1379 * 10 - MISC_PACKAGE_CTRLS
1380 * 11 - ENERGY_FILTERING_CTL
1381 * 12 - DOITM
1382 * 18 - FB_CLEAR_CTRL
1383 * 21 - XAPIC_DISABLE_STATUS
1384 * 23 - OVERCLOCKING_STATUS
1460 switch (msr->index) { in kvm_get_msr_feature()
1462 msr->data = kvm_get_arch_capabilities(); in kvm_get_msr_feature()
1465 rdmsrl_safe(msr->index, &msr->data); in kvm_get_msr_feature()
1525 u64 old_efer = vcpu->arch.efer; in set_efer()
1526 u64 efer = msr_info->data; in set_efer()
1532 if (!msr_info->host_initiated) { in set_efer()
1537 (vcpu->arch.efer & EFER_LME) != (efer & EFER_LME)) in set_efer()
1542 efer |= vcpu->arch.efer & EFER_LMA; in set_efer()
1567 struct kvm *kvm = vcpu->kvm; in kvm_msr_allowed()
1576 idx = srcu_read_lock(&kvm->srcu); in kvm_msr_allowed()
1578 msr_filter = srcu_dereference(kvm->arch.msr_filter, &kvm->srcu); in kvm_msr_allowed()
1584 allowed = msr_filter->default_allow; in kvm_msr_allowed()
1585 ranges = msr_filter->ranges; in kvm_msr_allowed()
1587 for (i = 0; i < msr_filter->count; i++) { in kvm_msr_allowed()
1588 u32 start = ranges[i].base; in kvm_msr_allowed()
1594 allowed = !!test_bit(index - start, bitmap); in kvm_msr_allowed()
1598 /* Note, VM-Exits that go down the "slow" path are accounted below. */ in kvm_msr_allowed()
1599 ++vcpu->stat.exits; in kvm_msr_allowed()
1603 srcu_read_unlock(&kvm->srcu, idx); in kvm_msr_allowed()
1612 * Returns 0 on success, non-0 otherwise.
1636 * non-canonical address is written on Intel but not on in __kvm_set_msr()
1637 * AMD (which ignores the top 32-bits, because it does in __kvm_set_msr()
1638 * not implement 64-bit SYSENTER). in __kvm_set_msr()
1640 * 64-bit code should hence be able to write a non-canonical in __kvm_set_msr()
1642 * vmentry does not fail on Intel after writing a non-canonical in __kvm_set_msr()
1644 * invokes 64-bit SYSENTER. in __kvm_set_msr()
1671 * Returns 0 on success, non-0 otherwise.
1721 if (vcpu->run->msr.error) { in complete_emulated_msr()
1725 kvm_rax_write(vcpu, (u32)vcpu->run->msr.data); in complete_emulated_msr()
1726 kvm_rdx_write(vcpu, vcpu->run->msr.data >> 32); in complete_emulated_msr()
1762 if (!(vcpu->kvm->arch.user_space_msr_mask & msr_reason)) in kvm_msr_user_space()
1765 vcpu->run->exit_reason = exit_reason; in kvm_msr_user_space()
1766 vcpu->run->msr.error = 0; in kvm_msr_user_space()
1767 memset(vcpu->run->msr.pad, 0, sizeof(vcpu->run->msr.pad)); in kvm_msr_user_space()
1768 vcpu->run->msr.reason = msr_reason; in kvm_msr_user_space()
1769 vcpu->run->msr.index = index; in kvm_msr_user_space()
1770 vcpu->run->msr.data = data; in kvm_msr_user_space()
1771 vcpu->arch.complete_userspace_io = completion; in kvm_msr_user_space()
1811 kvm_rax_write(vcpu, data & -1u); in kvm_emulate_rdmsr()
1812 kvm_rdx_write(vcpu, (data >> 32) & -1u); in kvm_emulate_rdmsr()
1848 return vcpu->mode == EXITING_GUEST_MODE || kvm_request_pending(vcpu) || in kvm_vcpu_exit_request()
1855 * i.e. the sending of IPI, sending IPI early in the VM-Exit flow reduces
1862 if (!lapic_in_kernel(vcpu) || !apic_x2apic_mode(vcpu->arch.apic)) in handle_fastpath_set_x2apic_icr_irqoff()
1871 kvm_apic_send_ipi(vcpu->arch.apic, (u32)data, (u32)(data >> 32)); in handle_fastpath_set_x2apic_icr_irqoff()
1872 kvm_lapic_set_reg(vcpu->arch.apic, APIC_ICR2, (u32)(data >> 32)); in handle_fastpath_set_x2apic_icr_irqoff()
1873 kvm_lapic_set_reg(vcpu->arch.apic, APIC_ICR, (u32)data); in handle_fastpath_set_x2apic_icr_irqoff()
1962 write_seqcount_begin(&vdata->seq); in update_pvclock_gtod()
1965 vdata->clock.vclock_mode = tk->tkr_mono.clock->vdso_clock_mode; in update_pvclock_gtod()
1966 vdata->clock.cycle_last = tk->tkr_mono.cycle_last; in update_pvclock_gtod()
1967 vdata->clock.mask = tk->tkr_mono.mask; in update_pvclock_gtod()
1968 vdata->clock.mult = tk->tkr_mono.mult; in update_pvclock_gtod()
1969 vdata->clock.shift = tk->tkr_mono.shift; in update_pvclock_gtod()
1970 vdata->clock.base_cycles = tk->tkr_mono.xtime_nsec; in update_pvclock_gtod()
1971 vdata->clock.offset = tk->tkr_mono.base; in update_pvclock_gtod()
1973 vdata->raw_clock.vclock_mode = tk->tkr_raw.clock->vdso_clock_mode; in update_pvclock_gtod()
1974 vdata->raw_clock.cycle_last = tk->tkr_raw.cycle_last; in update_pvclock_gtod()
1975 vdata->raw_clock.mask = tk->tkr_raw.mask; in update_pvclock_gtod()
1976 vdata->raw_clock.mult = tk->tkr_raw.mult; in update_pvclock_gtod()
1977 vdata->raw_clock.shift = tk->tkr_raw.shift; in update_pvclock_gtod()
1978 vdata->raw_clock.base_cycles = tk->tkr_raw.xtime_nsec; in update_pvclock_gtod()
1979 vdata->raw_clock.offset = tk->tkr_raw.base; in update_pvclock_gtod()
1981 vdata->wall_time_sec = tk->xtime_sec; in update_pvclock_gtod()
1983 vdata->offs_boot = tk->offs_boot; in update_pvclock_gtod()
1985 write_seqcount_end(&vdata->seq); in update_pvclock_gtod()
2008 kvm->arch.wall_clock = wall_clock; in kvm_write_wall_clock()
2030 wall_nsec = ktime_get_real_ns() - get_kvmclock_ns(kvm); in kvm_write_wall_clock()
2045 struct kvm_arch *ka = &vcpu->kvm->arch; in kvm_write_system_time()
2047 if (vcpu->vcpu_id == 0 && !host_initiated) { in kvm_write_system_time()
2048 if (ka->boot_vcpu_runs_old_kvmclock != old_msr) in kvm_write_system_time()
2051 ka->boot_vcpu_runs_old_kvmclock = old_msr; in kvm_write_system_time()
2054 vcpu->arch.time = system_time; in kvm_write_system_time()
2058 vcpu->arch.pv_time_enabled = false; in kvm_write_system_time()
2062 if (!kvm_gfn_to_hva_cache_init(vcpu->kvm, in kvm_write_system_time()
2063 &vcpu->arch.pv_time, system_time & ~1ULL, in kvm_write_system_time()
2065 vcpu->arch.pv_time_enabled = true; in kvm_write_system_time()
2088 shift--; in kvm_get_time_scale()
2124 vcpu->arch.tsc_scaling_ratio = kvm_default_tsc_scaling_ratio; in set_tsc_khz()
2131 vcpu->arch.tsc_catchup = 1; in set_tsc_khz()
2132 vcpu->arch.tsc_always_catchup = 1; in set_tsc_khz()
2136 return -1; in set_tsc_khz()
2140 /* TSC scaling required - calculate ratio */ in set_tsc_khz()
2145 pr_warn_ratelimited("Invalid TSC scaling ratio - virtual-tsc-khz=%u\n", in set_tsc_khz()
2147 return -1; in set_tsc_khz()
2150 vcpu->arch.tsc_scaling_ratio = ratio; in set_tsc_khz()
2162 vcpu->arch.tsc_scaling_ratio = kvm_default_tsc_scaling_ratio; in kvm_set_tsc_khz()
2163 return -1; in kvm_set_tsc_khz()
2168 &vcpu->arch.virtual_tsc_shift, in kvm_set_tsc_khz()
2169 &vcpu->arch.virtual_tsc_mult); in kvm_set_tsc_khz()
2170 vcpu->arch.virtual_tsc_khz = user_tsc_khz; in kvm_set_tsc_khz()
2178 thresh_lo = adjust_tsc_khz(tsc_khz, -tsc_tolerance_ppm); in kvm_set_tsc_khz()
2189 u64 tsc = pvclock_scale_delta(kernel_ns-vcpu->arch.this_tsc_nsec, in compute_guest_tsc()
2190 vcpu->arch.virtual_tsc_mult, in compute_guest_tsc()
2191 vcpu->arch.virtual_tsc_shift); in compute_guest_tsc()
2192 tsc += vcpu->arch.this_tsc_write; in compute_guest_tsc()
2205 struct kvm_arch *ka = &vcpu->kvm->arch; in kvm_track_tsc_matching()
2208 vcpus_matched = (ka->nr_vcpus_matched_tsc + 1 == in kvm_track_tsc_matching()
2209 atomic_read(&vcpu->kvm->online_vcpus)); in kvm_track_tsc_matching()
2219 if (ka->use_master_clock || in kvm_track_tsc_matching()
2220 (gtod_is_based_on_tsc(gtod->clock.vclock_mode) && vcpus_matched)) in kvm_track_tsc_matching()
2223 trace_kvm_track_tsc(vcpu->vcpu_id, ka->nr_vcpus_matched_tsc, in kvm_track_tsc_matching()
2224 atomic_read(&vcpu->kvm->online_vcpus), in kvm_track_tsc_matching()
2225 ka->use_master_clock, gtod->clock.vclock_mode); in kvm_track_tsc_matching()
2232 * The most significant 64-N bits (mult) of ratio represent the
2235 * point number (mult + frac * 2^(-N)).
2247 u64 ratio = vcpu->arch.tsc_scaling_ratio; in kvm_scale_tsc()
2262 return target_tsc - tsc; in kvm_compute_tsc_offset()
2267 return vcpu->arch.l1_tsc_offset + kvm_scale_tsc(vcpu, host_tsc); in kvm_read_l1_tsc()
2273 vcpu->arch.l1_tsc_offset = offset; in kvm_vcpu_write_tsc_offset()
2274 vcpu->arch.tsc_offset = kvm_x86_ops.write_l1_tsc_offset(vcpu, offset); in kvm_vcpu_write_tsc_offset()
2281 * TSC is marked unstable when we're running on Hyper-V, in kvm_check_tsc_unstable()
2292 struct kvm *kvm = vcpu->kvm; in kvm_synchronize_tsc()
2299 raw_spin_lock_irqsave(&kvm->arch.tsc_write_lock, flags); in kvm_synchronize_tsc()
2302 elapsed = ns - kvm->arch.last_tsc_nsec; in kvm_synchronize_tsc()
2304 if (vcpu->arch.virtual_tsc_khz) { in kvm_synchronize_tsc()
2307 * detection of vcpu initialization -- need to sync in kvm_synchronize_tsc()
2313 u64 tsc_exp = kvm->arch.last_tsc_write + in kvm_synchronize_tsc()
2315 u64 tsc_hz = vcpu->arch.virtual_tsc_khz * 1000LL; in kvm_synchronize_tsc()
2333 vcpu->arch.virtual_tsc_khz == kvm->arch.last_tsc_khz) { in kvm_synchronize_tsc()
2335 offset = kvm->arch.cur_tsc_offset; in kvm_synchronize_tsc()
2342 already_matched = (vcpu->arch.this_tsc_generation == kvm->arch.cur_tsc_generation); in kvm_synchronize_tsc()
2351 * These values are tracked in kvm->arch.cur_xxx variables. in kvm_synchronize_tsc()
2353 kvm->arch.cur_tsc_generation++; in kvm_synchronize_tsc()
2354 kvm->arch.cur_tsc_nsec = ns; in kvm_synchronize_tsc()
2355 kvm->arch.cur_tsc_write = data; in kvm_synchronize_tsc()
2356 kvm->arch.cur_tsc_offset = offset; in kvm_synchronize_tsc()
2364 kvm->arch.last_tsc_nsec = ns; in kvm_synchronize_tsc()
2365 kvm->arch.last_tsc_write = data; in kvm_synchronize_tsc()
2366 kvm->arch.last_tsc_khz = vcpu->arch.virtual_tsc_khz; in kvm_synchronize_tsc()
2368 vcpu->arch.last_guest_tsc = data; in kvm_synchronize_tsc()
2371 vcpu->arch.this_tsc_generation = kvm->arch.cur_tsc_generation; in kvm_synchronize_tsc()
2372 vcpu->arch.this_tsc_nsec = kvm->arch.cur_tsc_nsec; in kvm_synchronize_tsc()
2373 vcpu->arch.this_tsc_write = kvm->arch.cur_tsc_write; in kvm_synchronize_tsc()
2376 raw_spin_unlock_irqrestore(&kvm->arch.tsc_write_lock, flags); in kvm_synchronize_tsc()
2378 spin_lock(&kvm->arch.pvclock_gtod_sync_lock); in kvm_synchronize_tsc()
2380 kvm->arch.nr_vcpus_matched_tsc = 0; in kvm_synchronize_tsc()
2382 kvm->arch.nr_vcpus_matched_tsc++; in kvm_synchronize_tsc()
2386 spin_unlock(&kvm->arch.pvclock_gtod_sync_lock); in kvm_synchronize_tsc()
2392 u64 tsc_offset = vcpu->arch.l1_tsc_offset; in adjust_tsc_offset_guest()
2398 if (vcpu->arch.tsc_scaling_ratio != kvm_default_tsc_scaling_ratio) in adjust_tsc_offset_host()
2432 switch (clock->vclock_mode) { in vgettsc()
2439 v = (tsc_pg_val - clock->cycle_last) & in vgettsc()
2440 clock->mask; in vgettsc()
2449 v = (*tsc_timestamp - clock->cycle_last) & in vgettsc()
2450 clock->mask; in vgettsc()
2459 return v * clock->mult; in vgettsc()
2470 seq = read_seqcount_begin(&gtod->seq); in do_monotonic_raw()
2471 ns = gtod->raw_clock.base_cycles; in do_monotonic_raw()
2472 ns += vgettsc(&gtod->raw_clock, tsc_timestamp, &mode); in do_monotonic_raw()
2473 ns >>= gtod->raw_clock.shift; in do_monotonic_raw()
2474 ns += ktime_to_ns(ktime_add(gtod->raw_clock.offset, gtod->offs_boot)); in do_monotonic_raw()
2475 } while (unlikely(read_seqcount_retry(&gtod->seq, seq))); in do_monotonic_raw()
2489 seq = read_seqcount_begin(&gtod->seq); in do_realtime()
2490 ts->tv_sec = gtod->wall_time_sec; in do_realtime()
2491 ns = gtod->clock.base_cycles; in do_realtime()
2492 ns += vgettsc(&gtod->clock, tsc_timestamp, &mode); in do_realtime()
2493 ns >>= gtod->clock.shift; in do_realtime()
2494 } while (unlikely(read_seqcount_retry(&gtod->seq, seq))); in do_realtime()
2496 ts->tv_sec += __iter_div_u64_rem(ns, NSEC_PER_SEC, &ns); in do_realtime()
2497 ts->tv_nsec = ns; in do_realtime()
2541 * 4. ret0 = timespec0 + (rdtsc - tsc0) |
2542 * 5. | ret1 = timespec1 + (rdtsc - tsc1)
2543 * | ret1 = timespec0 + N + (rdtsc - (tsc0 + M))
2547 * - ret0 < ret1
2548 * - timespec0 + (rdtsc - tsc0) < timespec0 + N + (rdtsc - (tsc0 + M))
2550 * - 0 < N - M => M < N
2569 struct kvm_arch *ka = &kvm->arch; in pvclock_update_vm_gtod_copy()
2573 vcpus_matched = (ka->nr_vcpus_matched_tsc + 1 == in pvclock_update_vm_gtod_copy()
2574 atomic_read(&kvm->online_vcpus)); in pvclock_update_vm_gtod_copy()
2581 &ka->master_kernel_ns, in pvclock_update_vm_gtod_copy()
2582 &ka->master_cycle_now); in pvclock_update_vm_gtod_copy()
2584 ka->use_master_clock = host_tsc_clocksource && vcpus_matched in pvclock_update_vm_gtod_copy()
2585 && !ka->backwards_tsc_observed in pvclock_update_vm_gtod_copy()
2586 && !ka->boot_vcpu_runs_old_kvmclock; in pvclock_update_vm_gtod_copy()
2588 if (ka->use_master_clock) in pvclock_update_vm_gtod_copy()
2592 trace_kvm_update_master_clock(ka->use_master_clock, vclock_mode, in pvclock_update_vm_gtod_copy()
2607 struct kvm_arch *ka = &kvm->arch; in kvm_gen_update_masterclock()
2609 spin_lock(&ka->pvclock_gtod_sync_lock); in kvm_gen_update_masterclock()
2621 spin_unlock(&ka->pvclock_gtod_sync_lock); in kvm_gen_update_masterclock()
2627 struct kvm_arch *ka = &kvm->arch; in get_kvmclock_ns()
2631 spin_lock(&ka->pvclock_gtod_sync_lock); in get_kvmclock_ns()
2632 if (!ka->use_master_clock) { in get_kvmclock_ns()
2633 spin_unlock(&ka->pvclock_gtod_sync_lock); in get_kvmclock_ns()
2634 return get_kvmclock_base_ns() + ka->kvmclock_offset; in get_kvmclock_ns()
2637 hv_clock.tsc_timestamp = ka->master_cycle_now; in get_kvmclock_ns()
2638 hv_clock.system_time = ka->master_kernel_ns + ka->kvmclock_offset; in get_kvmclock_ns()
2639 spin_unlock(&ka->pvclock_gtod_sync_lock); in get_kvmclock_ns()
2650 ret = get_kvmclock_base_ns() + ka->kvmclock_offset; in get_kvmclock_ns()
2659 struct kvm_vcpu_arch *vcpu = &v->arch; in kvm_setup_pvclock_page()
2662 if (unlikely(kvm_read_guest_cached(v->kvm, &vcpu->pv_time, in kvm_setup_pvclock_page()
2677 * and third write. The vcpu->pv_time cache is still valid, because the in kvm_setup_pvclock_page()
2685 vcpu->hv_clock.version = guest_hv_clock.version + 1; in kvm_setup_pvclock_page()
2686 kvm_write_guest_cached(v->kvm, &vcpu->pv_time, in kvm_setup_pvclock_page()
2687 &vcpu->hv_clock, in kvm_setup_pvclock_page()
2688 sizeof(vcpu->hv_clock.version)); in kvm_setup_pvclock_page()
2693 vcpu->hv_clock.flags |= (guest_hv_clock.flags & PVCLOCK_GUEST_STOPPED); in kvm_setup_pvclock_page()
2695 if (vcpu->pvclock_set_guest_stopped_request) { in kvm_setup_pvclock_page()
2696 vcpu->hv_clock.flags |= PVCLOCK_GUEST_STOPPED; in kvm_setup_pvclock_page()
2697 vcpu->pvclock_set_guest_stopped_request = false; in kvm_setup_pvclock_page()
2700 trace_kvm_pvclock_update(v->vcpu_id, &vcpu->hv_clock); in kvm_setup_pvclock_page()
2702 kvm_write_guest_cached(v->kvm, &vcpu->pv_time, in kvm_setup_pvclock_page()
2703 &vcpu->hv_clock, in kvm_setup_pvclock_page()
2704 sizeof(vcpu->hv_clock)); in kvm_setup_pvclock_page()
2708 vcpu->hv_clock.version++; in kvm_setup_pvclock_page()
2709 kvm_write_guest_cached(v->kvm, &vcpu->pv_time, in kvm_setup_pvclock_page()
2710 &vcpu->hv_clock, in kvm_setup_pvclock_page()
2711 sizeof(vcpu->hv_clock.version)); in kvm_setup_pvclock_page()
2717 struct kvm_vcpu_arch *vcpu = &v->arch; in kvm_guest_time_update()
2718 struct kvm_arch *ka = &v->kvm->arch; in kvm_guest_time_update()
2731 spin_lock(&ka->pvclock_gtod_sync_lock); in kvm_guest_time_update()
2732 use_master_clock = ka->use_master_clock; in kvm_guest_time_update()
2734 host_tsc = ka->master_cycle_now; in kvm_guest_time_update()
2735 kernel_ns = ka->master_kernel_ns; in kvm_guest_time_update()
2737 spin_unlock(&ka->pvclock_gtod_sync_lock); in kvm_guest_time_update()
2758 * 2) Broken TSC compensation resets the base at each VCPU in kvm_guest_time_update()
2764 if (vcpu->tsc_catchup) { in kvm_guest_time_update()
2767 adjust_tsc_offset_guest(v, tsc - tsc_timestamp); in kvm_guest_time_update()
2779 if (unlikely(vcpu->hw_tsc_khz != tgt_tsc_khz)) { in kvm_guest_time_update()
2781 &vcpu->hv_clock.tsc_shift, in kvm_guest_time_update()
2782 &vcpu->hv_clock.tsc_to_system_mul); in kvm_guest_time_update()
2783 vcpu->hw_tsc_khz = tgt_tsc_khz; in kvm_guest_time_update()
2786 vcpu->hv_clock.tsc_timestamp = tsc_timestamp; in kvm_guest_time_update()
2787 vcpu->hv_clock.system_time = kernel_ns + v->kvm->arch.kvmclock_offset; in kvm_guest_time_update()
2788 vcpu->last_guest_tsc = tsc_timestamp; in kvm_guest_time_update()
2795 vcpu->hv_clock.flags = pvclock_flags; in kvm_guest_time_update()
2797 if (vcpu->pv_time_enabled) in kvm_guest_time_update()
2799 if (v == kvm_get_vcpu(v->kvm, 0)) in kvm_guest_time_update()
2800 kvm_hv_setup_tsc_page(v->kvm, &vcpu->hv_clock); in kvm_guest_time_update()
2806 * vcpu->cpu migration, should not allow system_timestamp from
2812 * We need to rate-limit these requests though, as they can
2815 * by the delay we use to rate-limit the updates.
2837 struct kvm *kvm = v->kvm; in kvm_gen_kvmclock_update()
2840 schedule_delayed_work(&kvm->arch.kvmclock_update_work, in kvm_gen_kvmclock_update()
2856 schedule_delayed_work(&kvm->arch.kvmclock_update_work, 0); in kvmclock_sync_fn()
2857 schedule_delayed_work(&kvm->arch.kvmclock_sync_work, in kvmclock_sync_fn()
2868 return !!(vcpu->arch.msr_hwcr & BIT_ULL(18)); in can_set_mci_status()
2875 u64 mcg_cap = vcpu->arch.mcg_cap; in set_msr_mce()
2877 u32 msr = msr_info->index; in set_msr_mce()
2878 u64 data = msr_info->data; in set_msr_mce()
2882 vcpu->arch.mcg_status = data; in set_msr_mce()
2886 (data || !msr_info->host_initiated)) in set_msr_mce()
2890 vcpu->arch.mcg_ctl = data; in set_msr_mce()
2896 msr - MSR_IA32_MC0_CTL, in set_msr_mce()
2897 MSR_IA32_MCx_CTL(bank_num) - MSR_IA32_MC0_CTL); in set_msr_mce()
2905 * correctable, single-bit ECC data errors. in set_msr_mce()
2912 if (!msr_info->host_initiated && in set_msr_mce()
2918 vcpu->arch.mce_banks[offset] = data; in set_msr_mce()
2928 struct kvm *kvm = vcpu->kvm; in xen_hvm_config()
2930 u8 *blob_addr = lm ? (u8 *)(long)kvm->arch.xen_hvm_config.blob_addr_64 in xen_hvm_config()
2931 : (u8 *)(long)kvm->arch.xen_hvm_config.blob_addr_32; in xen_hvm_config()
2932 u8 blob_size = lm ? kvm->arch.xen_hvm_config.blob_size_64 in xen_hvm_config()
2933 : kvm->arch.xen_hvm_config.blob_size_32; in xen_hvm_config()
2956 return (vcpu->arch.apf.msr_en_val & mask) == mask; in kvm_pv_async_pf_enabled()
2978 vcpu->arch.apf.msr_en_val = data; in kvm_pv_enable_async_pf()
2986 if (kvm_gfn_to_hva_cache_init(vcpu->kvm, &vcpu->arch.apf.data, gpa, in kvm_pv_enable_async_pf()
2990 vcpu->arch.apf.send_user_only = !(data & KVM_ASYNC_PF_SEND_ALWAYS); in kvm_pv_enable_async_pf()
2991 vcpu->arch.apf.delivery_as_pf_vmexit = data & KVM_ASYNC_PF_DELIVERY_AS_PF_VMEXIT; in kvm_pv_enable_async_pf()
3000 /* Bits 8-63 are reserved */ in kvm_pv_enable_async_pf_int()
3007 vcpu->arch.apf.msr_int_val = data; in kvm_pv_enable_async_pf_int()
3009 vcpu->arch.apf.vec = data & KVM_ASYNC_PF_VEC_MASK; in kvm_pv_enable_async_pf_int()
3016 vcpu->arch.pv_time_enabled = false; in kvmclock_reset()
3017 vcpu->arch.time = 0; in kvmclock_reset()
3022 ++vcpu->stat.tlb_flush; in kvm_vcpu_flush_tlb_all()
3028 ++vcpu->stat.tlb_flush; in kvm_vcpu_flush_tlb_guest()
3034 struct gfn_to_hva_cache *ghc = &vcpu->arch.st.cache; in record_steal_time()
3037 gpa_t gpa = vcpu->arch.st.msr_val & KVM_STEAL_VALID_BITS; in record_steal_time()
3041 if (!(vcpu->arch.st.msr_val & KVM_MSR_ENABLED)) in record_steal_time()
3044 if (WARN_ON_ONCE(current->mm != vcpu->kvm->mm)) in record_steal_time()
3047 slots = kvm_memslots(vcpu->kvm); in record_steal_time()
3049 if (unlikely(slots->generation != ghc->generation || in record_steal_time()
3050 gpa != ghc->gpa || in record_steal_time()
3051 kvm_is_error_hva(ghc->hva) || !ghc->memslot)) { in record_steal_time()
3053 BUILD_BUG_ON((sizeof(*st) - 1) & KVM_STEAL_VALID_BITS); in record_steal_time()
3055 if (kvm_gfn_to_hva_cache_init(vcpu->kvm, ghc, gpa, sizeof(*st)) || in record_steal_time()
3056 kvm_is_error_hva(ghc->hva) || !ghc->memslot) in record_steal_time()
3060 st = (struct kvm_steal_time __user *)ghc->hva; in record_steal_time()
3067 int err = -EFAULT; in record_steal_time()
3078 "+m" (st->preempted)); in record_steal_time()
3084 vcpu->arch.st.preempted = 0; in record_steal_time()
3086 trace_kvm_pv_tlb_flush(vcpu->vcpu_id, in record_steal_time()
3097 unsafe_put_user(0, &st->preempted, out); in record_steal_time()
3098 vcpu->arch.st.preempted = 0; in record_steal_time()
3101 unsafe_get_user(version, &st->version, out); in record_steal_time()
3106 unsafe_put_user(version, &st->version, out); in record_steal_time()
3110 unsafe_get_user(steal, &st->steal, out); in record_steal_time()
3111 steal += current->sched_info.run_delay - in record_steal_time()
3112 vcpu->arch.st.last_steal; in record_steal_time()
3113 vcpu->arch.st.last_steal = current->sched_info.run_delay; in record_steal_time()
3114 unsafe_put_user(steal, &st->steal, out); in record_steal_time()
3117 unsafe_put_user(version, &st->version, out); in record_steal_time()
3122 mark_page_dirty_in_slot(ghc->memslot, gpa_to_gfn(ghc->gpa)); in record_steal_time()
3128 u32 msr = msr_info->index; in kvm_set_msr_common()
3129 u64 data = msr_info->data; in kvm_set_msr_common()
3143 if (msr_info->host_initiated) in kvm_set_msr_common()
3144 vcpu->arch.microcode_version = data; in kvm_set_msr_common()
3147 if (!msr_info->host_initiated) in kvm_set_msr_common()
3149 vcpu->arch.arch_capabilities = data; in kvm_set_msr_common()
3154 if (!msr_info->host_initiated) in kvm_set_msr_common()
3161 vcpu->arch.perf_capabilities = data; in kvm_set_msr_common()
3174 vcpu->arch.msr_hwcr = data; in kvm_set_msr_common()
3190 /* We support the non-activated case already */ in kvm_set_msr_common()
3193 /* Values other than LBR and BTF are vendor-specific, in kvm_set_msr_common()
3211 if (!msr_info->host_initiated) { in kvm_set_msr_common()
3212 s64 adj = data - vcpu->arch.ia32_tsc_adjust_msr; in kvm_set_msr_common()
3219 vcpu->arch.ia32_tsc_adjust_msr = data; in kvm_set_msr_common()
3223 if (!kvm_check_has_quirk(vcpu->kvm, KVM_X86_QUIRK_MISC_ENABLE_NO_MWAIT) && in kvm_set_msr_common()
3224 ((vcpu->arch.ia32_misc_enable_msr ^ data) & MSR_IA32_MISC_ENABLE_MWAIT)) { in kvm_set_msr_common()
3227 vcpu->arch.ia32_misc_enable_msr = data; in kvm_set_msr_common()
3230 vcpu->arch.ia32_misc_enable_msr = data; in kvm_set_msr_common()
3234 if (!msr_info->host_initiated) in kvm_set_msr_common()
3236 vcpu->arch.smbase = data; in kvm_set_msr_common()
3239 vcpu->arch.msr_ia32_power_ctl = data; in kvm_set_msr_common()
3242 if (msr_info->host_initiated) { in kvm_set_msr_common()
3245 u64 adj = kvm_compute_tsc_offset(vcpu, data) - vcpu->arch.l1_tsc_offset; in kvm_set_msr_common()
3247 vcpu->arch.ia32_tsc_adjust_msr += adj; in kvm_set_msr_common()
3251 if (!msr_info->host_initiated && in kvm_set_msr_common()
3261 vcpu->arch.ia32_xss = data; in kvm_set_msr_common()
3265 if (!msr_info->host_initiated) in kvm_set_msr_common()
3267 vcpu->arch.smi_count = data; in kvm_set_msr_common()
3273 kvm_write_wall_clock(vcpu->kvm, data); in kvm_set_msr_common()
3279 kvm_write_wall_clock(vcpu->kvm, data); in kvm_set_msr_common()
3285 kvm_write_system_time(vcpu, data, false, msr_info->host_initiated); in kvm_set_msr_common()
3291 kvm_write_system_time(vcpu, data, true, msr_info->host_initiated); in kvm_set_msr_common()
3311 vcpu->arch.apf.pageready_pending = false; in kvm_set_msr_common()
3325 vcpu->arch.st.msr_val = data; in kvm_set_msr_common()
3346 if (data & (-1ULL << 1)) in kvm_set_msr_common()
3349 vcpu->arch.msr_kvm_poll_control = data; in kvm_set_msr_common()
3354 case MSR_IA32_MC0_CTL ... MSR_IA32_MCx_CTL(KVM_MAX_MCE_BANKS) - 1: in kvm_set_msr_common()
3374 * all pre-dating SVM, but a recommended workaround from in kvm_set_msr_common()
3390 msr_info->host_initiated); in kvm_set_msr_common()
3392 /* Drop writes to this legacy MSR -- see rdmsr in kvm_set_msr_common()
3402 vcpu->arch.osvw.length = data; in kvm_set_msr_common()
3407 vcpu->arch.osvw.status = data; in kvm_set_msr_common()
3410 if (!msr_info->host_initiated || in kvm_set_msr_common()
3414 vcpu->arch.msr_platform_info = data; in kvm_set_msr_common()
3421 vcpu->arch.msr_misc_features_enables = data; in kvm_set_msr_common()
3424 if (msr && (msr == vcpu->kvm->arch.xen_hvm_config.msr)) in kvm_set_msr_common()
3437 u64 mcg_cap = vcpu->arch.mcg_cap; in get_msr_mce()
3446 data = vcpu->arch.mcg_cap; in get_msr_mce()
3451 data = vcpu->arch.mcg_ctl; in get_msr_mce()
3454 data = vcpu->arch.mcg_status; in get_msr_mce()
3460 msr - MSR_IA32_MC0_CTL, in get_msr_mce()
3461 MSR_IA32_MCx_CTL(bank_num) - MSR_IA32_MC0_CTL); in get_msr_mce()
3463 data = vcpu->arch.mce_banks[offset]; in get_msr_mce()
3474 switch (msr_info->index) { in kvm_get_msr_common()
3498 * so for existing CPU-specific MSRs. in kvm_get_msr_common()
3505 msr_info->data = 0; in kvm_get_msr_common()
3512 if (kvm_pmu_is_valid_msr(vcpu, msr_info->index)) in kvm_get_msr_common()
3514 msr_info->data = 0; in kvm_get_msr_common()
3517 msr_info->data = vcpu->arch.microcode_version; in kvm_get_msr_common()
3520 if (!msr_info->host_initiated && in kvm_get_msr_common()
3523 msr_info->data = vcpu->arch.arch_capabilities; in kvm_get_msr_common()
3526 if (!msr_info->host_initiated && in kvm_get_msr_common()
3529 msr_info->data = vcpu->arch.perf_capabilities; in kvm_get_msr_common()
3532 msr_info->data = vcpu->arch.msr_ia32_power_ctl; in kvm_get_msr_common()
3541 * return L1's TSC value to ensure backwards-compatible in kvm_get_msr_common()
3544 u64 tsc_offset = msr_info->host_initiated ? vcpu->arch.l1_tsc_offset : in kvm_get_msr_common()
3545 vcpu->arch.tsc_offset; in kvm_get_msr_common()
3547 msr_info->data = kvm_scale_tsc(vcpu, rdtsc()) + tsc_offset; in kvm_get_msr_common()
3552 return kvm_mtrr_get_msr(vcpu, msr_info->index, &msr_info->data); in kvm_get_msr_common()
3554 msr_info->data = 3; in kvm_get_msr_common()
3568 msr_info->data = 1 << 24; in kvm_get_msr_common()
3571 msr_info->data = kvm_get_apic_base(vcpu); in kvm_get_msr_common()
3574 return kvm_x2apic_msr_read(vcpu, msr_info->index, &msr_info->data); in kvm_get_msr_common()
3576 msr_info->data = kvm_get_lapic_tscdeadline_msr(vcpu); in kvm_get_msr_common()
3579 msr_info->data = (u64)vcpu->arch.ia32_tsc_adjust_msr; in kvm_get_msr_common()
3582 msr_info->data = vcpu->arch.ia32_misc_enable_msr; in kvm_get_msr_common()
3585 if (!msr_info->host_initiated) in kvm_get_msr_common()
3587 msr_info->data = vcpu->arch.smbase; in kvm_get_msr_common()
3590 msr_info->data = vcpu->arch.smi_count; in kvm_get_msr_common()
3594 msr_info->data = 1000ULL; in kvm_get_msr_common()
3596 msr_info->data |= (((uint64_t)4ULL) << 40); in kvm_get_msr_common()
3599 msr_info->data = vcpu->arch.efer; in kvm_get_msr_common()
3605 msr_info->data = vcpu->kvm->arch.wall_clock; in kvm_get_msr_common()
3611 msr_info->data = vcpu->kvm->arch.wall_clock; in kvm_get_msr_common()
3617 msr_info->data = vcpu->arch.time; in kvm_get_msr_common()
3623 msr_info->data = vcpu->arch.time; in kvm_get_msr_common()
3629 msr_info->data = vcpu->arch.apf.msr_en_val; in kvm_get_msr_common()
3635 msr_info->data = vcpu->arch.apf.msr_int_val; in kvm_get_msr_common()
3641 msr_info->data = 0; in kvm_get_msr_common()
3647 msr_info->data = vcpu->arch.st.msr_val; in kvm_get_msr_common()
3653 msr_info->data = vcpu->arch.pv_eoi.msr_val; in kvm_get_msr_common()
3659 msr_info->data = vcpu->arch.msr_kvm_poll_control; in kvm_get_msr_common()
3666 case MSR_IA32_MC0_CTL ... MSR_IA32_MCx_CTL(KVM_MAX_MCE_BANKS) - 1: in kvm_get_msr_common()
3667 return get_msr_mce(vcpu, msr_info->index, &msr_info->data, in kvm_get_msr_common()
3668 msr_info->host_initiated); in kvm_get_msr_common()
3670 if (!msr_info->host_initiated && in kvm_get_msr_common()
3673 msr_info->data = vcpu->arch.ia32_xss; in kvm_get_msr_common()
3677 * Provide expected ramp-up count for K7. All other in kvm_get_msr_common()
3685 msr_info->data = 0x20000000; in kvm_get_msr_common()
3697 msr_info->index, &msr_info->data, in kvm_get_msr_common()
3698 msr_info->host_initiated); in kvm_get_msr_common()
3710 msr_info->data = 0xbe702111; in kvm_get_msr_common()
3715 msr_info->data = vcpu->arch.osvw.length; in kvm_get_msr_common()
3720 msr_info->data = vcpu->arch.osvw.status; in kvm_get_msr_common()
3723 if (!msr_info->host_initiated && in kvm_get_msr_common()
3724 !vcpu->kvm->arch.guest_can_read_msr_platform_info) in kvm_get_msr_common()
3726 msr_info->data = vcpu->arch.msr_platform_info; in kvm_get_msr_common()
3729 msr_info->data = vcpu->arch.msr_misc_features_enables; in kvm_get_msr_common()
3732 msr_info->data = vcpu->arch.msr_hwcr; in kvm_get_msr_common()
3735 if (kvm_pmu_is_valid_msr(vcpu, msr_info->index)) in kvm_get_msr_common()
3755 for (i = 0; i < msrs->nmsrs; ++i) in __msr_io()
3777 r = -EFAULT; in msr_io()
3781 r = -E2BIG; in msr_io()
3786 entries = memdup_user(user_msrs->entries, size); in msr_io()
3796 r = -EFAULT; in msr_io()
3797 if (writeback && copy_to_user(user_msrs->entries, entries, size)) in msr_io()
3929 r = kvm_x86_ops.nested_ops->get_state ? in kvm_vm_ioctl_check_extension()
3930 kvm_x86_ops.nested_ops->get_state(NULL, NULL, 0) : 0; in kvm_vm_ioctl_check_extension()
3936 r = kvm_x86_ops.nested_ops->enable_evmcs != NULL; in kvm_vm_ioctl_check_extension()
3963 r = -EFAULT; in kvm_arch_dev_ioctl()
3970 r = -E2BIG; in kvm_arch_dev_ioctl()
3973 r = -EFAULT; in kvm_arch_dev_ioctl()
3974 if (copy_to_user(user_msr_list->indices, &msrs_to_save, in kvm_arch_dev_ioctl()
3977 if (copy_to_user(user_msr_list->indices + num_msrs_to_save, in kvm_arch_dev_ioctl()
3989 r = -EFAULT; in kvm_arch_dev_ioctl()
3993 r = kvm_dev_ioctl_get_cpuid(&cpuid, cpuid_arg->entries, in kvm_arch_dev_ioctl()
3998 r = -EFAULT; in kvm_arch_dev_ioctl()
4005 r = -EFAULT; in kvm_arch_dev_ioctl()
4016 r = -EFAULT; in kvm_arch_dev_ioctl()
4023 r = -E2BIG; in kvm_arch_dev_ioctl()
4026 r = -EFAULT; in kvm_arch_dev_ioctl()
4027 if (copy_to_user(user_msr_list->indices, &msr_based_features, in kvm_arch_dev_ioctl()
4037 r = -EINVAL; in kvm_arch_dev_ioctl()
4051 return kvm_arch_has_noncoherent_dma(vcpu->kvm); in need_emulate_wbinvd()
4059 cpumask_set_cpu(cpu, vcpu->arch.wbinvd_dirty_mask); in kvm_arch_vcpu_load()
4060 else if (vcpu->cpu != -1 && vcpu->cpu != cpu) in kvm_arch_vcpu_load()
4061 smp_call_function_single(vcpu->cpu, in kvm_arch_vcpu_load()
4068 vcpu->arch.host_pkru = read_pkru(); in kvm_arch_vcpu_load()
4071 if (unlikely(vcpu->arch.tsc_offset_adjustment)) { in kvm_arch_vcpu_load()
4072 adjust_tsc_offset_host(vcpu, vcpu->arch.tsc_offset_adjustment); in kvm_arch_vcpu_load()
4073 vcpu->arch.tsc_offset_adjustment = 0; in kvm_arch_vcpu_load()
4077 if (unlikely(vcpu->cpu != cpu) || kvm_check_tsc_unstable()) { in kvm_arch_vcpu_load()
4078 s64 tsc_delta = !vcpu->arch.last_host_tsc ? 0 : in kvm_arch_vcpu_load()
4079 rdtsc() - vcpu->arch.last_host_tsc; in kvm_arch_vcpu_load()
4085 vcpu->arch.last_guest_tsc); in kvm_arch_vcpu_load()
4087 vcpu->arch.tsc_catchup = 1; in kvm_arch_vcpu_load()
4095 * kvmclock on vcpu->cpu migration in kvm_arch_vcpu_load()
4097 if (!vcpu->kvm->arch.use_master_clock || vcpu->cpu == -1) in kvm_arch_vcpu_load()
4099 if (vcpu->cpu != cpu) in kvm_arch_vcpu_load()
4101 vcpu->cpu = cpu; in kvm_arch_vcpu_load()
4109 struct gfn_to_hva_cache *ghc = &vcpu->arch.st.cache; in kvm_steal_time_set_preempted()
4113 gpa_t gpa = vcpu->arch.st.msr_val & KVM_STEAL_VALID_BITS; in kvm_steal_time_set_preempted()
4116 * The vCPU can be marked preempted if and only if the VM-Exit was on in kvm_steal_time_set_preempted()
4120 * preempted if and only if the VM-Exit was due to a host interrupt. in kvm_steal_time_set_preempted()
4122 if (!vcpu->arch.at_instruction_boundary) { in kvm_steal_time_set_preempted()
4123 vcpu->stat.preemption_other++; in kvm_steal_time_set_preempted()
4127 vcpu->stat.preemption_reported++; in kvm_steal_time_set_preempted()
4128 if (!(vcpu->arch.st.msr_val & KVM_MSR_ENABLED)) in kvm_steal_time_set_preempted()
4131 if (vcpu->arch.st.preempted) in kvm_steal_time_set_preempted()
4135 if (unlikely(current->mm != vcpu->kvm->mm)) in kvm_steal_time_set_preempted()
4138 slots = kvm_memslots(vcpu->kvm); in kvm_steal_time_set_preempted()
4140 if (unlikely(slots->generation != ghc->generation || in kvm_steal_time_set_preempted()
4141 gpa != ghc->gpa || in kvm_steal_time_set_preempted()
4142 kvm_is_error_hva(ghc->hva) || !ghc->memslot)) in kvm_steal_time_set_preempted()
4145 st = (struct kvm_steal_time __user *)ghc->hva; in kvm_steal_time_set_preempted()
4146 BUILD_BUG_ON(sizeof(st->preempted) != sizeof(preempted)); in kvm_steal_time_set_preempted()
4148 if (!copy_to_user_nofault(&st->preempted, &preempted, sizeof(preempted))) in kvm_steal_time_set_preempted()
4149 vcpu->arch.st.preempted = KVM_VCPU_PREEMPTED; in kvm_steal_time_set_preempted()
4151 mark_page_dirty_in_slot(ghc->memslot, gpa_to_gfn(ghc->gpa)); in kvm_steal_time_set_preempted()
4158 if (vcpu->preempted) { in kvm_arch_vcpu_put()
4159 vcpu->arch.preempted_in_kernel = !kvm_x86_ops.get_cpl(vcpu); in kvm_arch_vcpu_put()
4165 idx = srcu_read_lock(&vcpu->kvm->srcu); in kvm_arch_vcpu_put()
4167 srcu_read_unlock(&vcpu->kvm->srcu, idx); in kvm_arch_vcpu_put()
4171 vcpu->arch.last_host_tsc = rdtsc(); in kvm_arch_vcpu_put()
4183 if (vcpu->arch.apicv_active) in kvm_vcpu_ioctl_get_lapic()
4225 * instruction boundary and with no events half-injected. in kvm_vcpu_ready_for_interrupt_injection()
4230 !vcpu->arch.exception.pending); in kvm_vcpu_ready_for_interrupt_injection()
4236 if (irq->irq >= KVM_NR_INTERRUPTS) in kvm_vcpu_ioctl_interrupt()
4237 return -EINVAL; in kvm_vcpu_ioctl_interrupt()
4239 if (!irqchip_in_kernel(vcpu->kvm)) { in kvm_vcpu_ioctl_interrupt()
4240 kvm_queue_interrupt(vcpu, irq->irq, false); in kvm_vcpu_ioctl_interrupt()
4246 * With in-kernel LAPIC, we only use this to inject EXTINT, so in kvm_vcpu_ioctl_interrupt()
4247 * fail for in-kernel 8259. in kvm_vcpu_ioctl_interrupt()
4249 if (pic_in_kernel(vcpu->kvm)) in kvm_vcpu_ioctl_interrupt()
4250 return -ENXIO; in kvm_vcpu_ioctl_interrupt()
4252 if (vcpu->arch.pending_external_vector != -1) in kvm_vcpu_ioctl_interrupt()
4253 return -EEXIST; in kvm_vcpu_ioctl_interrupt()
4255 vcpu->arch.pending_external_vector = irq->irq; in kvm_vcpu_ioctl_interrupt()
4277 if (tac->flags) in vcpu_ioctl_tpr_access_reporting()
4278 return -EINVAL; in vcpu_ioctl_tpr_access_reporting()
4279 vcpu->arch.tpr_access_reporting = !!tac->enabled; in vcpu_ioctl_tpr_access_reporting()
4289 r = -EINVAL; in kvm_vcpu_ioctl_x86_setup_mce()
4295 vcpu->arch.mcg_cap = mcg_cap; in kvm_vcpu_ioctl_x86_setup_mce()
4298 vcpu->arch.mcg_ctl = ~(u64)0; in kvm_vcpu_ioctl_x86_setup_mce()
4301 vcpu->arch.mce_banks[bank*4] = ~(u64)0; in kvm_vcpu_ioctl_x86_setup_mce()
4311 u64 mcg_cap = vcpu->arch.mcg_cap; in kvm_vcpu_ioctl_x86_set_mce()
4313 u64 *banks = vcpu->arch.mce_banks; in kvm_vcpu_ioctl_x86_set_mce()
4315 if (mce->bank >= bank_num || !(mce->status & MCI_STATUS_VAL)) in kvm_vcpu_ioctl_x86_set_mce()
4316 return -EINVAL; in kvm_vcpu_ioctl_x86_set_mce()
4321 if ((mce->status & MCI_STATUS_UC) && (mcg_cap & MCG_CTL_P) && in kvm_vcpu_ioctl_x86_set_mce()
4322 vcpu->arch.mcg_ctl != ~(u64)0) in kvm_vcpu_ioctl_x86_set_mce()
4324 banks += 4 * mce->bank; in kvm_vcpu_ioctl_x86_set_mce()
4329 if ((mce->status & MCI_STATUS_UC) && banks[0] != ~(u64)0) in kvm_vcpu_ioctl_x86_set_mce()
4331 if (mce->status & MCI_STATUS_UC) { in kvm_vcpu_ioctl_x86_set_mce()
4332 if ((vcpu->arch.mcg_status & MCG_STATUS_MCIP) || in kvm_vcpu_ioctl_x86_set_mce()
4338 mce->status |= MCI_STATUS_OVER; in kvm_vcpu_ioctl_x86_set_mce()
4339 banks[2] = mce->addr; in kvm_vcpu_ioctl_x86_set_mce()
4340 banks[3] = mce->misc; in kvm_vcpu_ioctl_x86_set_mce()
4341 vcpu->arch.mcg_status = mce->mcg_status; in kvm_vcpu_ioctl_x86_set_mce()
4342 banks[1] = mce->status; in kvm_vcpu_ioctl_x86_set_mce()
4347 mce->status |= MCI_STATUS_OVER; in kvm_vcpu_ioctl_x86_set_mce()
4348 banks[2] = mce->addr; in kvm_vcpu_ioctl_x86_set_mce()
4349 banks[3] = mce->misc; in kvm_vcpu_ioctl_x86_set_mce()
4350 banks[1] = mce->status; in kvm_vcpu_ioctl_x86_set_mce()
4368 * modified under nVMX). Unless the per-VM capability, in kvm_vcpu_ioctl_x86_get_vcpu_events()
4375 if (!vcpu->kvm->arch.exception_payload_enabled && in kvm_vcpu_ioctl_x86_get_vcpu_events()
4376 vcpu->arch.exception.pending && vcpu->arch.exception.has_payload) in kvm_vcpu_ioctl_x86_get_vcpu_events()
4385 if (kvm_exception_is_soft(vcpu->arch.exception.nr)) { in kvm_vcpu_ioctl_x86_get_vcpu_events()
4386 events->exception.injected = 0; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4387 events->exception.pending = 0; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4389 events->exception.injected = vcpu->arch.exception.injected; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4390 events->exception.pending = vcpu->arch.exception.pending; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4396 if (!vcpu->kvm->arch.exception_payload_enabled) in kvm_vcpu_ioctl_x86_get_vcpu_events()
4397 events->exception.injected |= in kvm_vcpu_ioctl_x86_get_vcpu_events()
4398 vcpu->arch.exception.pending; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4400 events->exception.nr = vcpu->arch.exception.nr; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4401 events->exception.has_error_code = vcpu->arch.exception.has_error_code; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4402 events->exception.error_code = vcpu->arch.exception.error_code; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4403 events->exception_has_payload = vcpu->arch.exception.has_payload; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4404 events->exception_payload = vcpu->arch.exception.payload; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4406 events->interrupt.injected = in kvm_vcpu_ioctl_x86_get_vcpu_events()
4407 vcpu->arch.interrupt.injected && !vcpu->arch.interrupt.soft; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4408 events->interrupt.nr = vcpu->arch.interrupt.nr; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4409 events->interrupt.soft = 0; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4410 events->interrupt.shadow = kvm_x86_ops.get_interrupt_shadow(vcpu); in kvm_vcpu_ioctl_x86_get_vcpu_events()
4412 events->nmi.injected = vcpu->arch.nmi_injected; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4413 events->nmi.pending = vcpu->arch.nmi_pending != 0; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4414 events->nmi.masked = kvm_x86_ops.get_nmi_mask(vcpu); in kvm_vcpu_ioctl_x86_get_vcpu_events()
4415 events->nmi.pad = 0; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4417 events->sipi_vector = 0; /* never valid when reporting to user space */ in kvm_vcpu_ioctl_x86_get_vcpu_events()
4419 events->smi.smm = is_smm(vcpu); in kvm_vcpu_ioctl_x86_get_vcpu_events()
4420 events->smi.pending = vcpu->arch.smi_pending; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4421 events->smi.smm_inside_nmi = in kvm_vcpu_ioctl_x86_get_vcpu_events()
4422 !!(vcpu->arch.hflags & HF_SMM_INSIDE_NMI_MASK); in kvm_vcpu_ioctl_x86_get_vcpu_events()
4423 events->smi.latched_init = kvm_lapic_latched_init(vcpu); in kvm_vcpu_ioctl_x86_get_vcpu_events()
4425 events->flags = (KVM_VCPUEVENT_VALID_NMI_PENDING in kvm_vcpu_ioctl_x86_get_vcpu_events()
4428 if (vcpu->kvm->arch.exception_payload_enabled) in kvm_vcpu_ioctl_x86_get_vcpu_events()
4429 events->flags |= KVM_VCPUEVENT_VALID_PAYLOAD; in kvm_vcpu_ioctl_x86_get_vcpu_events()
4431 memset(&events->reserved, 0, sizeof(events->reserved)); in kvm_vcpu_ioctl_x86_get_vcpu_events()
4439 if (events->flags & ~(KVM_VCPUEVENT_VALID_NMI_PENDING in kvm_vcpu_ioctl_x86_set_vcpu_events()
4444 return -EINVAL; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4446 if (events->flags & KVM_VCPUEVENT_VALID_PAYLOAD) { in kvm_vcpu_ioctl_x86_set_vcpu_events()
4447 if (!vcpu->kvm->arch.exception_payload_enabled) in kvm_vcpu_ioctl_x86_set_vcpu_events()
4448 return -EINVAL; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4449 if (events->exception.pending) in kvm_vcpu_ioctl_x86_set_vcpu_events()
4450 events->exception.injected = 0; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4452 events->exception_has_payload = 0; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4454 events->exception.pending = 0; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4455 events->exception_has_payload = 0; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4458 if ((events->exception.injected || events->exception.pending) && in kvm_vcpu_ioctl_x86_set_vcpu_events()
4459 (events->exception.nr > 31 || events->exception.nr == NMI_VECTOR)) in kvm_vcpu_ioctl_x86_set_vcpu_events()
4460 return -EINVAL; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4463 if (events->flags & KVM_VCPUEVENT_VALID_SMM && in kvm_vcpu_ioctl_x86_set_vcpu_events()
4464 (events->smi.smm || events->smi.pending) && in kvm_vcpu_ioctl_x86_set_vcpu_events()
4465 vcpu->arch.mp_state == KVM_MP_STATE_INIT_RECEIVED) in kvm_vcpu_ioctl_x86_set_vcpu_events()
4466 return -EINVAL; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4469 vcpu->arch.exception.injected = events->exception.injected; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4470 vcpu->arch.exception.pending = events->exception.pending; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4471 vcpu->arch.exception.nr = events->exception.nr; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4472 vcpu->arch.exception.has_error_code = events->exception.has_error_code; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4473 vcpu->arch.exception.error_code = events->exception.error_code; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4474 vcpu->arch.exception.has_payload = events->exception_has_payload; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4475 vcpu->arch.exception.payload = events->exception_payload; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4477 vcpu->arch.interrupt.injected = events->interrupt.injected; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4478 vcpu->arch.interrupt.nr = events->interrupt.nr; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4479 vcpu->arch.interrupt.soft = events->interrupt.soft; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4480 if (events->flags & KVM_VCPUEVENT_VALID_SHADOW) in kvm_vcpu_ioctl_x86_set_vcpu_events()
4482 events->interrupt.shadow); in kvm_vcpu_ioctl_x86_set_vcpu_events()
4484 vcpu->arch.nmi_injected = events->nmi.injected; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4485 if (events->flags & KVM_VCPUEVENT_VALID_NMI_PENDING) in kvm_vcpu_ioctl_x86_set_vcpu_events()
4486 vcpu->arch.nmi_pending = events->nmi.pending; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4487 kvm_x86_ops.set_nmi_mask(vcpu, events->nmi.masked); in kvm_vcpu_ioctl_x86_set_vcpu_events()
4489 if (events->flags & KVM_VCPUEVENT_VALID_SIPI_VECTOR && in kvm_vcpu_ioctl_x86_set_vcpu_events()
4491 vcpu->arch.apic->sipi_vector = events->sipi_vector; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4493 if (events->flags & KVM_VCPUEVENT_VALID_SMM) { in kvm_vcpu_ioctl_x86_set_vcpu_events()
4494 if (!!(vcpu->arch.hflags & HF_SMM_MASK) != events->smi.smm) { in kvm_vcpu_ioctl_x86_set_vcpu_events()
4495 if (events->smi.smm) in kvm_vcpu_ioctl_x86_set_vcpu_events()
4496 vcpu->arch.hflags |= HF_SMM_MASK; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4498 vcpu->arch.hflags &= ~HF_SMM_MASK; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4500 kvm_x86_ops.nested_ops->leave_nested(vcpu); in kvm_vcpu_ioctl_x86_set_vcpu_events()
4504 vcpu->arch.smi_pending = events->smi.pending; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4506 if (events->smi.smm) { in kvm_vcpu_ioctl_x86_set_vcpu_events()
4507 if (events->smi.smm_inside_nmi) in kvm_vcpu_ioctl_x86_set_vcpu_events()
4508 vcpu->arch.hflags |= HF_SMM_INSIDE_NMI_MASK; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4510 vcpu->arch.hflags &= ~HF_SMM_INSIDE_NMI_MASK; in kvm_vcpu_ioctl_x86_set_vcpu_events()
4514 if (events->smi.latched_init) in kvm_vcpu_ioctl_x86_set_vcpu_events()
4515 set_bit(KVM_APIC_INIT, &vcpu->arch.apic->pending_events); in kvm_vcpu_ioctl_x86_set_vcpu_events()
4517 clear_bit(KVM_APIC_INIT, &vcpu->arch.apic->pending_events); in kvm_vcpu_ioctl_x86_set_vcpu_events()
4532 memcpy(dbgregs->db, vcpu->arch.db, sizeof(vcpu->arch.db)); in kvm_vcpu_ioctl_x86_get_debugregs()
4534 dbgregs->dr6 = val; in kvm_vcpu_ioctl_x86_get_debugregs()
4535 dbgregs->dr7 = vcpu->arch.dr7; in kvm_vcpu_ioctl_x86_get_debugregs()
4541 if (dbgregs->flags) in kvm_vcpu_ioctl_x86_set_debugregs()
4542 return -EINVAL; in kvm_vcpu_ioctl_x86_set_debugregs()
4544 if (dbgregs->dr6 & ~0xffffffffull) in kvm_vcpu_ioctl_x86_set_debugregs()
4545 return -EINVAL; in kvm_vcpu_ioctl_x86_set_debugregs()
4546 if (dbgregs->dr7 & ~0xffffffffull) in kvm_vcpu_ioctl_x86_set_debugregs()
4547 return -EINVAL; in kvm_vcpu_ioctl_x86_set_debugregs()
4549 memcpy(vcpu->arch.db, dbgregs->db, sizeof(vcpu->arch.db)); in kvm_vcpu_ioctl_x86_set_debugregs()
4551 vcpu->arch.dr6 = dbgregs->dr6; in kvm_vcpu_ioctl_x86_set_debugregs()
4552 vcpu->arch.dr7 = dbgregs->dr7; in kvm_vcpu_ioctl_x86_set_debugregs()
4562 struct xregs_state *xsave = &vcpu->arch.guest_fpu->state.xsave; in fill_xsave()
4563 u64 xstate_bv = xsave->header.xfeatures; in fill_xsave()
4573 xstate_bv &= vcpu->arch.guest_supported_xcr0 | XFEATURE_MASK_FPSSE; in fill_xsave()
4578 * non-compacted offset. in fill_xsave()
4582 u64 xfeature_mask = valid & -valid; in fill_xsave()
4583 int xfeature_nr = fls64(xfeature_mask) - 1; in fill_xsave()
4591 memcpy(dest + offset, &vcpu->arch.pkru, in fill_xsave()
4592 sizeof(vcpu->arch.pkru)); in fill_xsave()
4598 valid -= xfeature_mask; in fill_xsave()
4604 struct xregs_state *xsave = &vcpu->arch.guest_fpu->state.xsave; in load_xsave()
4615 xsave->header.xfeatures = xstate_bv; in load_xsave()
4617 xsave->header.xcomp_bv = host_xcr0 | XSTATE_COMPACTION_ENABLED; in load_xsave()
4620 * Copy each region from the non-compacted offset to the in load_xsave()
4625 u64 xfeature_mask = valid & -valid; in load_xsave()
4626 int xfeature_nr = fls64(xfeature_mask) - 1; in load_xsave()
4634 memcpy(&vcpu->arch.pkru, src + offset, in load_xsave()
4635 sizeof(vcpu->arch.pkru)); in load_xsave()
4640 valid -= xfeature_mask; in load_xsave()
4649 fill_xsave((u8 *) guest_xsave->region, vcpu); in kvm_vcpu_ioctl_x86_get_xsave()
4651 memcpy(guest_xsave->region, in kvm_vcpu_ioctl_x86_get_xsave()
4652 &vcpu->arch.guest_fpu->state.fxsave, in kvm_vcpu_ioctl_x86_get_xsave()
4654 *(u64 *)&guest_xsave->region[XSAVE_HDR_OFFSET / sizeof(u32)] = in kvm_vcpu_ioctl_x86_get_xsave()
4665 *(u64 *)&guest_xsave->region[XSAVE_HDR_OFFSET / sizeof(u32)]; in kvm_vcpu_ioctl_x86_set_xsave()
4666 u32 mxcsr = *(u32 *)&guest_xsave->region[XSAVE_MXCSR_OFFSET / sizeof(u32)]; in kvm_vcpu_ioctl_x86_set_xsave()
4675 return -EINVAL; in kvm_vcpu_ioctl_x86_set_xsave()
4676 load_xsave(vcpu, (u8 *)guest_xsave->region); in kvm_vcpu_ioctl_x86_set_xsave()
4680 return -EINVAL; in kvm_vcpu_ioctl_x86_set_xsave()
4681 memcpy(&vcpu->arch.guest_fpu->state.fxsave, in kvm_vcpu_ioctl_x86_set_xsave()
4682 guest_xsave->region, sizeof(struct fxregs_state)); in kvm_vcpu_ioctl_x86_set_xsave()
4691 guest_xcrs->nr_xcrs = 0; in kvm_vcpu_ioctl_x86_get_xcrs()
4695 guest_xcrs->nr_xcrs = 1; in kvm_vcpu_ioctl_x86_get_xcrs()
4696 guest_xcrs->flags = 0; in kvm_vcpu_ioctl_x86_get_xcrs()
4697 guest_xcrs->xcrs[0].xcr = XCR_XFEATURE_ENABLED_MASK; in kvm_vcpu_ioctl_x86_get_xcrs()
4698 guest_xcrs->xcrs[0].value = vcpu->arch.xcr0; in kvm_vcpu_ioctl_x86_get_xcrs()
4707 return -EINVAL; in kvm_vcpu_ioctl_x86_set_xcrs()
4709 if (guest_xcrs->nr_xcrs > KVM_MAX_XCRS || guest_xcrs->flags) in kvm_vcpu_ioctl_x86_set_xcrs()
4710 return -EINVAL; in kvm_vcpu_ioctl_x86_set_xcrs()
4712 for (i = 0; i < guest_xcrs->nr_xcrs; i++) in kvm_vcpu_ioctl_x86_set_xcrs()
4714 if (guest_xcrs->xcrs[i].xcr == XCR_XFEATURE_ENABLED_MASK) { in kvm_vcpu_ioctl_x86_set_xcrs()
4716 guest_xcrs->xcrs[i].value); in kvm_vcpu_ioctl_x86_set_xcrs()
4720 r = -EINVAL; in kvm_vcpu_ioctl_x86_set_xcrs()
4732 if (!vcpu->arch.pv_time_enabled) in kvm_set_guest_paused()
4733 return -EINVAL; in kvm_set_guest_paused()
4734 vcpu->arch.pvclock_set_guest_stopped_request = true; in kvm_set_guest_paused()
4746 if (cap->flags) in kvm_vcpu_ioctl_enable_cap()
4747 return -EINVAL; in kvm_vcpu_ioctl_enable_cap()
4749 switch (cap->cap) { in kvm_vcpu_ioctl_enable_cap()
4751 if (cap->args[0]) in kvm_vcpu_ioctl_enable_cap()
4752 return -EINVAL; in kvm_vcpu_ioctl_enable_cap()
4756 if (!irqchip_in_kernel(vcpu->kvm)) in kvm_vcpu_ioctl_enable_cap()
4757 return -EINVAL; in kvm_vcpu_ioctl_enable_cap()
4758 return kvm_hv_activate_synic(vcpu, cap->cap == in kvm_vcpu_ioctl_enable_cap()
4761 if (!kvm_x86_ops.nested_ops->enable_evmcs) in kvm_vcpu_ioctl_enable_cap()
4762 return -ENOTTY; in kvm_vcpu_ioctl_enable_cap()
4763 r = kvm_x86_ops.nested_ops->enable_evmcs(vcpu, &vmcs_version); in kvm_vcpu_ioctl_enable_cap()
4765 user_ptr = (void __user *)(uintptr_t)cap->args[0]; in kvm_vcpu_ioctl_enable_cap()
4768 r = -EFAULT; in kvm_vcpu_ioctl_enable_cap()
4773 return -ENOTTY; in kvm_vcpu_ioctl_enable_cap()
4778 vcpu->arch.pv_cpuid.enforce = cap->args[0]; in kvm_vcpu_ioctl_enable_cap()
4779 if (vcpu->arch.pv_cpuid.enforce) in kvm_vcpu_ioctl_enable_cap()
4785 return -EINVAL; in kvm_vcpu_ioctl_enable_cap()
4792 struct kvm_vcpu *vcpu = filp->private_data; in kvm_arch_vcpu_ioctl()
4807 r = -EINVAL; in kvm_arch_vcpu_ioctl()
4813 r = -ENOMEM; in kvm_arch_vcpu_ioctl()
4819 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4826 r = -EINVAL; in kvm_arch_vcpu_ioctl()
4841 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4859 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4862 r = kvm_vcpu_ioctl_set_cpuid(vcpu, &cpuid, cpuid_arg->entries); in kvm_arch_vcpu_ioctl()
4869 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4873 cpuid_arg->entries); in kvm_arch_vcpu_ioctl()
4880 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4884 cpuid_arg->entries); in kvm_arch_vcpu_ioctl()
4887 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4894 int idx = srcu_read_lock(&vcpu->kvm->srcu); in kvm_arch_vcpu_ioctl()
4896 srcu_read_unlock(&vcpu->kvm->srcu, idx); in kvm_arch_vcpu_ioctl()
4900 int idx = srcu_read_lock(&vcpu->kvm->srcu); in kvm_arch_vcpu_ioctl()
4902 srcu_read_unlock(&vcpu->kvm->srcu, idx); in kvm_arch_vcpu_ioctl()
4908 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4914 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4924 r = -EINVAL; in kvm_arch_vcpu_ioctl()
4927 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4930 idx = srcu_read_lock(&vcpu->kvm->srcu); in kvm_arch_vcpu_ioctl()
4932 srcu_read_unlock(&vcpu->kvm->srcu, idx); in kvm_arch_vcpu_ioctl()
4938 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4947 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4958 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4967 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4979 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4989 r = -EFAULT; in kvm_arch_vcpu_ioctl()
4999 r = -ENOMEM; in kvm_arch_vcpu_ioctl()
5005 r = -EFAULT; in kvm_arch_vcpu_ioctl()
5023 r = -ENOMEM; in kvm_arch_vcpu_ioctl()
5029 r = -EFAULT; in kvm_arch_vcpu_ioctl()
5049 r = -EINVAL; in kvm_arch_vcpu_ioctl()
5065 r = vcpu->arch.virtual_tsc_khz; in kvm_arch_vcpu_ioctl()
5075 r = -EFAULT; in kvm_arch_vcpu_ioctl()
5085 r = -EINVAL; in kvm_arch_vcpu_ioctl()
5086 if (!kvm_x86_ops.nested_ops->get_state) in kvm_arch_vcpu_ioctl()
5089 BUILD_BUG_ON(sizeof(user_data_size) != sizeof(user_kvm_nested_state->size)); in kvm_arch_vcpu_ioctl()
5090 r = -EFAULT; in kvm_arch_vcpu_ioctl()
5091 if (get_user(user_data_size, &user_kvm_nested_state->size)) in kvm_arch_vcpu_ioctl()
5094 r = kvm_x86_ops.nested_ops->get_state(vcpu, user_kvm_nested_state, in kvm_arch_vcpu_ioctl()
5100 if (put_user(r, &user_kvm_nested_state->size)) in kvm_arch_vcpu_ioctl()
5101 r = -EFAULT; in kvm_arch_vcpu_ioctl()
5103 r = -E2BIG; in kvm_arch_vcpu_ioctl()
5115 r = -EINVAL; in kvm_arch_vcpu_ioctl()
5116 if (!kvm_x86_ops.nested_ops->set_state) in kvm_arch_vcpu_ioctl()
5119 r = -EFAULT; in kvm_arch_vcpu_ioctl()
5123 r = -EINVAL; in kvm_arch_vcpu_ioctl()
5138 idx = srcu_read_lock(&vcpu->kvm->srcu); in kvm_arch_vcpu_ioctl()
5139 r = kvm_x86_ops.nested_ops->set_state(vcpu, user_kvm_nested_state, &kvm_state); in kvm_arch_vcpu_ioctl()
5140 srcu_read_unlock(&vcpu->kvm->srcu, idx); in kvm_arch_vcpu_ioctl()
5147 r = -EFAULT; in kvm_arch_vcpu_ioctl()
5152 cpuid_arg->entries); in kvm_arch_vcpu_ioctl()
5156 r = -EFAULT; in kvm_arch_vcpu_ioctl()
5163 r = -EINVAL; in kvm_arch_vcpu_ioctl()
5181 if (addr > (unsigned int)(-3 * PAGE_SIZE)) in kvm_vm_ioctl_set_tss_addr()
5182 return -EINVAL; in kvm_vm_ioctl_set_tss_addr()
5197 return -EINVAL; in kvm_vm_ioctl_set_nr_mmu_pages()
5199 mutex_lock(&kvm->slots_lock); in kvm_vm_ioctl_set_nr_mmu_pages()
5202 kvm->arch.n_requested_mmu_pages = kvm_nr_mmu_pages; in kvm_vm_ioctl_set_nr_mmu_pages()
5204 mutex_unlock(&kvm->slots_lock); in kvm_vm_ioctl_set_nr_mmu_pages()
5210 return kvm->arch.n_max_mmu_pages; in kvm_vm_ioctl_get_nr_mmu_pages()
5215 struct kvm_pic *pic = kvm->arch.vpic; in kvm_vm_ioctl_get_irqchip() local
5219 switch (chip->chip_id) { in kvm_vm_ioctl_get_irqchip()
5221 memcpy(&chip->chip.pic, &pic->pics[0], in kvm_vm_ioctl_get_irqchip()
5225 memcpy(&chip->chip.pic, &pic->pics[1], in kvm_vm_ioctl_get_irqchip()
5229 kvm_get_ioapic(kvm, &chip->chip.ioapic); in kvm_vm_ioctl_get_irqchip()
5232 r = -EINVAL; in kvm_vm_ioctl_get_irqchip()
5240 struct kvm_pic *pic = kvm->arch.vpic; in kvm_vm_ioctl_set_irqchip() local
5244 switch (chip->chip_id) { in kvm_vm_ioctl_set_irqchip()
5246 spin_lock(&pic->lock); in kvm_vm_ioctl_set_irqchip()
5247 memcpy(&pic->pics[0], &chip->chip.pic, in kvm_vm_ioctl_set_irqchip()
5249 spin_unlock(&pic->lock); in kvm_vm_ioctl_set_irqchip()
5252 spin_lock(&pic->lock); in kvm_vm_ioctl_set_irqchip()
5253 memcpy(&pic->pics[1], &chip->chip.pic, in kvm_vm_ioctl_set_irqchip()
5255 spin_unlock(&pic->lock); in kvm_vm_ioctl_set_irqchip()
5258 kvm_set_ioapic(kvm, &chip->chip.ioapic); in kvm_vm_ioctl_set_irqchip()
5261 r = -EINVAL; in kvm_vm_ioctl_set_irqchip()
5264 kvm_pic_update_irq(pic); in kvm_vm_ioctl_set_irqchip()
5270 struct kvm_kpit_state *kps = &kvm->arch.vpit->pit_state; in kvm_vm_ioctl_get_pit()
5272 BUILD_BUG_ON(sizeof(*ps) != sizeof(kps->channels)); in kvm_vm_ioctl_get_pit()
5274 mutex_lock(&kps->lock); in kvm_vm_ioctl_get_pit()
5275 memcpy(ps, &kps->channels, sizeof(*ps)); in kvm_vm_ioctl_get_pit()
5276 mutex_unlock(&kps->lock); in kvm_vm_ioctl_get_pit()
5283 struct kvm_pit *pit = kvm->arch.vpit; in kvm_vm_ioctl_set_pit()
5285 mutex_lock(&pit->pit_state.lock); in kvm_vm_ioctl_set_pit()
5286 memcpy(&pit->pit_state.channels, ps, sizeof(*ps)); in kvm_vm_ioctl_set_pit()
5288 kvm_pit_load_count(pit, i, ps->channels[i].count, 0); in kvm_vm_ioctl_set_pit()
5289 mutex_unlock(&pit->pit_state.lock); in kvm_vm_ioctl_set_pit()
5295 mutex_lock(&kvm->arch.vpit->pit_state.lock); in kvm_vm_ioctl_get_pit2()
5296 memcpy(ps->channels, &kvm->arch.vpit->pit_state.channels, in kvm_vm_ioctl_get_pit2()
5297 sizeof(ps->channels)); in kvm_vm_ioctl_get_pit2()
5298 ps->flags = kvm->arch.vpit->pit_state.flags; in kvm_vm_ioctl_get_pit2()
5299 mutex_unlock(&kvm->arch.vpit->pit_state.lock); in kvm_vm_ioctl_get_pit2()
5300 memset(&ps->reserved, 0, sizeof(ps->reserved)); in kvm_vm_ioctl_get_pit2()
5309 struct kvm_pit *pit = kvm->arch.vpit; in kvm_vm_ioctl_set_pit2()
5311 mutex_lock(&pit->pit_state.lock); in kvm_vm_ioctl_set_pit2()
5312 prev_legacy = pit->pit_state.flags & KVM_PIT_FLAGS_HPET_LEGACY; in kvm_vm_ioctl_set_pit2()
5313 cur_legacy = ps->flags & KVM_PIT_FLAGS_HPET_LEGACY; in kvm_vm_ioctl_set_pit2()
5316 memcpy(&pit->pit_state.channels, &ps->channels, in kvm_vm_ioctl_set_pit2()
5317 sizeof(pit->pit_state.channels)); in kvm_vm_ioctl_set_pit2()
5318 pit->pit_state.flags = ps->flags; in kvm_vm_ioctl_set_pit2()
5320 kvm_pit_load_count(pit, i, pit->pit_state.channels[i].count, in kvm_vm_ioctl_set_pit2()
5322 mutex_unlock(&pit->pit_state.lock); in kvm_vm_ioctl_set_pit2()
5329 struct kvm_pit *pit = kvm->arch.vpit; in kvm_vm_ioctl_reinject()
5331 /* pit->pit_state.lock was overloaded to prevent userspace from getting in kvm_vm_ioctl_reinject()
5335 mutex_lock(&pit->pit_state.lock); in kvm_vm_ioctl_reinject()
5336 kvm_pit_set_reinject(pit, control->pit_reinject); in kvm_vm_ioctl_reinject()
5337 mutex_unlock(&pit->pit_state.lock); in kvm_vm_ioctl_reinject()
5345 * Flush potentially hardware-cached dirty pages to dirty_bitmap. in kvm_arch_sync_dirty_log()
5355 return -ENXIO; in kvm_vm_ioctl_irq_line()
5357 irq_event->status = kvm_set_irq(kvm, KVM_USERSPACE_IRQ_SOURCE_ID, in kvm_vm_ioctl_irq_line()
5358 irq_event->irq, irq_event->level, in kvm_vm_ioctl_irq_line()
5368 if (cap->flags) in kvm_vm_ioctl_enable_cap()
5369 return -EINVAL; in kvm_vm_ioctl_enable_cap()
5371 switch (cap->cap) { in kvm_vm_ioctl_enable_cap()
5373 kvm->arch.disabled_quirks = cap->args[0]; in kvm_vm_ioctl_enable_cap()
5377 mutex_lock(&kvm->lock); in kvm_vm_ioctl_enable_cap()
5378 r = -EINVAL; in kvm_vm_ioctl_enable_cap()
5379 if (cap->args[0] > MAX_NR_RESERVED_IOAPIC_PINS) in kvm_vm_ioctl_enable_cap()
5381 r = -EEXIST; in kvm_vm_ioctl_enable_cap()
5384 if (kvm->created_vcpus) in kvm_vm_ioctl_enable_cap()
5391 kvm->arch.irqchip_mode = KVM_IRQCHIP_SPLIT; in kvm_vm_ioctl_enable_cap()
5392 kvm->arch.nr_reserved_ioapic_pins = cap->args[0]; in kvm_vm_ioctl_enable_cap()
5395 mutex_unlock(&kvm->lock); in kvm_vm_ioctl_enable_cap()
5399 r = -EINVAL; in kvm_vm_ioctl_enable_cap()
5400 if (cap->args[0] & ~KVM_X2APIC_API_VALID_FLAGS) in kvm_vm_ioctl_enable_cap()
5403 if (cap->args[0] & KVM_X2APIC_API_USE_32BIT_IDS) in kvm_vm_ioctl_enable_cap()
5404 kvm->arch.x2apic_format = true; in kvm_vm_ioctl_enable_cap()
5405 if (cap->args[0] & KVM_X2APIC_API_DISABLE_BROADCAST_QUIRK) in kvm_vm_ioctl_enable_cap()
5406 kvm->arch.x2apic_broadcast_quirk_disabled = true; in kvm_vm_ioctl_enable_cap()
5411 r = -EINVAL; in kvm_vm_ioctl_enable_cap()
5412 if (cap->args[0] & ~KVM_X86_DISABLE_VALID_EXITS) in kvm_vm_ioctl_enable_cap()
5415 if ((cap->args[0] & KVM_X86_DISABLE_EXITS_MWAIT) && in kvm_vm_ioctl_enable_cap()
5417 kvm->arch.mwait_in_guest = true; in kvm_vm_ioctl_enable_cap()
5418 if (cap->args[0] & KVM_X86_DISABLE_EXITS_HLT) in kvm_vm_ioctl_enable_cap()
5419 kvm->arch.hlt_in_guest = true; in kvm_vm_ioctl_enable_cap()
5420 if (cap->args[0] & KVM_X86_DISABLE_EXITS_PAUSE) in kvm_vm_ioctl_enable_cap()
5421 kvm->arch.pause_in_guest = true; in kvm_vm_ioctl_enable_cap()
5422 if (cap->args[0] & KVM_X86_DISABLE_EXITS_CSTATE) in kvm_vm_ioctl_enable_cap()
5423 kvm->arch.cstate_in_guest = true; in kvm_vm_ioctl_enable_cap()
5427 kvm->arch.guest_can_read_msr_platform_info = cap->args[0]; in kvm_vm_ioctl_enable_cap()
5431 kvm->arch.exception_payload_enabled = cap->args[0]; in kvm_vm_ioctl_enable_cap()
5435 r = -EINVAL; in kvm_vm_ioctl_enable_cap()
5436 if (cap->args[0] & ~(KVM_MSR_EXIT_REASON_INVAL | in kvm_vm_ioctl_enable_cap()
5440 kvm->arch.user_space_msr_mask = cap->args[0]; in kvm_vm_ioctl_enable_cap()
5444 r = -EINVAL; in kvm_vm_ioctl_enable_cap()
5458 msr_filter->default_allow = default_allow; in kvm_alloc_msr_filter()
5469 for (i = 0; i < msr_filter->count; i++) in kvm_free_msr_filter()
5470 kfree(msr_filter->ranges[i].bitmap); in kvm_free_msr_filter()
5483 if (!user_range->nmsrs) in kvm_add_msr_filter()
5486 bitmap_size = BITS_TO_LONGS(user_range->nmsrs) * sizeof(long); in kvm_add_msr_filter()
5488 return -EINVAL; in kvm_add_msr_filter()
5490 bitmap = memdup_user((__user u8*)user_range->bitmap, bitmap_size); in kvm_add_msr_filter()
5495 .flags = user_range->flags, in kvm_add_msr_filter()
5496 .base = user_range->base, in kvm_add_msr_filter()
5497 .nmsrs = user_range->nmsrs, in kvm_add_msr_filter()
5502 r = -EINVAL; in kvm_add_msr_filter()
5507 r = -EINVAL; in kvm_add_msr_filter()
5512 msr_filter->ranges[msr_filter->count] = range; in kvm_add_msr_filter()
5513 msr_filter->count++; in kvm_add_msr_filter()
5530 if (filter->flags & ~KVM_MSR_FILTER_DEFAULT_DENY) in kvm_vm_ioctl_set_msr_filter()
5531 return -EINVAL; in kvm_vm_ioctl_set_msr_filter()
5533 for (i = 0; i < ARRAY_SIZE(filter->ranges); i++) in kvm_vm_ioctl_set_msr_filter()
5534 empty &= !filter->ranges[i].nmsrs; in kvm_vm_ioctl_set_msr_filter()
5536 default_allow = !(filter->flags & KVM_MSR_FILTER_DEFAULT_DENY); in kvm_vm_ioctl_set_msr_filter()
5538 return -EINVAL; in kvm_vm_ioctl_set_msr_filter()
5542 return -ENOMEM; in kvm_vm_ioctl_set_msr_filter()
5544 for (i = 0; i < ARRAY_SIZE(filter->ranges); i++) { in kvm_vm_ioctl_set_msr_filter()
5545 r = kvm_add_msr_filter(new_filter, &filter->ranges[i]); in kvm_vm_ioctl_set_msr_filter()
5552 mutex_lock(&kvm->lock); in kvm_vm_ioctl_set_msr_filter()
5554 /* The per-VM filter is protected by kvm->lock... */ in kvm_vm_ioctl_set_msr_filter()
5555 old_filter = srcu_dereference_check(kvm->arch.msr_filter, &kvm->srcu, 1); in kvm_vm_ioctl_set_msr_filter()
5557 rcu_assign_pointer(kvm->arch.msr_filter, new_filter); in kvm_vm_ioctl_set_msr_filter()
5558 synchronize_srcu(&kvm->srcu); in kvm_vm_ioctl_set_msr_filter()
5563 mutex_unlock(&kvm->lock); in kvm_vm_ioctl_set_msr_filter()
5573 __u32 base; member
5588 struct kvm *kvm = filp->private_data; in kvm_arch_vm_compat_ioctl()
5589 long r = -ENOTTY; in kvm_arch_vm_compat_ioctl()
5600 return -EFAULT; in kvm_arch_vm_compat_ioctl()
5608 .flags = cr->flags, in kvm_arch_vm_compat_ioctl()
5609 .nmsrs = cr->nmsrs, in kvm_arch_vm_compat_ioctl()
5610 .base = cr->base, in kvm_arch_vm_compat_ioctl()
5611 .bitmap = (__u8 *)(ulong)cr->bitmap, in kvm_arch_vm_compat_ioctl()
5627 struct kvm *kvm = filp->private_data; in kvm_arch_vm_ioctl()
5629 int r = -ENOTTY; in kvm_arch_vm_ioctl()
5631 * This union makes it completely explicit to gcc-3.x in kvm_arch_vm_ioctl()
5648 mutex_lock(&kvm->lock); in kvm_arch_vm_ioctl()
5649 r = -EINVAL; in kvm_arch_vm_ioctl()
5650 if (kvm->created_vcpus) in kvm_arch_vm_ioctl()
5652 r = -EFAULT; in kvm_arch_vm_ioctl()
5657 mutex_unlock(&kvm->lock); in kvm_arch_vm_ioctl()
5667 mutex_lock(&kvm->lock); in kvm_arch_vm_ioctl()
5669 r = -EEXIST; in kvm_arch_vm_ioctl()
5673 r = -EINVAL; in kvm_arch_vm_ioctl()
5674 if (kvm->created_vcpus) in kvm_arch_vm_ioctl()
5693 /* Write kvm->irq_routing before enabling irqchip_in_kernel. */ in kvm_arch_vm_ioctl()
5695 kvm->arch.irqchip_mode = KVM_IRQCHIP_KERNEL; in kvm_arch_vm_ioctl()
5697 mutex_unlock(&kvm->lock); in kvm_arch_vm_ioctl()
5704 r = -EFAULT; in kvm_arch_vm_ioctl()
5709 mutex_lock(&kvm->lock); in kvm_arch_vm_ioctl()
5710 r = -EEXIST; in kvm_arch_vm_ioctl()
5711 if (kvm->arch.vpit) in kvm_arch_vm_ioctl()
5713 r = -ENOMEM; in kvm_arch_vm_ioctl()
5714 kvm->arch.vpit = kvm_create_pit(kvm, u.pit_config.flags); in kvm_arch_vm_ioctl()
5715 if (kvm->arch.vpit) in kvm_arch_vm_ioctl()
5718 mutex_unlock(&kvm->lock); in kvm_arch_vm_ioctl()
5721 /* 0: PIC master, 1: PIC slave, 2: IOAPIC */ in kvm_arch_vm_ioctl()
5730 r = -ENXIO; in kvm_arch_vm_ioctl()
5736 r = -EFAULT; in kvm_arch_vm_ioctl()
5745 /* 0: PIC master, 1: PIC slave, 2: IOAPIC */ in kvm_arch_vm_ioctl()
5754 r = -ENXIO; in kvm_arch_vm_ioctl()
5763 r = -EFAULT; in kvm_arch_vm_ioctl()
5766 r = -ENXIO; in kvm_arch_vm_ioctl()
5767 if (!kvm->arch.vpit) in kvm_arch_vm_ioctl()
5772 r = -EFAULT; in kvm_arch_vm_ioctl()
5779 r = -EFAULT; in kvm_arch_vm_ioctl()
5782 mutex_lock(&kvm->lock); in kvm_arch_vm_ioctl()
5783 r = -ENXIO; in kvm_arch_vm_ioctl()
5784 if (!kvm->arch.vpit) in kvm_arch_vm_ioctl()
5788 mutex_unlock(&kvm->lock); in kvm_arch_vm_ioctl()
5792 r = -ENXIO; in kvm_arch_vm_ioctl()
5793 if (!kvm->arch.vpit) in kvm_arch_vm_ioctl()
5798 r = -EFAULT; in kvm_arch_vm_ioctl()
5805 r = -EFAULT; in kvm_arch_vm_ioctl()
5808 mutex_lock(&kvm->lock); in kvm_arch_vm_ioctl()
5809 r = -ENXIO; in kvm_arch_vm_ioctl()
5810 if (!kvm->arch.vpit) in kvm_arch_vm_ioctl()
5814 mutex_unlock(&kvm->lock); in kvm_arch_vm_ioctl()
5819 r = -EFAULT; in kvm_arch_vm_ioctl()
5822 r = -ENXIO; in kvm_arch_vm_ioctl()
5823 if (!kvm->arch.vpit) in kvm_arch_vm_ioctl()
5830 mutex_lock(&kvm->lock); in kvm_arch_vm_ioctl()
5831 if (kvm->created_vcpus) in kvm_arch_vm_ioctl()
5832 r = -EBUSY; in kvm_arch_vm_ioctl()
5834 kvm->arch.bsp_vcpu_id = arg; in kvm_arch_vm_ioctl()
5835 mutex_unlock(&kvm->lock); in kvm_arch_vm_ioctl()
5839 r = -EFAULT; in kvm_arch_vm_ioctl()
5842 r = -EINVAL; in kvm_arch_vm_ioctl()
5845 memcpy(&kvm->arch.xen_hvm_config, &xhc, sizeof(xhc)); in kvm_arch_vm_ioctl()
5853 r = -EFAULT; in kvm_arch_vm_ioctl()
5857 r = -EINVAL; in kvm_arch_vm_ioctl()
5869 kvm->arch.kvmclock_offset += user_ns.clock - now_ns; in kvm_arch_vm_ioctl()
5879 user_ns.flags = kvm->arch.use_master_clock ? KVM_CLOCK_TSC_STABLE : 0; in kvm_arch_vm_ioctl()
5882 r = -EFAULT; in kvm_arch_vm_ioctl()
5889 r = -ENOTTY; in kvm_arch_vm_ioctl()
5897 r = -EFAULT; in kvm_arch_vm_ioctl()
5901 r = -ENOTTY; in kvm_arch_vm_ioctl()
5909 r = -EFAULT; in kvm_arch_vm_ioctl()
5913 r = -ENOTTY; in kvm_arch_vm_ioctl()
5921 r = -EFAULT; in kvm_arch_vm_ioctl()
5935 return -EFAULT; in kvm_arch_vm_ioctl()
5941 r = -ENOTTY; in kvm_arch_vm_ioctl()
6002 msrs_to_save_all[i] - MSR_IA32_RTIT_ADDR0_A >= in kvm_init_msr_list()
6007 if (msrs_to_save_all[i] - MSR_ARCH_PERFMON_PERFCTR0 >= in kvm_init_msr_list()
6012 if (msrs_to_save_all[i] - MSR_ARCH_PERFMON_EVENTSEL0 >= in kvm_init_msr_list()
6050 !kvm_iodevice_write(vcpu, &vcpu->arch.apic->dev, addr, n, v)) in vcpu_mmio_write()
6055 len -= n; in vcpu_mmio_write()
6070 !kvm_iodevice_read(vcpu, &vcpu->arch.apic->dev, in vcpu_mmio_read()
6077 len -= n; in vcpu_mmio_read()
6103 /* NPT walks are always user-walks */ in translate_nested_gpa()
6105 t_gpa = vcpu->arch.mmu->gva_to_gpa(vcpu, gpa, access, exception); in translate_nested_gpa()
6114 return vcpu->arch.walk_mmu->gva_to_gpa(vcpu, gva, access, exception); in kvm_mmu_gva_to_gpa_read()
6122 return vcpu->arch.walk_mmu->gva_to_gpa(vcpu, gva, access, exception); in kvm_mmu_gva_to_gpa_fetch()
6130 return vcpu->arch.walk_mmu->gva_to_gpa(vcpu, gva, access, exception); in kvm_mmu_gva_to_gpa_write()
6137 return vcpu->arch.walk_mmu->gva_to_gpa(vcpu, gva, 0, exception); in kvm_mmu_gva_to_gpa_system()
6148 gpa_t gpa = vcpu->arch.walk_mmu->gva_to_gpa(vcpu, addr, access, in kvm_read_guest_virt_helper()
6150 unsigned offset = addr & (PAGE_SIZE-1); in kvm_read_guest_virt_helper()
6151 unsigned toread = min(bytes, (unsigned)PAGE_SIZE - offset); in kvm_read_guest_virt_helper()
6163 bytes -= toread; in kvm_read_guest_virt_helper()
6182 gpa_t gpa = vcpu->arch.walk_mmu->gva_to_gpa(vcpu, addr, access|PFERR_FETCH_MASK, in kvm_fetch_guest_virt()
6187 offset = addr & (PAGE_SIZE-1); in kvm_fetch_guest_virt()
6189 bytes = (unsigned)PAGE_SIZE - offset; in kvm_fetch_guest_virt()
6246 gpa_t gpa = vcpu->arch.walk_mmu->gva_to_gpa(vcpu, addr, in kvm_write_guest_virt_helper()
6249 unsigned offset = addr & (PAGE_SIZE-1); in kvm_write_guest_virt_helper()
6250 unsigned towrite = min(bytes, (unsigned)PAGE_SIZE - offset); in kvm_write_guest_virt_helper()
6261 bytes -= towrite; in kvm_write_guest_virt_helper()
6287 vcpu->arch.l1tf_flush_l1d = true; in kvm_write_guest_virt_system()
6344 && !permission_fault(vcpu, vcpu->arch.walk_mmu, in vcpu_mmio_gva_to_gpa()
6345 vcpu->arch.mmio_access, 0, access)) { in vcpu_mmio_gva_to_gpa()
6346 *gpa = vcpu->arch.mmio_gfn << PAGE_SHIFT | in vcpu_mmio_gva_to_gpa()
6347 (gva & (PAGE_SIZE - 1)); in vcpu_mmio_gva_to_gpa()
6352 *gpa = vcpu->arch.walk_mmu->gva_to_gpa(vcpu, gva, access, exception); in vcpu_mmio_gva_to_gpa()
6355 return -1; in vcpu_mmio_gva_to_gpa()
6386 if (vcpu->mmio_read_completed) { in read_prepare()
6388 vcpu->mmio_fragments[0].gpa, val); in read_prepare()
6389 vcpu->mmio_read_completed = 0; in read_prepare()
6424 struct kvm_mmio_fragment *frag = &vcpu->mmio_fragments[0]; in write_exit_mmio()
6426 memcpy(vcpu->run->mmio.data, frag->data, min(8u, frag->len)); in write_exit_mmio()
6452 bool write = ops->write; in emulator_read_write_onepage()
6454 struct x86_emulate_ctxt *ctxt = vcpu->arch.emulate_ctxt; in emulator_read_write_onepage()
6463 if (ctxt->gpa_available && emulator_can_use_gpa(ctxt) && in emulator_read_write_onepage()
6464 (addr & ~PAGE_MASK) == (ctxt->gpa_val & ~PAGE_MASK)) { in emulator_read_write_onepage()
6465 gpa = ctxt->gpa_val; in emulator_read_write_onepage()
6473 if (!ret && ops->read_write_emulate(vcpu, gpa, val, bytes)) in emulator_read_write_onepage()
6479 handled = ops->read_write_mmio(vcpu, gpa, bytes, val); in emulator_read_write_onepage()
6484 bytes -= handled; in emulator_read_write_onepage()
6487 WARN_ON(vcpu->mmio_nr_fragments >= KVM_MAX_MMIO_FRAGMENTS); in emulator_read_write_onepage()
6488 frag = &vcpu->mmio_fragments[vcpu->mmio_nr_fragments++]; in emulator_read_write_onepage()
6489 frag->gpa = gpa; in emulator_read_write_onepage()
6490 frag->data = val; in emulator_read_write_onepage()
6491 frag->len = bytes; in emulator_read_write_onepage()
6505 if (ops->read_write_prepare && in emulator_read_write()
6506 ops->read_write_prepare(vcpu, val, bytes)) in emulator_read_write()
6509 vcpu->mmio_nr_fragments = 0; in emulator_read_write()
6512 if (((addr + bytes - 1) ^ addr) & PAGE_MASK) { in emulator_read_write()
6515 now = -addr & ~PAGE_MASK; in emulator_read_write()
6522 if (ctxt->mode != X86EMUL_MODE_PROT64) in emulator_read_write()
6525 bytes -= now; in emulator_read_write()
6533 if (!vcpu->mmio_nr_fragments) in emulator_read_write()
6536 gpa = vcpu->mmio_fragments[0].gpa; in emulator_read_write()
6538 vcpu->mmio_needed = 1; in emulator_read_write()
6539 vcpu->mmio_cur_fragment = 0; in emulator_read_write()
6541 vcpu->run->mmio.len = min(8u, vcpu->mmio_fragments[0].len); in emulator_read_write()
6542 vcpu->run->mmio.is_write = vcpu->mmio_is_write = ops->write; in emulator_read_write()
6543 vcpu->run->exit_reason = KVM_EXIT_MMIO; in emulator_read_write()
6544 vcpu->run->mmio.phys_addr = gpa; in emulator_read_write()
6546 return ops->read_write_exit_mmio(vcpu, gpa, val, bytes); in emulator_read_write()
6594 if (bytes > 8 || (bytes & (bytes - 1))) in emulator_cmpxchg_emulated()
6608 page_line_mask = ~(cache_line_size() - 1); in emulator_cmpxchg_emulated()
6612 if (((gpa + bytes - 1) & page_line_mask) != (gpa & page_line_mask)) in emulator_cmpxchg_emulated()
6656 for (i = 0; i < vcpu->arch.pio.count; i++) { in kernel_pio()
6657 if (vcpu->arch.pio.in) in kernel_pio()
6658 r = kvm_io_bus_read(vcpu, KVM_PIO_BUS, vcpu->arch.pio.port, in kernel_pio()
6659 vcpu->arch.pio.size, pd); in kernel_pio()
6662 vcpu->arch.pio.port, vcpu->arch.pio.size, in kernel_pio()
6666 pd += vcpu->arch.pio.size; in kernel_pio()
6675 vcpu->arch.pio.port = port; in emulator_pio_in_out()
6676 vcpu->arch.pio.in = in; in emulator_pio_in_out()
6677 vcpu->arch.pio.count = count; in emulator_pio_in_out()
6678 vcpu->arch.pio.size = size; in emulator_pio_in_out()
6680 if (!kernel_pio(vcpu, vcpu->arch.pio_data)) { in emulator_pio_in_out()
6681 vcpu->arch.pio.count = 0; in emulator_pio_in_out()
6685 vcpu->run->exit_reason = KVM_EXIT_IO; in emulator_pio_in_out()
6686 vcpu->run->io.direction = in ? KVM_EXIT_IO_IN : KVM_EXIT_IO_OUT; in emulator_pio_in_out()
6687 vcpu->run->io.size = size; in emulator_pio_in_out()
6688 vcpu->run->io.data_offset = KVM_PIO_PAGE_OFFSET * PAGE_SIZE; in emulator_pio_in_out()
6689 vcpu->run->io.count = count; in emulator_pio_in_out()
6690 vcpu->run->io.port = port; in emulator_pio_in_out()
6700 if (vcpu->arch.pio.count) in emulator_pio_in()
6703 memset(vcpu->arch.pio_data, 0, size * count); in emulator_pio_in()
6708 memcpy(val, vcpu->arch.pio_data, size * count); in emulator_pio_in()
6709 trace_kvm_pio(KVM_PIO_IN, port, size, count, vcpu->arch.pio_data); in emulator_pio_in()
6710 vcpu->arch.pio.count = 0; in emulator_pio_in()
6729 memcpy(vcpu->arch.pio_data, val, size * count); in emulator_pio_out()
6730 trace_kvm_pio(KVM_PIO_OUT, port, size, count, vcpu->arch.pio_data); in emulator_pio_out()
6759 cpumask_set_cpu(cpu, vcpu->arch.wbinvd_dirty_mask); in kvm_emulate_wbinvd_noskip()
6760 smp_call_function_many(vcpu->arch.wbinvd_dirty_mask, in kvm_emulate_wbinvd_noskip()
6763 cpumask_clear(vcpu->arch.wbinvd_dirty_mask); in kvm_emulate_wbinvd_noskip()
6798 return (curr_cr & ~((1ULL << 32) - 1)) | new_val; in mk_cr_64()
6811 value = vcpu->arch.cr2; in emulator_get_cr()
6840 vcpu->arch.cr2 = val; in emulator_set_cr()
6853 res = -1; in emulator_set_cr()
6909 set_desc_base(desc, (unsigned long)var.base); in emulator_get_segment()
6912 *base3 = var.base >> 32; in emulator_get_segment()
6914 desc->type = var.type; in emulator_get_segment()
6915 desc->s = var.s; in emulator_get_segment()
6916 desc->dpl = var.dpl; in emulator_get_segment()
6917 desc->p = var.present; in emulator_get_segment()
6918 desc->avl = var.avl; in emulator_get_segment()
6919 desc->l = var.l; in emulator_get_segment()
6920 desc->d = var.db; in emulator_get_segment()
6921 desc->g = var.g; in emulator_get_segment()
6934 var.base = get_desc_base(desc); in emulator_set_segment()
6936 var.base |= ((u64)base3) << 32; in emulator_set_segment()
6939 if (desc->g) in emulator_set_segment()
6941 var.type = desc->type; in emulator_set_segment()
6942 var.dpl = desc->dpl; in emulator_set_segment()
6943 var.db = desc->d; in emulator_set_segment()
6944 var.s = desc->s; in emulator_set_segment()
6945 var.l = desc->l; in emulator_set_segment()
6946 var.g = desc->g; in emulator_set_segment()
6947 var.avl = desc->avl; in emulator_set_segment()
6948 var.present = desc->p; in emulator_set_segment()
6992 return vcpu->arch.smbase; in emulator_get_smbase()
6999 vcpu->arch.smbase = smbase; in emulator_set_smbase()
7016 emul_to_vcpu(ctxt)->arch.halt_request = 1; in emulator_halt()
7024 &ctxt->exception); in emulator_intercept()
7071 return emul_to_vcpu(ctxt)->arch.hflags; in emulator_get_hflags()
7078 vcpu->arch.hflags = emul_flags; in emulator_set_hflags()
7167 struct x86_emulate_ctxt *ctxt = vcpu->arch.emulate_ctxt; in inject_emulated_exception()
7168 if (ctxt->exception.vector == PF_VECTOR) in inject_emulated_exception()
7169 return kvm_inject_emulated_page_fault(vcpu, &ctxt->exception); in inject_emulated_exception()
7171 if (ctxt->exception.error_code_valid) in inject_emulated_exception()
7172 kvm_queue_exception_e(vcpu, ctxt->exception.vector, in inject_emulated_exception()
7173 ctxt->exception.error_code); in inject_emulated_exception()
7175 kvm_queue_exception(vcpu, ctxt->exception.vector); in inject_emulated_exception()
7189 ctxt->vcpu = vcpu; in alloc_emulate_ctxt()
7190 ctxt->ops = &emulate_ops; in alloc_emulate_ctxt()
7191 vcpu->arch.emulate_ctxt = ctxt; in alloc_emulate_ctxt()
7198 struct x86_emulate_ctxt *ctxt = vcpu->arch.emulate_ctxt; in init_emulate_ctxt()
7203 ctxt->gpa_available = false; in init_emulate_ctxt()
7204 ctxt->eflags = kvm_get_rflags(vcpu); in init_emulate_ctxt()
7205 ctxt->tf = (ctxt->eflags & X86_EFLAGS_TF) != 0; in init_emulate_ctxt()
7207 ctxt->eip = kvm_rip_read(vcpu); in init_emulate_ctxt()
7208 ctxt->mode = (!is_protmode(vcpu)) ? X86EMUL_MODE_REAL : in init_emulate_ctxt()
7209 (ctxt->eflags & X86_EFLAGS_VM) ? X86EMUL_MODE_VM86 : in init_emulate_ctxt()
7217 ctxt->interruptibility = 0; in init_emulate_ctxt()
7218 ctxt->have_exception = false; in init_emulate_ctxt()
7219 ctxt->exception.vector = -1; in init_emulate_ctxt()
7220 ctxt->perm_ok = false; in init_emulate_ctxt()
7223 vcpu->arch.emulate_regs_need_sync_from_vcpu = false; in init_emulate_ctxt()
7228 struct x86_emulate_ctxt *ctxt = vcpu->arch.emulate_ctxt; in kvm_inject_realmode_interrupt()
7233 ctxt->op_bytes = 2; in kvm_inject_realmode_interrupt()
7234 ctxt->ad_bytes = 2; in kvm_inject_realmode_interrupt()
7235 ctxt->_eip = ctxt->eip + inc_eip; in kvm_inject_realmode_interrupt()
7241 ctxt->eip = ctxt->_eip; in kvm_inject_realmode_interrupt()
7242 kvm_rip_write(vcpu, ctxt->eip); in kvm_inject_realmode_interrupt()
7243 kvm_set_rflags(vcpu, ctxt->eflags); in kvm_inject_realmode_interrupt()
7250 ++vcpu->stat.insn_emulation_fail; in handle_emulation_failure()
7259 vcpu->run->exit_reason = KVM_EXIT_INTERNAL_ERROR; in handle_emulation_failure()
7260 vcpu->run->internal.suberror = KVM_INTERNAL_ERROR_EMULATION; in handle_emulation_failure()
7261 vcpu->run->internal.ndata = 0; in handle_emulation_failure()
7268 vcpu->run->exit_reason = KVM_EXIT_INTERNAL_ERROR; in handle_emulation_failure()
7269 vcpu->run->internal.suberror = KVM_INTERNAL_ERROR_EMULATION; in handle_emulation_failure()
7270 vcpu->run->internal.ndata = 0; in handle_emulation_failure()
7291 if (!vcpu->arch.mmu->direct_map) { in reexecute_instruction()
7309 * retry instruction -> write #PF -> emulation fail -> retry in reexecute_instruction()
7310 * instruction -> ... in reexecute_instruction()
7312 pfn = gfn_to_pfn(vcpu->kvm, gpa_to_gfn(gpa)); in reexecute_instruction()
7323 /* The instructions are well-emulated on direct mmu. */ in reexecute_instruction()
7324 if (vcpu->arch.mmu->direct_map) { in reexecute_instruction()
7327 spin_lock(&vcpu->kvm->mmu_lock); in reexecute_instruction()
7328 indirect_shadow_pages = vcpu->kvm->arch.indirect_shadow_pages; in reexecute_instruction()
7329 spin_unlock(&vcpu->kvm->mmu_lock); in reexecute_instruction()
7332 kvm_mmu_unprotect_page(vcpu->kvm, gpa_to_gfn(gpa)); in reexecute_instruction()
7339 * and it failed try to unshadow page and re-enter the in reexecute_instruction()
7342 kvm_mmu_unprotect_page(vcpu->kvm, gpa_to_gfn(gpa)); in reexecute_instruction()
7358 last_retry_eip = vcpu->arch.last_retry_eip; in retry_instruction()
7359 last_retry_addr = vcpu->arch.last_retry_addr; in retry_instruction()
7362 * If the emulation is caused by #PF and it is non-page_table in retry_instruction()
7363 * writing instruction, it means the VM-EXIT is caused by shadow in retry_instruction()
7367 * Note: if the guest uses a non-page-table modifying instruction in retry_instruction()
7374 vcpu->arch.last_retry_eip = vcpu->arch.last_retry_addr = 0; in retry_instruction()
7386 if (ctxt->eip == last_retry_eip && last_retry_addr == cr2_or_gpa) in retry_instruction()
7389 vcpu->arch.last_retry_eip = ctxt->eip; in retry_instruction()
7390 vcpu->arch.last_retry_addr = cr2_or_gpa; in retry_instruction()
7392 if (!vcpu->arch.mmu->direct_map) in retry_instruction()
7395 kvm_mmu_unprotect_page(vcpu->kvm, gpa_to_gfn(gpa)); in retry_instruction()
7405 if (!(vcpu->arch.hflags & HF_SMM_MASK)) { in kvm_smm_changed()
7407 trace_kvm_enter_smm(vcpu->vcpu_id, vcpu->arch.smbase, false); in kvm_smm_changed()
7433 struct kvm_run *kvm_run = vcpu->run; in kvm_vcpu_do_singlestep()
7435 if (vcpu->guest_debug & KVM_GUESTDBG_SINGLESTEP) { in kvm_vcpu_do_singlestep()
7436 kvm_run->debug.arch.dr6 = DR6_BS | DR6_FIXED_1 | DR6_RTM; in kvm_vcpu_do_singlestep()
7437 kvm_run->debug.arch.pc = kvm_get_linear_rip(vcpu); in kvm_vcpu_do_singlestep()
7438 kvm_run->debug.arch.exception = DB_VECTOR; in kvm_vcpu_do_singlestep()
7439 kvm_run->exit_reason = KVM_EXIT_DEBUG; in kvm_vcpu_do_singlestep()
7471 if (unlikely(vcpu->guest_debug & KVM_GUESTDBG_USE_HW_BP) && in kvm_vcpu_check_code_breakpoint()
7472 (vcpu->arch.guest_debug_dr7 & DR7_BP_EN_MASK)) { in kvm_vcpu_check_code_breakpoint()
7473 struct kvm_run *kvm_run = vcpu->run; in kvm_vcpu_check_code_breakpoint()
7476 vcpu->arch.guest_debug_dr7, in kvm_vcpu_check_code_breakpoint()
7477 vcpu->arch.eff_db); in kvm_vcpu_check_code_breakpoint()
7480 kvm_run->debug.arch.dr6 = dr6 | DR6_FIXED_1 | DR6_RTM; in kvm_vcpu_check_code_breakpoint()
7481 kvm_run->debug.arch.pc = eip; in kvm_vcpu_check_code_breakpoint()
7482 kvm_run->debug.arch.exception = DB_VECTOR; in kvm_vcpu_check_code_breakpoint()
7483 kvm_run->exit_reason = KVM_EXIT_DEBUG; in kvm_vcpu_check_code_breakpoint()
7489 if (unlikely(vcpu->arch.dr7 & DR7_BP_EN_MASK) && in kvm_vcpu_check_code_breakpoint()
7493 vcpu->arch.dr7, in kvm_vcpu_check_code_breakpoint()
7494 vcpu->arch.db); in kvm_vcpu_check_code_breakpoint()
7508 switch (ctxt->opcode_len) { in is_vmware_backdoor_opcode()
7510 switch (ctxt->b) { in is_vmware_backdoor_opcode()
7527 switch (ctxt->b) { in is_vmware_backdoor_opcode()
7540 * (and wrong) when emulating on an intercepted fault-like exception[*], as
7550 struct x86_emulate_ctxt *ctxt = vcpu->arch.emulate_ctxt; in x86_decode_emulated_instruction()
7555 ctxt->ud = emulation_type & EMULTYPE_TRAP_UD; in x86_decode_emulated_instruction()
7560 ++vcpu->stat.insn_emulation; in x86_decode_emulated_instruction()
7570 struct x86_emulate_ctxt *ctxt = vcpu->arch.emulate_ctxt; in x86_emulate_instruction()
7577 vcpu->arch.l1tf_flush_l1d = true; in x86_emulate_instruction()
7583 write_fault_to_spt = vcpu->arch.write_fault_to_shadow_pgtable; in x86_emulate_instruction()
7584 vcpu->arch.write_fault_to_shadow_pgtable = false; in x86_emulate_instruction()
7591 * are fault-like and are higher priority than any faults on in x86_emulate_instruction()
7611 if (ctxt->have_exception && in x86_emulate_instruction()
7614 * #UD should result in just EMULATION_FAILED, and trap-like in x86_emulate_instruction()
7617 WARN_ON_ONCE(ctxt->exception.vector == UD_VECTOR || in x86_emulate_instruction()
7618 exception_type(ctxt->exception.vector) == EXCPT_TRAP); in x86_emulate_instruction()
7635 * updating interruptibility state and injecting single-step #DBs. in x86_emulate_instruction()
7638 kvm_rip_write(vcpu, ctxt->_eip); in x86_emulate_instruction()
7639 if (ctxt->eflags & X86_EFLAGS_RF) in x86_emulate_instruction()
7640 kvm_set_rflags(vcpu, ctxt->eflags & ~X86_EFLAGS_RF); in x86_emulate_instruction()
7649 if (vcpu->arch.emulate_regs_need_sync_from_vcpu) { in x86_emulate_instruction()
7650 vcpu->arch.emulate_regs_need_sync_from_vcpu = false; in x86_emulate_instruction()
7657 ctxt->exception.address = cr2_or_gpa; in x86_emulate_instruction()
7660 if (vcpu->arch.mmu->direct_map) { in x86_emulate_instruction()
7661 ctxt->gpa_available = true; in x86_emulate_instruction()
7662 ctxt->gpa_val = cr2_or_gpa; in x86_emulate_instruction()
7666 ctxt->exception.address = 0; in x86_emulate_instruction()
7682 if (ctxt->have_exception) { in x86_emulate_instruction()
7686 } else if (vcpu->arch.pio.count) { in x86_emulate_instruction()
7687 if (!vcpu->arch.pio.in) { in x86_emulate_instruction()
7688 /* FIXME: return into emulator if single-stepping. */ in x86_emulate_instruction()
7689 vcpu->arch.pio.count = 0; in x86_emulate_instruction()
7692 vcpu->arch.complete_userspace_io = complete_emulated_pio; in x86_emulate_instruction()
7695 } else if (vcpu->mmio_needed) { in x86_emulate_instruction()
7696 ++vcpu->stat.mmio_exits; in x86_emulate_instruction()
7698 if (!vcpu->mmio_is_write) in x86_emulate_instruction()
7701 vcpu->arch.complete_userspace_io = complete_emulated_mmio; in x86_emulate_instruction()
7709 toggle_interruptibility(vcpu, ctxt->interruptibility); in x86_emulate_instruction()
7710 vcpu->arch.emulate_regs_need_sync_to_vcpu = false; in x86_emulate_instruction()
7713 * Note, EXCPT_DB is assumed to be fault-like as the emulator in x86_emulate_instruction()
7715 * of which are fault-like. in x86_emulate_instruction()
7717 if (!ctxt->have_exception || in x86_emulate_instruction()
7718 exception_type(ctxt->exception.vector) == EXCPT_TRAP) { in x86_emulate_instruction()
7719 kvm_rip_write(vcpu, ctxt->eip); in x86_emulate_instruction()
7720 if (r && (ctxt->tf || (vcpu->guest_debug & KVM_GUESTDBG_SINGLESTEP))) in x86_emulate_instruction()
7724 __kvm_set_rflags(vcpu, ctxt->eflags); in x86_emulate_instruction()
7733 if (unlikely((ctxt->eflags & ~rflags) & X86_EFLAGS_IF)) in x86_emulate_instruction()
7736 vcpu->arch.emulate_regs_need_sync_to_vcpu = true; in x86_emulate_instruction()
7756 vcpu->arch.pio.count = 0; in complete_fast_pio_out_port_0x7e()
7762 vcpu->arch.pio.count = 0; in complete_fast_pio_out()
7764 if (unlikely(!kvm_is_linear_rip(vcpu, vcpu->arch.pio.linear_rip))) in complete_fast_pio_out()
7784 kvm_check_has_quirk(vcpu->kvm, KVM_X86_QUIRK_OUT_7E_INC_RIP)) { in kvm_fast_pio_out()
7785 vcpu->arch.complete_userspace_io = in kvm_fast_pio_out()
7789 vcpu->arch.pio.linear_rip = kvm_get_linear_rip(vcpu); in kvm_fast_pio_out()
7790 vcpu->arch.complete_userspace_io = complete_fast_pio_out; in kvm_fast_pio_out()
7800 BUG_ON(vcpu->arch.pio.count != 1); in complete_fast_pio_in()
7802 if (unlikely(!kvm_is_linear_rip(vcpu, vcpu->arch.pio.linear_rip))) { in complete_fast_pio_in()
7803 vcpu->arch.pio.count = 0; in complete_fast_pio_in()
7808 val = (vcpu->arch.pio.size < 4) ? kvm_rax_read(vcpu) : 0; in complete_fast_pio_in()
7811 * Since vcpu->arch.pio.count == 1 let emulator_pio_in perform in complete_fast_pio_in()
7814 emulator_pio_in(vcpu, vcpu->arch.pio.size, vcpu->arch.pio.port, &val, 1); in complete_fast_pio_in()
7835 vcpu->arch.pio.linear_rip = kvm_get_linear_rip(vcpu); in kvm_fast_pio_in()
7836 vcpu->arch.complete_userspace_io = complete_fast_pio_in; in kvm_fast_pio_in()
7865 khz = freq->new; in tsc_khz_changed()
7886 /* TSC frequency always matches when on Hyper-V */ in kvm_hyperv_tsc_notifier()
7892 struct kvm_arch *ka = &kvm->arch; in kvm_hyperv_tsc_notifier()
7894 spin_lock(&ka->pvclock_gtod_sync_lock); in kvm_hyperv_tsc_notifier()
7904 spin_unlock(&ka->pvclock_gtod_sync_lock); in kvm_hyperv_tsc_notifier()
7960 if (vcpu->cpu != cpu) in __kvmclock_cpufreq_notifier()
7963 if (vcpu->cpu != raw_smp_processor_id()) in __kvmclock_cpufreq_notifier()
7969 if (freq->old < freq->new && send_ipi) { in __kvmclock_cpufreq_notifier()
7992 if (val == CPUFREQ_PRECHANGE && freq->old > freq->new) in kvmclock_cpufreq_notifier()
7994 if (val == CPUFREQ_POSTCHANGE && freq->old < freq->new) in kvmclock_cpufreq_notifier()
7997 for_each_cpu(cpu, freq->policy->cpus) in kvmclock_cpufreq_notifier()
8025 if (policy->cpuinfo.max_freq) in kvm_timer_init()
8026 max_tsc_khz = policy->cpuinfo.max_freq; in kvm_timer_init()
8073 (unsigned long *)&vcpu->arch.pmu.global_status); in kvm_handle_intel_pt_intr()
8129 if (!gtod_is_based_on_tsc(gtod->clock.vclock_mode) && in pvclock_gtod_notify()
8147 r = -EEXIST; in kvm_arch_init()
8151 if (!ops->cpu_has_kvm_support()) { in kvm_arch_init()
8153 r = -EOPNOTSUPP; in kvm_arch_init()
8156 if (ops->disabled_by_bios()) { in kvm_arch_init()
8158 r = -EOPNOTSUPP; in kvm_arch_init()
8169 r = -EOPNOTSUPP; in kvm_arch_init()
8173 r = -ENOMEM; in kvm_arch_init()
8203 if (ops->intel_pt_intr_in_guest && ops->intel_pt_intr_in_guest()) in kvm_arch_init()
8213 if (pi_inject_timer == -1) in kvm_arch_init()
8262 ++vcpu->stat.halt_exits; in kvm_vcpu_halt()
8264 vcpu->arch.mp_state = KVM_MP_STATE_HALTED; in kvm_vcpu_halt()
8267 vcpu->run->exit_reason = KVM_EXIT_HLT; in kvm_vcpu_halt()
8277 * TODO: we might be squashing a GUESTDBG_SINGLESTEP-triggered in kvm_emulate_halt()
8294 return -KVM_EOPNOTSUPP; in kvm_pv_clock_pairing()
8297 return -KVM_EOPNOTSUPP; in kvm_pv_clock_pairing()
8306 if (kvm_write_guest(vcpu->kvm, paddr, &clock_pairing, in kvm_pv_clock_pairing()
8308 ret = -KVM_EFAULT; in kvm_pv_clock_pairing()
8317 * @apicid - apicid of vcpu to be kicked.
8337 return (READ_ONCE(kvm->arch.apicv_inhibit_reasons) == 0); in kvm_apicv_activated()
8345 &kvm->arch.apicv_inhibit_reasons); in kvm_apicv_init()
8348 &kvm->arch.apicv_inhibit_reasons); in kvm_apicv_init()
8358 map = rcu_dereference(kvm->arch.apic_map); in kvm_sched_yield()
8360 if (likely(map) && dest_id <= map->max_apic_id && map->phys_map[dest_id]) in kvm_sched_yield()
8361 target = map->phys_map[dest_id]->vcpu; in kvm_sched_yield()
8365 if (target && READ_ONCE(target->ready)) in kvm_sched_yield()
8374 if (kvm_hv_hypercall_enabled(vcpu->kvm)) in kvm_emulate_hypercall()
8395 ret = -KVM_EPERM; in kvm_emulate_hypercall()
8399 ret = -KVM_ENOSYS; in kvm_emulate_hypercall()
8409 kvm_pv_kick_cpu_op(vcpu->kvm, a0, a1); in kvm_emulate_hypercall()
8410 kvm_sched_yield(vcpu->kvm, a1); in kvm_emulate_hypercall()
8422 ret = kvm_pv_send_ipi(vcpu->kvm, a0, a1, a2, a3, op_64_bit); in kvm_emulate_hypercall()
8428 kvm_sched_yield(vcpu->kvm, a0); in kvm_emulate_hypercall()
8432 ret = -KVM_ENOSYS; in kvm_emulate_hypercall()
8440 ++vcpu->stat.hypercalls; in kvm_emulate_hypercall()
8454 &ctxt->exception); in emulator_fix_hypercall()
8459 return vcpu->run->request_interrupt_window && in dm_request_for_irq_injection()
8460 likely(!pic_in_kernel(vcpu->kvm)); in dm_request_for_irq_injection()
8465 struct kvm_run *kvm_run = vcpu->run; in post_kvm_run_save()
8467 kvm_run->if_flag = (kvm_get_rflags(vcpu) & X86_EFLAGS_IF) != 0; in post_kvm_run_save()
8468 kvm_run->flags = is_smm(vcpu) ? KVM_RUN_X86_SMM : 0; in post_kvm_run_save()
8469 kvm_run->cr8 = kvm_get_cr8(vcpu); in post_kvm_run_save()
8470 kvm_run->apic_base = kvm_get_apic_base(vcpu); in post_kvm_run_save()
8471 kvm_run->ready_for_interrupt_injection = in post_kvm_run_save()
8472 pic_in_kernel(vcpu->kvm) || in post_kvm_run_save()
8486 if (vcpu->arch.apicv_active) in update_cr8_intercept()
8489 if (!vcpu->arch.apic->vapic_addr) in update_cr8_intercept()
8492 max_irr = -1; in update_cr8_intercept()
8494 if (max_irr != -1) in update_cr8_intercept()
8504 trace_kvm_inj_exception(vcpu->arch.exception.nr, in kvm_inject_exception()
8505 vcpu->arch.exception.has_error_code, in kvm_inject_exception()
8506 vcpu->arch.exception.error_code, in kvm_inject_exception()
8507 vcpu->arch.exception.injected); in kvm_inject_exception()
8509 if (vcpu->arch.exception.error_code && !is_protmode(vcpu)) in kvm_inject_exception()
8510 vcpu->arch.exception.error_code = false; in kvm_inject_exception()
8521 if (vcpu->arch.exception.injected) { in inject_pending_event()
8529 * Trap-like exceptions, e.g. #DB, have higher priority than in inject_pending_event()
8532 * Fault-like exceptions, e.g. #GP and #PF, are the lowest in inject_pending_event()
8534 * execution, i.e. a pending fault-like exception means the in inject_pending_event()
8539 else if (!vcpu->arch.exception.pending) { in inject_pending_event()
8540 if (vcpu->arch.nmi_injected) { in inject_pending_event()
8543 } else if (vcpu->arch.interrupt.injected) { in inject_pending_event()
8549 WARN_ON_ONCE(vcpu->arch.exception.injected && in inject_pending_event()
8550 vcpu->arch.exception.pending); in inject_pending_event()
8554 * in order for caller to determine if it should require immediate-exit in inject_pending_event()
8559 r = kvm_x86_ops.nested_ops->check_events(vcpu); in inject_pending_event()
8565 if (vcpu->arch.exception.pending) { in inject_pending_event()
8567 * Fault-class exceptions, except #DBs, set RF=1 in the RFLAGS in inject_pending_event()
8568 * value pushed on the stack. Trap-like exception and all #DBs in inject_pending_event()
8569 * leave RF as-is (KVM follows Intel's behavior in this regard; in inject_pending_event()
8574 * fault-like. They do _not_ set RF, a la code breakpoints. in inject_pending_event()
8576 if (exception_type(vcpu->arch.exception.nr) == EXCPT_FAULT) in inject_pending_event()
8580 if (vcpu->arch.exception.nr == DB_VECTOR) { in inject_pending_event()
8582 if (vcpu->arch.dr7 & DR7_GD) { in inject_pending_event()
8583 vcpu->arch.dr7 &= ~DR7_GD; in inject_pending_event()
8590 vcpu->arch.exception.pending = false; in inject_pending_event()
8591 vcpu->arch.exception.injected = true; in inject_pending_event()
8598 * due to architectural conditions (e.g. IF=0) a window-open exit in inject_pending_event()
8599 * will re-request KVM_REQ_EVENT. Sometimes however an event is pending in inject_pending_event()
8605 * The kvm_x86_ops hooks communicate this by returning -EBUSY. in inject_pending_event()
8607 if (vcpu->arch.smi_pending) { in inject_pending_event()
8608 r = can_inject ? kvm_x86_ops.smi_allowed(vcpu, true) : -EBUSY; in inject_pending_event()
8612 vcpu->arch.smi_pending = false; in inject_pending_event()
8613 ++vcpu->arch.smi_count; in inject_pending_event()
8620 if (vcpu->arch.nmi_pending) { in inject_pending_event()
8621 r = can_inject ? kvm_x86_ops.nmi_allowed(vcpu, true) : -EBUSY; in inject_pending_event()
8625 --vcpu->arch.nmi_pending; in inject_pending_event()
8626 vcpu->arch.nmi_injected = true; in inject_pending_event()
8631 if (vcpu->arch.nmi_pending) in inject_pending_event()
8636 r = can_inject ? kvm_x86_ops.interrupt_allowed(vcpu, true) : -EBUSY; in inject_pending_event()
8649 kvm_x86_ops.nested_ops->hv_timer_pending && in inject_pending_event()
8650 kvm_x86_ops.nested_ops->hv_timer_pending(vcpu)) in inject_pending_event()
8653 WARN_ON(vcpu->arch.exception.pending); in inject_pending_event()
8670 if (kvm_x86_ops.get_nmi_mask(vcpu) || vcpu->arch.nmi_injected) in process_nmi()
8673 vcpu->arch.nmi_pending += atomic_xchg(&vcpu->arch.nmi_queued, 0); in process_nmi()
8674 vcpu->arch.nmi_pending = min(vcpu->arch.nmi_pending, limit); in process_nmi()
8681 flags |= seg->g << 23; in enter_smm_get_segment_flags()
8682 flags |= seg->db << 22; in enter_smm_get_segment_flags()
8683 flags |= seg->l << 21; in enter_smm_get_segment_flags()
8684 flags |= seg->avl << 20; in enter_smm_get_segment_flags()
8685 flags |= seg->present << 15; in enter_smm_get_segment_flags()
8686 flags |= seg->dpl << 13; in enter_smm_get_segment_flags()
8687 flags |= seg->s << 12; in enter_smm_get_segment_flags()
8688 flags |= seg->type << 8; in enter_smm_get_segment_flags()
8703 offset = 0x7f2c + (n - 3) * 12; in enter_smm_save_seg_32()
8705 put_smstate(u32, buf, offset + 8, seg.base); in enter_smm_save_seg_32()
8724 put_smstate(u64, buf, offset + 8, seg.base); in enter_smm_save_seg_64()
8750 put_smstate(u32, buf, 0x7f64, seg.base); in enter_smm_save_state_32()
8756 put_smstate(u32, buf, 0x7f80, seg.base); in enter_smm_save_state_32()
8775 put_smstate(u32, buf, 0x7ef8, vcpu->arch.smbase); in enter_smm_save_state_32()
8787 put_smstate(u64, buf, 0x7ff8 - i * 8, kvm_register_read(vcpu, i)); in enter_smm_save_state_64()
8801 put_smstate(u32, buf, 0x7f00, vcpu->arch.smbase); in enter_smm_save_state_64()
8806 put_smstate(u64, buf, 0x7ed0, vcpu->arch.efer); in enter_smm_save_state_64()
8812 put_smstate(u64, buf, 0x7e98, seg.base); in enter_smm_save_state_64()
8822 put_smstate(u64, buf, 0x7e78, seg.base); in enter_smm_save_state_64()
8840 trace_kvm_enter_smm(vcpu->vcpu_id, vcpu->arch.smbase, true); in enter_smm()
8850 * Give pre_enter_smm() a chance to make ISA-specific changes to the in enter_smm()
8852 * the SMM state-save area. in enter_smm()
8856 vcpu->arch.hflags |= HF_SMM_MASK; in enter_smm()
8857 kvm_vcpu_write_guest(vcpu, vcpu->arch.smbase + 0xfe00, buf, sizeof(buf)); in enter_smm()
8860 vcpu->arch.hflags |= HF_SMM_INSIDE_NMI_MASK; in enter_smm()
8867 cr0 = vcpu->arch.cr0 & ~(X86_CR0_PE | X86_CR0_EM | X86_CR0_TS | X86_CR0_PG); in enter_smm()
8869 vcpu->arch.cr0 = cr0; in enter_smm()
8879 cs.selector = (vcpu->arch.smbase >> 4) & 0xffff; in enter_smm()
8880 cs.base = vcpu->arch.smbase; in enter_smm()
8883 ds.base = 0; in enter_smm()
8915 vcpu->arch.smi_pending = true; in process_smi()
8942 vcpu->arch.apicv_active = kvm_apicv_activated(vcpu->kvm); in kvm_vcpu_update_apicv()
8951 * In particular, kvm_request_apicv_update() expects kvm->srcu not to be
8953 * synchronize_srcu(&kvm->srcu).
8964 old = READ_ONCE(kvm->arch.apicv_inhibit_reasons); in kvm_request_apicv_update()
8973 old = cmpxchg(&kvm->arch.apicv_inhibit_reasons, expected, new); in kvm_request_apicv_update()
9001 bitmap_zero(vcpu->arch.ioapic_handled_vectors, 256); in vcpu_scan_ioapic()
9003 if (irqchip_split(vcpu->kvm)) in vcpu_scan_ioapic()
9004 kvm_scan_ioapic_routes(vcpu, vcpu->arch.ioapic_handled_vectors); in vcpu_scan_ioapic()
9006 if (vcpu->arch.apicv_active) in vcpu_scan_ioapic()
9008 if (ioapic_in_kernel(vcpu->kvm)) in vcpu_scan_ioapic()
9009 kvm_ioapic_scan_entry(vcpu, vcpu->arch.ioapic_handled_vectors); in vcpu_scan_ioapic()
9013 vcpu->arch.load_eoi_exitmap_pending = true; in vcpu_scan_ioapic()
9022 if (!kvm_apic_hw_enabled(vcpu->arch.apic)) in vcpu_load_eoi_exitmap()
9025 bitmap_or((ulong *)eoi_exit_bitmap, vcpu->arch.ioapic_handled_vectors, in vcpu_load_eoi_exitmap()
9026 vcpu_to_synic(vcpu)->vec_bitmap, 256); in vcpu_load_eoi_exitmap()
9063 smp_send_reschedule(vcpu->cpu); in __kvm_request_immediate_exit()
9084 if (unlikely(!kvm_x86_ops.nested_ops->get_nested_state_pages(vcpu))) { in vcpu_enter_guest()
9094 kvm_gen_update_masterclock(vcpu->kvm); in vcpu_enter_guest()
9118 vcpu->run->exit_reason = KVM_EXIT_TPR_ACCESS; in vcpu_enter_guest()
9123 vcpu->run->exit_reason = KVM_EXIT_SHUTDOWN; in vcpu_enter_guest()
9124 vcpu->mmio_needed = 0; in vcpu_enter_guest()
9130 vcpu->arch.apf.halted = true; in vcpu_enter_guest()
9145 BUG_ON(vcpu->arch.pending_ioapic_eoi > 255); in vcpu_enter_guest()
9146 if (test_bit(vcpu->arch.pending_ioapic_eoi, in vcpu_enter_guest()
9147 vcpu->arch.ioapic_handled_vectors)) { in vcpu_enter_guest()
9148 vcpu->run->exit_reason = KVM_EXIT_IOAPIC_EOI; in vcpu_enter_guest()
9149 vcpu->run->eoi.vector = in vcpu_enter_guest()
9150 vcpu->arch.pending_ioapic_eoi; in vcpu_enter_guest()
9162 vcpu->run->exit_reason = KVM_EXIT_SYSTEM_EVENT; in vcpu_enter_guest()
9163 vcpu->run->system_event.type = KVM_SYSTEM_EVENT_CRASH; in vcpu_enter_guest()
9168 vcpu->run->exit_reason = KVM_EXIT_SYSTEM_EVENT; in vcpu_enter_guest()
9169 vcpu->run->system_event.type = KVM_SYSTEM_EVENT_RESET; in vcpu_enter_guest()
9174 vcpu->run->exit_reason = KVM_EXIT_HYPERV; in vcpu_enter_guest()
9175 vcpu->run->hyperv = vcpu->arch.hyperv.exit; in vcpu_enter_guest()
9182 * KVM_REQ_CLOCK_UPDATE, because Hyper-V SynIC timers in vcpu_enter_guest()
9183 * depend on the guest clock being up-to-date in vcpu_enter_guest()
9196 ++vcpu->stat.req_event; in vcpu_enter_guest()
9198 if (vcpu->arch.mp_state == KVM_MP_STATE_INIT_RECEIVED) { in vcpu_enter_guest()
9228 vcpu->mode = IN_GUEST_MODE; in vcpu_enter_guest()
9230 srcu_read_unlock(&vcpu->kvm->srcu, vcpu->srcu_idx); in vcpu_enter_guest()
9233 * 1) We should set ->mode before checking ->requests. Please see in vcpu_enter_guest()
9236 * 2) For APICv, we should set ->mode before checking PID.ON. This in vcpu_enter_guest()
9250 if (kvm_lapic_enabled(vcpu) && vcpu->arch.apicv_active) in vcpu_enter_guest()
9254 vcpu->mode = OUTSIDE_GUEST_MODE; in vcpu_enter_guest()
9258 vcpu->srcu_idx = srcu_read_lock(&vcpu->kvm->srcu); in vcpu_enter_guest()
9274 if (unlikely(vcpu->arch.switch_db_regs)) { in vcpu_enter_guest()
9276 set_debugreg(vcpu->arch.eff_db[0], 0); in vcpu_enter_guest()
9277 set_debugreg(vcpu->arch.eff_db[1], 1); in vcpu_enter_guest()
9278 set_debugreg(vcpu->arch.eff_db[2], 2); in vcpu_enter_guest()
9279 set_debugreg(vcpu->arch.eff_db[3], 3); in vcpu_enter_guest()
9280 set_debugreg(vcpu->arch.dr6, 6); in vcpu_enter_guest()
9281 vcpu->arch.switch_db_regs &= ~KVM_DEBUGREG_RELOAD; in vcpu_enter_guest()
9294 if (unlikely(vcpu->arch.switch_db_regs & KVM_DEBUGREG_WONT_EXIT)) { in vcpu_enter_guest()
9295 WARN_ON(vcpu->guest_debug & KVM_GUESTDBG_USE_HW_BP); in vcpu_enter_guest()
9299 vcpu->arch.switch_db_regs &= ~KVM_DEBUGREG_RELOAD; in vcpu_enter_guest()
9312 vcpu->arch.last_vmentry_cpu = vcpu->cpu; in vcpu_enter_guest()
9313 vcpu->arch.last_guest_tsc = kvm_read_l1_tsc(vcpu, rdtsc()); in vcpu_enter_guest()
9315 vcpu->mode = OUTSIDE_GUEST_MODE; in vcpu_enter_guest()
9322 * VM-Exit on SVM and any ticks that occur between VM-Exit and now. in vcpu_enter_guest()
9329 ++vcpu->stat.exits; in vcpu_enter_guest()
9343 s64 delta = vcpu->arch.apic->lapic_timer.advance_expire_delta; in vcpu_enter_guest()
9345 trace_kvm_wait_lapic_expire(vcpu->vcpu_id, delta); in vcpu_enter_guest()
9346 vcpu->arch.apic->lapic_timer.advance_expire_delta = S64_MIN; in vcpu_enter_guest()
9353 vcpu->srcu_idx = srcu_read_lock(&vcpu->kvm->srcu); in vcpu_enter_guest()
9363 if (unlikely(vcpu->arch.tsc_always_catchup)) in vcpu_enter_guest()
9366 if (vcpu->arch.apic_attention) in vcpu_enter_guest()
9376 if (unlikely(vcpu->arch.apic_attention)) in vcpu_enter_guest()
9386 srcu_read_unlock(&kvm->srcu, vcpu->srcu_idx); in vcpu_block()
9388 vcpu->srcu_idx = srcu_read_lock(&kvm->srcu); in vcpu_block()
9398 switch(vcpu->arch.mp_state) { in vcpu_block()
9400 vcpu->arch.pv.pv_unhalted = false; in vcpu_block()
9401 vcpu->arch.mp_state = in vcpu_block()
9405 vcpu->arch.apf.halted = false; in vcpu_block()
9410 return -EINTR; in vcpu_block()
9418 kvm_x86_ops.nested_ops->check_events(vcpu); in kvm_vcpu_running()
9420 return (vcpu->arch.mp_state == KVM_MP_STATE_RUNNABLE && in kvm_vcpu_running()
9421 !vcpu->arch.apf.halted); in kvm_vcpu_running()
9427 struct kvm *kvm = vcpu->kvm; in vcpu_run()
9429 vcpu->srcu_idx = srcu_read_lock(&kvm->srcu); in vcpu_run()
9430 vcpu->arch.l1tf_flush_l1d = true; in vcpu_run()
9439 vcpu->arch.at_instruction_boundary = false; in vcpu_run()
9456 vcpu->run->exit_reason = KVM_EXIT_IRQ_WINDOW_OPEN; in vcpu_run()
9457 ++vcpu->stat.request_irq_exits; in vcpu_run()
9462 srcu_read_unlock(&kvm->srcu, vcpu->srcu_idx); in vcpu_run()
9466 vcpu->srcu_idx = srcu_read_lock(&kvm->srcu); in vcpu_run()
9470 srcu_read_unlock(&kvm->srcu, vcpu->srcu_idx); in vcpu_run()
9479 vcpu->srcu_idx = srcu_read_lock(&vcpu->kvm->srcu); in complete_emulated_io()
9481 srcu_read_unlock(&vcpu->kvm->srcu, vcpu->srcu_idx); in complete_emulated_io()
9487 BUG_ON(!vcpu->arch.pio.count); in complete_emulated_pio()
9512 struct kvm_run *run = vcpu->run; in complete_emulated_mmio()
9516 BUG_ON(!vcpu->mmio_needed); in complete_emulated_mmio()
9519 frag = &vcpu->mmio_fragments[vcpu->mmio_cur_fragment]; in complete_emulated_mmio()
9520 len = min(8u, frag->len); in complete_emulated_mmio()
9521 if (!vcpu->mmio_is_write) in complete_emulated_mmio()
9522 memcpy(frag->data, run->mmio.data, len); in complete_emulated_mmio()
9524 if (frag->len <= 8) { in complete_emulated_mmio()
9527 vcpu->mmio_cur_fragment++; in complete_emulated_mmio()
9530 frag->data += len; in complete_emulated_mmio()
9531 frag->gpa += len; in complete_emulated_mmio()
9532 frag->len -= len; in complete_emulated_mmio()
9535 if (vcpu->mmio_cur_fragment >= vcpu->mmio_nr_fragments) { in complete_emulated_mmio()
9536 vcpu->mmio_needed = 0; in complete_emulated_mmio()
9538 /* FIXME: return into emulator if single-stepping. */ in complete_emulated_mmio()
9539 if (vcpu->mmio_is_write) in complete_emulated_mmio()
9541 vcpu->mmio_read_completed = 1; in complete_emulated_mmio()
9545 run->exit_reason = KVM_EXIT_MMIO; in complete_emulated_mmio()
9546 run->mmio.phys_addr = frag->gpa; in complete_emulated_mmio()
9547 if (vcpu->mmio_is_write) in complete_emulated_mmio()
9548 memcpy(run->mmio.data, frag->data, min(8u, frag->len)); in complete_emulated_mmio()
9549 run->mmio.len = min(8u, frag->len); in complete_emulated_mmio()
9550 run->mmio.is_write = vcpu->mmio_is_write; in complete_emulated_mmio()
9551 vcpu->arch.complete_userspace_io = complete_emulated_mmio; in complete_emulated_mmio()
9562 memcpy(&fpu->state, &current->thread.fpu.state, in kvm_save_current_fpu()
9573 kvm_save_current_fpu(vcpu->arch.user_fpu); in kvm_load_guest_fpu()
9576 __copy_kernel_to_fpregs(&vcpu->arch.guest_fpu->state, in kvm_load_guest_fpu()
9590 kvm_save_current_fpu(vcpu->arch.guest_fpu); in kvm_put_guest_fpu()
9592 copy_kernel_to_fpregs(&vcpu->arch.user_fpu->state); in kvm_put_guest_fpu()
9597 ++vcpu->stat.fpu_reload; in kvm_put_guest_fpu()
9603 struct kvm_run *kvm_run = vcpu->run; in kvm_arch_vcpu_ioctl_run()
9610 if (unlikely(vcpu->arch.mp_state == KVM_MP_STATE_UNINITIALIZED)) { in kvm_arch_vcpu_ioctl_run()
9611 if (kvm_run->immediate_exit) { in kvm_arch_vcpu_ioctl_run()
9612 r = -EINTR; in kvm_arch_vcpu_ioctl_run()
9618 r = -EAGAIN; in kvm_arch_vcpu_ioctl_run()
9620 r = -EINTR; in kvm_arch_vcpu_ioctl_run()
9621 kvm_run->exit_reason = KVM_EXIT_INTR; in kvm_arch_vcpu_ioctl_run()
9622 ++vcpu->stat.signal_exits; in kvm_arch_vcpu_ioctl_run()
9627 if (kvm_run->kvm_valid_regs & ~KVM_SYNC_X86_VALID_FIELDS) { in kvm_arch_vcpu_ioctl_run()
9628 r = -EINVAL; in kvm_arch_vcpu_ioctl_run()
9632 if (kvm_run->kvm_dirty_regs) { in kvm_arch_vcpu_ioctl_run()
9638 /* re-sync apic's tpr */ in kvm_arch_vcpu_ioctl_run()
9640 if (kvm_set_cr8(vcpu, kvm_run->cr8) != 0) { in kvm_arch_vcpu_ioctl_run()
9641 r = -EINVAL; in kvm_arch_vcpu_ioctl_run()
9646 if (unlikely(vcpu->arch.complete_userspace_io)) { in kvm_arch_vcpu_ioctl_run()
9647 int (*cui)(struct kvm_vcpu *) = vcpu->arch.complete_userspace_io; in kvm_arch_vcpu_ioctl_run()
9648 vcpu->arch.complete_userspace_io = NULL; in kvm_arch_vcpu_ioctl_run()
9653 WARN_ON(vcpu->arch.pio.count || vcpu->mmio_needed); in kvm_arch_vcpu_ioctl_run()
9655 if (kvm_run->immediate_exit) in kvm_arch_vcpu_ioctl_run()
9656 r = -EINTR; in kvm_arch_vcpu_ioctl_run()
9662 if (kvm_run->kvm_valid_regs) in kvm_arch_vcpu_ioctl_run()
9673 if (vcpu->arch.emulate_regs_need_sync_to_vcpu) { in __get_regs()
9681 emulator_writeback_register_cache(vcpu->arch.emulate_ctxt); in __get_regs()
9682 vcpu->arch.emulate_regs_need_sync_to_vcpu = false; in __get_regs()
9684 regs->rax = kvm_rax_read(vcpu); in __get_regs()
9685 regs->rbx = kvm_rbx_read(vcpu); in __get_regs()
9686 regs->rcx = kvm_rcx_read(vcpu); in __get_regs()
9687 regs->rdx = kvm_rdx_read(vcpu); in __get_regs()
9688 regs->rsi = kvm_rsi_read(vcpu); in __get_regs()
9689 regs->rdi = kvm_rdi_read(vcpu); in __get_regs()
9690 regs->rsp = kvm_rsp_read(vcpu); in __get_regs()
9691 regs->rbp = kvm_rbp_read(vcpu); in __get_regs()
9693 regs->r8 = kvm_r8_read(vcpu); in __get_regs()
9694 regs->r9 = kvm_r9_read(vcpu); in __get_regs()
9695 regs->r10 = kvm_r10_read(vcpu); in __get_regs()
9696 regs->r11 = kvm_r11_read(vcpu); in __get_regs()
9697 regs->r12 = kvm_r12_read(vcpu); in __get_regs()
9698 regs->r13 = kvm_r13_read(vcpu); in __get_regs()
9699 regs->r14 = kvm_r14_read(vcpu); in __get_regs()
9700 regs->r15 = kvm_r15_read(vcpu); in __get_regs()
9703 regs->rip = kvm_rip_read(vcpu); in __get_regs()
9704 regs->rflags = kvm_get_rflags(vcpu); in __get_regs()
9717 vcpu->arch.emulate_regs_need_sync_from_vcpu = true; in __set_regs()
9718 vcpu->arch.emulate_regs_need_sync_to_vcpu = false; in __set_regs()
9720 kvm_rax_write(vcpu, regs->rax); in __set_regs()
9721 kvm_rbx_write(vcpu, regs->rbx); in __set_regs()
9722 kvm_rcx_write(vcpu, regs->rcx); in __set_regs()
9723 kvm_rdx_write(vcpu, regs->rdx); in __set_regs()
9724 kvm_rsi_write(vcpu, regs->rsi); in __set_regs()
9725 kvm_rdi_write(vcpu, regs->rdi); in __set_regs()
9726 kvm_rsp_write(vcpu, regs->rsp); in __set_regs()
9727 kvm_rbp_write(vcpu, regs->rbp); in __set_regs()
9729 kvm_r8_write(vcpu, regs->r8); in __set_regs()
9730 kvm_r9_write(vcpu, regs->r9); in __set_regs()
9731 kvm_r10_write(vcpu, regs->r10); in __set_regs()
9732 kvm_r11_write(vcpu, regs->r11); in __set_regs()
9733 kvm_r12_write(vcpu, regs->r12); in __set_regs()
9734 kvm_r13_write(vcpu, regs->r13); in __set_regs()
9735 kvm_r14_write(vcpu, regs->r14); in __set_regs()
9736 kvm_r15_write(vcpu, regs->r15); in __set_regs()
9739 kvm_rip_write(vcpu, regs->rip); in __set_regs()
9740 kvm_set_rflags(vcpu, regs->rflags | X86_EFLAGS_FIXED); in __set_regs()
9742 vcpu->arch.exception.pending = false; in __set_regs()
9769 kvm_get_segment(vcpu, &sregs->cs, VCPU_SREG_CS); in __get_sregs()
9770 kvm_get_segment(vcpu, &sregs->ds, VCPU_SREG_DS); in __get_sregs()
9771 kvm_get_segment(vcpu, &sregs->es, VCPU_SREG_ES); in __get_sregs()
9772 kvm_get_segment(vcpu, &sregs->fs, VCPU_SREG_FS); in __get_sregs()
9773 kvm_get_segment(vcpu, &sregs->gs, VCPU_SREG_GS); in __get_sregs()
9774 kvm_get_segment(vcpu, &sregs->ss, VCPU_SREG_SS); in __get_sregs()
9776 kvm_get_segment(vcpu, &sregs->tr, VCPU_SREG_TR); in __get_sregs()
9777 kvm_get_segment(vcpu, &sregs->ldt, VCPU_SREG_LDTR); in __get_sregs()
9780 sregs->idt.limit = dt.size; in __get_sregs()
9781 sregs->idt.base = dt.address; in __get_sregs()
9783 sregs->gdt.limit = dt.size; in __get_sregs()
9784 sregs->gdt.base = dt.address; in __get_sregs()
9786 sregs->cr0 = kvm_read_cr0(vcpu); in __get_sregs()
9787 sregs->cr2 = vcpu->arch.cr2; in __get_sregs()
9788 sregs->cr3 = kvm_read_cr3(vcpu); in __get_sregs()
9789 sregs->cr4 = kvm_read_cr4(vcpu); in __get_sregs()
9790 sregs->cr8 = kvm_get_cr8(vcpu); in __get_sregs()
9791 sregs->efer = vcpu->arch.efer; in __get_sregs()
9792 sregs->apic_base = kvm_get_apic_base(vcpu); in __get_sregs()
9794 memset(sregs->interrupt_bitmap, 0, sizeof(sregs->interrupt_bitmap)); in __get_sregs()
9796 if (vcpu->arch.interrupt.injected && !vcpu->arch.interrupt.soft) in __get_sregs()
9797 set_bit(vcpu->arch.interrupt.nr, in __get_sregs()
9798 (unsigned long *)sregs->interrupt_bitmap); in __get_sregs()
9818 if (vcpu->arch.mp_state == KVM_MP_STATE_HALTED && in kvm_arch_vcpu_ioctl_get_mpstate()
9819 vcpu->arch.pv.pv_unhalted) in kvm_arch_vcpu_ioctl_get_mpstate()
9820 mp_state->mp_state = KVM_MP_STATE_RUNNABLE; in kvm_arch_vcpu_ioctl_get_mpstate()
9822 mp_state->mp_state = vcpu->arch.mp_state; in kvm_arch_vcpu_ioctl_get_mpstate()
9833 int ret = -EINVAL; in kvm_arch_vcpu_ioctl_set_mpstate()
9838 mp_state->mp_state != KVM_MP_STATE_RUNNABLE) in kvm_arch_vcpu_ioctl_set_mpstate()
9846 if ((kvm_vcpu_latch_init(vcpu) || vcpu->arch.smi_pending) && in kvm_arch_vcpu_ioctl_set_mpstate()
9847 (mp_state->mp_state == KVM_MP_STATE_SIPI_RECEIVED || in kvm_arch_vcpu_ioctl_set_mpstate()
9848 mp_state->mp_state == KVM_MP_STATE_INIT_RECEIVED)) in kvm_arch_vcpu_ioctl_set_mpstate()
9851 if (mp_state->mp_state == KVM_MP_STATE_SIPI_RECEIVED) { in kvm_arch_vcpu_ioctl_set_mpstate()
9852 vcpu->arch.mp_state = KVM_MP_STATE_INIT_RECEIVED; in kvm_arch_vcpu_ioctl_set_mpstate()
9853 set_bit(KVM_APIC_SIPI, &vcpu->arch.apic->pending_events); in kvm_arch_vcpu_ioctl_set_mpstate()
9855 vcpu->arch.mp_state = mp_state->mp_state; in kvm_arch_vcpu_ioctl_set_mpstate()
9867 struct x86_emulate_ctxt *ctxt = vcpu->arch.emulate_ctxt; in kvm_task_switch()
9875 vcpu->run->exit_reason = KVM_EXIT_INTERNAL_ERROR; in kvm_task_switch()
9876 vcpu->run->internal.suberror = KVM_INTERNAL_ERROR_EMULATION; in kvm_task_switch()
9877 vcpu->run->internal.ndata = 0; in kvm_task_switch()
9881 kvm_rip_write(vcpu, ctxt->eip); in kvm_task_switch()
9882 kvm_set_rflags(vcpu, ctxt->eflags); in kvm_task_switch()
9889 if ((sregs->efer & EFER_LME) && (sregs->cr0 & X86_CR0_PG)) { in kvm_valid_sregs()
9892 * 64-bit mode (though maybe in a 32-bit code segment). in kvm_valid_sregs()
9895 if (!(sregs->cr4 & X86_CR4_PAE) in kvm_valid_sregs()
9896 || !(sregs->efer & EFER_LMA)) in kvm_valid_sregs()
9897 return -EINVAL; in kvm_valid_sregs()
9898 if (sregs->cr3 & vcpu->arch.cr3_lm_rsvd_bits) in kvm_valid_sregs()
9899 return -EINVAL; in kvm_valid_sregs()
9902 * Not in 64-bit mode: EFER.LMA is clear and the code in kvm_valid_sregs()
9903 * segment cannot be 64-bit. in kvm_valid_sregs()
9905 if (sregs->efer & EFER_LMA || sregs->cs.l) in kvm_valid_sregs()
9906 return -EINVAL; in kvm_valid_sregs()
9909 return kvm_valid_cr4(vcpu, sregs->cr4); in kvm_valid_sregs()
9919 int ret = -EINVAL; in __set_sregs()
9924 apic_base_msr.data = sregs->apic_base; in __set_sregs()
9929 dt.size = sregs->idt.limit; in __set_sregs()
9930 dt.address = sregs->idt.base; in __set_sregs()
9932 dt.size = sregs->gdt.limit; in __set_sregs()
9933 dt.address = sregs->gdt.base; in __set_sregs()
9936 vcpu->arch.cr2 = sregs->cr2; in __set_sregs()
9937 mmu_reset_needed |= kvm_read_cr3(vcpu) != sregs->cr3; in __set_sregs()
9938 vcpu->arch.cr3 = sregs->cr3; in __set_sregs()
9941 kvm_set_cr8(vcpu, sregs->cr8); in __set_sregs()
9943 mmu_reset_needed |= vcpu->arch.efer != sregs->efer; in __set_sregs()
9944 kvm_x86_ops.set_efer(vcpu, sregs->efer); in __set_sregs()
9946 mmu_reset_needed |= kvm_read_cr0(vcpu) != sregs->cr0; in __set_sregs()
9947 kvm_x86_ops.set_cr0(vcpu, sregs->cr0); in __set_sregs()
9948 vcpu->arch.cr0 = sregs->cr0; in __set_sregs()
9950 mmu_reset_needed |= kvm_read_cr4(vcpu) != sregs->cr4; in __set_sregs()
9951 cpuid_update_needed |= ((kvm_read_cr4(vcpu) ^ sregs->cr4) & in __set_sregs()
9953 kvm_x86_ops.set_cr4(vcpu, sregs->cr4); in __set_sregs()
9957 idx = srcu_read_lock(&vcpu->kvm->srcu); in __set_sregs()
9959 load_pdptrs(vcpu, vcpu->arch.walk_mmu, kvm_read_cr3(vcpu)); in __set_sregs()
9962 srcu_read_unlock(&vcpu->kvm->srcu, idx); in __set_sregs()
9969 (const unsigned long *)sregs->interrupt_bitmap, max_bits); in __set_sregs()
9975 kvm_set_segment(vcpu, &sregs->cs, VCPU_SREG_CS); in __set_sregs()
9976 kvm_set_segment(vcpu, &sregs->ds, VCPU_SREG_DS); in __set_sregs()
9977 kvm_set_segment(vcpu, &sregs->es, VCPU_SREG_ES); in __set_sregs()
9978 kvm_set_segment(vcpu, &sregs->fs, VCPU_SREG_FS); in __set_sregs()
9979 kvm_set_segment(vcpu, &sregs->gs, VCPU_SREG_GS); in __set_sregs()
9980 kvm_set_segment(vcpu, &sregs->ss, VCPU_SREG_SS); in __set_sregs()
9982 kvm_set_segment(vcpu, &sregs->tr, VCPU_SREG_TR); in __set_sregs()
9983 kvm_set_segment(vcpu, &sregs->ldt, VCPU_SREG_LDTR); in __set_sregs()
9989 sregs->cs.selector == 0xf000 && sregs->cs.base == 0xffff0000 && in __set_sregs()
9991 vcpu->arch.mp_state = KVM_MP_STATE_RUNNABLE; in __set_sregs()
10019 if (dbg->control & (KVM_GUESTDBG_INJECT_DB | KVM_GUESTDBG_INJECT_BP)) { in kvm_arch_vcpu_ioctl_set_guest_debug()
10020 r = -EBUSY; in kvm_arch_vcpu_ioctl_set_guest_debug()
10021 if (vcpu->arch.exception.pending) in kvm_arch_vcpu_ioctl_set_guest_debug()
10023 if (dbg->control & KVM_GUESTDBG_INJECT_DB) in kvm_arch_vcpu_ioctl_set_guest_debug()
10035 vcpu->guest_debug = dbg->control; in kvm_arch_vcpu_ioctl_set_guest_debug()
10036 if (!(vcpu->guest_debug & KVM_GUESTDBG_ENABLE)) in kvm_arch_vcpu_ioctl_set_guest_debug()
10037 vcpu->guest_debug = 0; in kvm_arch_vcpu_ioctl_set_guest_debug()
10039 if (vcpu->guest_debug & KVM_GUESTDBG_USE_HW_BP) { in kvm_arch_vcpu_ioctl_set_guest_debug()
10041 vcpu->arch.eff_db[i] = dbg->arch.debugreg[i]; in kvm_arch_vcpu_ioctl_set_guest_debug()
10042 vcpu->arch.guest_debug_dr7 = dbg->arch.debugreg[7]; in kvm_arch_vcpu_ioctl_set_guest_debug()
10045 vcpu->arch.eff_db[i] = vcpu->arch.db[i]; in kvm_arch_vcpu_ioctl_set_guest_debug()
10049 if (vcpu->guest_debug & KVM_GUESTDBG_SINGLESTEP) in kvm_arch_vcpu_ioctl_set_guest_debug()
10050 vcpu->arch.singlestep_rip = kvm_rip_read(vcpu) + in kvm_arch_vcpu_ioctl_set_guest_debug()
10074 unsigned long vaddr = tr->linear_address; in kvm_arch_vcpu_ioctl_translate()
10080 idx = srcu_read_lock(&vcpu->kvm->srcu); in kvm_arch_vcpu_ioctl_translate()
10082 srcu_read_unlock(&vcpu->kvm->srcu, idx); in kvm_arch_vcpu_ioctl_translate()
10083 tr->physical_address = gpa; in kvm_arch_vcpu_ioctl_translate()
10084 tr->valid = gpa != UNMAPPED_GVA; in kvm_arch_vcpu_ioctl_translate()
10085 tr->writeable = 1; in kvm_arch_vcpu_ioctl_translate()
10086 tr->usermode = 0; in kvm_arch_vcpu_ioctl_translate()
10098 fxsave = &vcpu->arch.guest_fpu->state.fxsave; in kvm_arch_vcpu_ioctl_get_fpu()
10099 memcpy(fpu->fpr, fxsave->st_space, 128); in kvm_arch_vcpu_ioctl_get_fpu()
10100 fpu->fcw = fxsave->cwd; in kvm_arch_vcpu_ioctl_get_fpu()
10101 fpu->fsw = fxsave->swd; in kvm_arch_vcpu_ioctl_get_fpu()
10102 fpu->ftwx = fxsave->twd; in kvm_arch_vcpu_ioctl_get_fpu()
10103 fpu->last_opcode = fxsave->fop; in kvm_arch_vcpu_ioctl_get_fpu()
10104 fpu->last_ip = fxsave->rip; in kvm_arch_vcpu_ioctl_get_fpu()
10105 fpu->last_dp = fxsave->rdp; in kvm_arch_vcpu_ioctl_get_fpu()
10106 memcpy(fpu->xmm, fxsave->xmm_space, sizeof(fxsave->xmm_space)); in kvm_arch_vcpu_ioctl_get_fpu()
10118 fxsave = &vcpu->arch.guest_fpu->state.fxsave; in kvm_arch_vcpu_ioctl_set_fpu()
10120 memcpy(fxsave->st_space, fpu->fpr, 128); in kvm_arch_vcpu_ioctl_set_fpu()
10121 fxsave->cwd = fpu->fcw; in kvm_arch_vcpu_ioctl_set_fpu()
10122 fxsave->swd = fpu->fsw; in kvm_arch_vcpu_ioctl_set_fpu()
10123 fxsave->twd = fpu->ftwx; in kvm_arch_vcpu_ioctl_set_fpu()
10124 fxsave->fop = fpu->last_opcode; in kvm_arch_vcpu_ioctl_set_fpu()
10125 fxsave->rip = fpu->last_ip; in kvm_arch_vcpu_ioctl_set_fpu()
10126 fxsave->rdp = fpu->last_dp; in kvm_arch_vcpu_ioctl_set_fpu()
10127 memcpy(fxsave->xmm_space, fpu->xmm, sizeof(fxsave->xmm_space)); in kvm_arch_vcpu_ioctl_set_fpu()
10137 if (vcpu->run->kvm_valid_regs & KVM_SYNC_X86_REGS) in store_regs()
10138 __get_regs(vcpu, &vcpu->run->s.regs.regs); in store_regs()
10140 if (vcpu->run->kvm_valid_regs & KVM_SYNC_X86_SREGS) in store_regs()
10141 __get_sregs(vcpu, &vcpu->run->s.regs.sregs); in store_regs()
10143 if (vcpu->run->kvm_valid_regs & KVM_SYNC_X86_EVENTS) in store_regs()
10145 vcpu, &vcpu->run->s.regs.events); in store_regs()
10150 if (vcpu->run->kvm_dirty_regs & ~KVM_SYNC_X86_VALID_FIELDS) in sync_regs()
10151 return -EINVAL; in sync_regs()
10153 if (vcpu->run->kvm_dirty_regs & KVM_SYNC_X86_REGS) { in sync_regs()
10154 __set_regs(vcpu, &vcpu->run->s.regs.regs); in sync_regs()
10155 vcpu->run->kvm_dirty_regs &= ~KVM_SYNC_X86_REGS; in sync_regs()
10157 if (vcpu->run->kvm_dirty_regs & KVM_SYNC_X86_SREGS) { in sync_regs()
10158 if (__set_sregs(vcpu, &vcpu->run->s.regs.sregs)) in sync_regs()
10159 return -EINVAL; in sync_regs()
10160 vcpu->run->kvm_dirty_regs &= ~KVM_SYNC_X86_SREGS; in sync_regs()
10162 if (vcpu->run->kvm_dirty_regs & KVM_SYNC_X86_EVENTS) { in sync_regs()
10164 vcpu, &vcpu->run->s.regs.events)) in sync_regs()
10165 return -EINVAL; in sync_regs()
10166 vcpu->run->kvm_dirty_regs &= ~KVM_SYNC_X86_EVENTS; in sync_regs()
10174 fpstate_init(&vcpu->arch.guest_fpu->state); in fx_init()
10176 vcpu->arch.guest_fpu->state.xsave.header.xcomp_bv = in fx_init()
10182 vcpu->arch.xcr0 = XFEATURE_MASK_FP; in fx_init()
10184 vcpu->arch.cr0 |= X86_CR0_ET; in fx_init()
10189 if (kvm_check_tsc_unstable() && atomic_read(&kvm->online_vcpus) != 0) in kvm_arch_vcpu_precreate()
10201 if (!irqchip_in_kernel(vcpu->kvm) || kvm_vcpu_is_reset_bsp(vcpu)) in kvm_arch_vcpu_create()
10202 vcpu->arch.mp_state = KVM_MP_STATE_RUNNABLE; in kvm_arch_vcpu_create()
10204 vcpu->arch.mp_state = KVM_MP_STATE_UNINITIALIZED; in kvm_arch_vcpu_create()
10212 if (irqchip_in_kernel(vcpu->kvm)) { in kvm_arch_vcpu_create()
10216 if (kvm_apicv_activated(vcpu->kvm)) in kvm_arch_vcpu_create()
10217 vcpu->arch.apicv_active = true; in kvm_arch_vcpu_create()
10221 r = -ENOMEM; in kvm_arch_vcpu_create()
10226 vcpu->arch.pio_data = page_address(page); in kvm_arch_vcpu_create()
10228 vcpu->arch.mce_banks = kzalloc(KVM_MAX_MCE_BANKS * sizeof(u64) * 4, in kvm_arch_vcpu_create()
10230 if (!vcpu->arch.mce_banks) in kvm_arch_vcpu_create()
10232 vcpu->arch.mcg_cap = KVM_MAX_MCE_BANKS; in kvm_arch_vcpu_create()
10234 if (!zalloc_cpumask_var(&vcpu->arch.wbinvd_dirty_mask, in kvm_arch_vcpu_create()
10241 vcpu->arch.user_fpu = kmem_cache_zalloc(x86_fpu_cache, in kvm_arch_vcpu_create()
10243 if (!vcpu->arch.user_fpu) { in kvm_arch_vcpu_create()
10248 vcpu->arch.guest_fpu = kmem_cache_zalloc(x86_fpu_cache, in kvm_arch_vcpu_create()
10250 if (!vcpu->arch.guest_fpu) { in kvm_arch_vcpu_create()
10256 vcpu->arch.maxphyaddr = cpuid_query_maxphyaddr(vcpu); in kvm_arch_vcpu_create()
10257 vcpu->arch.cr3_lm_rsvd_bits = rsvd_bits(cpuid_maxphyaddr(vcpu), 63); in kvm_arch_vcpu_create()
10259 vcpu->arch.pat = MSR_IA32_CR_PAT_DEFAULT; in kvm_arch_vcpu_create()
10264 vcpu->arch.pending_external_vector = -1; in kvm_arch_vcpu_create()
10265 vcpu->arch.preempted_in_kernel = false; in kvm_arch_vcpu_create()
10273 vcpu->arch.arch_capabilities = kvm_get_arch_capabilities(); in kvm_arch_vcpu_create()
10274 vcpu->arch.msr_platform_info = MSR_PLATFORM_INFO_CPUID_FAULT; in kvm_arch_vcpu_create()
10283 kmem_cache_free(x86_fpu_cache, vcpu->arch.guest_fpu); in kvm_arch_vcpu_create()
10285 kmem_cache_free(x86_fpu_cache, vcpu->arch.user_fpu); in kvm_arch_vcpu_create()
10287 kmem_cache_free(x86_emulator_cache, vcpu->arch.emulate_ctxt); in kvm_arch_vcpu_create()
10289 free_cpumask_var(vcpu->arch.wbinvd_dirty_mask); in kvm_arch_vcpu_create()
10291 kfree(vcpu->arch.mce_banks); in kvm_arch_vcpu_create()
10293 free_page((unsigned long)vcpu->arch.pio_data); in kvm_arch_vcpu_create()
10303 struct kvm *kvm = vcpu->kvm; in kvm_arch_vcpu_postcreate()
10307 if (mutex_lock_killable(&vcpu->mutex)) in kvm_arch_vcpu_postcreate()
10314 vcpu->arch.msr_kvm_poll_control = 1; in kvm_arch_vcpu_postcreate()
10316 mutex_unlock(&vcpu->mutex); in kvm_arch_vcpu_postcreate()
10318 if (kvmclock_periodic_sync && vcpu->vcpu_idx == 0) in kvm_arch_vcpu_postcreate()
10319 schedule_delayed_work(&kvm->arch.kvmclock_sync_work, in kvm_arch_vcpu_postcreate()
10331 kmem_cache_free(x86_emulator_cache, vcpu->arch.emulate_ctxt); in kvm_arch_vcpu_destroy()
10332 free_cpumask_var(vcpu->arch.wbinvd_dirty_mask); in kvm_arch_vcpu_destroy()
10333 kmem_cache_free(x86_fpu_cache, vcpu->arch.user_fpu); in kvm_arch_vcpu_destroy()
10334 kmem_cache_free(x86_fpu_cache, vcpu->arch.guest_fpu); in kvm_arch_vcpu_destroy()
10338 kfree(vcpu->arch.mce_banks); in kvm_arch_vcpu_destroy()
10340 idx = srcu_read_lock(&vcpu->kvm->srcu); in kvm_arch_vcpu_destroy()
10342 srcu_read_unlock(&vcpu->kvm->srcu, idx); in kvm_arch_vcpu_destroy()
10343 free_page((unsigned long)vcpu->arch.pio_data); in kvm_arch_vcpu_destroy()
10344 kvfree(vcpu->arch.cpuid_entries); in kvm_arch_vcpu_destroy()
10353 vcpu->arch.hflags = 0; in kvm_vcpu_reset()
10355 vcpu->arch.smi_pending = 0; in kvm_vcpu_reset()
10356 vcpu->arch.smi_count = 0; in kvm_vcpu_reset()
10357 atomic_set(&vcpu->arch.nmi_queued, 0); in kvm_vcpu_reset()
10358 vcpu->arch.nmi_pending = 0; in kvm_vcpu_reset()
10359 vcpu->arch.nmi_injected = false; in kvm_vcpu_reset()
10363 memset(vcpu->arch.db, 0, sizeof(vcpu->arch.db)); in kvm_vcpu_reset()
10365 vcpu->arch.dr6 = DR6_INIT; in kvm_vcpu_reset()
10366 vcpu->arch.dr7 = DR7_FIXED_1; in kvm_vcpu_reset()
10369 vcpu->arch.cr2 = 0; in kvm_vcpu_reset()
10372 vcpu->arch.apf.msr_en_val = 0; in kvm_vcpu_reset()
10373 vcpu->arch.apf.msr_int_val = 0; in kvm_vcpu_reset()
10374 vcpu->arch.st.msr_val = 0; in kvm_vcpu_reset()
10380 vcpu->arch.apf.halted = false; in kvm_vcpu_reset()
10391 mpx_state_buffer = get_xsave_addr(&vcpu->arch.guest_fpu->state.xsave, in kvm_vcpu_reset()
10395 mpx_state_buffer = get_xsave_addr(&vcpu->arch.guest_fpu->state.xsave, in kvm_vcpu_reset()
10405 vcpu->arch.smbase = 0x30000; in kvm_vcpu_reset()
10407 vcpu->arch.msr_misc_features_enables = 0; in kvm_vcpu_reset()
10409 vcpu->arch.xcr0 = XFEATURE_MASK_FP; in kvm_vcpu_reset()
10412 memset(vcpu->arch.regs, 0, sizeof(vcpu->arch.regs)); in kvm_vcpu_reset()
10413 vcpu->arch.regs_avail = ~0; in kvm_vcpu_reset()
10414 vcpu->arch.regs_dirty = ~0; in kvm_vcpu_reset()
10416 vcpu->arch.ia32_xss = 0; in kvm_vcpu_reset()
10427 cs.base = vector << 12; in kvm_vcpu_deliver_sipi_vector()
10451 if (!stable && vcpu->cpu == smp_processor_id()) in kvm_arch_hardware_enable()
10453 if (stable && vcpu->arch.last_host_tsc > local_tsc) { in kvm_arch_hardware_enable()
10455 if (vcpu->arch.last_host_tsc > max_tsc) in kvm_arch_hardware_enable()
10456 max_tsc = vcpu->arch.last_host_tsc; in kvm_arch_hardware_enable()
10486 * N.B. - this code below runs only on platforms with reliable TSC, in kvm_arch_hardware_enable()
10500 u64 delta_cyc = max_tsc - local_tsc; in kvm_arch_hardware_enable()
10502 kvm->arch.backwards_tsc_observed = true; in kvm_arch_hardware_enable()
10504 vcpu->arch.tsc_offset_adjustment += delta_cyc; in kvm_arch_hardware_enable()
10505 vcpu->arch.last_host_tsc = local_tsc; in kvm_arch_hardware_enable()
10515 kvm->arch.last_tsc_nsec = 0; in kvm_arch_hardware_enable()
10516 kvm->arch.last_tsc_write = 0; in kvm_arch_hardware_enable()
10539 r = ops->hardware_setup(); in kvm_arch_hardware_setup()
10543 memcpy(&kvm_x86_ops, ops->runtime_ops, sizeof(kvm_x86_ops)); in kvm_arch_hardware_setup()
10584 return -EIO; in kvm_arch_check_processor_compat()
10586 return ops->check_processor_compatibility(); in kvm_arch_check_processor_compat()
10591 return vcpu->kvm->arch.bsp_vcpu_id == vcpu->vcpu_id; in kvm_vcpu_is_reset_bsp()
10597 return (vcpu->arch.apic_base & MSR_IA32_APICBASE_BSP) != 0; in kvm_vcpu_is_bsp()
10607 vcpu->arch.l1tf_flush_l1d = true; in kvm_arch_sched_in()
10608 if (pmu->version && unlikely(pmu->event_count)) { in kvm_arch_sched_in()
10609 pmu->need_cleanup = true; in kvm_arch_sched_in()
10617 kfree(kvm->arch.hyperv.hv_pa_pg); in kvm_arch_free_vm()
10627 return -EINVAL; in kvm_arch_init_vm()
10633 INIT_HLIST_HEAD(&kvm->arch.mask_notifier_list); in kvm_arch_init_vm()
10634 INIT_LIST_HEAD(&kvm->arch.active_mmu_pages); in kvm_arch_init_vm()
10635 INIT_LIST_HEAD(&kvm->arch.zapped_obsolete_pages); in kvm_arch_init_vm()
10636 INIT_LIST_HEAD(&kvm->arch.lpage_disallowed_mmu_pages); in kvm_arch_init_vm()
10637 INIT_LIST_HEAD(&kvm->arch.assigned_dev_head); in kvm_arch_init_vm()
10638 atomic_set(&kvm->arch.noncoherent_dma_count, 0); in kvm_arch_init_vm()
10641 set_bit(KVM_USERSPACE_IRQ_SOURCE_ID, &kvm->arch.irq_sources_bitmap); in kvm_arch_init_vm()
10642 /* Reserve bit 1 of irq_sources_bitmap for irqfd-resampler */ in kvm_arch_init_vm()
10644 &kvm->arch.irq_sources_bitmap); in kvm_arch_init_vm()
10646 raw_spin_lock_init(&kvm->arch.tsc_write_lock); in kvm_arch_init_vm()
10647 mutex_init(&kvm->arch.apic_map_lock); in kvm_arch_init_vm()
10648 spin_lock_init(&kvm->arch.pvclock_gtod_sync_lock); in kvm_arch_init_vm()
10650 kvm->arch.kvmclock_offset = -get_kvmclock_base_ns(); in kvm_arch_init_vm()
10653 kvm->arch.guest_can_read_msr_platform_info = true; in kvm_arch_init_vm()
10655 INIT_DELAYED_WORK(&kvm->arch.kvmclock_update_work, kvmclock_update_fn); in kvm_arch_init_vm()
10656 INIT_DELAYED_WORK(&kvm->arch.kvmclock_sync_work, kvmclock_sync_fn); in kvm_arch_init_vm()
10691 mutex_lock(&kvm->lock); in kvm_free_vcpus()
10692 for (i = 0; i < atomic_read(&kvm->online_vcpus); i++) in kvm_free_vcpus()
10693 kvm->vcpus[i] = NULL; in kvm_free_vcpus()
10695 atomic_set(&kvm->online_vcpus, 0); in kvm_free_vcpus()
10696 mutex_unlock(&kvm->lock); in kvm_free_vcpus()
10701 cancel_delayed_work_sync(&kvm->arch.kvmclock_sync_work); in kvm_arch_sync_events()
10702 cancel_delayed_work_sync(&kvm->arch.kvmclock_update_work); in kvm_arch_sync_events()
10713 /* Called with kvm->slots_lock held. */ in __x86_set_memory_region()
10715 return -EINVAL; in __x86_set_memory_region()
10719 if (slot && slot->npages) in __x86_set_memory_region()
10720 return -EEXIST; in __x86_set_memory_region()
10731 if (!slot || !slot->npages) in __x86_set_memory_region()
10734 old_npages = slot->npages; in __x86_set_memory_region()
10765 if (current->mm == kvm->mm) { in kvm_arch_destroy_vm()
10771 mutex_lock(&kvm->slots_lock); in kvm_arch_destroy_vm()
10777 mutex_unlock(&kvm->slots_lock); in kvm_arch_destroy_vm()
10781 kvm_free_msr_filter(srcu_dereference_check(kvm->arch.msr_filter, &kvm->srcu, 1)); in kvm_arch_destroy_vm()
10785 kvfree(rcu_dereference_check(kvm->arch.apic_map, 1)); in kvm_arch_destroy_vm()
10786 kfree(srcu_dereference_check(kvm->arch.pmu_event_filter, &kvm->srcu, 1)); in kvm_arch_destroy_vm()
10797 kvfree(slot->arch.rmap[i]); in kvm_arch_free_memslot()
10798 slot->arch.rmap[i] = NULL; in kvm_arch_free_memslot()
10803 kvfree(slot->arch.lpage_info[i - 1]); in kvm_arch_free_memslot()
10804 slot->arch.lpage_info[i - 1] = NULL; in kvm_arch_free_memslot()
10820 memset(&slot->arch, 0, sizeof(slot->arch)); in kvm_alloc_memslot_metadata()
10828 lpages = gfn_to_index(slot->base_gfn + npages - 1, in kvm_alloc_memslot_metadata()
10829 slot->base_gfn, level) + 1; in kvm_alloc_memslot_metadata()
10831 slot->arch.rmap[i] = in kvm_alloc_memslot_metadata()
10832 __vcalloc(lpages, sizeof(*slot->arch.rmap[i]), in kvm_alloc_memslot_metadata()
10834 if (!slot->arch.rmap[i]) in kvm_alloc_memslot_metadata()
10843 slot->arch.lpage_info[i - 1] = linfo; in kvm_alloc_memslot_metadata()
10845 if (slot->base_gfn & (KVM_PAGES_PER_HPAGE(level) - 1)) in kvm_alloc_memslot_metadata()
10847 if ((slot->base_gfn + npages) & (KVM_PAGES_PER_HPAGE(level) - 1)) in kvm_alloc_memslot_metadata()
10848 linfo[lpages - 1].disallow_lpage = 1; in kvm_alloc_memslot_metadata()
10849 ugfn = slot->userspace_addr >> PAGE_SHIFT; in kvm_alloc_memslot_metadata()
10854 if ((slot->base_gfn ^ ugfn) & (KVM_PAGES_PER_HPAGE(level) - 1)) { in kvm_alloc_memslot_metadata()
10869 kvfree(slot->arch.rmap[i]); in kvm_alloc_memslot_metadata()
10870 slot->arch.rmap[i] = NULL; in kvm_alloc_memslot_metadata()
10874 kvfree(slot->arch.lpage_info[i - 1]); in kvm_alloc_memslot_metadata()
10875 slot->arch.lpage_info[i - 1] = NULL; in kvm_alloc_memslot_metadata()
10877 return -ENOMEM; in kvm_alloc_memslot_metadata()
10886 * memslots->generation has been incremented. in kvm_arch_memslots_updated()
10891 /* Force re-initialization of steal_time cache */ in kvm_arch_memslots_updated()
10903 mem->memory_size >> PAGE_SHIFT); in kvm_arch_prepare_memory_region()
10916 if ((change != KVM_MR_FLAGS_ONLY) || (new->flags & KVM_MEM_READONLY)) in kvm_mmu_slot_apply_flags()
10928 * which can be collapsed into a single large-page spte. Later in kvm_mmu_slot_apply_flags()
10929 * page faults will create the large-page sptes. in kvm_mmu_slot_apply_flags()
10936 if ((old->flags & KVM_MEM_LOG_DIRTY_PAGES) && in kvm_mmu_slot_apply_flags()
10937 !(new->flags & KVM_MEM_LOG_DIRTY_PAGES)) in kvm_mmu_slot_apply_flags()
10953 * When disabling dirty logging with PML enabled, the D-bit is set in kvm_mmu_slot_apply_flags()
10960 * When enabling dirty logging, large sptes are write-protected in kvm_mmu_slot_apply_flags()
10965 * initial-all-set state. Otherwise, depending on whether pml in kvm_mmu_slot_apply_flags()
10966 * is enabled the D-bit or the W-bit will be cleared. in kvm_mmu_slot_apply_flags()
10968 if (new->flags & KVM_MEM_LOG_DIRTY_PAGES) { in kvm_mmu_slot_apply_flags()
10977 * If we're with initial-all-set, we don't need in kvm_mmu_slot_apply_flags()
10980 * we still need to write-protect huge pages in kvm_mmu_slot_apply_flags()
10998 if (!kvm->arch.n_requested_mmu_pages) in kvm_arch_commit_memory_region()
11003 * FIXME: const-ify all uses of struct kvm_memory_slot. in kvm_arch_commit_memory_region()
11032 if (!list_empty_careful(&vcpu->async_pf.done)) in kvm_vcpu_has_events()
11038 if (vcpu->arch.pv.pv_unhalted) in kvm_vcpu_has_events()
11041 if (vcpu->arch.exception.pending) in kvm_vcpu_has_events()
11045 (vcpu->arch.nmi_pending && in kvm_vcpu_has_events()
11050 (vcpu->arch.smi_pending && in kvm_vcpu_has_events()
11063 kvm_x86_ops.nested_ops->hv_timer_pending && in kvm_vcpu_has_events()
11064 kvm_x86_ops.nested_ops->hv_timer_pending(vcpu)) in kvm_vcpu_has_events()
11077 if (READ_ONCE(vcpu->arch.pv.pv_unhalted)) in kvm_arch_dy_runnable()
11085 if (vcpu->arch.apicv_active && kvm_x86_ops.dy_apicv_has_pending_interrupt(vcpu)) in kvm_arch_dy_runnable()
11093 return vcpu->arch.preempted_in_kernel; in kvm_arch_vcpu_in_kernel()
11126 if (vcpu->guest_debug & KVM_GUESTDBG_SINGLESTEP) in kvm_get_rflags()
11134 if (vcpu->guest_debug & KVM_GUESTDBG_SINGLESTEP && in __kvm_set_rflags()
11135 kvm_is_linear_rip(vcpu, vcpu->arch.singlestep_rip)) in __kvm_set_rflags()
11151 if ((vcpu->arch.mmu->direct_map != work->arch.direct_map) || in kvm_arch_async_page_ready()
11152 work->wakeup_all) in kvm_arch_async_page_ready()
11159 if (!vcpu->arch.mmu->direct_map && in kvm_arch_async_page_ready()
11160 work->arch.cr3 != vcpu->arch.mmu->get_guest_pgd(vcpu)) in kvm_arch_async_page_ready()
11163 kvm_mmu_do_page_fault(vcpu, work->cr2_or_gpa, 0, true); in kvm_arch_async_page_ready()
11175 return (key + 1) & (ASYNC_PF_PER_VCPU - 1); in kvm_async_pf_next_probe()
11182 while (vcpu->arch.apf.gfns[key] != ~0) in kvm_add_async_pf_gfn()
11185 vcpu->arch.apf.gfns[key] = gfn; in kvm_add_async_pf_gfn()
11194 (vcpu->arch.apf.gfns[key] != gfn && in kvm_async_pf_gfn_slot()
11195 vcpu->arch.apf.gfns[key] != ~0); i++) in kvm_async_pf_gfn_slot()
11203 return vcpu->arch.apf.gfns[kvm_async_pf_gfn_slot(vcpu, gfn)] == gfn; in kvm_find_async_pf_gfn()
11212 if (WARN_ON_ONCE(vcpu->arch.apf.gfns[i] != gfn)) in kvm_del_async_pf_gfn()
11216 vcpu->arch.apf.gfns[i] = ~0; in kvm_del_async_pf_gfn()
11219 if (vcpu->arch.apf.gfns[j] == ~0) in kvm_del_async_pf_gfn()
11221 k = kvm_async_pf_hash_fn(vcpu->arch.apf.gfns[j]); in kvm_del_async_pf_gfn()
11228 vcpu->arch.apf.gfns[i] = vcpu->arch.apf.gfns[j]; in kvm_del_async_pf_gfn()
11237 return kvm_write_guest_cached(vcpu->kvm, &vcpu->arch.apf.data, &reason, in apf_put_user_notpresent()
11245 return kvm_write_guest_offset_cached(vcpu->kvm, &vcpu->arch.apf.data, in apf_put_user_ready()
11254 if (kvm_read_guest_offset_cached(vcpu->kvm, &vcpu->arch.apf.data, in apf_pageready_slot_free()
11263 if (!vcpu->arch.apf.delivery_as_pf_vmexit && is_guest_mode(vcpu)) in kvm_can_deliver_async_pf()
11267 (vcpu->arch.apf.send_user_only && kvm_x86_ops.get_cpl(vcpu) == 0)) in kvm_can_deliver_async_pf()
11277 vcpu->arch.exception.pending)) in kvm_can_do_async_pf()
11280 if (kvm_hlt_in_guest(vcpu->kvm) && !kvm_can_deliver_async_pf(vcpu)) in kvm_can_do_async_pf()
11295 trace_kvm_async_pf_not_present(work->arch.token, work->cr2_or_gpa); in kvm_arch_async_page_not_present()
11296 kvm_add_async_pf_gfn(vcpu, work->arch.gfn); in kvm_arch_async_page_not_present()
11304 fault.address = work->arch.token; in kvm_arch_async_page_not_present()
11327 .vector = vcpu->arch.apf.vec in kvm_arch_async_page_present()
11330 if (work->wakeup_all) in kvm_arch_async_page_present()
11331 work->arch.token = ~0; /* broadcast wakeup */ in kvm_arch_async_page_present()
11333 kvm_del_async_pf_gfn(vcpu, work->arch.gfn); in kvm_arch_async_page_present()
11334 trace_kvm_async_pf_ready(work->arch.token, work->cr2_or_gpa); in kvm_arch_async_page_present()
11336 if ((work->wakeup_all || work->notpresent_injected) && in kvm_arch_async_page_present()
11338 !apf_put_user_ready(vcpu, work->arch.token)) { in kvm_arch_async_page_present()
11339 vcpu->arch.apf.pageready_pending = true; in kvm_arch_async_page_present()
11343 vcpu->arch.apf.halted = false; in kvm_arch_async_page_present()
11344 vcpu->arch.mp_state = KVM_MP_STATE_RUNNABLE; in kvm_arch_async_page_present()
11350 if (!vcpu->arch.apf.pageready_pending) in kvm_arch_async_page_present_queued()
11364 atomic_inc(&kvm->arch.assigned_device_count); in kvm_arch_start_assignment()
11370 atomic_dec(&kvm->arch.assigned_device_count); in kvm_arch_end_assignment()
11376 return arch_atomic_read(&kvm->arch.assigned_device_count); in kvm_arch_has_assigned_device()
11382 atomic_inc(&kvm->arch.noncoherent_dma_count); in kvm_arch_register_noncoherent_dma()
11388 atomic_dec(&kvm->arch.noncoherent_dma_count); in kvm_arch_unregister_noncoherent_dma()
11394 return atomic_read(&kvm->arch.noncoherent_dma_count); in kvm_arch_has_noncoherent_dma()
11410 irqfd->producer = prod; in kvm_arch_irq_bypass_add_producer()
11411 kvm_arch_start_assignment(irqfd->kvm); in kvm_arch_irq_bypass_add_producer()
11412 ret = kvm_x86_ops.update_pi_irte(irqfd->kvm, in kvm_arch_irq_bypass_add_producer()
11413 prod->irq, irqfd->gsi, 1); in kvm_arch_irq_bypass_add_producer()
11416 kvm_arch_end_assignment(irqfd->kvm); in kvm_arch_irq_bypass_add_producer()
11428 WARN_ON(irqfd->producer != prod); in kvm_arch_irq_bypass_del_producer()
11429 irqfd->producer = NULL; in kvm_arch_irq_bypass_del_producer()
11433 * remapped mode, so we can re-use the current implementation in kvm_arch_irq_bypass_del_producer()
11437 ret = kvm_x86_ops.update_pi_irte(irqfd->kvm, prod->irq, irqfd->gsi, 0); in kvm_arch_irq_bypass_del_producer()
11440 " fails: %d\n", irqfd->consumer.token, ret); in kvm_arch_irq_bypass_del_producer()
11442 kvm_arch_end_assignment(irqfd->kvm); in kvm_arch_irq_bypass_del_producer()
11458 return (vcpu->arch.msr_kvm_poll_control & 1) == 0; in kvm_arch_no_poll()
11496 vcpu->arch.walk_mmu->gva_to_gpa(vcpu, gva, access, &fault) != UNMAPPED_GVA) { in kvm_fixup_and_inject_pf_error()
11498 * If vcpu->arch.walk_mmu->gva_to_gpa succeeded, the page in kvm_fixup_and_inject_pf_error()
11508 vcpu->arch.walk_mmu->inject_page_fault(vcpu, &fault); in kvm_fixup_and_inject_pf_error()
11529 * doesn't seem to be a real use-case behind such requests, just return in kvm_handle_memory_failure()
11532 vcpu->run->exit_reason = KVM_EXIT_INTERNAL_ERROR; in kvm_handle_memory_failure()
11533 vcpu->run->internal.suberror = KVM_INTERNAL_ERROR_EMULATION; in kvm_handle_memory_failure()
11534 vcpu->run->internal.ndata = 0; in kvm_handle_memory_failure()
11585 if (kvm_get_pcid(vcpu, vcpu->arch.mmu->prev_roots[i].pgd) in kvm_handle_invpcid()
11589 kvm_mmu_free_roots(vcpu, vcpu->arch.mmu, roots_to_free); in kvm_handle_invpcid()
11601 * page tables, so a non-global flush just degenerates to a in kvm_handle_invpcid()