1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef ARCH_X86_KVM_X86_H
3 #define ARCH_X86_KVM_X86_H
5 #include <linux/kvm_host.h>
7 #include <asm/pvclock.h>
8 #include "kvm_cache_regs.h"
9 #include "kvm_emulate.h"
11 #define KVM_DEFAULT_PLE_GAP 128
12 #define KVM_VMX_DEFAULT_PLE_WINDOW 4096
13 #define KVM_DEFAULT_PLE_WINDOW_GROW 2
14 #define KVM_DEFAULT_PLE_WINDOW_SHRINK 0
15 #define KVM_VMX_DEFAULT_PLE_WINDOW_MAX UINT_MAX
16 #define KVM_SVM_DEFAULT_PLE_WINDOW_MAX USHRT_MAX
17 #define KVM_SVM_DEFAULT_PLE_WINDOW 3000
19 static inline unsigned int __grow_ple_window(unsigned int val
,
20 unsigned int base
, unsigned int modifier
, unsigned int max
)
32 return min(ret
, (u64
)max
);
35 static inline unsigned int __shrink_ple_window(unsigned int val
,
36 unsigned int base
, unsigned int modifier
, unsigned int min
)
49 #define MSR_IA32_CR_PAT_DEFAULT 0x0007040600070406ULL
51 static inline void kvm_clear_exception_queue(struct kvm_vcpu
*vcpu
)
53 vcpu
->arch
.exception
.pending
= false;
54 vcpu
->arch
.exception
.injected
= false;
57 static inline void kvm_queue_interrupt(struct kvm_vcpu
*vcpu
, u8 vector
,
60 vcpu
->arch
.interrupt
.injected
= true;
61 vcpu
->arch
.interrupt
.soft
= soft
;
62 vcpu
->arch
.interrupt
.nr
= vector
;
65 static inline void kvm_clear_interrupt_queue(struct kvm_vcpu
*vcpu
)
67 vcpu
->arch
.interrupt
.injected
= false;
70 static inline bool kvm_event_needs_reinjection(struct kvm_vcpu
*vcpu
)
72 return vcpu
->arch
.exception
.injected
|| vcpu
->arch
.interrupt
.injected
||
73 vcpu
->arch
.nmi_injected
;
76 static inline bool kvm_exception_is_soft(unsigned int nr
)
78 return (nr
== BP_VECTOR
) || (nr
== OF_VECTOR
);
81 static inline bool is_protmode(struct kvm_vcpu
*vcpu
)
83 return kvm_read_cr0_bits(vcpu
, X86_CR0_PE
);
86 static inline int is_long_mode(struct kvm_vcpu
*vcpu
)
89 return vcpu
->arch
.efer
& EFER_LMA
;
95 static inline bool is_64_bit_mode(struct kvm_vcpu
*vcpu
)
99 if (!is_long_mode(vcpu
))
101 kvm_x86_ops
.get_cs_db_l_bits(vcpu
, &cs_db
, &cs_l
);
105 static inline bool is_la57_mode(struct kvm_vcpu
*vcpu
)
108 return (vcpu
->arch
.efer
& EFER_LMA
) &&
109 kvm_read_cr4_bits(vcpu
, X86_CR4_LA57
);
115 static inline bool x86_exception_has_error_code(unsigned int vector
)
117 static u32 exception_has_error_code
= BIT(DF_VECTOR
) | BIT(TS_VECTOR
) |
118 BIT(NP_VECTOR
) | BIT(SS_VECTOR
) | BIT(GP_VECTOR
) |
119 BIT(PF_VECTOR
) | BIT(AC_VECTOR
);
121 return (1U << vector
) & exception_has_error_code
;
124 static inline bool mmu_is_nested(struct kvm_vcpu
*vcpu
)
126 return vcpu
->arch
.walk_mmu
== &vcpu
->arch
.nested_mmu
;
129 static inline void kvm_vcpu_flush_tlb_current(struct kvm_vcpu
*vcpu
)
131 ++vcpu
->stat
.tlb_flush
;
132 kvm_x86_ops
.tlb_flush_current(vcpu
);
135 static inline int is_pae(struct kvm_vcpu
*vcpu
)
137 return kvm_read_cr4_bits(vcpu
, X86_CR4_PAE
);
140 static inline int is_pse(struct kvm_vcpu
*vcpu
)
142 return kvm_read_cr4_bits(vcpu
, X86_CR4_PSE
);
145 static inline int is_paging(struct kvm_vcpu
*vcpu
)
147 return likely(kvm_read_cr0_bits(vcpu
, X86_CR0_PG
));
150 static inline bool is_pae_paging(struct kvm_vcpu
*vcpu
)
152 return !is_long_mode(vcpu
) && is_pae(vcpu
) && is_paging(vcpu
);
155 static inline u8
vcpu_virt_addr_bits(struct kvm_vcpu
*vcpu
)
157 return kvm_read_cr4_bits(vcpu
, X86_CR4_LA57
) ? 57 : 48;
160 static inline u64
get_canonical(u64 la
, u8 vaddr_bits
)
162 return ((int64_t)la
<< (64 - vaddr_bits
)) >> (64 - vaddr_bits
);
165 static inline bool is_noncanonical_address(u64 la
, struct kvm_vcpu
*vcpu
)
167 return get_canonical(la
, vcpu_virt_addr_bits(vcpu
)) != la
;
170 static inline void vcpu_cache_mmio_info(struct kvm_vcpu
*vcpu
,
171 gva_t gva
, gfn_t gfn
, unsigned access
)
173 u64 gen
= kvm_memslots(vcpu
->kvm
)->generation
;
175 if (unlikely(gen
& KVM_MEMSLOT_GEN_UPDATE_IN_PROGRESS
))
179 * If this is a shadow nested page table, the "GVA" is
182 vcpu
->arch
.mmio_gva
= mmu_is_nested(vcpu
) ? 0 : gva
& PAGE_MASK
;
183 vcpu
->arch
.mmio_access
= access
;
184 vcpu
->arch
.mmio_gfn
= gfn
;
185 vcpu
->arch
.mmio_gen
= gen
;
188 static inline bool vcpu_match_mmio_gen(struct kvm_vcpu
*vcpu
)
190 return vcpu
->arch
.mmio_gen
== kvm_memslots(vcpu
->kvm
)->generation
;
194 * Clear the mmio cache info for the given gva. If gva is MMIO_GVA_ANY, we
195 * clear all mmio cache info.
197 #define MMIO_GVA_ANY (~(gva_t)0)
199 static inline void vcpu_clear_mmio_info(struct kvm_vcpu
*vcpu
, gva_t gva
)
201 if (gva
!= MMIO_GVA_ANY
&& vcpu
->arch
.mmio_gva
!= (gva
& PAGE_MASK
))
204 vcpu
->arch
.mmio_gva
= 0;
207 static inline bool vcpu_match_mmio_gva(struct kvm_vcpu
*vcpu
, unsigned long gva
)
209 if (vcpu_match_mmio_gen(vcpu
) && vcpu
->arch
.mmio_gva
&&
210 vcpu
->arch
.mmio_gva
== (gva
& PAGE_MASK
))
216 static inline bool vcpu_match_mmio_gpa(struct kvm_vcpu
*vcpu
, gpa_t gpa
)
218 if (vcpu_match_mmio_gen(vcpu
) && vcpu
->arch
.mmio_gfn
&&
219 vcpu
->arch
.mmio_gfn
== gpa
>> PAGE_SHIFT
)
225 static inline unsigned long kvm_register_readl(struct kvm_vcpu
*vcpu
, int reg
)
227 unsigned long val
= kvm_register_read(vcpu
, reg
);
229 return is_64_bit_mode(vcpu
) ? val
: (u32
)val
;
232 static inline void kvm_register_writel(struct kvm_vcpu
*vcpu
,
233 int reg
, unsigned long val
)
235 if (!is_64_bit_mode(vcpu
))
237 return kvm_register_write(vcpu
, reg
, val
);
240 static inline bool kvm_check_has_quirk(struct kvm
*kvm
, u64 quirk
)
242 return !(kvm
->arch
.disabled_quirks
& quirk
);
245 static inline bool kvm_vcpu_latch_init(struct kvm_vcpu
*vcpu
)
247 return is_smm(vcpu
) || kvm_x86_ops
.apic_init_signal_blocked(vcpu
);
250 void kvm_inject_realmode_interrupt(struct kvm_vcpu
*vcpu
, int irq
, int inc_eip
);
252 void kvm_write_tsc(struct kvm_vcpu
*vcpu
, struct msr_data
*msr
);
253 u64
get_kvmclock_ns(struct kvm
*kvm
);
255 int kvm_read_guest_virt(struct kvm_vcpu
*vcpu
,
256 gva_t addr
, void *val
, unsigned int bytes
,
257 struct x86_exception
*exception
);
259 int kvm_write_guest_virt_system(struct kvm_vcpu
*vcpu
,
260 gva_t addr
, void *val
, unsigned int bytes
,
261 struct x86_exception
*exception
);
263 int handle_ud(struct kvm_vcpu
*vcpu
);
265 void kvm_deliver_exception_payload(struct kvm_vcpu
*vcpu
);
267 void kvm_vcpu_mtrr_init(struct kvm_vcpu
*vcpu
);
268 u8
kvm_mtrr_get_guest_memory_type(struct kvm_vcpu
*vcpu
, gfn_t gfn
);
269 bool kvm_mtrr_valid(struct kvm_vcpu
*vcpu
, u32 msr
, u64 data
);
270 int kvm_mtrr_set_msr(struct kvm_vcpu
*vcpu
, u32 msr
, u64 data
);
271 int kvm_mtrr_get_msr(struct kvm_vcpu
*vcpu
, u32 msr
, u64
*pdata
);
272 bool kvm_mtrr_check_gfn_range_consistency(struct kvm_vcpu
*vcpu
, gfn_t gfn
,
274 bool kvm_vector_hashing_enabled(void);
275 void kvm_fixup_and_inject_pf_error(struct kvm_vcpu
*vcpu
, gva_t gva
, u16 error_code
);
276 int x86_emulate_instruction(struct kvm_vcpu
*vcpu
, gpa_t cr2_or_gpa
,
277 int emulation_type
, void *insn
, int insn_len
);
278 fastpath_t
handle_fastpath_set_msr_irqoff(struct kvm_vcpu
*vcpu
);
280 extern u64 host_xcr0
;
281 extern u64 supported_xcr0
;
283 extern u64 supported_xss
;
285 static inline bool kvm_mpx_supported(void)
287 return (supported_xcr0
& (XFEATURE_MASK_BNDREGS
| XFEATURE_MASK_BNDCSR
))
288 == (XFEATURE_MASK_BNDREGS
| XFEATURE_MASK_BNDCSR
);
291 extern unsigned int min_timer_period_us
;
293 extern bool enable_vmware_backdoor
;
295 extern int pi_inject_timer
;
297 extern struct static_key kvm_no_apic_vcpu
;
299 static inline u64
nsec_to_cycles(struct kvm_vcpu
*vcpu
, u64 nsec
)
301 return pvclock_scale_delta(nsec
, vcpu
->arch
.virtual_tsc_mult
,
302 vcpu
->arch
.virtual_tsc_shift
);
305 /* Same "calling convention" as do_div:
306 * - divide (n << 32) by base
310 #define do_shl32_div32(n, base) \
313 asm("divl %2" : "=a" (__quot), "=d" (__rem) \
314 : "rm" (base), "0" (0), "1" ((u32) n)); \
319 static inline bool kvm_mwait_in_guest(struct kvm
*kvm
)
321 return kvm
->arch
.mwait_in_guest
;
324 static inline bool kvm_hlt_in_guest(struct kvm
*kvm
)
326 return kvm
->arch
.hlt_in_guest
;
329 static inline bool kvm_pause_in_guest(struct kvm
*kvm
)
331 return kvm
->arch
.pause_in_guest
;
334 static inline bool kvm_cstate_in_guest(struct kvm
*kvm
)
336 return kvm
->arch
.cstate_in_guest
;
339 DECLARE_PER_CPU(struct kvm_vcpu
*, current_vcpu
);
341 static inline void kvm_before_interrupt(struct kvm_vcpu
*vcpu
)
343 __this_cpu_write(current_vcpu
, vcpu
);
346 static inline void kvm_after_interrupt(struct kvm_vcpu
*vcpu
)
348 __this_cpu_write(current_vcpu
, NULL
);
352 static inline bool kvm_pat_valid(u64 data
)
354 if (data
& 0xF8F8F8F8F8F8F8F8ull
)
356 /* 0, 1, 4, 5, 6, 7 are valid values. */
357 return (data
| ((data
& 0x0202020202020202ull
) << 1)) == data
;
360 static inline bool kvm_dr7_valid(u64 data
)
362 /* Bits [63:32] are reserved */
363 return !(data
>> 32);
365 static inline bool kvm_dr6_valid(u64 data
)
367 /* Bits [63:32] are reserved */
368 return !(data
>> 32);
372 * Trigger machine check on the host. We assume all the MSRs are already set up
373 * by the CPU and that we still run on the same CPU as the MCE occurred on.
374 * We pass a fake environment to the machine check handler because we want
375 * the guest to be always treated like user space, no matter what context
376 * it used internally.
378 static inline void kvm_machine_check(void)
380 #if defined(CONFIG_X86_MCE)
381 struct pt_regs regs
= {
382 .cs
= 3, /* Fake ring 3 no matter what the guest ran on */
383 .flags
= X86_EFLAGS_IF
,
386 do_machine_check(®s
);
390 void kvm_load_guest_xsave_state(struct kvm_vcpu
*vcpu
);
391 void kvm_load_host_xsave_state(struct kvm_vcpu
*vcpu
);
392 int kvm_spec_ctrl_test_value(u64 value
);
393 bool kvm_is_valid_cr4(struct kvm_vcpu
*vcpu
, unsigned long cr4
);
394 bool kvm_vcpu_exit_request(struct kvm_vcpu
*vcpu
);
395 int kvm_handle_memory_failure(struct kvm_vcpu
*vcpu
, int r
,
396 struct x86_exception
*e
);
397 int kvm_handle_invpcid(struct kvm_vcpu
*vcpu
, unsigned long type
, gva_t gva
);
398 bool kvm_msr_allowed(struct kvm_vcpu
*vcpu
, u32 index
, u32 type
);
401 * Internal error codes that are used to indicate that MSR emulation encountered
402 * an error that should result in #GP in the guest, unless userspace
405 #define KVM_MSR_RET_INVALID 2 /* in-kernel MSR emulation #GP condition */
406 #define KVM_MSR_RET_FILTERED 3 /* #GP due to userspace MSR filter */
408 #define __cr4_reserved_bits(__cpu_has, __c) \
410 u64 __reserved_bits = CR4_RESERVED_BITS; \
412 if (!__cpu_has(__c, X86_FEATURE_XSAVE)) \
413 __reserved_bits |= X86_CR4_OSXSAVE; \
414 if (!__cpu_has(__c, X86_FEATURE_SMEP)) \
415 __reserved_bits |= X86_CR4_SMEP; \
416 if (!__cpu_has(__c, X86_FEATURE_SMAP)) \
417 __reserved_bits |= X86_CR4_SMAP; \
418 if (!__cpu_has(__c, X86_FEATURE_FSGSBASE)) \
419 __reserved_bits |= X86_CR4_FSGSBASE; \
420 if (!__cpu_has(__c, X86_FEATURE_PKU)) \
421 __reserved_bits |= X86_CR4_PKE; \
422 if (!__cpu_has(__c, X86_FEATURE_LA57)) \
423 __reserved_bits |= X86_CR4_LA57; \
424 if (!__cpu_has(__c, X86_FEATURE_UMIP)) \
425 __reserved_bits |= X86_CR4_UMIP; \
426 if (!__cpu_has(__c, X86_FEATURE_VMX)) \
427 __reserved_bits |= X86_CR4_VMXE; \
431 int kvm_sev_es_mmio_write(struct kvm_vcpu
*vcpu
, gpa_t src
, unsigned int bytes
,
433 int kvm_sev_es_mmio_read(struct kvm_vcpu
*vcpu
, gpa_t src
, unsigned int bytes
,
435 int kvm_sev_es_string_io(struct kvm_vcpu
*vcpu
, unsigned int size
,
436 unsigned int port
, void *data
, unsigned int count
,