1 /* Copyright 2008 IBM Corporation
3 * Copyright 2011 Intel Corporation
4 * Copyright 2016 Veertu, Inc.
5 * Copyright 2017 The Android Open Source Project
7 * QEMU Hypervisor.framework support
9 * This program is free software; you can redistribute it and/or
10 * modify it under the terms of version 2 of the GNU General Public
11 * License as published by the Free Software Foundation.
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with this program; if not, see <http://www.gnu.org/licenses/>.
21 * This file contain code under public domain from the hvdos project:
22 * https://github.com/mist64/hvdos
24 * Parts Copyright (c) 2011 NetApp, Inc.
25 * All rights reserved.
27 * Redistribution and use in source and binary forms, with or without
28 * modification, are permitted provided that the following conditions
30 * 1. Redistributions of source code must retain the above copyright
31 * notice, this list of conditions and the following disclaimer.
32 * 2. Redistributions in binary form must reproduce the above copyright
33 * notice, this list of conditions and the following disclaimer in the
34 * documentation and/or other materials provided with the distribution.
36 * THIS SOFTWARE IS PROVIDED BY NETAPP, INC ``AS IS'' AND
37 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
38 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
39 * ARE DISCLAIMED. IN NO EVENT SHALL NETAPP, INC OR CONTRIBUTORS BE LIABLE
40 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
41 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
42 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
43 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
44 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
45 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
48 #include "qemu/osdep.h"
49 #include "qemu-common.h"
50 #include "qemu/error-report.h"
52 #include "sysemu/hvf.h"
57 #include "x86_descr.h"
59 #include "x86_decode.h"
64 #include <Hypervisor/hv.h>
65 #include <Hypervisor/hv_vmx.h>
67 #include "exec/address-spaces.h"
68 #include "hw/i386/apic_internal.h"
69 #include "hw/boards.h"
70 #include "qemu/main-loop.h"
71 #include "sysemu/accel.h"
72 #include "sysemu/sysemu.h"
73 #include "target/i386/cpu.h"
75 pthread_rwlock_t mem_lock
= PTHREAD_RWLOCK_INITIALIZER
;
79 static void assert_hvf_ok(hv_return_t ret
)
81 if (ret
== HV_SUCCESS
) {
87 error_report("Error: HV_ERROR");
90 error_report("Error: HV_BUSY");
93 error_report("Error: HV_BAD_ARGUMENT");
96 error_report("Error: HV_NO_RESOURCES");
99 error_report("Error: HV_NO_DEVICE");
102 error_report("Error: HV_UNSUPPORTED");
105 error_report("Unknown Error");
112 hvf_slot
*hvf_find_overlap_slot(uint64_t start
, uint64_t end
)
116 for (x
= 0; x
< hvf_state
->num_slots
; ++x
) {
117 slot
= &hvf_state
->slots
[x
];
118 if (slot
->size
&& start
< (slot
->start
+ slot
->size
) &&
133 struct mac_slot mac_slots
[32];
134 #define ALIGN(x, y) (((x) + (y) - 1) & ~((y) - 1))
136 static int do_hvf_set_memory(hvf_slot
*slot
)
138 struct mac_slot
*macslot
;
139 hv_memory_flags_t flags
;
142 macslot
= &mac_slots
[slot
->slot_id
];
144 if (macslot
->present
) {
145 if (macslot
->size
!= slot
->size
) {
146 macslot
->present
= 0;
147 ret
= hv_vm_unmap(macslot
->gpa_start
, macslot
->size
);
156 flags
= HV_MEMORY_READ
| HV_MEMORY_WRITE
| HV_MEMORY_EXEC
;
158 macslot
->present
= 1;
159 macslot
->gpa_start
= slot
->start
;
160 macslot
->size
= slot
->size
;
161 ret
= hv_vm_map((hv_uvaddr_t
)slot
->mem
, slot
->start
, slot
->size
, flags
);
166 void hvf_set_phys_mem(MemoryRegionSection
*section
, bool add
)
169 MemoryRegion
*area
= section
->mr
;
171 if (!memory_region_is_ram(area
)) {
175 mem
= hvf_find_overlap_slot(
176 section
->offset_within_address_space
,
177 section
->offset_within_address_space
+ int128_get64(section
->size
));
180 if (mem
->size
== int128_get64(section
->size
) &&
181 mem
->start
== section
->offset_within_address_space
&&
182 mem
->mem
== (memory_region_get_ram_ptr(area
) +
183 section
->offset_within_region
)) {
184 return; /* Same region was attempted to register, go away. */
188 /* Region needs to be reset. set the size to 0 and remap it. */
191 if (do_hvf_set_memory(mem
)) {
192 error_report("Failed to reset overlapping slot");
201 /* Now make a new slot. */
204 for (x
= 0; x
< hvf_state
->num_slots
; ++x
) {
205 mem
= &hvf_state
->slots
[x
];
211 if (x
== hvf_state
->num_slots
) {
212 error_report("No free slots");
216 mem
->size
= int128_get64(section
->size
);
217 mem
->mem
= memory_region_get_ram_ptr(area
) + section
->offset_within_region
;
218 mem
->start
= section
->offset_within_address_space
;
221 if (do_hvf_set_memory(mem
)) {
222 error_report("Error registering new memory slot");
227 void vmx_update_tpr(CPUState
*cpu
)
229 /* TODO: need integrate APIC handling */
230 X86CPU
*x86_cpu
= X86_CPU(cpu
);
231 int tpr
= cpu_get_apic_tpr(x86_cpu
->apic_state
) << 4;
232 int irr
= apic_get_highest_priority_irr(x86_cpu
->apic_state
);
234 wreg(cpu
->hvf_fd
, HV_X86_TPR
, tpr
);
236 wvmcs(cpu
->hvf_fd
, VMCS_TPR_THRESHOLD
, 0);
238 wvmcs(cpu
->hvf_fd
, VMCS_TPR_THRESHOLD
, (irr
> tpr
) ? tpr
>> 4 :
243 void update_apic_tpr(CPUState
*cpu
)
245 X86CPU
*x86_cpu
= X86_CPU(cpu
);
246 int tpr
= rreg(cpu
->hvf_fd
, HV_X86_TPR
) >> 4;
247 cpu_set_apic_tpr(x86_cpu
->apic_state
, tpr
);
250 #define VECTORING_INFO_VECTOR_MASK 0xff
252 static void hvf_handle_interrupt(CPUState
* cpu
, int mask
)
254 cpu
->interrupt_request
|= mask
;
255 if (!qemu_cpu_is_self(cpu
)) {
260 void hvf_handle_io(CPUArchState
*env
, uint16_t port
, void *buffer
,
261 int direction
, int size
, int count
)
264 uint8_t *ptr
= buffer
;
266 for (i
= 0; i
< count
; i
++) {
267 address_space_rw(&address_space_io
, port
, MEMTXATTRS_UNSPECIFIED
,
274 /* TODO: synchronize vcpu state */
275 static void do_hvf_cpu_synchronize_state(CPUState
*cpu
, run_on_cpu_data arg
)
277 CPUState
*cpu_state
= cpu
;
278 if (cpu_state
->vcpu_dirty
== 0) {
279 hvf_get_registers(cpu_state
);
282 cpu_state
->vcpu_dirty
= 1;
285 void hvf_cpu_synchronize_state(CPUState
*cpu_state
)
287 if (cpu_state
->vcpu_dirty
== 0) {
288 run_on_cpu(cpu_state
, do_hvf_cpu_synchronize_state
, RUN_ON_CPU_NULL
);
292 static void do_hvf_cpu_synchronize_post_reset(CPUState
*cpu
, run_on_cpu_data arg
)
294 CPUState
*cpu_state
= cpu
;
295 hvf_put_registers(cpu_state
);
296 cpu_state
->vcpu_dirty
= false;
299 void hvf_cpu_synchronize_post_reset(CPUState
*cpu_state
)
301 run_on_cpu(cpu_state
, do_hvf_cpu_synchronize_post_reset
, RUN_ON_CPU_NULL
);
304 void _hvf_cpu_synchronize_post_init(CPUState
*cpu
, run_on_cpu_data arg
)
306 CPUState
*cpu_state
= cpu
;
307 hvf_put_registers(cpu_state
);
308 cpu_state
->vcpu_dirty
= false;
311 void hvf_cpu_synchronize_post_init(CPUState
*cpu_state
)
313 run_on_cpu(cpu_state
, _hvf_cpu_synchronize_post_init
, RUN_ON_CPU_NULL
);
316 static bool ept_emulation_fault(hvf_slot
*slot
, uint64_t gpa
, uint64_t ept_qual
)
320 /* EPT fault on an instruction fetch doesn't make sense here */
321 if (ept_qual
& EPT_VIOLATION_INST_FETCH
) {
325 /* EPT fault must be a read fault or a write fault */
326 read
= ept_qual
& EPT_VIOLATION_DATA_READ
? 1 : 0;
327 write
= ept_qual
& EPT_VIOLATION_DATA_WRITE
? 1 : 0;
328 if ((read
| write
) == 0) {
333 if (slot
->flags
& HVF_SLOT_LOG
) {
334 memory_region_set_dirty(slot
->region
, gpa
- slot
->start
, 1);
335 hv_vm_protect((hv_gpaddr_t
)slot
->start
, (size_t)slot
->size
,
336 HV_MEMORY_READ
| HV_MEMORY_WRITE
);
341 * The EPT violation must have been caused by accessing a
342 * guest-physical address that is a translation of a guest-linear
345 if ((ept_qual
& EPT_VIOLATION_GLA_VALID
) == 0 ||
346 (ept_qual
& EPT_VIOLATION_XLAT_VALID
) == 0) {
353 static void hvf_set_dirty_tracking(MemoryRegionSection
*section
, bool on
)
357 slot
= hvf_find_overlap_slot(
358 section
->offset_within_address_space
,
359 section
->offset_within_address_space
+ int128_get64(section
->size
));
361 /* protect region against writes; begin tracking it */
363 slot
->flags
|= HVF_SLOT_LOG
;
364 hv_vm_protect((hv_gpaddr_t
)slot
->start
, (size_t)slot
->size
,
366 /* stop tracking region*/
368 slot
->flags
&= ~HVF_SLOT_LOG
;
369 hv_vm_protect((hv_gpaddr_t
)slot
->start
, (size_t)slot
->size
,
370 HV_MEMORY_READ
| HV_MEMORY_WRITE
);
374 static void hvf_log_start(MemoryListener
*listener
,
375 MemoryRegionSection
*section
, int old
, int new)
381 hvf_set_dirty_tracking(section
, 1);
384 static void hvf_log_stop(MemoryListener
*listener
,
385 MemoryRegionSection
*section
, int old
, int new)
391 hvf_set_dirty_tracking(section
, 0);
394 static void hvf_log_sync(MemoryListener
*listener
,
395 MemoryRegionSection
*section
)
398 * sync of dirty pages is handled elsewhere; just make sure we keep
399 * tracking the region.
401 hvf_set_dirty_tracking(section
, 1);
404 static void hvf_region_add(MemoryListener
*listener
,
405 MemoryRegionSection
*section
)
407 hvf_set_phys_mem(section
, true);
410 static void hvf_region_del(MemoryListener
*listener
,
411 MemoryRegionSection
*section
)
413 hvf_set_phys_mem(section
, false);
416 static MemoryListener hvf_memory_listener
= {
418 .region_add
= hvf_region_add
,
419 .region_del
= hvf_region_del
,
420 .log_start
= hvf_log_start
,
421 .log_stop
= hvf_log_stop
,
422 .log_sync
= hvf_log_sync
,
425 void hvf_reset_vcpu(CPUState
*cpu
) {
427 /* TODO: this shouldn't be needed; there is already a call to
428 * cpu_synchronize_all_post_reset in vl.c
430 wvmcs(cpu
->hvf_fd
, VMCS_ENTRY_CTLS
, 0);
431 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_IA32_EFER
, 0);
432 macvm_set_cr0(cpu
->hvf_fd
, 0x60000010);
434 wvmcs(cpu
->hvf_fd
, VMCS_CR4_MASK
, CR4_VMXE_MASK
);
435 wvmcs(cpu
->hvf_fd
, VMCS_CR4_SHADOW
, 0x0);
436 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_CR4
, CR4_VMXE_MASK
);
438 /* set VMCS guest state fields */
439 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_CS_SELECTOR
, 0xf000);
440 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_CS_LIMIT
, 0xffff);
441 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_CS_ACCESS_RIGHTS
, 0x9b);
442 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_CS_BASE
, 0xffff0000);
444 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_DS_SELECTOR
, 0);
445 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_DS_LIMIT
, 0xffff);
446 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_DS_ACCESS_RIGHTS
, 0x93);
447 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_DS_BASE
, 0);
449 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_ES_SELECTOR
, 0);
450 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_ES_LIMIT
, 0xffff);
451 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_ES_ACCESS_RIGHTS
, 0x93);
452 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_ES_BASE
, 0);
454 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_FS_SELECTOR
, 0);
455 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_FS_LIMIT
, 0xffff);
456 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_FS_ACCESS_RIGHTS
, 0x93);
457 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_FS_BASE
, 0);
459 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_GS_SELECTOR
, 0);
460 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_GS_LIMIT
, 0xffff);
461 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_GS_ACCESS_RIGHTS
, 0x93);
462 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_GS_BASE
, 0);
464 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_SS_SELECTOR
, 0);
465 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_SS_LIMIT
, 0xffff);
466 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_SS_ACCESS_RIGHTS
, 0x93);
467 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_SS_BASE
, 0);
469 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_LDTR_SELECTOR
, 0);
470 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_LDTR_LIMIT
, 0);
471 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_LDTR_ACCESS_RIGHTS
, 0x10000);
472 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_LDTR_BASE
, 0);
474 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_TR_SELECTOR
, 0);
475 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_TR_LIMIT
, 0);
476 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_TR_ACCESS_RIGHTS
, 0x83);
477 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_TR_BASE
, 0);
479 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_GDTR_LIMIT
, 0);
480 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_GDTR_BASE
, 0);
482 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_IDTR_LIMIT
, 0);
483 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_IDTR_BASE
, 0);
485 /*wvmcs(cpu->hvf_fd, VMCS_GUEST_CR2, 0x0);*/
486 wvmcs(cpu
->hvf_fd
, VMCS_GUEST_CR3
, 0x0);
488 wreg(cpu
->hvf_fd
, HV_X86_RIP
, 0xfff0);
489 wreg(cpu
->hvf_fd
, HV_X86_RDX
, 0x623);
490 wreg(cpu
->hvf_fd
, HV_X86_RFLAGS
, 0x2);
491 wreg(cpu
->hvf_fd
, HV_X86_RSP
, 0x0);
492 wreg(cpu
->hvf_fd
, HV_X86_RAX
, 0x0);
493 wreg(cpu
->hvf_fd
, HV_X86_RBX
, 0x0);
494 wreg(cpu
->hvf_fd
, HV_X86_RCX
, 0x0);
495 wreg(cpu
->hvf_fd
, HV_X86_RSI
, 0x0);
496 wreg(cpu
->hvf_fd
, HV_X86_RDI
, 0x0);
497 wreg(cpu
->hvf_fd
, HV_X86_RBP
, 0x0);
499 for (int i
= 0; i
< 8; i
++) {
500 wreg(cpu
->hvf_fd
, HV_X86_R8
+ i
, 0x0);
505 hv_vcpu_invalidate_tlb(cpu
->hvf_fd
);
506 hv_vcpu_flush(cpu
->hvf_fd
);
509 void hvf_vcpu_destroy(CPUState
*cpu
)
511 hv_return_t ret
= hv_vcpu_destroy((hv_vcpuid_t
)cpu
->hvf_fd
);
515 static void dummy_signal(int sig
)
519 int hvf_init_vcpu(CPUState
*cpu
)
522 X86CPU
*x86cpu
= X86_CPU(cpu
);
523 CPUX86State
*env
= &x86cpu
->env
;
526 /* init cpu signals */
528 struct sigaction sigact
;
530 memset(&sigact
, 0, sizeof(sigact
));
531 sigact
.sa_handler
= dummy_signal
;
532 sigaction(SIG_IPI
, &sigact
, NULL
);
534 pthread_sigmask(SIG_BLOCK
, NULL
, &set
);
535 sigdelset(&set
, SIG_IPI
);
540 hvf_state
->hvf_caps
= g_new0(struct hvf_vcpu_caps
, 1);
541 env
->hvf_emul
= g_new0(HVFX86EmulatorState
, 1);
543 r
= hv_vcpu_create((hv_vcpuid_t
*)&cpu
->hvf_fd
, HV_VCPU_DEFAULT
);
547 if (hv_vmx_read_capability(HV_VMX_CAP_PINBASED
,
548 &hvf_state
->hvf_caps
->vmx_cap_pinbased
)) {
551 if (hv_vmx_read_capability(HV_VMX_CAP_PROCBASED
,
552 &hvf_state
->hvf_caps
->vmx_cap_procbased
)) {
555 if (hv_vmx_read_capability(HV_VMX_CAP_PROCBASED2
,
556 &hvf_state
->hvf_caps
->vmx_cap_procbased2
)) {
559 if (hv_vmx_read_capability(HV_VMX_CAP_ENTRY
,
560 &hvf_state
->hvf_caps
->vmx_cap_entry
)) {
564 /* set VMCS control fields */
565 wvmcs(cpu
->hvf_fd
, VMCS_PIN_BASED_CTLS
,
566 cap2ctrl(hvf_state
->hvf_caps
->vmx_cap_pinbased
,
567 VMCS_PIN_BASED_CTLS_EXTINT
|
568 VMCS_PIN_BASED_CTLS_NMI
|
569 VMCS_PIN_BASED_CTLS_VNMI
));
570 wvmcs(cpu
->hvf_fd
, VMCS_PRI_PROC_BASED_CTLS
,
571 cap2ctrl(hvf_state
->hvf_caps
->vmx_cap_procbased
,
572 VMCS_PRI_PROC_BASED_CTLS_HLT
|
573 VMCS_PRI_PROC_BASED_CTLS_MWAIT
|
574 VMCS_PRI_PROC_BASED_CTLS_TSC_OFFSET
|
575 VMCS_PRI_PROC_BASED_CTLS_TPR_SHADOW
) |
576 VMCS_PRI_PROC_BASED_CTLS_SEC_CONTROL
);
577 wvmcs(cpu
->hvf_fd
, VMCS_SEC_PROC_BASED_CTLS
,
578 cap2ctrl(hvf_state
->hvf_caps
->vmx_cap_procbased2
,
579 VMCS_PRI_PROC_BASED2_CTLS_APIC_ACCESSES
));
581 wvmcs(cpu
->hvf_fd
, VMCS_ENTRY_CTLS
, cap2ctrl(hvf_state
->hvf_caps
->vmx_cap_entry
,
583 wvmcs(cpu
->hvf_fd
, VMCS_EXCEPTION_BITMAP
, 0); /* Double fault */
585 wvmcs(cpu
->hvf_fd
, VMCS_TPR_THRESHOLD
, 0);
589 x86cpu
= X86_CPU(cpu
);
590 x86cpu
->env
.kvm_xsave_buf
= qemu_memalign(4096, 4096);
592 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_STAR
, 1);
593 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_LSTAR
, 1);
594 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_CSTAR
, 1);
595 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_FMASK
, 1);
596 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_FSBASE
, 1);
597 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_GSBASE
, 1);
598 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_KERNELGSBASE
, 1);
599 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_TSC_AUX
, 1);
600 /*hv_vcpu_enable_native_msr(cpu->hvf_fd, MSR_IA32_TSC, 1);*/
601 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_IA32_SYSENTER_CS
, 1);
602 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_IA32_SYSENTER_EIP
, 1);
603 hv_vcpu_enable_native_msr(cpu
->hvf_fd
, MSR_IA32_SYSENTER_ESP
, 1);
608 void hvf_disable(int shouldDisable
)
610 hvf_disabled
= shouldDisable
;
613 static void hvf_store_events(CPUState
*cpu
, uint32_t ins_len
, uint64_t idtvec_info
)
615 X86CPU
*x86_cpu
= X86_CPU(cpu
);
616 CPUX86State
*env
= &x86_cpu
->env
;
618 env
->exception_injected
= -1;
619 env
->interrupt_injected
= -1;
620 env
->nmi_injected
= false;
621 if (idtvec_info
& VMCS_IDT_VEC_VALID
) {
622 switch (idtvec_info
& VMCS_IDT_VEC_TYPE
) {
623 case VMCS_IDT_VEC_HWINTR
:
624 case VMCS_IDT_VEC_SWINTR
:
625 env
->interrupt_injected
= idtvec_info
& VMCS_IDT_VEC_VECNUM
;
627 case VMCS_IDT_VEC_NMI
:
628 env
->nmi_injected
= true;
630 case VMCS_IDT_VEC_HWEXCEPTION
:
631 case VMCS_IDT_VEC_SWEXCEPTION
:
632 env
->exception_injected
= idtvec_info
& VMCS_IDT_VEC_VECNUM
;
634 case VMCS_IDT_VEC_PRIV_SWEXCEPTION
:
638 if ((idtvec_info
& VMCS_IDT_VEC_TYPE
) == VMCS_IDT_VEC_SWEXCEPTION
||
639 (idtvec_info
& VMCS_IDT_VEC_TYPE
) == VMCS_IDT_VEC_SWINTR
) {
640 env
->ins_len
= ins_len
;
642 if (idtvec_info
& VMCS_INTR_DEL_ERRCODE
) {
643 env
->has_error_code
= true;
644 env
->error_code
= rvmcs(cpu
->hvf_fd
, VMCS_IDT_VECTORING_ERROR
);
647 if ((rvmcs(cpu
->hvf_fd
, VMCS_GUEST_INTERRUPTIBILITY
) &
648 VMCS_INTERRUPTIBILITY_NMI_BLOCKING
)) {
649 env
->hflags2
|= HF2_NMI_MASK
;
651 env
->hflags2
&= ~HF2_NMI_MASK
;
653 if (rvmcs(cpu
->hvf_fd
, VMCS_GUEST_INTERRUPTIBILITY
) &
654 (VMCS_INTERRUPTIBILITY_STI_BLOCKING
|
655 VMCS_INTERRUPTIBILITY_MOVSS_BLOCKING
)) {
656 env
->hflags
|= HF_INHIBIT_IRQ_MASK
;
658 env
->hflags
&= ~HF_INHIBIT_IRQ_MASK
;
662 int hvf_vcpu_exec(CPUState
*cpu
)
664 X86CPU
*x86_cpu
= X86_CPU(cpu
);
665 CPUX86State
*env
= &x86_cpu
->env
;
671 if (hvf_process_events(cpu
)) {
676 if (cpu
->vcpu_dirty
) {
677 hvf_put_registers(cpu
);
678 cpu
->vcpu_dirty
= false;
681 if (hvf_inject_interrupts(cpu
)) {
682 return EXCP_INTERRUPT
;
686 qemu_mutex_unlock_iothread();
687 if (!cpu_is_bsp(X86_CPU(cpu
)) && cpu
->halted
) {
688 qemu_mutex_lock_iothread();
692 hv_return_t r
= hv_vcpu_run(cpu
->hvf_fd
);
696 uint64_t exit_reason
= rvmcs(cpu
->hvf_fd
, VMCS_EXIT_REASON
);
697 uint64_t exit_qual
= rvmcs(cpu
->hvf_fd
, VMCS_EXIT_QUALIFICATION
);
698 uint32_t ins_len
= (uint32_t)rvmcs(cpu
->hvf_fd
,
699 VMCS_EXIT_INSTRUCTION_LENGTH
);
701 uint64_t idtvec_info
= rvmcs(cpu
->hvf_fd
, VMCS_IDT_VECTORING_INFO
);
703 hvf_store_events(cpu
, ins_len
, idtvec_info
);
704 rip
= rreg(cpu
->hvf_fd
, HV_X86_RIP
);
705 RFLAGS(env
) = rreg(cpu
->hvf_fd
, HV_X86_RFLAGS
);
706 env
->eflags
= RFLAGS(env
);
708 qemu_mutex_lock_iothread();
710 update_apic_tpr(cpu
);
714 switch (exit_reason
) {
715 case EXIT_REASON_HLT
: {
716 macvm_set_rip(cpu
, rip
+ ins_len
);
717 if (!((cpu
->interrupt_request
& CPU_INTERRUPT_HARD
) &&
718 (EFLAGS(env
) & IF_MASK
))
719 && !(cpu
->interrupt_request
& CPU_INTERRUPT_NMI
) &&
720 !(idtvec_info
& VMCS_IDT_VEC_VALID
)) {
724 ret
= EXCP_INTERRUPT
;
727 case EXIT_REASON_MWAIT
: {
728 ret
= EXCP_INTERRUPT
;
731 /* Need to check if MMIO or unmmaped fault */
732 case EXIT_REASON_EPT_FAULT
:
735 uint64_t gpa
= rvmcs(cpu
->hvf_fd
, VMCS_GUEST_PHYSICAL_ADDRESS
);
737 if (((idtvec_info
& VMCS_IDT_VEC_VALID
) == 0) &&
738 ((exit_qual
& EXIT_QUAL_NMIUDTI
) != 0)) {
739 vmx_set_nmi_blocking(cpu
);
742 slot
= hvf_find_overlap_slot(gpa
, gpa
);
744 if (ept_emulation_fault(slot
, gpa
, exit_qual
)) {
745 struct x86_decode decode
;
748 env
->hvf_emul
->fetch_rip
= rip
;
750 decode_instruction(env
, &decode
);
751 exec_instruction(env
, &decode
);
757 case EXIT_REASON_INOUT
:
759 uint32_t in
= (exit_qual
& 8) != 0;
760 uint32_t size
= (exit_qual
& 7) + 1;
761 uint32_t string
= (exit_qual
& 16) != 0;
762 uint32_t port
= exit_qual
>> 16;
763 /*uint32_t rep = (exit_qual & 0x20) != 0;*/
768 hvf_handle_io(env
, port
, &val
, 0, size
, 1);
771 } else if (size
== 2) {
773 } else if (size
== 4) {
774 RAX(env
) = (uint32_t)val
;
776 RAX(env
) = (uint64_t)val
;
781 } else if (!string
&& !in
) {
782 RAX(env
) = rreg(cpu
->hvf_fd
, HV_X86_RAX
);
783 hvf_handle_io(env
, port
, &RAX(env
), 1, size
, 1);
784 macvm_set_rip(cpu
, rip
+ ins_len
);
787 struct x86_decode decode
;
790 env
->hvf_emul
->fetch_rip
= rip
;
792 decode_instruction(env
, &decode
);
793 assert(ins_len
== decode
.len
);
794 exec_instruction(env
, &decode
);
799 case EXIT_REASON_CPUID
: {
800 uint32_t rax
= (uint32_t)rreg(cpu
->hvf_fd
, HV_X86_RAX
);
801 uint32_t rbx
= (uint32_t)rreg(cpu
->hvf_fd
, HV_X86_RBX
);
802 uint32_t rcx
= (uint32_t)rreg(cpu
->hvf_fd
, HV_X86_RCX
);
803 uint32_t rdx
= (uint32_t)rreg(cpu
->hvf_fd
, HV_X86_RDX
);
805 cpu_x86_cpuid(env
, rax
, rcx
, &rax
, &rbx
, &rcx
, &rdx
);
807 wreg(cpu
->hvf_fd
, HV_X86_RAX
, rax
);
808 wreg(cpu
->hvf_fd
, HV_X86_RBX
, rbx
);
809 wreg(cpu
->hvf_fd
, HV_X86_RCX
, rcx
);
810 wreg(cpu
->hvf_fd
, HV_X86_RDX
, rdx
);
812 macvm_set_rip(cpu
, rip
+ ins_len
);
815 case EXIT_REASON_XSETBV
: {
816 X86CPU
*x86_cpu
= X86_CPU(cpu
);
817 CPUX86State
*env
= &x86_cpu
->env
;
818 uint32_t eax
= (uint32_t)rreg(cpu
->hvf_fd
, HV_X86_RAX
);
819 uint32_t ecx
= (uint32_t)rreg(cpu
->hvf_fd
, HV_X86_RCX
);
820 uint32_t edx
= (uint32_t)rreg(cpu
->hvf_fd
, HV_X86_RDX
);
823 macvm_set_rip(cpu
, rip
+ ins_len
);
826 env
->xcr0
= ((uint64_t)edx
<< 32) | eax
;
827 wreg(cpu
->hvf_fd
, HV_X86_XCR0
, env
->xcr0
| 1);
828 macvm_set_rip(cpu
, rip
+ ins_len
);
831 case EXIT_REASON_INTR_WINDOW
:
832 vmx_clear_int_window_exiting(cpu
);
833 ret
= EXCP_INTERRUPT
;
835 case EXIT_REASON_NMI_WINDOW
:
836 vmx_clear_nmi_window_exiting(cpu
);
837 ret
= EXCP_INTERRUPT
;
839 case EXIT_REASON_EXT_INTR
:
840 /* force exit and allow io handling */
841 ret
= EXCP_INTERRUPT
;
843 case EXIT_REASON_RDMSR
:
844 case EXIT_REASON_WRMSR
:
847 if (exit_reason
== EXIT_REASON_RDMSR
) {
852 RIP(env
) += rvmcs(cpu
->hvf_fd
, VMCS_EXIT_INSTRUCTION_LENGTH
);
856 case EXIT_REASON_CR_ACCESS
: {
862 reg
= (exit_qual
>> 8) & 15;
866 macvm_set_cr0(cpu
->hvf_fd
, RRX(env
, reg
));
870 macvm_set_cr4(cpu
->hvf_fd
, RRX(env
, reg
));
874 X86CPU
*x86_cpu
= X86_CPU(cpu
);
875 if (exit_qual
& 0x10) {
876 RRX(env
, reg
) = cpu_get_apic_tpr(x86_cpu
->apic_state
);
878 int tpr
= RRX(env
, reg
);
879 cpu_set_apic_tpr(x86_cpu
->apic_state
, tpr
);
880 ret
= EXCP_INTERRUPT
;
885 error_report("Unrecognized CR %d", cr
);
892 case EXIT_REASON_APIC_ACCESS
: { /* TODO */
893 struct x86_decode decode
;
896 env
->hvf_emul
->fetch_rip
= rip
;
898 decode_instruction(env
, &decode
);
899 exec_instruction(env
, &decode
);
903 case EXIT_REASON_TPR
: {
907 case EXIT_REASON_TASK_SWITCH
: {
908 uint64_t vinfo
= rvmcs(cpu
->hvf_fd
, VMCS_IDT_VECTORING_INFO
);
909 x68_segment_selector sel
= {.sel
= exit_qual
& 0xffff};
910 vmx_handle_task_switch(cpu
, sel
, (exit_qual
>> 30) & 0x3,
911 vinfo
& VMCS_INTR_VALID
, vinfo
& VECTORING_INFO_VECTOR_MASK
, vinfo
915 case EXIT_REASON_TRIPLE_FAULT
: {
916 qemu_system_reset_request(SHUTDOWN_CAUSE_GUEST_RESET
);
917 ret
= EXCP_INTERRUPT
;
920 case EXIT_REASON_RDPMC
:
921 wreg(cpu
->hvf_fd
, HV_X86_RAX
, 0);
922 wreg(cpu
->hvf_fd
, HV_X86_RDX
, 0);
923 macvm_set_rip(cpu
, rip
+ ins_len
);
925 case VMX_REASON_VMCALL
:
926 env
->exception_injected
= EXCP0D_GPF
;
927 env
->has_error_code
= true;
931 error_report("%llx: unhandled exit %llx", rip
, exit_reason
);
938 static bool hvf_allowed
;
940 static int hvf_accel_init(MachineState
*ms
)
947 ret
= hv_vm_create(HV_VM_DEFAULT
);
950 s
= g_new0(HVFState
, 1);
953 for (x
= 0; x
< s
->num_slots
; ++x
) {
954 s
->slots
[x
].size
= 0;
955 s
->slots
[x
].slot_id
= x
;
959 cpu_interrupt_handler
= hvf_handle_interrupt
;
960 memory_listener_register(&hvf_memory_listener
, &address_space_memory
);
964 static void hvf_accel_class_init(ObjectClass
*oc
, void *data
)
966 AccelClass
*ac
= ACCEL_CLASS(oc
);
968 ac
->init_machine
= hvf_accel_init
;
969 ac
->allowed
= &hvf_allowed
;
972 static const TypeInfo hvf_accel_type
= {
973 .name
= TYPE_HVF_ACCEL
,
974 .parent
= TYPE_ACCEL
,
975 .class_init
= hvf_accel_class_init
,
978 static void hvf_type_init(void)
980 type_register_static(&hvf_accel_type
);
983 type_init(hvf_type_init
);