VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMR0/HMVMXR0.cpp@ 76477

Last change on this file since 76477 was 76477, checked in by vboxsync, 6 years ago

VMM/HM: Cleanup.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 578.1 KB
Line 
1/* $Id: HMVMXR0.cpp 76477 2018-12-25 08:01:34Z vboxsync $ */
2/** @file
3 * HM VMX (Intel VT-x) - Host Context Ring-0.
4 */
5
6/*
7 * Copyright (C) 2012-2017 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*********************************************************************************************************************************
20* Header Files *
21*********************************************************************************************************************************/
22#define LOG_GROUP LOG_GROUP_HM
23#define VMCPU_INCL_CPUM_GST_CTX
24#include <iprt/x86.h>
25#include <iprt/asm-amd64-x86.h>
26#include <iprt/thread.h>
27
28#include <VBox/vmm/pdmapi.h>
29#include <VBox/vmm/dbgf.h>
30#include <VBox/vmm/iem.h>
31#include <VBox/vmm/iom.h>
32#include <VBox/vmm/selm.h>
33#include <VBox/vmm/tm.h>
34#include <VBox/vmm/em.h>
35#include <VBox/vmm/gim.h>
36#include <VBox/vmm/apic.h>
37#ifdef VBOX_WITH_REM
38# include <VBox/vmm/rem.h>
39#endif
40#include "HMInternal.h"
41#include <VBox/vmm/vm.h>
42#include <VBox/vmm/hmvmxinline.h>
43#include "HMVMXR0.h"
44#include "dtrace/VBoxVMM.h"
45
46#ifdef DEBUG_ramshankar
47# define HMVMX_ALWAYS_SAVE_GUEST_RFLAGS
48# define HMVMX_ALWAYS_SAVE_FULL_GUEST_STATE
49# define HMVMX_ALWAYS_SYNC_FULL_GUEST_STATE
50# define HMVMX_ALWAYS_CHECK_GUEST_STATE
51# define HMVMX_ALWAYS_TRAP_ALL_XCPTS
52# define HMVMX_ALWAYS_TRAP_PF
53# define HMVMX_ALWAYS_FLUSH_TLB
54# define HMVMX_ALWAYS_SWAP_EFER
55#endif
56
57
58/*********************************************************************************************************************************
59* Defined Constants And Macros *
60*********************************************************************************************************************************/
61/** Use the function table. */
62#define HMVMX_USE_FUNCTION_TABLE
63
64/** Determine which tagged-TLB flush handler to use. */
65#define HMVMX_FLUSH_TAGGED_TLB_EPT_VPID 0
66#define HMVMX_FLUSH_TAGGED_TLB_EPT 1
67#define HMVMX_FLUSH_TAGGED_TLB_VPID 2
68#define HMVMX_FLUSH_TAGGED_TLB_NONE 3
69
70/** @name HMVMX_READ_XXX
71 * Flags to skip redundant reads of some common VMCS fields that are not part of
72 * the guest-CPU or VCPU state but are needed while handling VM-exits.
73 */
74#define HMVMX_READ_IDT_VECTORING_INFO RT_BIT_32(0)
75#define HMVMX_READ_IDT_VECTORING_ERROR_CODE RT_BIT_32(1)
76#define HMVMX_READ_EXIT_QUALIFICATION RT_BIT_32(2)
77#define HMVMX_READ_EXIT_INSTR_LEN RT_BIT_32(3)
78#define HMVMX_READ_EXIT_INTERRUPTION_INFO RT_BIT_32(4)
79#define HMVMX_READ_EXIT_INTERRUPTION_ERROR_CODE RT_BIT_32(5)
80#define HMVMX_READ_EXIT_INSTR_INFO RT_BIT_32(6)
81#define HMVMX_READ_GUEST_LINEAR_ADDR RT_BIT_32(7)
82/** @} */
83
84/**
85 * States of the VMCS.
86 *
87 * This does not reflect all possible VMCS states but currently only those
88 * needed for maintaining the VMCS consistently even when thread-context hooks
89 * are used. Maybe later this can be extended (i.e. Nested Virtualization).
90 */
91#define HMVMX_VMCS_STATE_CLEAR RT_BIT(0)
92#define HMVMX_VMCS_STATE_ACTIVE RT_BIT(1)
93#define HMVMX_VMCS_STATE_LAUNCHED RT_BIT(2)
94
95/**
96 * Subset of the guest-CPU state that is kept by VMX R0 code while executing the
97 * guest using hardware-assisted VMX.
98 *
99 * This excludes state like GPRs (other than RSP) which are always are
100 * swapped and restored across the world-switch and also registers like EFER,
101 * MSR which cannot be modified by the guest without causing a VM-exit.
102 */
103#define HMVMX_CPUMCTX_EXTRN_ALL ( CPUMCTX_EXTRN_RIP \
104 | CPUMCTX_EXTRN_RFLAGS \
105 | CPUMCTX_EXTRN_RSP \
106 | CPUMCTX_EXTRN_SREG_MASK \
107 | CPUMCTX_EXTRN_TABLE_MASK \
108 | CPUMCTX_EXTRN_KERNEL_GS_BASE \
109 | CPUMCTX_EXTRN_SYSCALL_MSRS \
110 | CPUMCTX_EXTRN_SYSENTER_MSRS \
111 | CPUMCTX_EXTRN_TSC_AUX \
112 | CPUMCTX_EXTRN_OTHER_MSRS \
113 | CPUMCTX_EXTRN_CR0 \
114 | CPUMCTX_EXTRN_CR3 \
115 | CPUMCTX_EXTRN_CR4 \
116 | CPUMCTX_EXTRN_DR7 \
117 | CPUMCTX_EXTRN_HM_VMX_MASK)
118
119/**
120 * Exception bitmap mask for real-mode guests (real-on-v86).
121 *
122 * We need to intercept all exceptions manually except:
123 * - \#AC and \#DB are always intercepted to prevent the CPU from deadlocking
124 * due to bugs in Intel CPUs.
125 * - \#PF need not be intercepted even in real-mode if we have Nested Paging
126 * support.
127 */
128#define HMVMX_REAL_MODE_XCPT_MASK ( RT_BIT(X86_XCPT_DE) /* always: | RT_BIT(X86_XCPT_DB) */ | RT_BIT(X86_XCPT_NMI) \
129 | RT_BIT(X86_XCPT_BP) | RT_BIT(X86_XCPT_OF) | RT_BIT(X86_XCPT_BR) \
130 | RT_BIT(X86_XCPT_UD) | RT_BIT(X86_XCPT_NM) | RT_BIT(X86_XCPT_DF) \
131 | RT_BIT(X86_XCPT_CO_SEG_OVERRUN) | RT_BIT(X86_XCPT_TS) | RT_BIT(X86_XCPT_NP) \
132 | RT_BIT(X86_XCPT_SS) | RT_BIT(X86_XCPT_GP) /* RT_BIT(X86_XCPT_PF) */ \
133 | RT_BIT(X86_XCPT_MF) /* always: | RT_BIT(X86_XCPT_AC) */ | RT_BIT(X86_XCPT_MC) \
134 | RT_BIT(X86_XCPT_XF))
135
136/** Maximum VM-instruction error number. */
137#define HMVMX_INSTR_ERROR_MAX 28
138
139/** Profiling macro. */
140#ifdef HM_PROFILE_EXIT_DISPATCH
141# define HMVMX_START_EXIT_DISPATCH_PROF() STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatExitDispatch, ed)
142# define HMVMX_STOP_EXIT_DISPATCH_PROF() STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExitDispatch, ed)
143#else
144# define HMVMX_START_EXIT_DISPATCH_PROF() do { } while (0)
145# define HMVMX_STOP_EXIT_DISPATCH_PROF() do { } while (0)
146#endif
147
148/** Assert that preemption is disabled or covered by thread-context hooks. */
149#define HMVMX_ASSERT_PREEMPT_SAFE(a_pVCpu) Assert( VMMR0ThreadCtxHookIsEnabled((a_pVCpu)) \
150 || !RTThreadPreemptIsEnabled(NIL_RTTHREAD))
151
152/** Assert that we haven't migrated CPUs when thread-context hooks are not
153 * used. */
154#define HMVMX_ASSERT_CPU_SAFE(a_pVCpu) AssertMsg( VMMR0ThreadCtxHookIsEnabled((a_pVCpu)) \
155 || (a_pVCpu)->hm.s.idEnteredCpu == RTMpCpuId(), \
156 ("Illegal migration! Entered on CPU %u Current %u\n", \
157 (a_pVCpu)->hm.s.idEnteredCpu, RTMpCpuId()))
158
159/** Asserts that the given CPUMCTX_EXTRN_XXX bits are present in the guest-CPU
160 * context. */
161#define HMVMX_CPUMCTX_ASSERT(a_pVCpu, a_fExtrnMbz) AssertMsg(!((a_pVCpu)->cpum.GstCtx.fExtrn & (a_fExtrnMbz)), \
162 ("fExtrn=%#RX64 fExtrnMbz=%#RX64\n", \
163 (a_pVCpu)->cpum.GstCtx.fExtrn, (a_fExtrnMbz)))
164
165/** Macro for importing guest state from the VMCS back into CPUMCTX (intended to be
166 * used only from VM-exit handlers). */
167#define HMVMX_CPUMCTX_IMPORT_STATE(a_pVCpu, a_fWhat) (hmR0VmxImportGuestState((a_pVCpu), (a_fWhat)))
168
169/** Helper macro for VM-exit handlers called unexpectedly. */
170#define HMVMX_UNEXPECTED_EXIT_RET(a_pVCpu, a_pVmxTransient) \
171 do { \
172 (a_pVCpu)->hm.s.u32HMError = (a_pVmxTransient)->uExitReason; \
173 return VERR_VMX_UNEXPECTED_EXIT; \
174 } while (0)
175
176/** Macro for importing segment registers to the VMCS from the guest-CPU context. */
177#ifdef VMX_USE_CACHED_VMCS_ACCESSES
178# define HMVMX_IMPORT_SREG(Sel, a_pCtxSelReg) \
179 hmR0VmxImportGuestSegmentReg(pVCpu, VMX_VMCS16_GUEST_##Sel##_SEL, VMX_VMCS32_GUEST_##Sel##_LIMIT, \
180 VMX_VMCS_GUEST_##Sel##_BASE_CACHE_IDX, VMX_VMCS32_GUEST_##Sel##_ACCESS_RIGHTS, (a_pCtxSelReg))
181#else
182# define HMVMX_IMPORT_SREG(Sel, a_pCtxSelReg) \
183 hmR0VmxImportGuestSegmentReg(pVCpu, VMX_VMCS16_GUEST_##Sel##_SEL, VMX_VMCS32_GUEST_##Sel##_LIMIT, \
184 VMX_VMCS_GUEST_##Sel##_BASE, VMX_VMCS32_GUEST_##Sel##_ACCESS_RIGHTS, (a_pCtxSelReg))
185#endif
186
187/** Macro for exporting segment registers to the VMCS from the guest-CPU context. */
188#define HMVMX_EXPORT_SREG(Sel, a_pCtxSelReg) \
189 hmR0VmxExportGuestSegmentReg(pVCpu, VMX_VMCS16_GUEST_##Sel##_SEL, VMX_VMCS32_GUEST_##Sel##_LIMIT, \
190 VMX_VMCS_GUEST_##Sel##_BASE, VMX_VMCS32_GUEST_##Sel##_ACCESS_RIGHTS, (a_pCtxSelReg))
191
192#ifdef VBOX_WITH_NESTED_HWVIRT_VMX
193/** Macro that does the necessary privilege checks and intercepted VM-exits for
194 * guests that attempted to execute a VMX instruction. */
195# define HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(a_pVCpu, a_uExitReason) \
196 do \
197 { \
198 VBOXSTRICTRC rcStrictTmp = hmR0VmxCheckExitDueToVmxInstr((a_pVCpu), (a_uExitReason)); \
199 if (rcStrictTmp == VINF_SUCCESS) \
200 { /* likely */ } \
201 else if (rcStrictTmp == VINF_HM_PENDING_XCPT) \
202 { \
203 Assert((a_pVCpu)->hm.s.Event.fPending); \
204 Log4Func(("Privilege checks failed -> %#x\n", VMX_ENTRY_INT_INFO_VECTOR((a_pVCpu)->hm.s.Event.u64IntInfo))); \
205 return VINF_SUCCESS; \
206 } \
207 else \
208 { \
209 int rcTmp = VBOXSTRICTRC_VAL(rcStrictTmp); \
210 AssertMsgFailedReturn(("Unexpected failure. rc=%Rrc", rcTmp), rcTmp); \
211 } \
212 } while (0)
213
214/** Macro that decodes a memory operand for an instruction VM-exit. */
215# define HMVMX_DECODE_MEM_OPERAND(a_pVCpu, a_uExitInstrInfo, a_uExitQual, a_enmMemAccess, a_pGCPtrEffAddr) \
216 do \
217 { \
218 VBOXSTRICTRC rcStrictTmp = hmR0VmxDecodeMemOperand((a_pVCpu), (a_uExitInstrInfo), (a_uExitQual), (a_enmMemAccess), \
219 (a_pGCPtrEffAddr)); \
220 if (rcStrictTmp == VINF_SUCCESS) \
221 { /* likely */ } \
222 else if (rcStrictTmp == VINF_HM_PENDING_XCPT) \
223 { \
224 uint8_t const uXcptTmp = VMX_ENTRY_INT_INFO_VECTOR((a_pVCpu)->hm.s.Event.u64IntInfo); \
225 Log4Func(("Memory operand decoding failed, raising xcpt %#x\n", uXcptTmp)); \
226 NOREF(uXcptTmp); \
227 return VINF_SUCCESS; \
228 } \
229 else \
230 { \
231 Log4Func(("hmR0VmxCheckExitDueToVmxInstr failed. rc=%Rrc\n", VBOXSTRICTRC_VAL(rcStrictTmp))); \
232 return rcStrictTmp; \
233 } \
234 } while (0)
235
236#endif /* VBOX_WITH_NESTED_HWVIRT_VMX */
237
238
239/*********************************************************************************************************************************
240* Structures and Typedefs *
241*********************************************************************************************************************************/
242/**
243 * VMX transient state.
244 *
245 * A state structure for holding miscellaneous information across
246 * VMX non-root operation and restored after the transition.
247 */
248typedef struct VMXTRANSIENT
249{
250 /** The host's rflags/eflags. */
251 RTCCUINTREG fEFlags;
252#if HC_ARCH_BITS == 32
253 uint32_t u32Alignment0;
254#endif
255 /** The guest's TPR value used for TPR shadowing. */
256 uint8_t u8GuestTpr;
257 /** Alignment. */
258 uint8_t abAlignment0[7];
259
260 /** The basic VM-exit reason. */
261 uint16_t uExitReason;
262 /** Alignment. */
263 uint16_t u16Alignment0;
264 /** The VM-exit interruption error code. */
265 uint32_t uExitIntErrorCode;
266 /** The VM-exit exit code qualification. */
267 uint64_t uExitQual;
268 /** The Guest-linear address. */
269 uint64_t uGuestLinearAddr;
270
271 /** The VM-exit interruption-information field. */
272 uint32_t uExitIntInfo;
273 /** The VM-exit instruction-length field. */
274 uint32_t cbInstr;
275 /** The VM-exit instruction-information field. */
276 VMXEXITINSTRINFO ExitInstrInfo;
277 /** Whether the VM-entry failed or not. */
278 bool fVMEntryFailed;
279 /** Alignment. */
280 uint8_t abAlignment1[3];
281
282 /** The VM-entry interruption-information field. */
283 uint32_t uEntryIntInfo;
284 /** The VM-entry exception error code field. */
285 uint32_t uEntryXcptErrorCode;
286 /** The VM-entry instruction length field. */
287 uint32_t cbEntryInstr;
288
289 /** IDT-vectoring information field. */
290 uint32_t uIdtVectoringInfo;
291 /** IDT-vectoring error code. */
292 uint32_t uIdtVectoringErrorCode;
293
294 /** Mask of currently read VMCS fields; HMVMX_READ_XXX. */
295 uint32_t fVmcsFieldsRead;
296
297 /** Whether the guest debug state was active at the time of VM-exit. */
298 bool fWasGuestDebugStateActive;
299 /** Whether the hyper debug state was active at the time of VM-exit. */
300 bool fWasHyperDebugStateActive;
301 /** Whether TSC-offsetting should be setup before VM-entry. */
302 bool fUpdateTscOffsettingAndPreemptTimer;
303 /** Whether the VM-exit was caused by a page-fault during delivery of a
304 * contributory exception or a page-fault. */
305 bool fVectoringDoublePF;
306 /** Whether the VM-exit was caused by a page-fault during delivery of an
307 * external interrupt or NMI. */
308 bool fVectoringPF;
309} VMXTRANSIENT;
310AssertCompileMemberAlignment(VMXTRANSIENT, uExitReason, sizeof(uint64_t));
311AssertCompileMemberAlignment(VMXTRANSIENT, uExitIntInfo, sizeof(uint64_t));
312AssertCompileMemberAlignment(VMXTRANSIENT, uEntryIntInfo, sizeof(uint64_t));
313AssertCompileMemberAlignment(VMXTRANSIENT, fWasGuestDebugStateActive, sizeof(uint64_t));
314AssertCompileMemberSize(VMXTRANSIENT, ExitInstrInfo, sizeof(uint32_t));
315/** Pointer to VMX transient state. */
316typedef VMXTRANSIENT *PVMXTRANSIENT;
317
318/**
319 * Memory operand read or write access.
320 */
321typedef enum VMXMEMACCESS
322{
323 VMXMEMACCESS_READ = 0,
324 VMXMEMACCESS_WRITE = 1
325} VMXMEMACCESS;
326
327/**
328 * VMX VM-exit handler.
329 *
330 * @returns Strict VBox status code (i.e. informational status codes too).
331 * @param pVCpu The cross context virtual CPU structure.
332 * @param pVmxTransient Pointer to the VMX-transient structure.
333 */
334#ifndef HMVMX_USE_FUNCTION_TABLE
335typedef VBOXSTRICTRC FNVMXEXITHANDLER(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
336#else
337typedef DECLCALLBACK(VBOXSTRICTRC) FNVMXEXITHANDLER(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
338/** Pointer to VM-exit handler. */
339typedef FNVMXEXITHANDLER *PFNVMXEXITHANDLER;
340#endif
341
342/**
343 * VMX VM-exit handler, non-strict status code.
344 *
345 * This is generally the same as FNVMXEXITHANDLER, the NSRC bit is just FYI.
346 *
347 * @returns VBox status code, no informational status code returned.
348 * @param pVCpu The cross context virtual CPU structure.
349 * @param pVmxTransient Pointer to the VMX-transient structure.
350 *
351 * @remarks This is not used on anything returning VERR_EM_INTERPRETER as the
352 * use of that status code will be replaced with VINF_EM_SOMETHING
353 * later when switching over to IEM.
354 */
355#ifndef HMVMX_USE_FUNCTION_TABLE
356typedef int FNVMXEXITHANDLERNSRC(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
357#else
358typedef FNVMXEXITHANDLER FNVMXEXITHANDLERNSRC;
359#endif
360
361
362/*********************************************************************************************************************************
363* Internal Functions *
364*********************************************************************************************************************************/
365static void hmR0VmxFlushEpt(PVMCPU pVCpu, VMXTLBFLUSHEPT enmTlbFlush);
366static void hmR0VmxFlushVpid(PVMCPU pVCpu, VMXTLBFLUSHVPID enmTlbFlush, RTGCPTR GCPtr);
367static void hmR0VmxClearIntNmiWindowsVmcs(PVMCPU pVCpu);
368static int hmR0VmxImportGuestState(PVMCPU pVCpu, uint64_t fWhat);
369static VBOXSTRICTRC hmR0VmxInjectEventVmcs(PVMCPU pVCpu, uint64_t u64IntInfo, uint32_t cbInstr, uint32_t u32ErrCode,
370 RTGCUINTREG GCPtrFaultAddress, bool fStepping, uint32_t *pfIntrState);
371#if HC_ARCH_BITS == 32
372static int hmR0VmxInitVmcsReadCache(PVMCPU pVCpu);
373#endif
374#ifndef HMVMX_USE_FUNCTION_TABLE
375DECLINLINE(VBOXSTRICTRC) hmR0VmxHandleExit(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient, uint32_t rcReason);
376# define HMVMX_EXIT_DECL DECLINLINE(VBOXSTRICTRC)
377# define HMVMX_EXIT_NSRC_DECL DECLINLINE(int)
378#else
379# define HMVMX_EXIT_DECL static DECLCALLBACK(VBOXSTRICTRC)
380# define HMVMX_EXIT_NSRC_DECL HMVMX_EXIT_DECL
381#endif
382
383/** @name VM-exit handlers.
384 * @{
385 */
386static FNVMXEXITHANDLER hmR0VmxExitXcptOrNmi;
387static FNVMXEXITHANDLER hmR0VmxExitExtInt;
388static FNVMXEXITHANDLER hmR0VmxExitTripleFault;
389static FNVMXEXITHANDLERNSRC hmR0VmxExitInitSignal;
390static FNVMXEXITHANDLERNSRC hmR0VmxExitSipi;
391static FNVMXEXITHANDLERNSRC hmR0VmxExitIoSmi;
392static FNVMXEXITHANDLERNSRC hmR0VmxExitSmi;
393static FNVMXEXITHANDLERNSRC hmR0VmxExitIntWindow;
394static FNVMXEXITHANDLERNSRC hmR0VmxExitNmiWindow;
395static FNVMXEXITHANDLER hmR0VmxExitTaskSwitch;
396static FNVMXEXITHANDLER hmR0VmxExitCpuid;
397static FNVMXEXITHANDLER hmR0VmxExitGetsec;
398static FNVMXEXITHANDLER hmR0VmxExitHlt;
399static FNVMXEXITHANDLERNSRC hmR0VmxExitInvd;
400static FNVMXEXITHANDLER hmR0VmxExitInvlpg;
401static FNVMXEXITHANDLER hmR0VmxExitRdpmc;
402static FNVMXEXITHANDLER hmR0VmxExitVmcall;
403#ifdef VBOX_WITH_NESTED_HWVIRT_VMX
404static FNVMXEXITHANDLER hmR0VmxExitVmclear;
405static FNVMXEXITHANDLER hmR0VmxExitVmlaunch;
406static FNVMXEXITHANDLER hmR0VmxExitVmptrld;
407static FNVMXEXITHANDLER hmR0VmxExitVmptrst;
408static FNVMXEXITHANDLER hmR0VmxExitVmread;
409static FNVMXEXITHANDLER hmR0VmxExitVmresume;
410static FNVMXEXITHANDLER hmR0VmxExitVmwrite;
411static FNVMXEXITHANDLER hmR0VmxExitVmxoff;
412static FNVMXEXITHANDLER hmR0VmxExitVmxon;
413#endif
414static FNVMXEXITHANDLER hmR0VmxExitRdtsc;
415static FNVMXEXITHANDLERNSRC hmR0VmxExitRsm;
416static FNVMXEXITHANDLERNSRC hmR0VmxExitSetPendingXcptUD;
417static FNVMXEXITHANDLER hmR0VmxExitMovCRx;
418static FNVMXEXITHANDLER hmR0VmxExitMovDRx;
419static FNVMXEXITHANDLER hmR0VmxExitIoInstr;
420static FNVMXEXITHANDLER hmR0VmxExitRdmsr;
421static FNVMXEXITHANDLER hmR0VmxExitWrmsr;
422static FNVMXEXITHANDLERNSRC hmR0VmxExitErrInvalidGuestState;
423static FNVMXEXITHANDLERNSRC hmR0VmxExitErrMsrLoad;
424static FNVMXEXITHANDLERNSRC hmR0VmxExitErrUndefined;
425static FNVMXEXITHANDLER hmR0VmxExitMwait;
426static FNVMXEXITHANDLER hmR0VmxExitMtf;
427static FNVMXEXITHANDLER hmR0VmxExitMonitor;
428static FNVMXEXITHANDLER hmR0VmxExitPause;
429static FNVMXEXITHANDLERNSRC hmR0VmxExitErrMachineCheck;
430static FNVMXEXITHANDLERNSRC hmR0VmxExitTprBelowThreshold;
431static FNVMXEXITHANDLER hmR0VmxExitApicAccess;
432static FNVMXEXITHANDLER hmR0VmxExitXdtrAccess;
433static FNVMXEXITHANDLER hmR0VmxExitEptViolation;
434static FNVMXEXITHANDLER hmR0VmxExitEptMisconfig;
435static FNVMXEXITHANDLER hmR0VmxExitRdtscp;
436static FNVMXEXITHANDLER hmR0VmxExitPreemptTimer;
437static FNVMXEXITHANDLERNSRC hmR0VmxExitWbinvd;
438static FNVMXEXITHANDLER hmR0VmxExitXsetbv;
439static FNVMXEXITHANDLER hmR0VmxExitRdrand;
440static FNVMXEXITHANDLER hmR0VmxExitInvpcid;
441/** @} */
442
443static int hmR0VmxExitXcptPF(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
444static int hmR0VmxExitXcptMF(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
445static int hmR0VmxExitXcptDB(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
446static int hmR0VmxExitXcptBP(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
447static int hmR0VmxExitXcptGP(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
448static int hmR0VmxExitXcptAC(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
449static int hmR0VmxExitXcptGeneric(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient);
450static uint32_t hmR0VmxCheckGuestState(PVMCPU pVCpu);
451
452
453/*********************************************************************************************************************************
454* Global Variables *
455*********************************************************************************************************************************/
456#ifdef HMVMX_USE_FUNCTION_TABLE
457
458/**
459 * VMX_EXIT dispatch table.
460 */
461static const PFNVMXEXITHANDLER g_apfnVMExitHandlers[VMX_EXIT_MAX + 1] =
462{
463 /* 00 VMX_EXIT_XCPT_OR_NMI */ hmR0VmxExitXcptOrNmi,
464 /* 01 VMX_EXIT_EXT_INT */ hmR0VmxExitExtInt,
465 /* 02 VMX_EXIT_TRIPLE_FAULT */ hmR0VmxExitTripleFault,
466 /* 03 VMX_EXIT_INIT_SIGNAL */ hmR0VmxExitInitSignal,
467 /* 04 VMX_EXIT_SIPI */ hmR0VmxExitSipi,
468 /* 05 VMX_EXIT_IO_SMI */ hmR0VmxExitIoSmi,
469 /* 06 VMX_EXIT_SMI */ hmR0VmxExitSmi,
470 /* 07 VMX_EXIT_INT_WINDOW */ hmR0VmxExitIntWindow,
471 /* 08 VMX_EXIT_NMI_WINDOW */ hmR0VmxExitNmiWindow,
472 /* 09 VMX_EXIT_TASK_SWITCH */ hmR0VmxExitTaskSwitch,
473 /* 10 VMX_EXIT_CPUID */ hmR0VmxExitCpuid,
474 /* 11 VMX_EXIT_GETSEC */ hmR0VmxExitGetsec,
475 /* 12 VMX_EXIT_HLT */ hmR0VmxExitHlt,
476 /* 13 VMX_EXIT_INVD */ hmR0VmxExitInvd,
477 /* 14 VMX_EXIT_INVLPG */ hmR0VmxExitInvlpg,
478 /* 15 VMX_EXIT_RDPMC */ hmR0VmxExitRdpmc,
479 /* 16 VMX_EXIT_RDTSC */ hmR0VmxExitRdtsc,
480 /* 17 VMX_EXIT_RSM */ hmR0VmxExitRsm,
481 /* 18 VMX_EXIT_VMCALL */ hmR0VmxExitVmcall,
482#ifdef VBOX_WITH_NESTED_HWVIRT_VMX
483 /* 19 VMX_EXIT_VMCLEAR */ hmR0VmxExitVmclear,
484 /* 20 VMX_EXIT_VMLAUNCH */ hmR0VmxExitVmlaunch,
485 /* 21 VMX_EXIT_VMPTRLD */ hmR0VmxExitVmptrld,
486 /* 22 VMX_EXIT_VMPTRST */ hmR0VmxExitVmptrst,
487 /* 23 VMX_EXIT_VMREAD */ hmR0VmxExitVmread,
488 /* 24 VMX_EXIT_VMRESUME */ hmR0VmxExitVmresume,
489 /* 25 VMX_EXIT_VMWRITE */ hmR0VmxExitVmwrite,
490 /* 26 VMX_EXIT_VMXOFF */ hmR0VmxExitVmxoff,
491 /* 27 VMX_EXIT_VMXON */ hmR0VmxExitVmxon,
492#else
493 /* 19 VMX_EXIT_VMCLEAR */ hmR0VmxExitSetPendingXcptUD,
494 /* 20 VMX_EXIT_VMLAUNCH */ hmR0VmxExitSetPendingXcptUD,
495 /* 21 VMX_EXIT_VMPTRLD */ hmR0VmxExitSetPendingXcptUD,
496 /* 22 VMX_EXIT_VMPTRST */ hmR0VmxExitSetPendingXcptUD,
497 /* 23 VMX_EXIT_VMREAD */ hmR0VmxExitSetPendingXcptUD,
498 /* 24 VMX_EXIT_VMRESUME */ hmR0VmxExitSetPendingXcptUD,
499 /* 25 VMX_EXIT_VMWRITE */ hmR0VmxExitSetPendingXcptUD,
500 /* 26 VMX_EXIT_VMXOFF */ hmR0VmxExitSetPendingXcptUD,
501 /* 27 VMX_EXIT_VMXON */ hmR0VmxExitSetPendingXcptUD,
502#endif
503 /* 28 VMX_EXIT_MOV_CRX */ hmR0VmxExitMovCRx,
504 /* 29 VMX_EXIT_MOV_DRX */ hmR0VmxExitMovDRx,
505 /* 30 VMX_EXIT_IO_INSTR */ hmR0VmxExitIoInstr,
506 /* 31 VMX_EXIT_RDMSR */ hmR0VmxExitRdmsr,
507 /* 32 VMX_EXIT_WRMSR */ hmR0VmxExitWrmsr,
508 /* 33 VMX_EXIT_ERR_INVALID_GUEST_STATE */ hmR0VmxExitErrInvalidGuestState,
509 /* 34 VMX_EXIT_ERR_MSR_LOAD */ hmR0VmxExitErrMsrLoad,
510 /* 35 UNDEFINED */ hmR0VmxExitErrUndefined,
511 /* 36 VMX_EXIT_MWAIT */ hmR0VmxExitMwait,
512 /* 37 VMX_EXIT_MTF */ hmR0VmxExitMtf,
513 /* 38 UNDEFINED */ hmR0VmxExitErrUndefined,
514 /* 39 VMX_EXIT_MONITOR */ hmR0VmxExitMonitor,
515 /* 40 UNDEFINED */ hmR0VmxExitPause,
516 /* 41 VMX_EXIT_PAUSE */ hmR0VmxExitErrMachineCheck,
517 /* 42 VMX_EXIT_ERR_MACHINE_CHECK */ hmR0VmxExitErrUndefined,
518 /* 43 VMX_EXIT_TPR_BELOW_THRESHOLD */ hmR0VmxExitTprBelowThreshold,
519 /* 44 VMX_EXIT_APIC_ACCESS */ hmR0VmxExitApicAccess,
520 /* 45 UNDEFINED */ hmR0VmxExitErrUndefined,
521 /* 46 VMX_EXIT_GDTR_IDTR_ACCESS */ hmR0VmxExitXdtrAccess,
522 /* 47 VMX_EXIT_LDTR_TR_ACCESS */ hmR0VmxExitXdtrAccess,
523 /* 48 VMX_EXIT_EPT_VIOLATION */ hmR0VmxExitEptViolation,
524 /* 49 VMX_EXIT_EPT_MISCONFIG */ hmR0VmxExitEptMisconfig,
525 /* 50 VMX_EXIT_INVEPT */ hmR0VmxExitSetPendingXcptUD,
526 /* 51 VMX_EXIT_RDTSCP */ hmR0VmxExitRdtscp,
527 /* 52 VMX_EXIT_PREEMPT_TIMER */ hmR0VmxExitPreemptTimer,
528 /* 53 VMX_EXIT_INVVPID */ hmR0VmxExitSetPendingXcptUD,
529 /* 54 VMX_EXIT_WBINVD */ hmR0VmxExitWbinvd,
530 /* 55 VMX_EXIT_XSETBV */ hmR0VmxExitXsetbv,
531 /* 56 VMX_EXIT_APIC_WRITE */ hmR0VmxExitErrUndefined,
532 /* 57 VMX_EXIT_RDRAND */ hmR0VmxExitRdrand,
533 /* 58 VMX_EXIT_INVPCID */ hmR0VmxExitInvpcid,
534 /* 59 VMX_EXIT_VMFUNC */ hmR0VmxExitSetPendingXcptUD,
535 /* 60 VMX_EXIT_ENCLS */ hmR0VmxExitErrUndefined,
536 /* 61 VMX_EXIT_RDSEED */ hmR0VmxExitErrUndefined, /* only spurious exits, so undefined */
537 /* 62 VMX_EXIT_PML_FULL */ hmR0VmxExitErrUndefined,
538 /* 63 VMX_EXIT_XSAVES */ hmR0VmxExitSetPendingXcptUD,
539 /* 64 VMX_EXIT_XRSTORS */ hmR0VmxExitSetPendingXcptUD,
540};
541#endif /* HMVMX_USE_FUNCTION_TABLE */
542
543#if defined(VBOX_STRICT) && defined(LOG_ENABLED)
544static const char * const g_apszVmxInstrErrors[HMVMX_INSTR_ERROR_MAX + 1] =
545{
546 /* 0 */ "(Not Used)",
547 /* 1 */ "VMCALL executed in VMX root operation.",
548 /* 2 */ "VMCLEAR with invalid physical address.",
549 /* 3 */ "VMCLEAR with VMXON pointer.",
550 /* 4 */ "VMLAUNCH with non-clear VMCS.",
551 /* 5 */ "VMRESUME with non-launched VMCS.",
552 /* 6 */ "VMRESUME after VMXOFF",
553 /* 7 */ "VM-entry with invalid control fields.",
554 /* 8 */ "VM-entry with invalid host state fields.",
555 /* 9 */ "VMPTRLD with invalid physical address.",
556 /* 10 */ "VMPTRLD with VMXON pointer.",
557 /* 11 */ "VMPTRLD with incorrect revision identifier.",
558 /* 12 */ "VMREAD/VMWRITE from/to unsupported VMCS component.",
559 /* 13 */ "VMWRITE to read-only VMCS component.",
560 /* 14 */ "(Not Used)",
561 /* 15 */ "VMXON executed in VMX root operation.",
562 /* 16 */ "VM-entry with invalid executive-VMCS pointer.",
563 /* 17 */ "VM-entry with non-launched executing VMCS.",
564 /* 18 */ "VM-entry with executive-VMCS pointer not VMXON pointer.",
565 /* 19 */ "VMCALL with non-clear VMCS.",
566 /* 20 */ "VMCALL with invalid VM-exit control fields.",
567 /* 21 */ "(Not Used)",
568 /* 22 */ "VMCALL with incorrect MSEG revision identifier.",
569 /* 23 */ "VMXOFF under dual monitor treatment of SMIs and SMM.",
570 /* 24 */ "VMCALL with invalid SMM-monitor features.",
571 /* 25 */ "VM-entry with invalid VM-execution control fields in executive VMCS.",
572 /* 26 */ "VM-entry with events blocked by MOV SS.",
573 /* 27 */ "(Not Used)",
574 /* 28 */ "Invalid operand to INVEPT/INVVPID."
575};
576#endif /* VBOX_STRICT */
577
578
579/**
580 * Updates the VM's last error record.
581 *
582 * If there was a VMX instruction error, reads the error data from the VMCS and
583 * updates VCPU's last error record as well.
584 *
585 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
586 * Can be NULL if @a rc is not VERR_VMX_UNABLE_TO_START_VM or
587 * VERR_VMX_INVALID_VMCS_FIELD.
588 * @param rc The error code.
589 */
590static void hmR0VmxUpdateErrorRecord(PVMCPU pVCpu, int rc)
591{
592 if ( rc == VERR_VMX_INVALID_VMCS_FIELD
593 || rc == VERR_VMX_UNABLE_TO_START_VM)
594 {
595 AssertPtrReturnVoid(pVCpu);
596 VMXReadVmcs32(VMX_VMCS32_RO_VM_INSTR_ERROR, &pVCpu->hm.s.vmx.LastError.u32InstrError);
597 }
598 pVCpu->CTX_SUFF(pVM)->hm.s.rcInit = rc;
599}
600
601
602/**
603 * Reads the VM-entry interruption-information field from the VMCS into the VMX
604 * transient structure.
605 *
606 * @returns VBox status code.
607 * @param pVmxTransient Pointer to the VMX transient structure.
608 *
609 * @remarks No-long-jump zone!!!
610 */
611DECLINLINE(int) hmR0VmxReadEntryIntInfoVmcs(PVMXTRANSIENT pVmxTransient)
612{
613 int rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY_INTERRUPTION_INFO, &pVmxTransient->uEntryIntInfo);
614 AssertRCReturn(rc, rc);
615 return VINF_SUCCESS;
616}
617
618#ifdef VBOX_STRICT
619/**
620 * Reads the VM-entry exception error code field from the VMCS into
621 * the VMX transient structure.
622 *
623 * @returns VBox status code.
624 * @param pVmxTransient Pointer to the VMX transient structure.
625 *
626 * @remarks No-long-jump zone!!!
627 */
628DECLINLINE(int) hmR0VmxReadEntryXcptErrorCodeVmcs(PVMXTRANSIENT pVmxTransient)
629{
630 int rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY_EXCEPTION_ERRCODE, &pVmxTransient->uEntryXcptErrorCode);
631 AssertRCReturn(rc, rc);
632 return VINF_SUCCESS;
633}
634
635
636/**
637 * Reads the VM-entry exception error code field from the VMCS into
638 * the VMX transient structure.
639 *
640 * @returns VBox status code.
641 * @param pVmxTransient Pointer to the VMX transient structure.
642 *
643 * @remarks No-long-jump zone!!!
644 */
645DECLINLINE(int) hmR0VmxReadEntryInstrLenVmcs(PVMXTRANSIENT pVmxTransient)
646{
647 int rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY_INSTR_LENGTH, &pVmxTransient->cbEntryInstr);
648 AssertRCReturn(rc, rc);
649 return VINF_SUCCESS;
650}
651#endif /* VBOX_STRICT */
652
653
654/**
655 * Reads the VM-exit interruption-information field from the VMCS into the VMX
656 * transient structure.
657 *
658 * @returns VBox status code.
659 * @param pVmxTransient Pointer to the VMX transient structure.
660 */
661DECLINLINE(int) hmR0VmxReadExitIntInfoVmcs(PVMXTRANSIENT pVmxTransient)
662{
663 if (!(pVmxTransient->fVmcsFieldsRead & HMVMX_READ_EXIT_INTERRUPTION_INFO))
664 {
665 int rc = VMXReadVmcs32(VMX_VMCS32_RO_EXIT_INTERRUPTION_INFO, &pVmxTransient->uExitIntInfo);
666 AssertRCReturn(rc,rc);
667 pVmxTransient->fVmcsFieldsRead |= HMVMX_READ_EXIT_INTERRUPTION_INFO;
668 }
669 return VINF_SUCCESS;
670}
671
672
673/**
674 * Reads the VM-exit interruption error code from the VMCS into the VMX
675 * transient structure.
676 *
677 * @returns VBox status code.
678 * @param pVmxTransient Pointer to the VMX transient structure.
679 */
680DECLINLINE(int) hmR0VmxReadExitIntErrorCodeVmcs(PVMXTRANSIENT pVmxTransient)
681{
682 if (!(pVmxTransient->fVmcsFieldsRead & HMVMX_READ_EXIT_INTERRUPTION_ERROR_CODE))
683 {
684 int rc = VMXReadVmcs32(VMX_VMCS32_RO_EXIT_INTERRUPTION_ERROR_CODE, &pVmxTransient->uExitIntErrorCode);
685 AssertRCReturn(rc, rc);
686 pVmxTransient->fVmcsFieldsRead |= HMVMX_READ_EXIT_INTERRUPTION_ERROR_CODE;
687 }
688 return VINF_SUCCESS;
689}
690
691
692/**
693 * Reads the VM-exit instruction length field from the VMCS into the VMX
694 * transient structure.
695 *
696 * @returns VBox status code.
697 * @param pVmxTransient Pointer to the VMX transient structure.
698 */
699DECLINLINE(int) hmR0VmxReadExitInstrLenVmcs(PVMXTRANSIENT pVmxTransient)
700{
701 if (!(pVmxTransient->fVmcsFieldsRead & HMVMX_READ_EXIT_INSTR_LEN))
702 {
703 int rc = VMXReadVmcs32(VMX_VMCS32_RO_EXIT_INSTR_LENGTH, &pVmxTransient->cbInstr);
704 AssertRCReturn(rc, rc);
705 pVmxTransient->fVmcsFieldsRead |= HMVMX_READ_EXIT_INSTR_LEN;
706 }
707 return VINF_SUCCESS;
708}
709
710
711/**
712 * Reads the VM-exit instruction-information field from the VMCS into
713 * the VMX transient structure.
714 *
715 * @returns VBox status code.
716 * @param pVmxTransient Pointer to the VMX transient structure.
717 */
718DECLINLINE(int) hmR0VmxReadExitInstrInfoVmcs(PVMXTRANSIENT pVmxTransient)
719{
720 if (!(pVmxTransient->fVmcsFieldsRead & HMVMX_READ_EXIT_INSTR_INFO))
721 {
722 int rc = VMXReadVmcs32(VMX_VMCS32_RO_EXIT_INSTR_INFO, &pVmxTransient->ExitInstrInfo.u);
723 AssertRCReturn(rc, rc);
724 pVmxTransient->fVmcsFieldsRead |= HMVMX_READ_EXIT_INSTR_INFO;
725 }
726 return VINF_SUCCESS;
727}
728
729
730/**
731 * Reads the VM-exit Qualification from the VMCS into the VMX transient structure.
732 *
733 * @returns VBox status code.
734 * @param pVCpu The cross context virtual CPU structure of the
735 * calling EMT. (Required for the VMCS cache case.)
736 * @param pVmxTransient Pointer to the VMX transient structure.
737 */
738DECLINLINE(int) hmR0VmxReadExitQualVmcs(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
739{
740 if (!(pVmxTransient->fVmcsFieldsRead & HMVMX_READ_EXIT_QUALIFICATION))
741 {
742 int rc = VMXReadVmcsGstN(VMX_VMCS_RO_EXIT_QUALIFICATION, &pVmxTransient->uExitQual); NOREF(pVCpu);
743 AssertRCReturn(rc, rc);
744 pVmxTransient->fVmcsFieldsRead |= HMVMX_READ_EXIT_QUALIFICATION;
745 }
746 return VINF_SUCCESS;
747}
748
749
750/**
751 * Reads the Guest-linear address from the VMCS into the VMX transient structure.
752 *
753 * @returns VBox status code.
754 * @param pVCpu The cross context virtual CPU structure of the
755 * calling EMT. (Required for the VMCS cache case.)
756 * @param pVmxTransient Pointer to the VMX transient structure.
757 */
758DECLINLINE(int) hmR0VmxReadGuestLinearAddrVmcs(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
759{
760 if (!(pVmxTransient->fVmcsFieldsRead & HMVMX_READ_GUEST_LINEAR_ADDR))
761 {
762 int rc = VMXReadVmcsGstN(VMX_VMCS_RO_GUEST_LINEAR_ADDR, &pVmxTransient->uGuestLinearAddr); NOREF(pVCpu);
763 AssertRCReturn(rc, rc);
764 pVmxTransient->fVmcsFieldsRead |= HMVMX_READ_GUEST_LINEAR_ADDR;
765 }
766 return VINF_SUCCESS;
767}
768
769
770/**
771 * Reads the IDT-vectoring information field from the VMCS into the VMX
772 * transient structure.
773 *
774 * @returns VBox status code.
775 * @param pVmxTransient Pointer to the VMX transient structure.
776 *
777 * @remarks No-long-jump zone!!!
778 */
779DECLINLINE(int) hmR0VmxReadIdtVectoringInfoVmcs(PVMXTRANSIENT pVmxTransient)
780{
781 if (!(pVmxTransient->fVmcsFieldsRead & HMVMX_READ_IDT_VECTORING_INFO))
782 {
783 int rc = VMXReadVmcs32(VMX_VMCS32_RO_IDT_VECTORING_INFO, &pVmxTransient->uIdtVectoringInfo);
784 AssertRCReturn(rc, rc);
785 pVmxTransient->fVmcsFieldsRead |= HMVMX_READ_IDT_VECTORING_INFO;
786 }
787 return VINF_SUCCESS;
788}
789
790
791/**
792 * Reads the IDT-vectoring error code from the VMCS into the VMX
793 * transient structure.
794 *
795 * @returns VBox status code.
796 * @param pVmxTransient Pointer to the VMX transient structure.
797 */
798DECLINLINE(int) hmR0VmxReadIdtVectoringErrorCodeVmcs(PVMXTRANSIENT pVmxTransient)
799{
800 if (!(pVmxTransient->fVmcsFieldsRead & HMVMX_READ_IDT_VECTORING_ERROR_CODE))
801 {
802 int rc = VMXReadVmcs32(VMX_VMCS32_RO_IDT_VECTORING_ERROR_CODE, &pVmxTransient->uIdtVectoringErrorCode);
803 AssertRCReturn(rc, rc);
804 pVmxTransient->fVmcsFieldsRead |= HMVMX_READ_IDT_VECTORING_ERROR_CODE;
805 }
806 return VINF_SUCCESS;
807}
808
809
810/**
811 * Enters VMX root mode operation on the current CPU.
812 *
813 * @returns VBox status code.
814 * @param pVM The cross context VM structure. Can be
815 * NULL, after a resume.
816 * @param HCPhysCpuPage Physical address of the VMXON region.
817 * @param pvCpuPage Pointer to the VMXON region.
818 */
819static int hmR0VmxEnterRootMode(PVM pVM, RTHCPHYS HCPhysCpuPage, void *pvCpuPage)
820{
821 Assert(HCPhysCpuPage && HCPhysCpuPage != NIL_RTHCPHYS);
822 Assert(RT_ALIGN_T(HCPhysCpuPage, _4K, RTHCPHYS) == HCPhysCpuPage);
823 Assert(pvCpuPage);
824 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
825
826 if (pVM)
827 {
828 /* Write the VMCS revision dword to the VMXON region. */
829 *(uint32_t *)pvCpuPage = RT_BF_GET(pVM->hm.s.vmx.Msrs.u64Basic, VMX_BF_BASIC_VMCS_ID);
830 }
831
832 /* Paranoid: Disable interrupts as, in theory, interrupt handlers might mess with CR4. */
833 RTCCUINTREG fEFlags = ASMIntDisableFlags();
834
835 /* Enable the VMX bit in CR4 if necessary. */
836 RTCCUINTREG uOldCr4 = SUPR0ChangeCR4(X86_CR4_VMXE, RTCCUINTREG_MAX);
837
838 /* Enter VMX root mode. */
839 int rc = VMXEnable(HCPhysCpuPage);
840 if (RT_FAILURE(rc))
841 {
842 if (!(uOldCr4 & X86_CR4_VMXE))
843 SUPR0ChangeCR4(0, ~X86_CR4_VMXE);
844
845 if (pVM)
846 pVM->hm.s.vmx.HCPhysVmxEnableError = HCPhysCpuPage;
847 }
848
849 /* Restore interrupts. */
850 ASMSetFlags(fEFlags);
851 return rc;
852}
853
854
855/**
856 * Exits VMX root mode operation on the current CPU.
857 *
858 * @returns VBox status code.
859 */
860static int hmR0VmxLeaveRootMode(void)
861{
862 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
863
864 /* Paranoid: Disable interrupts as, in theory, interrupts handlers might mess with CR4. */
865 RTCCUINTREG fEFlags = ASMIntDisableFlags();
866
867 /* If we're for some reason not in VMX root mode, then don't leave it. */
868 RTCCUINTREG uHostCR4 = ASMGetCR4();
869
870 int rc;
871 if (uHostCR4 & X86_CR4_VMXE)
872 {
873 /* Exit VMX root mode and clear the VMX bit in CR4. */
874 VMXDisable();
875 SUPR0ChangeCR4(0, ~X86_CR4_VMXE);
876 rc = VINF_SUCCESS;
877 }
878 else
879 rc = VERR_VMX_NOT_IN_VMX_ROOT_MODE;
880
881 /* Restore interrupts. */
882 ASMSetFlags(fEFlags);
883 return rc;
884}
885
886
887/**
888 * Allocates and maps one physically contiguous page. The allocated page is
889 * zero'd out. (Used by various VT-x structures).
890 *
891 * @returns IPRT status code.
892 * @param pMemObj Pointer to the ring-0 memory object.
893 * @param ppVirt Where to store the virtual address of the
894 * allocation.
895 * @param pHCPhys Where to store the physical address of the
896 * allocation.
897 */
898static int hmR0VmxPageAllocZ(PRTR0MEMOBJ pMemObj, PRTR0PTR ppVirt, PRTHCPHYS pHCPhys)
899{
900 AssertPtrReturn(pMemObj, VERR_INVALID_PARAMETER);
901 AssertPtrReturn(ppVirt, VERR_INVALID_PARAMETER);
902 AssertPtrReturn(pHCPhys, VERR_INVALID_PARAMETER);
903
904 int rc = RTR0MemObjAllocCont(pMemObj, PAGE_SIZE, false /* fExecutable */);
905 if (RT_FAILURE(rc))
906 return rc;
907 *ppVirt = RTR0MemObjAddress(*pMemObj);
908 *pHCPhys = RTR0MemObjGetPagePhysAddr(*pMemObj, 0 /* iPage */);
909 ASMMemZero32(*ppVirt, PAGE_SIZE);
910 return VINF_SUCCESS;
911}
912
913
914/**
915 * Frees and unmaps an allocated physical page.
916 *
917 * @param pMemObj Pointer to the ring-0 memory object.
918 * @param ppVirt Where to re-initialize the virtual address of
919 * allocation as 0.
920 * @param pHCPhys Where to re-initialize the physical address of the
921 * allocation as 0.
922 */
923static void hmR0VmxPageFree(PRTR0MEMOBJ pMemObj, PRTR0PTR ppVirt, PRTHCPHYS pHCPhys)
924{
925 AssertPtr(pMemObj);
926 AssertPtr(ppVirt);
927 AssertPtr(pHCPhys);
928 if (*pMemObj != NIL_RTR0MEMOBJ)
929 {
930 int rc = RTR0MemObjFree(*pMemObj, true /* fFreeMappings */);
931 AssertRC(rc);
932 *pMemObj = NIL_RTR0MEMOBJ;
933 *ppVirt = 0;
934 *pHCPhys = 0;
935 }
936}
937
938
939/**
940 * Worker function to free VT-x related structures.
941 *
942 * @returns IPRT status code.
943 * @param pVM The cross context VM structure.
944 */
945static void hmR0VmxStructsFree(PVM pVM)
946{
947 for (VMCPUID i = 0; i < pVM->cCpus; i++)
948 {
949 PVMCPU pVCpu = &pVM->aCpus[i];
950 AssertPtr(pVCpu);
951
952 hmR0VmxPageFree(&pVCpu->hm.s.vmx.hMemObjHostMsr, &pVCpu->hm.s.vmx.pvHostMsr, &pVCpu->hm.s.vmx.HCPhysHostMsr);
953 hmR0VmxPageFree(&pVCpu->hm.s.vmx.hMemObjGuestMsr, &pVCpu->hm.s.vmx.pvGuestMsr, &pVCpu->hm.s.vmx.HCPhysGuestMsr);
954
955 if (pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_USE_MSR_BITMAPS)
956 hmR0VmxPageFree(&pVCpu->hm.s.vmx.hMemObjMsrBitmap, &pVCpu->hm.s.vmx.pvMsrBitmap, &pVCpu->hm.s.vmx.HCPhysMsrBitmap);
957
958 hmR0VmxPageFree(&pVCpu->hm.s.vmx.hMemObjVmcs, &pVCpu->hm.s.vmx.pvVmcs, &pVCpu->hm.s.vmx.HCPhysVmcs);
959 }
960
961 hmR0VmxPageFree(&pVM->hm.s.vmx.hMemObjApicAccess, (PRTR0PTR)&pVM->hm.s.vmx.pbApicAccess, &pVM->hm.s.vmx.HCPhysApicAccess);
962#ifdef VBOX_WITH_CRASHDUMP_MAGIC
963 hmR0VmxPageFree(&pVM->hm.s.vmx.hMemObjScratch, &pVM->hm.s.vmx.pbScratch, &pVM->hm.s.vmx.HCPhysScratch);
964#endif
965}
966
967
968/**
969 * Worker function to allocate VT-x related VM structures.
970 *
971 * @returns IPRT status code.
972 * @param pVM The cross context VM structure.
973 */
974static int hmR0VmxStructsAlloc(PVM pVM)
975{
976 /*
977 * Initialize members up-front so we can cleanup properly on allocation failure.
978 */
979#define VMXLOCAL_INIT_VM_MEMOBJ(a_Name, a_VirtPrefix) \
980 pVM->hm.s.vmx.hMemObj##a_Name = NIL_RTR0MEMOBJ; \
981 pVM->hm.s.vmx.a_VirtPrefix##a_Name = 0; \
982 pVM->hm.s.vmx.HCPhys##a_Name = 0;
983
984#define VMXLOCAL_INIT_VMCPU_MEMOBJ(a_Name, a_VirtPrefix) \
985 pVCpu->hm.s.vmx.hMemObj##a_Name = NIL_RTR0MEMOBJ; \
986 pVCpu->hm.s.vmx.a_VirtPrefix##a_Name = 0; \
987 pVCpu->hm.s.vmx.HCPhys##a_Name = 0;
988
989#ifdef VBOX_WITH_CRASHDUMP_MAGIC
990 VMXLOCAL_INIT_VM_MEMOBJ(Scratch, pv);
991#endif
992 VMXLOCAL_INIT_VM_MEMOBJ(ApicAccess, pb);
993
994 AssertCompile(sizeof(VMCPUID) == sizeof(pVM->cCpus));
995 for (VMCPUID i = 0; i < pVM->cCpus; i++)
996 {
997 PVMCPU pVCpu = &pVM->aCpus[i];
998 VMXLOCAL_INIT_VMCPU_MEMOBJ(Vmcs, pv);
999 VMXLOCAL_INIT_VMCPU_MEMOBJ(MsrBitmap, pv);
1000 VMXLOCAL_INIT_VMCPU_MEMOBJ(GuestMsr, pv);
1001 VMXLOCAL_INIT_VMCPU_MEMOBJ(HostMsr, pv);
1002 }
1003#undef VMXLOCAL_INIT_VMCPU_MEMOBJ
1004#undef VMXLOCAL_INIT_VM_MEMOBJ
1005
1006 /* The VMCS size cannot be more than 4096 bytes. See Intel spec. Appendix A.1 "Basic VMX Information". */
1007 AssertReturnStmt(RT_BF_GET(pVM->hm.s.vmx.Msrs.u64Basic, VMX_BF_BASIC_VMCS_SIZE) <= PAGE_SIZE,
1008 (&pVM->aCpus[0])->hm.s.u32HMError = VMX_UFC_INVALID_VMCS_SIZE,
1009 VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO);
1010
1011 /*
1012 * Allocate all the VT-x structures.
1013 */
1014 int rc = VINF_SUCCESS;
1015#ifdef VBOX_WITH_CRASHDUMP_MAGIC
1016 rc = hmR0VmxPageAllocZ(&pVM->hm.s.vmx.hMemObjScratch, &pVM->hm.s.vmx.pbScratch, &pVM->hm.s.vmx.HCPhysScratch);
1017 if (RT_FAILURE(rc))
1018 goto cleanup;
1019 strcpy((char *)pVM->hm.s.vmx.pbScratch, "SCRATCH Magic");
1020 *(uint64_t *)(pVM->hm.s.vmx.pbScratch + 16) = UINT64_C(0xdeadbeefdeadbeef);
1021#endif
1022
1023 /* Allocate the APIC-access page for trapping APIC accesses from the guest. */
1024 if (pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1 & VMX_PROC_CTLS2_VIRT_APIC_ACCESS)
1025 {
1026 rc = hmR0VmxPageAllocZ(&pVM->hm.s.vmx.hMemObjApicAccess, (PRTR0PTR)&pVM->hm.s.vmx.pbApicAccess,
1027 &pVM->hm.s.vmx.HCPhysApicAccess);
1028 if (RT_FAILURE(rc))
1029 goto cleanup;
1030 }
1031
1032 /*
1033 * Initialize per-VCPU VT-x structures.
1034 */
1035 for (VMCPUID i = 0; i < pVM->cCpus; i++)
1036 {
1037 PVMCPU pVCpu = &pVM->aCpus[i];
1038 AssertPtr(pVCpu);
1039
1040 /* Allocate the VM control structure (VMCS). */
1041 rc = hmR0VmxPageAllocZ(&pVCpu->hm.s.vmx.hMemObjVmcs, &pVCpu->hm.s.vmx.pvVmcs, &pVCpu->hm.s.vmx.HCPhysVmcs);
1042 if (RT_FAILURE(rc))
1043 goto cleanup;
1044
1045 /* Get the allocated virtual-APIC page from the APIC device for transparent TPR accesses. */
1046 if ( PDMHasApic(pVM)
1047 && (pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_USE_TPR_SHADOW))
1048 {
1049 rc = APICGetApicPageForCpu(pVCpu, &pVCpu->hm.s.vmx.HCPhysVirtApic, (PRTR0PTR)&pVCpu->hm.s.vmx.pbVirtApic,
1050 NULL /* pR3Ptr */, NULL /* pRCPtr */);
1051 if (RT_FAILURE(rc))
1052 goto cleanup;
1053 }
1054
1055 /*
1056 * Allocate the MSR-bitmap if supported by the CPU. The MSR-bitmap is for
1057 * transparent accesses of specific MSRs.
1058 *
1059 * If the condition for enabling MSR bitmaps changes here, don't forget to
1060 * update HMAreMsrBitmapsAvailable().
1061 */
1062 if (pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_USE_MSR_BITMAPS)
1063 {
1064 rc = hmR0VmxPageAllocZ(&pVCpu->hm.s.vmx.hMemObjMsrBitmap, &pVCpu->hm.s.vmx.pvMsrBitmap,
1065 &pVCpu->hm.s.vmx.HCPhysMsrBitmap);
1066 if (RT_FAILURE(rc))
1067 goto cleanup;
1068 ASMMemFill32(pVCpu->hm.s.vmx.pvMsrBitmap, PAGE_SIZE, UINT32_C(0xffffffff));
1069 }
1070
1071 /* Allocate the VM-entry MSR-load and VM-exit MSR-store page for the guest MSRs. */
1072 rc = hmR0VmxPageAllocZ(&pVCpu->hm.s.vmx.hMemObjGuestMsr, &pVCpu->hm.s.vmx.pvGuestMsr, &pVCpu->hm.s.vmx.HCPhysGuestMsr);
1073 if (RT_FAILURE(rc))
1074 goto cleanup;
1075
1076 /* Allocate the VM-exit MSR-load page for the host MSRs. */
1077 rc = hmR0VmxPageAllocZ(&pVCpu->hm.s.vmx.hMemObjHostMsr, &pVCpu->hm.s.vmx.pvHostMsr, &pVCpu->hm.s.vmx.HCPhysHostMsr);
1078 if (RT_FAILURE(rc))
1079 goto cleanup;
1080 }
1081
1082 return VINF_SUCCESS;
1083
1084cleanup:
1085 hmR0VmxStructsFree(pVM);
1086 return rc;
1087}
1088
1089
1090/**
1091 * Does global VT-x initialization (called during module initialization).
1092 *
1093 * @returns VBox status code.
1094 */
1095VMMR0DECL(int) VMXR0GlobalInit(void)
1096{
1097#ifdef HMVMX_USE_FUNCTION_TABLE
1098 AssertCompile(VMX_EXIT_MAX + 1 == RT_ELEMENTS(g_apfnVMExitHandlers));
1099# ifdef VBOX_STRICT
1100 for (unsigned i = 0; i < RT_ELEMENTS(g_apfnVMExitHandlers); i++)
1101 Assert(g_apfnVMExitHandlers[i]);
1102# endif
1103#endif
1104 return VINF_SUCCESS;
1105}
1106
1107
1108/**
1109 * Does global VT-x termination (called during module termination).
1110 */
1111VMMR0DECL(void) VMXR0GlobalTerm()
1112{
1113 /* Nothing to do currently. */
1114}
1115
1116
1117/**
1118 * Sets up and activates VT-x on the current CPU.
1119 *
1120 * @returns VBox status code.
1121 * @param pHostCpu Pointer to the global CPU info struct.
1122 * @param pVM The cross context VM structure. Can be
1123 * NULL after a host resume operation.
1124 * @param pvCpuPage Pointer to the VMXON region (can be NULL if @a
1125 * fEnabledByHost is @c true).
1126 * @param HCPhysCpuPage Physical address of the VMXON region (can be 0 if
1127 * @a fEnabledByHost is @c true).
1128 * @param fEnabledByHost Set if SUPR0EnableVTx() or similar was used to
1129 * enable VT-x on the host.
1130 * @param pHwvirtMsrs Pointer to the hardware-virtualization MSRs.
1131 */
1132VMMR0DECL(int) VMXR0EnableCpu(PHMGLOBALCPUINFO pHostCpu, PVM pVM, void *pvCpuPage, RTHCPHYS HCPhysCpuPage, bool fEnabledByHost,
1133 PCSUPHWVIRTMSRS pHwvirtMsrs)
1134{
1135 Assert(pHostCpu);
1136 Assert(pHwvirtMsrs);
1137 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1138
1139 /* Enable VT-x if it's not already enabled by the host. */
1140 if (!fEnabledByHost)
1141 {
1142 int rc = hmR0VmxEnterRootMode(pVM, HCPhysCpuPage, pvCpuPage);
1143 if (RT_FAILURE(rc))
1144 return rc;
1145 }
1146
1147 /*
1148 * Flush all EPT tagged-TLB entries (in case VirtualBox or any other hypervisor have been
1149 * using EPTPs) so we don't retain any stale guest-physical mappings which won't get
1150 * invalidated when flushing by VPID.
1151 */
1152 if (pHwvirtMsrs->u.vmx.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVEPT_ALL_CONTEXTS)
1153 {
1154 hmR0VmxFlushEpt(NULL /* pVCpu */, VMXTLBFLUSHEPT_ALL_CONTEXTS);
1155 pHostCpu->fFlushAsidBeforeUse = false;
1156 }
1157 else
1158 pHostCpu->fFlushAsidBeforeUse = true;
1159
1160 /* Ensure each VCPU scheduled on this CPU gets a new VPID on resume. See @bugref{6255}. */
1161 ++pHostCpu->cTlbFlushes;
1162
1163 return VINF_SUCCESS;
1164}
1165
1166
1167/**
1168 * Deactivates VT-x on the current CPU.
1169 *
1170 * @returns VBox status code.
1171 * @param pHostCpu Pointer to the global CPU info struct.
1172 * @param pvCpuPage Pointer to the VMXON region.
1173 * @param HCPhysCpuPage Physical address of the VMXON region.
1174 *
1175 * @remarks This function should never be called when SUPR0EnableVTx() or
1176 * similar was used to enable VT-x on the host.
1177 */
1178VMMR0DECL(int) VMXR0DisableCpu(PHMGLOBALCPUINFO pHostCpu, void *pvCpuPage, RTHCPHYS HCPhysCpuPage)
1179{
1180 RT_NOREF3(pHostCpu, pvCpuPage, HCPhysCpuPage);
1181
1182 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1183 return hmR0VmxLeaveRootMode();
1184}
1185
1186
1187/**
1188 * Sets the permission bits for the specified MSR in the MSR bitmap.
1189 *
1190 * @param pVCpu The cross context virtual CPU structure.
1191 * @param uMsr The MSR value.
1192 * @param enmRead Whether reading this MSR causes a VM-exit.
1193 * @param enmWrite Whether writing this MSR causes a VM-exit.
1194 */
1195static void hmR0VmxSetMsrPermission(PVMCPU pVCpu, uint32_t uMsr, VMXMSREXITREAD enmRead, VMXMSREXITWRITE enmWrite)
1196{
1197 int32_t iBit;
1198 uint8_t *pbMsrBitmap = (uint8_t *)pVCpu->hm.s.vmx.pvMsrBitmap;
1199
1200 /*
1201 * MSR Layout:
1202 * Byte index MSR range Interpreted as
1203 * 0x000 - 0x3ff 0x00000000 - 0x00001fff Low MSR read bits.
1204 * 0x400 - 0x7ff 0xc0000000 - 0xc0001fff High MSR read bits.
1205 * 0x800 - 0xbff 0x00000000 - 0x00001fff Low MSR write bits.
1206 * 0xc00 - 0xfff 0xc0000000 - 0xc0001fff High MSR write bits.
1207 *
1208 * A bit corresponding to an MSR within the above range causes a VM-exit
1209 * if the bit is 1 on executions of RDMSR/WRMSR.
1210 *
1211 * If an MSR falls out of the MSR range, it always cause a VM-exit.
1212 *
1213 * See Intel spec. 24.6.9 "MSR-Bitmap Address".
1214 */
1215 if (uMsr <= 0x00001fff)
1216 iBit = uMsr;
1217 else if (uMsr - UINT32_C(0xc0000000) <= UINT32_C(0x00001fff))
1218 {
1219 iBit = uMsr - UINT32_C(0xc0000000);
1220 pbMsrBitmap += 0x400;
1221 }
1222 else
1223 AssertMsgFailedReturnVoid(("hmR0VmxSetMsrPermission: Invalid MSR %#RX32\n", uMsr));
1224
1225 Assert(iBit <= 0x1fff);
1226 if (enmRead == VMXMSREXIT_INTERCEPT_READ)
1227 ASMBitSet(pbMsrBitmap, iBit);
1228 else
1229 ASMBitClear(pbMsrBitmap, iBit);
1230
1231 if (enmWrite == VMXMSREXIT_INTERCEPT_WRITE)
1232 ASMBitSet(pbMsrBitmap + 0x800, iBit);
1233 else
1234 ASMBitClear(pbMsrBitmap + 0x800, iBit);
1235}
1236
1237
1238/**
1239 * Updates the VMCS with the number of effective MSRs in the auto-load/store MSR
1240 * area.
1241 *
1242 * @returns VBox status code.
1243 * @param pVCpu The cross context virtual CPU structure.
1244 * @param cMsrs The number of MSRs.
1245 */
1246static int hmR0VmxSetAutoLoadStoreMsrCount(PVMCPU pVCpu, uint32_t cMsrs)
1247{
1248 /* Shouldn't ever happen but there -is- a number. We're well within the recommended 512. */
1249 uint64_t const uVmxMiscMsr = pVCpu->CTX_SUFF(pVM)->hm.s.vmx.Msrs.u64Misc;
1250 uint32_t const cMaxSupportedMsrs = VMX_MISC_MAX_MSRS(uVmxMiscMsr);
1251 if (RT_UNLIKELY(cMsrs > cMaxSupportedMsrs))
1252 {
1253 LogRel(("CPU auto-load/store MSR count in VMCS exceeded cMsrs=%u Supported=%u.\n", cMsrs, cMaxSupportedMsrs));
1254 pVCpu->hm.s.u32HMError = VMX_UFC_INSUFFICIENT_GUEST_MSR_STORAGE;
1255 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
1256 }
1257
1258 /* Update number of guest MSRs to load/store across the world-switch. */
1259 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_ENTRY_MSR_LOAD_COUNT, cMsrs);
1260 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_EXIT_MSR_STORE_COUNT, cMsrs);
1261
1262 /* Update number of host MSRs to load after the world-switch. Identical to guest-MSR count as it's always paired. */
1263 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_EXIT_MSR_LOAD_COUNT, cMsrs);
1264 AssertRCReturn(rc, rc);
1265
1266 /* Update the VCPU's copy of the MSR count. */
1267 pVCpu->hm.s.vmx.cMsrs = cMsrs;
1268
1269 return VINF_SUCCESS;
1270}
1271
1272
1273/**
1274 * Adds a new (or updates the value of an existing) guest/host MSR
1275 * pair to be swapped during the world-switch as part of the
1276 * auto-load/store MSR area in the VMCS.
1277 *
1278 * @returns VBox status code.
1279 * @param pVCpu The cross context virtual CPU structure.
1280 * @param uMsr The MSR.
1281 * @param uGuestMsrValue Value of the guest MSR.
1282 * @param fUpdateHostMsr Whether to update the value of the host MSR if
1283 * necessary.
1284 * @param pfAddedAndUpdated Where to store whether the MSR was added -and-
1285 * its value was updated. Optional, can be NULL.
1286 */
1287static int hmR0VmxAddAutoLoadStoreMsr(PVMCPU pVCpu, uint32_t uMsr, uint64_t uGuestMsrValue, bool fUpdateHostMsr,
1288 bool *pfAddedAndUpdated)
1289{
1290 PVMXAUTOMSR pGuestMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvGuestMsr;
1291 uint32_t cMsrs = pVCpu->hm.s.vmx.cMsrs;
1292 uint32_t i;
1293 for (i = 0; i < cMsrs; i++)
1294 {
1295 if (pGuestMsr->u32Msr == uMsr)
1296 break;
1297 pGuestMsr++;
1298 }
1299
1300 bool fAdded = false;
1301 if (i == cMsrs)
1302 {
1303 ++cMsrs;
1304 int rc = hmR0VmxSetAutoLoadStoreMsrCount(pVCpu, cMsrs);
1305 AssertMsgRCReturn(rc, ("hmR0VmxAddAutoLoadStoreMsr: Insufficient space to add MSR %u\n", uMsr), rc);
1306
1307 /* Now that we're swapping MSRs during the world-switch, allow the guest to read/write them without causing VM-exits. */
1308 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_MSR_BITMAPS)
1309 hmR0VmxSetMsrPermission(pVCpu, uMsr, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
1310
1311 fAdded = true;
1312 }
1313
1314 /* Update the MSR values in the auto-load/store MSR area. */
1315 pGuestMsr->u32Msr = uMsr;
1316 pGuestMsr->u64Value = uGuestMsrValue;
1317
1318 /* Create/update the MSR slot in the host MSR area. */
1319 PVMXAUTOMSR pHostMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvHostMsr;
1320 pHostMsr += i;
1321 pHostMsr->u32Msr = uMsr;
1322
1323 /*
1324 * Update the host MSR only when requested by the caller AND when we're
1325 * adding it to the auto-load/store area. Otherwise, it would have been
1326 * updated by hmR0VmxExportHostMsrs(). We do this for performance reasons.
1327 */
1328 bool fUpdatedMsrValue = false;
1329 if ( fAdded
1330 && fUpdateHostMsr)
1331 {
1332 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
1333 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1334 pHostMsr->u64Value = ASMRdMsr(pHostMsr->u32Msr);
1335 fUpdatedMsrValue = true;
1336 }
1337
1338 if (pfAddedAndUpdated)
1339 *pfAddedAndUpdated = fUpdatedMsrValue;
1340 return VINF_SUCCESS;
1341}
1342
1343
1344/**
1345 * Removes a guest/host MSR pair to be swapped during the world-switch from the
1346 * auto-load/store MSR area in the VMCS.
1347 *
1348 * @returns VBox status code.
1349 * @param pVCpu The cross context virtual CPU structure.
1350 * @param uMsr The MSR.
1351 */
1352static int hmR0VmxRemoveAutoLoadStoreMsr(PVMCPU pVCpu, uint32_t uMsr)
1353{
1354 PVMXAUTOMSR pGuestMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvGuestMsr;
1355 uint32_t cMsrs = pVCpu->hm.s.vmx.cMsrs;
1356 for (uint32_t i = 0; i < cMsrs; i++)
1357 {
1358 /* Find the MSR. */
1359 if (pGuestMsr->u32Msr == uMsr)
1360 {
1361 /* If it's the last MSR, simply reduce the count. */
1362 if (i == cMsrs - 1)
1363 {
1364 --cMsrs;
1365 break;
1366 }
1367
1368 /* Remove it by swapping the last MSR in place of it, and reducing the count. */
1369 PVMXAUTOMSR pLastGuestMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvGuestMsr;
1370 pLastGuestMsr += cMsrs - 1;
1371 pGuestMsr->u32Msr = pLastGuestMsr->u32Msr;
1372 pGuestMsr->u64Value = pLastGuestMsr->u64Value;
1373
1374 PVMXAUTOMSR pHostMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvHostMsr;
1375 PVMXAUTOMSR pLastHostMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvHostMsr;
1376 pLastHostMsr += cMsrs - 1;
1377 pHostMsr->u32Msr = pLastHostMsr->u32Msr;
1378 pHostMsr->u64Value = pLastHostMsr->u64Value;
1379 --cMsrs;
1380 break;
1381 }
1382 pGuestMsr++;
1383 }
1384
1385 /* Update the VMCS if the count changed (meaning the MSR was found). */
1386 if (cMsrs != pVCpu->hm.s.vmx.cMsrs)
1387 {
1388 int rc = hmR0VmxSetAutoLoadStoreMsrCount(pVCpu, cMsrs);
1389 AssertRCReturn(rc, rc);
1390
1391 /* We're no longer swapping MSRs during the world-switch, intercept guest read/writes to them. */
1392 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_MSR_BITMAPS)
1393 hmR0VmxSetMsrPermission(pVCpu, uMsr, VMXMSREXIT_INTERCEPT_READ, VMXMSREXIT_INTERCEPT_WRITE);
1394
1395 Log4Func(("Removed MSR %#RX32 new cMsrs=%u\n", uMsr, pVCpu->hm.s.vmx.cMsrs));
1396 return VINF_SUCCESS;
1397 }
1398
1399 return VERR_NOT_FOUND;
1400}
1401
1402
1403/**
1404 * Checks if the specified guest MSR is part of the auto-load/store area in
1405 * the VMCS.
1406 *
1407 * @returns true if found, false otherwise.
1408 * @param pVCpu The cross context virtual CPU structure.
1409 * @param uMsr The MSR to find.
1410 */
1411static bool hmR0VmxIsAutoLoadStoreGuestMsr(PVMCPU pVCpu, uint32_t uMsr)
1412{
1413 PVMXAUTOMSR pGuestMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvGuestMsr;
1414 uint32_t cMsrs = pVCpu->hm.s.vmx.cMsrs;
1415
1416 for (uint32_t i = 0; i < cMsrs; i++, pGuestMsr++)
1417 {
1418 if (pGuestMsr->u32Msr == uMsr)
1419 return true;
1420 }
1421 return false;
1422}
1423
1424
1425/**
1426 * Updates the value of all host MSRs in the auto-load/store area in the VMCS.
1427 *
1428 * @param pVCpu The cross context virtual CPU structure.
1429 *
1430 * @remarks No-long-jump zone!!!
1431 */
1432static void hmR0VmxUpdateAutoLoadStoreHostMsrs(PVMCPU pVCpu)
1433{
1434 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1435 PVMXAUTOMSR pHostMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvHostMsr;
1436 PVMXAUTOMSR pGuestMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvGuestMsr;
1437 uint32_t cMsrs = pVCpu->hm.s.vmx.cMsrs;
1438
1439 for (uint32_t i = 0; i < cMsrs; i++, pHostMsr++, pGuestMsr++)
1440 {
1441 AssertReturnVoid(pHostMsr->u32Msr == pGuestMsr->u32Msr);
1442
1443 /*
1444 * Performance hack for the host EFER MSR. We use the cached value rather than re-read it.
1445 * Strict builds will catch mismatches in hmR0VmxCheckAutoLoadStoreMsrs(). See @bugref{7368}.
1446 */
1447 if (pHostMsr->u32Msr == MSR_K6_EFER)
1448 pHostMsr->u64Value = pVCpu->CTX_SUFF(pVM)->hm.s.vmx.u64HostEfer;
1449 else
1450 pHostMsr->u64Value = ASMRdMsr(pHostMsr->u32Msr);
1451 }
1452
1453 pVCpu->hm.s.vmx.fUpdatedHostMsrs = true;
1454}
1455
1456
1457/**
1458 * Saves a set of host MSRs to allow read/write passthru access to the guest and
1459 * perform lazy restoration of the host MSRs while leaving VT-x.
1460 *
1461 * @param pVCpu The cross context virtual CPU structure.
1462 *
1463 * @remarks No-long-jump zone!!!
1464 */
1465static void hmR0VmxLazySaveHostMsrs(PVMCPU pVCpu)
1466{
1467 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1468
1469 /*
1470 * Note: If you're adding MSRs here, make sure to update the MSR-bitmap permissions in hmR0VmxSetupProcCtls().
1471 */
1472 if (!(pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_SAVED_HOST))
1473 {
1474 Assert(!(pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_LOADED_GUEST)); /* Guest MSRs better not be loaded now. */
1475#if HC_ARCH_BITS == 64
1476 if (pVCpu->CTX_SUFF(pVM)->hm.s.fAllow64BitGuests)
1477 {
1478 pVCpu->hm.s.vmx.u64HostLStarMsr = ASMRdMsr(MSR_K8_LSTAR);
1479 pVCpu->hm.s.vmx.u64HostStarMsr = ASMRdMsr(MSR_K6_STAR);
1480 pVCpu->hm.s.vmx.u64HostSFMaskMsr = ASMRdMsr(MSR_K8_SF_MASK);
1481 pVCpu->hm.s.vmx.u64HostKernelGSBaseMsr = ASMRdMsr(MSR_K8_KERNEL_GS_BASE);
1482 }
1483#endif
1484 pVCpu->hm.s.vmx.fLazyMsrs |= VMX_LAZY_MSRS_SAVED_HOST;
1485 }
1486}
1487
1488
1489/**
1490 * Checks whether the MSR belongs to the set of guest MSRs that we restore
1491 * lazily while leaving VT-x.
1492 *
1493 * @returns true if it does, false otherwise.
1494 * @param pVCpu The cross context virtual CPU structure.
1495 * @param uMsr The MSR to check.
1496 */
1497static bool hmR0VmxIsLazyGuestMsr(PVMCPU pVCpu, uint32_t uMsr)
1498{
1499 NOREF(pVCpu);
1500#if HC_ARCH_BITS == 64
1501 if (pVCpu->CTX_SUFF(pVM)->hm.s.fAllow64BitGuests)
1502 {
1503 switch (uMsr)
1504 {
1505 case MSR_K8_LSTAR:
1506 case MSR_K6_STAR:
1507 case MSR_K8_SF_MASK:
1508 case MSR_K8_KERNEL_GS_BASE:
1509 return true;
1510 }
1511 }
1512#else
1513 RT_NOREF(pVCpu, uMsr);
1514#endif
1515 return false;
1516}
1517
1518
1519/**
1520 * Loads a set of guests MSRs to allow read/passthru to the guest.
1521 *
1522 * The name of this function is slightly confusing. This function does NOT
1523 * postpone loading, but loads the MSR right now. "hmR0VmxLazy" is simply a
1524 * common prefix for functions dealing with "lazy restoration" of the shared
1525 * MSRs.
1526 *
1527 * @param pVCpu The cross context virtual CPU structure.
1528 *
1529 * @remarks No-long-jump zone!!!
1530 */
1531static void hmR0VmxLazyLoadGuestMsrs(PVMCPU pVCpu)
1532{
1533 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1534 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
1535
1536 Assert(pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_SAVED_HOST);
1537#if HC_ARCH_BITS == 64
1538 if (pVCpu->CTX_SUFF(pVM)->hm.s.fAllow64BitGuests)
1539 {
1540 /*
1541 * If the guest MSRs are not loaded -and- if all the guest MSRs are identical
1542 * to the MSRs on the CPU (which are the saved host MSRs, see assertion above) then
1543 * we can skip a few MSR writes.
1544 *
1545 * Otherwise, it implies either 1. they're not loaded, or 2. they're loaded but the
1546 * guest MSR values in the guest-CPU context might be different to what's currently
1547 * loaded in the CPU. In either case, we need to write the new guest MSR values to the
1548 * CPU, see @bugref{8728}.
1549 */
1550 PCCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
1551 if ( !(pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_LOADED_GUEST)
1552 && pCtx->msrKERNELGSBASE == pVCpu->hm.s.vmx.u64HostKernelGSBaseMsr
1553 && pCtx->msrLSTAR == pVCpu->hm.s.vmx.u64HostLStarMsr
1554 && pCtx->msrSTAR == pVCpu->hm.s.vmx.u64HostStarMsr
1555 && pCtx->msrSFMASK == pVCpu->hm.s.vmx.u64HostSFMaskMsr)
1556 {
1557#ifdef VBOX_STRICT
1558 Assert(ASMRdMsr(MSR_K8_KERNEL_GS_BASE) == pCtx->msrKERNELGSBASE);
1559 Assert(ASMRdMsr(MSR_K8_LSTAR) == pCtx->msrLSTAR);
1560 Assert(ASMRdMsr(MSR_K6_STAR) == pCtx->msrSTAR);
1561 Assert(ASMRdMsr(MSR_K8_SF_MASK) == pCtx->msrSFMASK);
1562#endif
1563 }
1564 else
1565 {
1566 ASMWrMsr(MSR_K8_KERNEL_GS_BASE, pCtx->msrKERNELGSBASE);
1567 ASMWrMsr(MSR_K8_LSTAR, pCtx->msrLSTAR);
1568 ASMWrMsr(MSR_K6_STAR, pCtx->msrSTAR);
1569 ASMWrMsr(MSR_K8_SF_MASK, pCtx->msrSFMASK);
1570 }
1571 }
1572#endif
1573 pVCpu->hm.s.vmx.fLazyMsrs |= VMX_LAZY_MSRS_LOADED_GUEST;
1574}
1575
1576
1577/**
1578 * Performs lazy restoration of the set of host MSRs if they were previously
1579 * loaded with guest MSR values.
1580 *
1581 * @param pVCpu The cross context virtual CPU structure.
1582 *
1583 * @remarks No-long-jump zone!!!
1584 * @remarks The guest MSRs should have been saved back into the guest-CPU
1585 * context by hmR0VmxImportGuestState()!!!
1586 */
1587static void hmR0VmxLazyRestoreHostMsrs(PVMCPU pVCpu)
1588{
1589 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1590 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
1591
1592 if (pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_LOADED_GUEST)
1593 {
1594 Assert(pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_SAVED_HOST);
1595#if HC_ARCH_BITS == 64
1596 if (pVCpu->CTX_SUFF(pVM)->hm.s.fAllow64BitGuests)
1597 {
1598 ASMWrMsr(MSR_K8_LSTAR, pVCpu->hm.s.vmx.u64HostLStarMsr);
1599 ASMWrMsr(MSR_K6_STAR, pVCpu->hm.s.vmx.u64HostStarMsr);
1600 ASMWrMsr(MSR_K8_SF_MASK, pVCpu->hm.s.vmx.u64HostSFMaskMsr);
1601 ASMWrMsr(MSR_K8_KERNEL_GS_BASE, pVCpu->hm.s.vmx.u64HostKernelGSBaseMsr);
1602 }
1603#endif
1604 }
1605 pVCpu->hm.s.vmx.fLazyMsrs &= ~(VMX_LAZY_MSRS_LOADED_GUEST | VMX_LAZY_MSRS_SAVED_HOST);
1606}
1607
1608
1609/**
1610 * Verifies that our cached values of the VMCS fields are all consistent with
1611 * what's actually present in the VMCS.
1612 *
1613 * @returns VBox status code.
1614 * @retval VINF_SUCCESS if all our caches match their respective VMCS fields.
1615 * @retval VERR_VMX_VMCS_FIELD_CACHE_INVALID if a cache field doesn't match the
1616 * VMCS content. HMCPU error-field is
1617 * updated, see VMX_VCI_XXX.
1618 * @param pVCpu The cross context virtual CPU structure.
1619 */
1620static int hmR0VmxCheckVmcsCtls(PVMCPU pVCpu)
1621{
1622 uint32_t u32Val;
1623 int rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY, &u32Val);
1624 AssertRCReturn(rc, rc);
1625 AssertMsgReturnStmt(pVCpu->hm.s.vmx.u32EntryCtls == u32Val,
1626 ("Cache=%#RX32 VMCS=%#RX32\n", pVCpu->hm.s.vmx.u32EntryCtls, u32Val),
1627 pVCpu->hm.s.u32HMError = VMX_VCI_CTRL_ENTRY,
1628 VERR_VMX_VMCS_FIELD_CACHE_INVALID);
1629
1630 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_EXIT, &u32Val);
1631 AssertRCReturn(rc, rc);
1632 AssertMsgReturnStmt(pVCpu->hm.s.vmx.u32ExitCtls == u32Val,
1633 ("Cache=%#RX32 VMCS=%#RX32\n", pVCpu->hm.s.vmx.u32ExitCtls, u32Val),
1634 pVCpu->hm.s.u32HMError = VMX_VCI_CTRL_EXIT,
1635 VERR_VMX_VMCS_FIELD_CACHE_INVALID);
1636
1637 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_PIN_EXEC, &u32Val);
1638 AssertRCReturn(rc, rc);
1639 AssertMsgReturnStmt(pVCpu->hm.s.vmx.u32PinCtls == u32Val,
1640 ("Cache=%#RX32 VMCS=%#RX32\n", pVCpu->hm.s.vmx.u32PinCtls, u32Val),
1641 pVCpu->hm.s.u32HMError = VMX_VCI_CTRL_PIN_EXEC,
1642 VERR_VMX_VMCS_FIELD_CACHE_INVALID);
1643
1644 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, &u32Val);
1645 AssertRCReturn(rc, rc);
1646 AssertMsgReturnStmt(pVCpu->hm.s.vmx.u32ProcCtls == u32Val,
1647 ("Cache=%#RX32 VMCS=%#RX32\n", pVCpu->hm.s.vmx.u32ProcCtls, u32Val),
1648 pVCpu->hm.s.u32HMError = VMX_VCI_CTRL_PROC_EXEC,
1649 VERR_VMX_VMCS_FIELD_CACHE_INVALID);
1650
1651 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_SECONDARY_CTLS)
1652 {
1653 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_PROC_EXEC2, &u32Val);
1654 AssertRCReturn(rc, rc);
1655 AssertMsgReturnStmt(pVCpu->hm.s.vmx.u32ProcCtls2 == u32Val,
1656 ("Cache=%#RX32 VMCS=%#RX32\n", pVCpu->hm.s.vmx.u32ProcCtls2, u32Val),
1657 pVCpu->hm.s.u32HMError = VMX_VCI_CTRL_PROC_EXEC2,
1658 VERR_VMX_VMCS_FIELD_CACHE_INVALID);
1659 }
1660
1661 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_EXCEPTION_BITMAP, &u32Val);
1662 AssertRCReturn(rc, rc);
1663 AssertMsgReturnStmt(pVCpu->hm.s.vmx.u32XcptBitmap == u32Val,
1664 ("Cache=%#RX32 VMCS=%#RX32\n", pVCpu->hm.s.vmx.u32XcptBitmap, u32Val),
1665 pVCpu->hm.s.u32HMError = VMX_VCI_CTRL_XCPT_BITMAP,
1666 VERR_VMX_VMCS_FIELD_CACHE_INVALID);
1667
1668 uint64_t u64Val;
1669 rc = VMXReadVmcs64(VMX_VMCS64_CTRL_TSC_OFFSET_FULL, &u64Val);
1670 AssertRCReturn(rc, rc);
1671 AssertMsgReturnStmt(pVCpu->hm.s.vmx.u64TscOffset == u64Val,
1672 ("Cache=%#RX64 VMCS=%#RX64\n", pVCpu->hm.s.vmx.u64TscOffset, u64Val),
1673 pVCpu->hm.s.u32HMError = VMX_VCI_CTRL_TSC_OFFSET,
1674 VERR_VMX_VMCS_FIELD_CACHE_INVALID);
1675
1676 return VINF_SUCCESS;
1677}
1678
1679
1680#ifdef VBOX_STRICT
1681/**
1682 * Verifies that our cached host EFER value has not changed
1683 * since we cached it.
1684 *
1685 * @param pVCpu The cross context virtual CPU structure.
1686 */
1687static void hmR0VmxCheckHostEferMsr(PVMCPU pVCpu)
1688{
1689 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1690
1691 if (pVCpu->hm.s.vmx.u32ExitCtls & VMX_EXIT_CTLS_LOAD_EFER_MSR)
1692 {
1693 uint64_t u64Val;
1694 int rc = VMXReadVmcs64(VMX_VMCS64_HOST_EFER_FULL, &u64Val);
1695 AssertRC(rc);
1696
1697 uint64_t u64HostEferMsr = ASMRdMsr(MSR_K6_EFER);
1698 AssertMsgReturnVoid(u64HostEferMsr == u64Val, ("u64HostEferMsr=%#RX64 u64Val=%#RX64\n", u64HostEferMsr, u64Val));
1699 }
1700}
1701
1702
1703/**
1704 * Verifies whether the guest/host MSR pairs in the auto-load/store area in the
1705 * VMCS are correct.
1706 *
1707 * @param pVCpu The cross context virtual CPU structure.
1708 */
1709static void hmR0VmxCheckAutoLoadStoreMsrs(PVMCPU pVCpu)
1710{
1711 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1712
1713 /* Verify MSR counts in the VMCS are what we think it should be. */
1714 uint32_t cMsrs;
1715 int rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY_MSR_LOAD_COUNT, &cMsrs); AssertRC(rc);
1716 Assert(cMsrs == pVCpu->hm.s.vmx.cMsrs);
1717
1718 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_EXIT_MSR_STORE_COUNT, &cMsrs); AssertRC(rc);
1719 Assert(cMsrs == pVCpu->hm.s.vmx.cMsrs);
1720
1721 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_EXIT_MSR_LOAD_COUNT, &cMsrs); AssertRC(rc);
1722 Assert(cMsrs == pVCpu->hm.s.vmx.cMsrs);
1723
1724 PCVMXAUTOMSR pHostMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvHostMsr;
1725 PCVMXAUTOMSR pGuestMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvGuestMsr;
1726 for (uint32_t i = 0; i < cMsrs; i++, pHostMsr++, pGuestMsr++)
1727 {
1728 /* Verify that the MSRs are paired properly and that the host MSR has the correct value. */
1729 AssertMsgReturnVoid(pHostMsr->u32Msr == pGuestMsr->u32Msr, ("HostMsr=%#RX32 GuestMsr=%#RX32 cMsrs=%u\n", pHostMsr->u32Msr,
1730 pGuestMsr->u32Msr, cMsrs));
1731
1732 uint64_t u64Msr = ASMRdMsr(pHostMsr->u32Msr);
1733 AssertMsgReturnVoid(pHostMsr->u64Value == u64Msr, ("u32Msr=%#RX32 VMCS Value=%#RX64 ASMRdMsr=%#RX64 cMsrs=%u\n",
1734 pHostMsr->u32Msr, pHostMsr->u64Value, u64Msr, cMsrs));
1735
1736 /* Verify that the permissions are as expected in the MSR bitmap. */
1737 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_MSR_BITMAPS)
1738 {
1739 VMXMSREXITREAD enmRead;
1740 VMXMSREXITWRITE enmWrite;
1741 rc = HMVmxGetMsrPermission(pVCpu->hm.s.vmx.pvMsrBitmap, pGuestMsr->u32Msr, &enmRead, &enmWrite);
1742 AssertMsgReturnVoid(rc == VINF_SUCCESS, ("HMVmxGetMsrPermission! failed. rc=%Rrc\n", rc));
1743 if (pGuestMsr->u32Msr == MSR_K6_EFER)
1744 {
1745 AssertMsgReturnVoid(enmRead == VMXMSREXIT_INTERCEPT_READ, ("Passthru read for EFER!?\n"));
1746 AssertMsgReturnVoid(enmWrite == VMXMSREXIT_INTERCEPT_WRITE, ("Passthru write for EFER!?\n"));
1747 }
1748 else
1749 {
1750 AssertMsgReturnVoid(enmRead == VMXMSREXIT_PASSTHRU_READ, ("u32Msr=%#RX32 cMsrs=%u No passthru read!\n",
1751 pGuestMsr->u32Msr, cMsrs));
1752 AssertMsgReturnVoid(enmWrite == VMXMSREXIT_PASSTHRU_WRITE, ("u32Msr=%#RX32 cMsrs=%u No passthru write!\n",
1753 pGuestMsr->u32Msr, cMsrs));
1754 }
1755 }
1756 }
1757}
1758#endif /* VBOX_STRICT */
1759
1760
1761/**
1762 * Flushes the TLB using EPT.
1763 *
1764 * @returns VBox status code.
1765 * @param pVCpu The cross context virtual CPU structure of the calling
1766 * EMT. Can be NULL depending on @a enmTlbFlush.
1767 * @param enmTlbFlush Type of flush.
1768 *
1769 * @remarks Caller is responsible for making sure this function is called only
1770 * when NestedPaging is supported and providing @a enmTlbFlush that is
1771 * supported by the CPU.
1772 * @remarks Can be called with interrupts disabled.
1773 */
1774static void hmR0VmxFlushEpt(PVMCPU pVCpu, VMXTLBFLUSHEPT enmTlbFlush)
1775{
1776 uint64_t au64Descriptor[2];
1777 if (enmTlbFlush == VMXTLBFLUSHEPT_ALL_CONTEXTS)
1778 au64Descriptor[0] = 0;
1779 else
1780 {
1781 Assert(pVCpu);
1782 au64Descriptor[0] = pVCpu->hm.s.vmx.HCPhysEPTP;
1783 }
1784 au64Descriptor[1] = 0; /* MBZ. Intel spec. 33.3 "VMX Instructions" */
1785
1786 int rc = VMXR0InvEPT(enmTlbFlush, &au64Descriptor[0]);
1787 AssertMsg(rc == VINF_SUCCESS,
1788 ("VMXR0InvEPT %#x %RGv failed with %Rrc\n", enmTlbFlush, pVCpu ? pVCpu->hm.s.vmx.HCPhysEPTP : 0, rc));
1789
1790 if ( RT_SUCCESS(rc)
1791 && pVCpu)
1792 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushNestedPaging);
1793}
1794
1795
1796/**
1797 * Flushes the TLB using VPID.
1798 *
1799 * @returns VBox status code.
1800 * @param pVCpu The cross context virtual CPU structure of the calling
1801 * EMT. Can be NULL depending on @a enmTlbFlush.
1802 * @param enmTlbFlush Type of flush.
1803 * @param GCPtr Virtual address of the page to flush (can be 0 depending
1804 * on @a enmTlbFlush).
1805 *
1806 * @remarks Can be called with interrupts disabled.
1807 */
1808static void hmR0VmxFlushVpid(PVMCPU pVCpu, VMXTLBFLUSHVPID enmTlbFlush, RTGCPTR GCPtr)
1809{
1810 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.vmx.fVpid);
1811
1812 uint64_t au64Descriptor[2];
1813 if (enmTlbFlush == VMXTLBFLUSHVPID_ALL_CONTEXTS)
1814 {
1815 au64Descriptor[0] = 0;
1816 au64Descriptor[1] = 0;
1817 }
1818 else
1819 {
1820 AssertPtr(pVCpu);
1821 AssertMsg(pVCpu->hm.s.uCurrentAsid != 0, ("VMXR0InvVPID: invalid ASID %lu\n", pVCpu->hm.s.uCurrentAsid));
1822 AssertMsg(pVCpu->hm.s.uCurrentAsid <= UINT16_MAX, ("VMXR0InvVPID: invalid ASID %lu\n", pVCpu->hm.s.uCurrentAsid));
1823 au64Descriptor[0] = pVCpu->hm.s.uCurrentAsid;
1824 au64Descriptor[1] = GCPtr;
1825 }
1826
1827 int rc = VMXR0InvVPID(enmTlbFlush, &au64Descriptor[0]);
1828 AssertMsg(rc == VINF_SUCCESS,
1829 ("VMXR0InvVPID %#x %u %RGv failed with %Rrc\n", enmTlbFlush, pVCpu ? pVCpu->hm.s.uCurrentAsid : 0, GCPtr, rc));
1830
1831 if ( RT_SUCCESS(rc)
1832 && pVCpu)
1833 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushAsid);
1834 NOREF(rc);
1835}
1836
1837
1838/**
1839 * Invalidates a guest page by guest virtual address. Only relevant for
1840 * EPT/VPID, otherwise there is nothing really to invalidate.
1841 *
1842 * @returns VBox status code.
1843 * @param pVCpu The cross context virtual CPU structure.
1844 * @param GCVirt Guest virtual address of the page to invalidate.
1845 */
1846VMMR0DECL(int) VMXR0InvalidatePage(PVMCPU pVCpu, RTGCPTR GCVirt)
1847{
1848 AssertPtr(pVCpu);
1849 LogFlowFunc(("pVCpu=%p GCVirt=%RGv\n", pVCpu, GCVirt));
1850
1851 bool fFlushPending = VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
1852 if (!fFlushPending)
1853 {
1854 /*
1855 * We must invalidate the guest TLB entry in either case, we cannot ignore it even for
1856 * the EPT case. See @bugref{6043} and @bugref{6177}.
1857 *
1858 * Set the VMCPU_FF_TLB_FLUSH force flag and flush before VM-entry in hmR0VmxFlushTLB*()
1859 * as this function maybe called in a loop with individual addresses.
1860 */
1861 PVM pVM = pVCpu->CTX_SUFF(pVM);
1862 if (pVM->hm.s.vmx.fVpid)
1863 {
1864 bool fVpidFlush = RT_BOOL(pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVVPID_INDIV_ADDR);
1865
1866#if HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS)
1867 /*
1868 * Workaround Erratum BV75, AAJ159 and others that affect several Intel CPUs
1869 * where executing INVVPID outside 64-bit mode does not flush translations of
1870 * 64-bit linear addresses, see @bugref{6208#c72}.
1871 */
1872 if (RT_HI_U32(GCVirt))
1873 fVpidFlush = false;
1874#endif
1875
1876 if (fVpidFlush)
1877 {
1878 hmR0VmxFlushVpid(pVCpu, VMXTLBFLUSHVPID_INDIV_ADDR, GCVirt);
1879 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlbInvlpgVirt);
1880 }
1881 else
1882 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
1883 }
1884 else if (pVM->hm.s.fNestedPaging)
1885 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
1886 }
1887
1888 return VINF_SUCCESS;
1889}
1890
1891
1892/**
1893 * Dummy placeholder for tagged-TLB flush handling before VM-entry. Used in the
1894 * case where neither EPT nor VPID is supported by the CPU.
1895 *
1896 * @param pVCpu The cross context virtual CPU structure.
1897 * @param pCpu Pointer to the global HM struct.
1898 *
1899 * @remarks Called with interrupts disabled.
1900 */
1901static void hmR0VmxFlushTaggedTlbNone(PVMCPU pVCpu, PHMGLOBALCPUINFO pCpu)
1902{
1903 AssertPtr(pVCpu);
1904 AssertPtr(pCpu);
1905
1906 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_TLB_FLUSH);
1907
1908 Assert(pCpu->idCpu != NIL_RTCPUID);
1909 pVCpu->hm.s.idLastCpu = pCpu->idCpu;
1910 pVCpu->hm.s.cTlbFlushes = pCpu->cTlbFlushes;
1911 pVCpu->hm.s.fForceTLBFlush = false;
1912 return;
1913}
1914
1915
1916/**
1917 * Flushes the tagged-TLB entries for EPT+VPID CPUs as necessary.
1918 *
1919 * @param pVCpu The cross context virtual CPU structure.
1920 * @param pCpu Pointer to the global HM CPU struct.
1921 *
1922 * @remarks All references to "ASID" in this function pertains to "VPID" in Intel's
1923 * nomenclature. The reason is, to avoid confusion in compare statements
1924 * since the host-CPU copies are named "ASID".
1925 *
1926 * @remarks Called with interrupts disabled.
1927 */
1928static void hmR0VmxFlushTaggedTlbBoth(PVMCPU pVCpu, PHMGLOBALCPUINFO pCpu)
1929{
1930#ifdef VBOX_WITH_STATISTICS
1931 bool fTlbFlushed = false;
1932# define HMVMX_SET_TAGGED_TLB_FLUSHED() do { fTlbFlushed = true; } while (0)
1933# define HMVMX_UPDATE_FLUSH_SKIPPED_STAT() do { \
1934 if (!fTlbFlushed) \
1935 STAM_COUNTER_INC(&pVCpu->hm.s.StatNoFlushTlbWorldSwitch); \
1936 } while (0)
1937#else
1938# define HMVMX_SET_TAGGED_TLB_FLUSHED() do { } while (0)
1939# define HMVMX_UPDATE_FLUSH_SKIPPED_STAT() do { } while (0)
1940#endif
1941
1942 AssertPtr(pCpu);
1943 AssertPtr(pVCpu);
1944 Assert(pCpu->idCpu != NIL_RTCPUID);
1945
1946 PVM pVM = pVCpu->CTX_SUFF(pVM);
1947 AssertMsg(pVM->hm.s.fNestedPaging && pVM->hm.s.vmx.fVpid,
1948 ("hmR0VmxFlushTaggedTlbBoth cannot be invoked unless NestedPaging & VPID are enabled."
1949 "fNestedPaging=%RTbool fVpid=%RTbool", pVM->hm.s.fNestedPaging, pVM->hm.s.vmx.fVpid));
1950
1951 /*
1952 * Force a TLB flush for the first world-switch if the current CPU differs from the one we
1953 * ran on last. If the TLB flush count changed, another VM (VCPU rather) has hit the ASID
1954 * limit while flushing the TLB or the host CPU is online after a suspend/resume, so we
1955 * cannot reuse the current ASID anymore.
1956 */
1957 if ( pVCpu->hm.s.idLastCpu != pCpu->idCpu
1958 || pVCpu->hm.s.cTlbFlushes != pCpu->cTlbFlushes)
1959 {
1960 ++pCpu->uCurrentAsid;
1961 if (pCpu->uCurrentAsid >= pVM->hm.s.uMaxAsid)
1962 {
1963 pCpu->uCurrentAsid = 1; /* Wraparound to 1; host uses 0. */
1964 pCpu->cTlbFlushes++; /* All VCPUs that run on this host CPU must use a new VPID. */
1965 pCpu->fFlushAsidBeforeUse = true; /* All VCPUs that run on this host CPU must flush their new VPID before use. */
1966 }
1967
1968 pVCpu->hm.s.uCurrentAsid = pCpu->uCurrentAsid;
1969 pVCpu->hm.s.idLastCpu = pCpu->idCpu;
1970 pVCpu->hm.s.cTlbFlushes = pCpu->cTlbFlushes;
1971
1972 /*
1973 * Flush by EPT when we get rescheduled to a new host CPU to ensure EPT-only tagged mappings are also
1974 * invalidated. We don't need to flush-by-VPID here as flushing by EPT covers it. See @bugref{6568}.
1975 */
1976 hmR0VmxFlushEpt(pVCpu, pVM->hm.s.vmx.enmTlbFlushEpt);
1977 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlbWorldSwitch);
1978 HMVMX_SET_TAGGED_TLB_FLUSHED();
1979 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_TLB_FLUSH);
1980 }
1981 else if (VMCPU_FF_TEST_AND_CLEAR(pVCpu, VMCPU_FF_TLB_FLUSH)) /* Check for explicit TLB flushes. */
1982 {
1983 /*
1984 * Changes to the EPT paging structure by VMM requires flushing-by-EPT as the CPU
1985 * creates guest-physical (ie. only EPT-tagged) mappings while traversing the EPT
1986 * tables when EPT is in use. Flushing-by-VPID will only flush linear (only
1987 * VPID-tagged) and combined (EPT+VPID tagged) mappings but not guest-physical
1988 * mappings, see @bugref{6568}.
1989 *
1990 * See Intel spec. 28.3.2 "Creating and Using Cached Translation Information".
1991 */
1992 hmR0VmxFlushEpt(pVCpu, pVM->hm.s.vmx.enmTlbFlushEpt);
1993 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlb);
1994 HMVMX_SET_TAGGED_TLB_FLUSHED();
1995 }
1996
1997 pVCpu->hm.s.fForceTLBFlush = false;
1998 HMVMX_UPDATE_FLUSH_SKIPPED_STAT();
1999
2000 Assert(pVCpu->hm.s.idLastCpu == pCpu->idCpu);
2001 Assert(pVCpu->hm.s.cTlbFlushes == pCpu->cTlbFlushes);
2002 AssertMsg(pVCpu->hm.s.cTlbFlushes == pCpu->cTlbFlushes,
2003 ("Flush count mismatch for cpu %d (%u vs %u)\n", pCpu->idCpu, pVCpu->hm.s.cTlbFlushes, pCpu->cTlbFlushes));
2004 AssertMsg(pCpu->uCurrentAsid >= 1 && pCpu->uCurrentAsid < pVM->hm.s.uMaxAsid,
2005 ("Cpu[%u] uCurrentAsid=%u cTlbFlushes=%u pVCpu->idLastCpu=%u pVCpu->cTlbFlushes=%u\n", pCpu->idCpu,
2006 pCpu->uCurrentAsid, pCpu->cTlbFlushes, pVCpu->hm.s.idLastCpu, pVCpu->hm.s.cTlbFlushes));
2007 AssertMsg(pVCpu->hm.s.uCurrentAsid >= 1 && pVCpu->hm.s.uCurrentAsid < pVM->hm.s.uMaxAsid,
2008 ("Cpu[%u] pVCpu->uCurrentAsid=%u\n", pCpu->idCpu, pVCpu->hm.s.uCurrentAsid));
2009
2010 /* Update VMCS with the VPID. */
2011 int rc = VMXWriteVmcs32(VMX_VMCS16_VPID, pVCpu->hm.s.uCurrentAsid);
2012 AssertRC(rc);
2013
2014#undef HMVMX_SET_TAGGED_TLB_FLUSHED
2015}
2016
2017
2018/**
2019 * Flushes the tagged-TLB entries for EPT CPUs as necessary.
2020 *
2021 * @returns VBox status code.
2022 * @param pVCpu The cross context virtual CPU structure.
2023 * @param pCpu Pointer to the global HM CPU struct.
2024 *
2025 * @remarks Called with interrupts disabled.
2026 */
2027static void hmR0VmxFlushTaggedTlbEpt(PVMCPU pVCpu, PHMGLOBALCPUINFO pCpu)
2028{
2029 AssertPtr(pVCpu);
2030 AssertPtr(pCpu);
2031 Assert(pCpu->idCpu != NIL_RTCPUID);
2032 AssertMsg(pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging, ("hmR0VmxFlushTaggedTlbEpt cannot be invoked without NestedPaging."));
2033 AssertMsg(!pVCpu->CTX_SUFF(pVM)->hm.s.vmx.fVpid, ("hmR0VmxFlushTaggedTlbEpt cannot be invoked with VPID."));
2034
2035 /*
2036 * Force a TLB flush for the first world-switch if the current CPU differs from the one we ran on last.
2037 * A change in the TLB flush count implies the host CPU is online after a suspend/resume.
2038 */
2039 if ( pVCpu->hm.s.idLastCpu != pCpu->idCpu
2040 || pVCpu->hm.s.cTlbFlushes != pCpu->cTlbFlushes)
2041 {
2042 pVCpu->hm.s.fForceTLBFlush = true;
2043 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlbWorldSwitch);
2044 }
2045
2046 /* Check for explicit TLB flushes. */
2047 if (VMCPU_FF_TEST_AND_CLEAR(pVCpu, VMCPU_FF_TLB_FLUSH))
2048 {
2049 pVCpu->hm.s.fForceTLBFlush = true;
2050 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlb);
2051 }
2052
2053 pVCpu->hm.s.idLastCpu = pCpu->idCpu;
2054 pVCpu->hm.s.cTlbFlushes = pCpu->cTlbFlushes;
2055
2056 if (pVCpu->hm.s.fForceTLBFlush)
2057 {
2058 hmR0VmxFlushEpt(pVCpu, pVCpu->CTX_SUFF(pVM)->hm.s.vmx.enmTlbFlushEpt);
2059 pVCpu->hm.s.fForceTLBFlush = false;
2060 }
2061}
2062
2063
2064/**
2065 * Flushes the tagged-TLB entries for VPID CPUs as necessary.
2066 *
2067 * @returns VBox status code.
2068 * @param pVCpu The cross context virtual CPU structure.
2069 * @param pCpu Pointer to the global HM CPU struct.
2070 *
2071 * @remarks Called with interrupts disabled.
2072 */
2073static void hmR0VmxFlushTaggedTlbVpid(PVMCPU pVCpu, PHMGLOBALCPUINFO pCpu)
2074{
2075 AssertPtr(pVCpu);
2076 AssertPtr(pCpu);
2077 Assert(pCpu->idCpu != NIL_RTCPUID);
2078 AssertMsg(pVCpu->CTX_SUFF(pVM)->hm.s.vmx.fVpid, ("hmR0VmxFlushTlbVpid cannot be invoked without VPID."));
2079 AssertMsg(!pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging, ("hmR0VmxFlushTlbVpid cannot be invoked with NestedPaging"));
2080
2081 /*
2082 * Force a TLB flush for the first world switch if the current CPU differs from the one we
2083 * ran on last. If the TLB flush count changed, another VM (VCPU rather) has hit the ASID
2084 * limit while flushing the TLB or the host CPU is online after a suspend/resume, so we
2085 * cannot reuse the current ASID anymore.
2086 */
2087 if ( pVCpu->hm.s.idLastCpu != pCpu->idCpu
2088 || pVCpu->hm.s.cTlbFlushes != pCpu->cTlbFlushes)
2089 {
2090 pVCpu->hm.s.fForceTLBFlush = true;
2091 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlbWorldSwitch);
2092 }
2093
2094 /* Check for explicit TLB flushes. */
2095 if (VMCPU_FF_TEST_AND_CLEAR(pVCpu, VMCPU_FF_TLB_FLUSH))
2096 {
2097 /*
2098 * If we ever support VPID flush combinations other than ALL or SINGLE-context (see
2099 * hmR0VmxSetupTaggedTlb()) we would need to explicitly flush in this case (add an
2100 * fExplicitFlush = true here and change the pCpu->fFlushAsidBeforeUse check below to
2101 * include fExplicitFlush's too) - an obscure corner case.
2102 */
2103 pVCpu->hm.s.fForceTLBFlush = true;
2104 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlb);
2105 }
2106
2107 PVM pVM = pVCpu->CTX_SUFF(pVM);
2108 pVCpu->hm.s.idLastCpu = pCpu->idCpu;
2109 if (pVCpu->hm.s.fForceTLBFlush)
2110 {
2111 ++pCpu->uCurrentAsid;
2112 if (pCpu->uCurrentAsid >= pVM->hm.s.uMaxAsid)
2113 {
2114 pCpu->uCurrentAsid = 1; /* Wraparound to 1; host uses 0 */
2115 pCpu->cTlbFlushes++; /* All VCPUs that run on this host CPU must use a new VPID. */
2116 pCpu->fFlushAsidBeforeUse = true; /* All VCPUs that run on this host CPU must flush their new VPID before use. */
2117 }
2118
2119 pVCpu->hm.s.fForceTLBFlush = false;
2120 pVCpu->hm.s.cTlbFlushes = pCpu->cTlbFlushes;
2121 pVCpu->hm.s.uCurrentAsid = pCpu->uCurrentAsid;
2122 if (pCpu->fFlushAsidBeforeUse)
2123 {
2124 if (pVM->hm.s.vmx.enmTlbFlushVpid == VMXTLBFLUSHVPID_SINGLE_CONTEXT)
2125 hmR0VmxFlushVpid(pVCpu, VMXTLBFLUSHVPID_SINGLE_CONTEXT, 0 /* GCPtr */);
2126 else if (pVM->hm.s.vmx.enmTlbFlushVpid == VMXTLBFLUSHVPID_ALL_CONTEXTS)
2127 {
2128 hmR0VmxFlushVpid(pVCpu, VMXTLBFLUSHVPID_ALL_CONTEXTS, 0 /* GCPtr */);
2129 pCpu->fFlushAsidBeforeUse = false;
2130 }
2131 else
2132 {
2133 /* hmR0VmxSetupTaggedTlb() ensures we never get here. Paranoia. */
2134 AssertMsgFailed(("Unsupported VPID-flush context type.\n"));
2135 }
2136 }
2137 }
2138
2139 AssertMsg(pVCpu->hm.s.cTlbFlushes == pCpu->cTlbFlushes,
2140 ("Flush count mismatch for cpu %d (%u vs %u)\n", pCpu->idCpu, pVCpu->hm.s.cTlbFlushes, pCpu->cTlbFlushes));
2141 AssertMsg(pCpu->uCurrentAsid >= 1 && pCpu->uCurrentAsid < pVM->hm.s.uMaxAsid,
2142 ("Cpu[%u] uCurrentAsid=%u cTlbFlushes=%u pVCpu->idLastCpu=%u pVCpu->cTlbFlushes=%u\n", pCpu->idCpu,
2143 pCpu->uCurrentAsid, pCpu->cTlbFlushes, pVCpu->hm.s.idLastCpu, pVCpu->hm.s.cTlbFlushes));
2144 AssertMsg(pVCpu->hm.s.uCurrentAsid >= 1 && pVCpu->hm.s.uCurrentAsid < pVM->hm.s.uMaxAsid,
2145 ("Cpu[%u] pVCpu->uCurrentAsid=%u\n", pCpu->idCpu, pVCpu->hm.s.uCurrentAsid));
2146
2147 int rc = VMXWriteVmcs32(VMX_VMCS16_VPID, pVCpu->hm.s.uCurrentAsid);
2148 AssertRC(rc);
2149}
2150
2151
2152/**
2153 * Flushes the guest TLB entry based on CPU capabilities.
2154 *
2155 * @param pVCpu The cross context virtual CPU structure.
2156 * @param pCpu Pointer to the global HM CPU struct.
2157 */
2158DECLINLINE(void) hmR0VmxFlushTaggedTlb(PVMCPU pVCpu, PHMGLOBALCPUINFO pCpu)
2159{
2160#ifdef HMVMX_ALWAYS_FLUSH_TLB
2161 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
2162#endif
2163 PVM pVM = pVCpu->CTX_SUFF(pVM);
2164 switch (pVM->hm.s.vmx.enmTlbFlushType)
2165 {
2166 case VMXTLBFLUSHTYPE_EPT_VPID: hmR0VmxFlushTaggedTlbBoth(pVCpu, pCpu); break;
2167 case VMXTLBFLUSHTYPE_EPT: hmR0VmxFlushTaggedTlbEpt(pVCpu, pCpu); break;
2168 case VMXTLBFLUSHTYPE_VPID: hmR0VmxFlushTaggedTlbVpid(pVCpu, pCpu); break;
2169 case VMXTLBFLUSHTYPE_NONE: hmR0VmxFlushTaggedTlbNone(pVCpu, pCpu); break;
2170 default:
2171 AssertMsgFailed(("Invalid flush-tag function identifier\n"));
2172 break;
2173 }
2174 /* Don't assert that VMCPU_FF_TLB_FLUSH should no longer be pending. It can be set by other EMTs. */
2175}
2176
2177
2178/**
2179 * Sets up the appropriate tagged TLB-flush level and handler for flushing guest
2180 * TLB entries from the host TLB before VM-entry.
2181 *
2182 * @returns VBox status code.
2183 * @param pVM The cross context VM structure.
2184 */
2185static int hmR0VmxSetupTaggedTlb(PVM pVM)
2186{
2187 /*
2188 * Determine optimal flush type for Nested Paging.
2189 * We cannot ignore EPT if no suitable flush-types is supported by the CPU as we've already setup unrestricted
2190 * guest execution (see hmR3InitFinalizeR0()).
2191 */
2192 if (pVM->hm.s.fNestedPaging)
2193 {
2194 if (pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVEPT)
2195 {
2196 if (pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVEPT_SINGLE_CONTEXT)
2197 pVM->hm.s.vmx.enmTlbFlushEpt = VMXTLBFLUSHEPT_SINGLE_CONTEXT;
2198 else if (pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVEPT_ALL_CONTEXTS)
2199 pVM->hm.s.vmx.enmTlbFlushEpt = VMXTLBFLUSHEPT_ALL_CONTEXTS;
2200 else
2201 {
2202 /* Shouldn't happen. EPT is supported but no suitable flush-types supported. */
2203 pVM->hm.s.vmx.enmTlbFlushEpt = VMXTLBFLUSHEPT_NOT_SUPPORTED;
2204 pVM->aCpus[0].hm.s.u32HMError = VMX_UFC_EPT_FLUSH_TYPE_UNSUPPORTED;
2205 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
2206 }
2207
2208 /* Make sure the write-back cacheable memory type for EPT is supported. */
2209 if (RT_UNLIKELY(!(pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_EMT_WB)))
2210 {
2211 pVM->hm.s.vmx.enmTlbFlushEpt = VMXTLBFLUSHEPT_NOT_SUPPORTED;
2212 pVM->aCpus[0].hm.s.u32HMError = VMX_UFC_EPT_MEM_TYPE_NOT_WB;
2213 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
2214 }
2215
2216 /* EPT requires a page-walk length of 4. */
2217 if (RT_UNLIKELY(!(pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_PAGE_WALK_LENGTH_4)))
2218 {
2219 pVM->hm.s.vmx.enmTlbFlushEpt = VMXTLBFLUSHEPT_NOT_SUPPORTED;
2220 pVM->aCpus[0].hm.s.u32HMError = VMX_UFC_EPT_PAGE_WALK_LENGTH_UNSUPPORTED;
2221 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
2222 }
2223 }
2224 else
2225 {
2226 /* Shouldn't happen. EPT is supported but INVEPT instruction is not supported. */
2227 pVM->hm.s.vmx.enmTlbFlushEpt = VMXTLBFLUSHEPT_NOT_SUPPORTED;
2228 pVM->aCpus[0].hm.s.u32HMError = VMX_UFC_EPT_INVEPT_UNAVAILABLE;
2229 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
2230 }
2231 }
2232
2233 /*
2234 * Determine optimal flush type for VPID.
2235 */
2236 if (pVM->hm.s.vmx.fVpid)
2237 {
2238 if (pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVVPID)
2239 {
2240 if (pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVVPID_SINGLE_CONTEXT)
2241 pVM->hm.s.vmx.enmTlbFlushVpid = VMXTLBFLUSHVPID_SINGLE_CONTEXT;
2242 else if (pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVVPID_ALL_CONTEXTS)
2243 pVM->hm.s.vmx.enmTlbFlushVpid = VMXTLBFLUSHVPID_ALL_CONTEXTS;
2244 else
2245 {
2246 /* Neither SINGLE nor ALL-context flush types for VPID is supported by the CPU. Ignore VPID capability. */
2247 if (pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVVPID_INDIV_ADDR)
2248 LogRelFunc(("Only INDIV_ADDR supported. Ignoring VPID.\n"));
2249 if (pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_INVVPID_SINGLE_CONTEXT_RETAIN_GLOBALS)
2250 LogRelFunc(("Only SINGLE_CONTEXT_RETAIN_GLOBALS supported. Ignoring VPID.\n"));
2251 pVM->hm.s.vmx.enmTlbFlushVpid = VMXTLBFLUSHVPID_NOT_SUPPORTED;
2252 pVM->hm.s.vmx.fVpid = false;
2253 }
2254 }
2255 else
2256 {
2257 /* Shouldn't happen. VPID is supported but INVVPID is not supported by the CPU. Ignore VPID capability. */
2258 Log4Func(("VPID supported without INVEPT support. Ignoring VPID.\n"));
2259 pVM->hm.s.vmx.enmTlbFlushVpid = VMXTLBFLUSHVPID_NOT_SUPPORTED;
2260 pVM->hm.s.vmx.fVpid = false;
2261 }
2262 }
2263
2264 /*
2265 * Setup the handler for flushing tagged-TLBs.
2266 */
2267 if (pVM->hm.s.fNestedPaging && pVM->hm.s.vmx.fVpid)
2268 pVM->hm.s.vmx.enmTlbFlushType = VMXTLBFLUSHTYPE_EPT_VPID;
2269 else if (pVM->hm.s.fNestedPaging)
2270 pVM->hm.s.vmx.enmTlbFlushType = VMXTLBFLUSHTYPE_EPT;
2271 else if (pVM->hm.s.vmx.fVpid)
2272 pVM->hm.s.vmx.enmTlbFlushType = VMXTLBFLUSHTYPE_VPID;
2273 else
2274 pVM->hm.s.vmx.enmTlbFlushType = VMXTLBFLUSHTYPE_NONE;
2275 return VINF_SUCCESS;
2276}
2277
2278
2279/**
2280 * Sets up pin-based VM-execution controls in the VMCS.
2281 *
2282 * @returns VBox status code.
2283 * @param pVCpu The cross context virtual CPU structure.
2284 *
2285 * @remarks We don't really care about optimizing vmwrites here as it's done only
2286 * once per VM and hence we don't care about VMCS-field cache comparisons.
2287 */
2288static int hmR0VmxSetupPinCtls(PVMCPU pVCpu)
2289{
2290 PVM pVM = pVCpu->CTX_SUFF(pVM);
2291 uint32_t fVal = pVM->hm.s.vmx.Msrs.PinCtls.n.allowed0; /* Bits set here must always be set. */
2292 uint32_t const fZap = pVM->hm.s.vmx.Msrs.PinCtls.n.allowed1; /* Bits cleared here must always be cleared. */
2293
2294 fVal |= VMX_PIN_CTLS_EXT_INT_EXIT /* External interrupts cause a VM-exit. */
2295 | VMX_PIN_CTLS_NMI_EXIT; /* Non-maskable interrupts (NMIs) cause a VM-exit. */
2296
2297 if (pVM->hm.s.vmx.Msrs.PinCtls.n.allowed1 & VMX_PIN_CTLS_VIRT_NMI)
2298 fVal |= VMX_PIN_CTLS_VIRT_NMI; /* Use virtual NMIs and virtual-NMI blocking features. */
2299
2300 /* Enable the VMX preemption timer. */
2301 if (pVM->hm.s.vmx.fUsePreemptTimer)
2302 {
2303 Assert(pVM->hm.s.vmx.Msrs.PinCtls.n.allowed1 & VMX_PIN_CTLS_PREEMPT_TIMER);
2304 fVal |= VMX_PIN_CTLS_PREEMPT_TIMER;
2305 }
2306
2307#if 0
2308 /* Enable posted-interrupt processing. */
2309 if (pVM->hm.s.fPostedIntrs)
2310 {
2311 Assert(pVM->hm.s.vmx.Msrs.PinCtls.n.allowed1 & VMX_PIN_CTLS_POSTED_INT);
2312 Assert(pVM->hm.s.vmx.Msrs.ExitCtls.n.allowed1 & VMX_EXIT_CTLS_ACK_EXT_INT);
2313 fVal |= VMX_PIN_CTL_POSTED_INT;
2314 }
2315#endif
2316
2317 if ((fVal & fZap) != fVal)
2318 {
2319 LogRelFunc(("Invalid pin-based VM-execution controls combo! Cpu=%#RX32 fVal=%#RX32 fZap=%#RX32\n",
2320 pVM->hm.s.vmx.Msrs.PinCtls.n.allowed0, fVal, fZap));
2321 pVCpu->hm.s.u32HMError = VMX_UFC_CTRL_PIN_EXEC;
2322 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
2323 }
2324
2325 /* Commit it to the VMCS and update our cache. */
2326 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PIN_EXEC, fVal);
2327 AssertRCReturn(rc, rc);
2328 pVCpu->hm.s.vmx.u32PinCtls = fVal;
2329
2330 return VINF_SUCCESS;
2331}
2332
2333
2334/**
2335 * Sets up secondary processor-based VM-execution controls in the VMCS.
2336 *
2337 * @returns VBox status code.
2338 * @param pVCpu The cross context virtual CPU structure.
2339 *
2340 * @remarks We don't really care about optimizing vmwrites here as it's done only
2341 * once per VM and hence we don't care about VMCS-field cache comparisons.
2342 */
2343static int hmR0VmxSetupProcCtls2(PVMCPU pVCpu)
2344{
2345 PVM pVM = pVCpu->CTX_SUFF(pVM);
2346 uint32_t fVal = pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed0; /* Bits set here must be set in the VMCS. */
2347 uint32_t const fZap = pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1; /* Bits cleared here must be cleared in the VMCS. */
2348
2349 /* WBINVD causes a VM-exit. */
2350 if (pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1 & VMX_PROC_CTLS2_WBINVD_EXIT)
2351 fVal |= VMX_PROC_CTLS2_WBINVD_EXIT;
2352
2353 /* Enable EPT (aka nested-paging). */
2354 if (pVM->hm.s.fNestedPaging)
2355 fVal |= VMX_PROC_CTLS2_EPT;
2356
2357 /*
2358 * Enable the INVPCID instruction if supported by the hardware and we expose
2359 * it to the guest. Without this, guest executing INVPCID would cause a #UD.
2360 */
2361 if ( (pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1 & VMX_PROC_CTLS2_INVPCID)
2362 && pVM->cpum.ro.GuestFeatures.fInvpcid)
2363 fVal |= VMX_PROC_CTLS2_INVPCID;
2364
2365 /* Enable VPID. */
2366 if (pVM->hm.s.vmx.fVpid)
2367 fVal |= VMX_PROC_CTLS2_VPID;
2368
2369 /* Enable Unrestricted guest execution. */
2370 if (pVM->hm.s.vmx.fUnrestrictedGuest)
2371 fVal |= VMX_PROC_CTLS2_UNRESTRICTED_GUEST;
2372
2373#if 0
2374 if (pVM->hm.s.fVirtApicRegs)
2375 {
2376 /* Enable APIC-register virtualization. */
2377 Assert(pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1 & VMX_PROC_CTLS2_APIC_REG_VIRT);
2378 fVal |= VMX_PROC_CTLS2_APIC_REG_VIRT;
2379
2380 /* Enable virtual-interrupt delivery. */
2381 Assert(pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1 & VMX_PROC_CTLS2_VIRT_INTR_DELIVERY);
2382 fVal |= VMX_PROC_CTLS2_VIRT_INTR_DELIVERY;
2383 }
2384#endif
2385
2386 /* Virtualize-APIC accesses if supported by the CPU. The virtual-APIC page is where the TPR shadow resides. */
2387 /** @todo VIRT_X2APIC support, it's mutually exclusive with this. So must be
2388 * done dynamically. */
2389 if (pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1 & VMX_PROC_CTLS2_VIRT_APIC_ACCESS)
2390 {
2391 Assert(pVM->hm.s.vmx.HCPhysApicAccess);
2392 Assert(!(pVM->hm.s.vmx.HCPhysApicAccess & 0xfff)); /* Bits 11:0 MBZ. */
2393 fVal |= VMX_PROC_CTLS2_VIRT_APIC_ACCESS; /* Virtualize APIC accesses. */
2394 int rc = VMXWriteVmcs64(VMX_VMCS64_CTRL_APIC_ACCESSADDR_FULL, pVM->hm.s.vmx.HCPhysApicAccess);
2395 AssertRCReturn(rc, rc);
2396 }
2397
2398 /* Enable RDTSCP. */
2399 if (pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1 & VMX_PROC_CTLS2_RDTSCP)
2400 fVal |= VMX_PROC_CTLS2_RDTSCP;
2401
2402 /* Enable Pause-Loop exiting. */
2403 if ( pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1 & VMX_PROC_CTLS2_PAUSE_LOOP_EXIT
2404 && pVM->hm.s.vmx.cPleGapTicks
2405 && pVM->hm.s.vmx.cPleWindowTicks)
2406 {
2407 fVal |= VMX_PROC_CTLS2_PAUSE_LOOP_EXIT;
2408
2409 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PLE_GAP, pVM->hm.s.vmx.cPleGapTicks);
2410 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_PLE_WINDOW, pVM->hm.s.vmx.cPleWindowTicks);
2411 AssertRCReturn(rc, rc);
2412 }
2413
2414 if ((fVal & fZap) != fVal)
2415 {
2416 LogRelFunc(("Invalid secondary processor-based VM-execution controls combo! cpu=%#RX32 fVal=%#RX32 fZap=%#RX32\n",
2417 pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed0, fVal, fZap));
2418 pVCpu->hm.s.u32HMError = VMX_UFC_CTRL_PROC_EXEC2;
2419 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
2420 }
2421
2422 /* Commit it to the VMCS and update our cache. */
2423 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC2, fVal);
2424 AssertRCReturn(rc, rc);
2425 pVCpu->hm.s.vmx.u32ProcCtls2 = fVal;
2426
2427 return VINF_SUCCESS;
2428}
2429
2430
2431/**
2432 * Sets up processor-based VM-execution controls in the VMCS.
2433 *
2434 * @returns VBox status code.
2435 * @param pVCpu The cross context virtual CPU structure.
2436 *
2437 * @remarks We don't really care about optimizing vmwrites here as it's done only
2438 * once per VM and hence we don't care about VMCS-field cache comparisons.
2439 */
2440static int hmR0VmxSetupProcCtls(PVMCPU pVCpu)
2441{
2442 PVM pVM = pVCpu->CTX_SUFF(pVM);
2443 uint32_t fVal = pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed0; /* Bits set here must be set in the VMCS. */
2444 uint32_t const fZap = pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1; /* Bits cleared here must be cleared in the VMCS. */
2445
2446 fVal |= VMX_PROC_CTLS_HLT_EXIT /* HLT causes a VM-exit. */
2447 | VMX_PROC_CTLS_USE_TSC_OFFSETTING /* Use TSC-offsetting. */
2448 | VMX_PROC_CTLS_MOV_DR_EXIT /* MOV DRx causes a VM-exit. */
2449 | VMX_PROC_CTLS_UNCOND_IO_EXIT /* All IO instructions cause a VM-exit. */
2450 | VMX_PROC_CTLS_RDPMC_EXIT /* RDPMC causes a VM-exit. */
2451 | VMX_PROC_CTLS_MONITOR_EXIT /* MONITOR causes a VM-exit. */
2452 | VMX_PROC_CTLS_MWAIT_EXIT; /* MWAIT causes a VM-exit. */
2453
2454 /* We toggle VMX_PROC_CTLS_MOV_DR_EXIT later, check if it's not -always- needed to be set or clear. */
2455 if ( !(pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_MOV_DR_EXIT)
2456 || (pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed0 & VMX_PROC_CTLS_MOV_DR_EXIT))
2457 {
2458 LogRelFunc(("Unsupported VMX_PROC_CTLS_MOV_DR_EXIT combo!"));
2459 pVCpu->hm.s.u32HMError = VMX_UFC_CTRL_PROC_MOV_DRX_EXIT;
2460 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
2461 }
2462
2463 /* Without Nested Paging, INVLPG (also affects INVPCID) and MOV CR3 instructions should cause VM-exits. */
2464 if (!pVM->hm.s.fNestedPaging)
2465 {
2466 Assert(!pVM->hm.s.vmx.fUnrestrictedGuest); /* Paranoia. */
2467 fVal |= VMX_PROC_CTLS_INVLPG_EXIT
2468 | VMX_PROC_CTLS_CR3_LOAD_EXIT
2469 | VMX_PROC_CTLS_CR3_STORE_EXIT;
2470 }
2471
2472 /* Use TPR shadowing if supported by the CPU. */
2473 if ( PDMHasApic(pVM)
2474 && pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_USE_TPR_SHADOW)
2475 {
2476 Assert(pVCpu->hm.s.vmx.HCPhysVirtApic);
2477 Assert(!(pVCpu->hm.s.vmx.HCPhysVirtApic & 0xfff)); /* Bits 11:0 MBZ. */
2478 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_TPR_THRESHOLD, 0);
2479 rc |= VMXWriteVmcs64(VMX_VMCS64_CTRL_VIRT_APIC_PAGEADDR_FULL, pVCpu->hm.s.vmx.HCPhysVirtApic);
2480 AssertRCReturn(rc, rc);
2481
2482 fVal |= VMX_PROC_CTLS_USE_TPR_SHADOW; /* CR8 reads from the Virtual-APIC page. */
2483 /* CR8 writes cause a VM-exit based on TPR threshold. */
2484 Assert(!(fVal & VMX_PROC_CTLS_CR8_STORE_EXIT));
2485 Assert(!(fVal & VMX_PROC_CTLS_CR8_LOAD_EXIT));
2486 }
2487 else
2488 {
2489 /*
2490 * Some 32-bit CPUs do not support CR8 load/store exiting as MOV CR8 is invalid on 32-bit Intel CPUs.
2491 * Set this control only for 64-bit guests.
2492 */
2493 if (pVM->hm.s.fAllow64BitGuests)
2494 {
2495 fVal |= VMX_PROC_CTLS_CR8_STORE_EXIT /* CR8 reads cause a VM-exit. */
2496 | VMX_PROC_CTLS_CR8_LOAD_EXIT; /* CR8 writes cause a VM-exit. */
2497 }
2498 }
2499
2500 /* Use MSR-bitmaps if supported by the CPU. */
2501 if (pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_USE_MSR_BITMAPS)
2502 {
2503 fVal |= VMX_PROC_CTLS_USE_MSR_BITMAPS;
2504
2505 Assert(pVCpu->hm.s.vmx.HCPhysMsrBitmap);
2506 Assert(!(pVCpu->hm.s.vmx.HCPhysMsrBitmap & 0xfff)); /* Bits 11:0 MBZ. */
2507 int rc = VMXWriteVmcs64(VMX_VMCS64_CTRL_MSR_BITMAP_FULL, pVCpu->hm.s.vmx.HCPhysMsrBitmap);
2508 AssertRCReturn(rc, rc);
2509
2510 /*
2511 * The guest can access the following MSRs (read, write) without causing VM-exits; they are loaded/stored
2512 * automatically using dedicated fields in the VMCS.
2513 */
2514 hmR0VmxSetMsrPermission(pVCpu, MSR_IA32_SYSENTER_CS, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2515 hmR0VmxSetMsrPermission(pVCpu, MSR_IA32_SYSENTER_ESP, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2516 hmR0VmxSetMsrPermission(pVCpu, MSR_IA32_SYSENTER_EIP, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2517 hmR0VmxSetMsrPermission(pVCpu, MSR_K8_GS_BASE, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2518 hmR0VmxSetMsrPermission(pVCpu, MSR_K8_FS_BASE, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2519#if HC_ARCH_BITS == 64
2520 /*
2521 * Set passthru permissions for the following MSRs (mandatory for VT-x) required for 64-bit guests.
2522 */
2523 if (pVM->hm.s.fAllow64BitGuests)
2524 {
2525 hmR0VmxSetMsrPermission(pVCpu, MSR_K8_LSTAR, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2526 hmR0VmxSetMsrPermission(pVCpu, MSR_K6_STAR, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2527 hmR0VmxSetMsrPermission(pVCpu, MSR_K8_SF_MASK, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2528 hmR0VmxSetMsrPermission(pVCpu, MSR_K8_KERNEL_GS_BASE, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2529 }
2530#endif
2531 /*
2532 * The IA32_PRED_CMD MSR is write-only and has no state associated with it. We never need to intercept
2533 * access (writes need to be executed without exiting, reds will #GP-fault anyway).
2534 */
2535 if (pVM->cpum.ro.GuestFeatures.fIbpb)
2536 hmR0VmxSetMsrPermission(pVCpu, MSR_IA32_PRED_CMD, VMXMSREXIT_PASSTHRU_READ, VMXMSREXIT_PASSTHRU_WRITE);
2537
2538 /* Though MSR_IA32_PERF_GLOBAL_CTRL is saved/restored lazily, we want intercept reads/write to it for now. */
2539 }
2540
2541 /* Use the secondary processor-based VM-execution controls if supported by the CPU. */
2542 if (pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_USE_SECONDARY_CTLS)
2543 fVal |= VMX_PROC_CTLS_USE_SECONDARY_CTLS;
2544
2545 if ((fVal & fZap) != fVal)
2546 {
2547 LogRelFunc(("Invalid processor-based VM-execution controls combo! cpu=%#RX32 fVal=%#RX32 fZap=%#RX32\n",
2548 pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed0, fVal, fZap));
2549 pVCpu->hm.s.u32HMError = VMX_UFC_CTRL_PROC_EXEC;
2550 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
2551 }
2552
2553 /* Commit it to the VMCS and update our cache. */
2554 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, fVal);
2555 AssertRCReturn(rc, rc);
2556 pVCpu->hm.s.vmx.u32ProcCtls = fVal;
2557
2558 /* Set up secondary processor-based VM-execution controls if the CPU supports it. */
2559 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_SECONDARY_CTLS)
2560 return hmR0VmxSetupProcCtls2(pVCpu);
2561
2562 /* Sanity check, should not really happen. */
2563 if (RT_UNLIKELY(pVM->hm.s.vmx.fUnrestrictedGuest))
2564 {
2565 LogRelFunc(("Unrestricted Guest enabled when secondary processor-based VM-execution controls not available\n"));
2566 pVCpu->hm.s.u32HMError = VMX_UFC_INVALID_UX_COMBO;
2567 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
2568 }
2569
2570 /* Old CPUs without secondary processor-based VM-execution controls would end up here. */
2571 return VINF_SUCCESS;
2572}
2573
2574
2575/**
2576 * Sets up miscellaneous (everything other than Pin & Processor-based
2577 * VM-execution) control fields in the VMCS.
2578 *
2579 * @returns VBox status code.
2580 * @param pVCpu The cross context virtual CPU structure.
2581 */
2582static int hmR0VmxSetupMiscCtls(PVMCPU pVCpu)
2583{
2584 AssertPtr(pVCpu);
2585
2586 int rc = VERR_GENERAL_FAILURE;
2587
2588 /* All fields are zero-initialized during allocation; but don't remove the commented block below. */
2589#if 0
2590 /* All CR3 accesses cause VM-exits. Later we optimize CR3 accesses (see hmR0VmxExportGuestCR3AndCR4())*/
2591 rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_CR3_TARGET_COUNT, 0);
2592 rc |= VMXWriteVmcs64(VMX_VMCS64_CTRL_TSC_OFFSET_FULL, 0);
2593
2594 /*
2595 * Set MASK & MATCH to 0. VMX checks if GuestPFErrCode & MASK == MATCH. If equal (in our case it always is)
2596 * and if the X86_XCPT_PF bit in the exception bitmap is set it causes a VM-exit, if clear doesn't cause an exit.
2597 * We thus use the exception bitmap to control it rather than use both.
2598 */
2599 rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PAGEFAULT_ERROR_MASK, 0);
2600 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_PAGEFAULT_ERROR_MATCH, 0);
2601
2602 /* All IO & IOIO instructions cause VM-exits. */
2603 rc |= VMXWriteVmcs64(VMX_VMCS64_CTRL_IO_BITMAP_A_FULL, 0);
2604 rc |= VMXWriteVmcs64(VMX_VMCS64_CTRL_IO_BITMAP_B_FULL, 0);
2605
2606 /* Initialize the MSR-bitmap area. */
2607 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_ENTRY_MSR_LOAD_COUNT, 0);
2608 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_EXIT_MSR_STORE_COUNT, 0);
2609 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_EXIT_MSR_LOAD_COUNT, 0);
2610 AssertRCReturn(rc, rc);
2611#endif
2612
2613 /* Setup MSR auto-load/store area. */
2614 Assert(pVCpu->hm.s.vmx.HCPhysGuestMsr);
2615 Assert(!(pVCpu->hm.s.vmx.HCPhysGuestMsr & 0xf)); /* Lower 4 bits MBZ. */
2616 rc = VMXWriteVmcs64(VMX_VMCS64_CTRL_ENTRY_MSR_LOAD_FULL, pVCpu->hm.s.vmx.HCPhysGuestMsr);
2617 rc |= VMXWriteVmcs64(VMX_VMCS64_CTRL_EXIT_MSR_STORE_FULL, pVCpu->hm.s.vmx.HCPhysGuestMsr);
2618 AssertRCReturn(rc, rc);
2619
2620 Assert(pVCpu->hm.s.vmx.HCPhysHostMsr);
2621 Assert(!(pVCpu->hm.s.vmx.HCPhysHostMsr & 0xf)); /* Lower 4 bits MBZ. */
2622 rc = VMXWriteVmcs64(VMX_VMCS64_CTRL_EXIT_MSR_LOAD_FULL, pVCpu->hm.s.vmx.HCPhysHostMsr);
2623 AssertRCReturn(rc, rc);
2624
2625 /* Set VMCS link pointer. Reserved for future use, must be -1. Intel spec. 24.4 "Guest-State Area". */
2626 rc = VMXWriteVmcs64(VMX_VMCS64_GUEST_VMCS_LINK_PTR_FULL, UINT64_C(0xffffffffffffffff));
2627 AssertRCReturn(rc, rc);
2628
2629 /* All fields are zero-initialized during allocation; but don't remove the commented block below. */
2630#if 0
2631 /* Setup debug controls */
2632 rc = VMXWriteVmcs64(VMX_VMCS64_GUEST_DEBUGCTL_FULL, 0);
2633 rc |= VMXWriteVmcs32(VMX_VMCS_GUEST_PENDING_DEBUG_XCPTS, 0);
2634 AssertRCReturn(rc, rc);
2635#endif
2636
2637 return rc;
2638}
2639
2640
2641/**
2642 * Sets up the initial exception bitmap in the VMCS based on static conditions.
2643 *
2644 * We shall setup those exception intercepts that don't change during the
2645 * lifetime of the VM here. The rest are done dynamically while loading the
2646 * guest state.
2647 *
2648 * @returns VBox status code.
2649 * @param pVCpu The cross context virtual CPU structure.
2650 */
2651static int hmR0VmxInitXcptBitmap(PVMCPU pVCpu)
2652{
2653 AssertPtr(pVCpu);
2654
2655 uint32_t uXcptBitmap;
2656
2657 /* Must always intercept #AC to prevent the guest from hanging the CPU. */
2658 uXcptBitmap = RT_BIT_32(X86_XCPT_AC);
2659
2660 /* Because we need to maintain the DR6 state even when intercepting DRx reads
2661 and writes, and because recursive #DBs can cause the CPU hang, we must always
2662 intercept #DB. */
2663 uXcptBitmap |= RT_BIT_32(X86_XCPT_DB);
2664
2665 /* Without Nested Paging, #PF must cause a VM-exit so we can sync our shadow page tables. */
2666 if (!pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging)
2667 uXcptBitmap |= RT_BIT(X86_XCPT_PF);
2668
2669 /* Commit it to the VMCS. */
2670 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_EXCEPTION_BITMAP, uXcptBitmap);
2671 AssertRCReturn(rc, rc);
2672
2673 /* Update our cache of the exception bitmap. */
2674 pVCpu->hm.s.vmx.u32XcptBitmap = uXcptBitmap;
2675 return VINF_SUCCESS;
2676}
2677
2678
2679/**
2680 * Does per-VM VT-x initialization.
2681 *
2682 * @returns VBox status code.
2683 * @param pVM The cross context VM structure.
2684 */
2685VMMR0DECL(int) VMXR0InitVM(PVM pVM)
2686{
2687 LogFlowFunc(("pVM=%p\n", pVM));
2688
2689 int rc = hmR0VmxStructsAlloc(pVM);
2690 if (RT_FAILURE(rc))
2691 {
2692 LogRelFunc(("hmR0VmxStructsAlloc failed! rc=%Rrc\n", rc));
2693 return rc;
2694 }
2695
2696 return VINF_SUCCESS;
2697}
2698
2699
2700/**
2701 * Does per-VM VT-x termination.
2702 *
2703 * @returns VBox status code.
2704 * @param pVM The cross context VM structure.
2705 */
2706VMMR0DECL(int) VMXR0TermVM(PVM pVM)
2707{
2708 LogFlowFunc(("pVM=%p\n", pVM));
2709
2710#ifdef VBOX_WITH_CRASHDUMP_MAGIC
2711 if (pVM->hm.s.vmx.hMemObjScratch != NIL_RTR0MEMOBJ)
2712 ASMMemZero32(pVM->hm.s.vmx.pvScratch, PAGE_SIZE);
2713#endif
2714 hmR0VmxStructsFree(pVM);
2715 return VINF_SUCCESS;
2716}
2717
2718
2719/**
2720 * Sets up the VM for execution under VT-x.
2721 * This function is only called once per-VM during initialization.
2722 *
2723 * @returns VBox status code.
2724 * @param pVM The cross context VM structure.
2725 */
2726VMMR0DECL(int) VMXR0SetupVM(PVM pVM)
2727{
2728 AssertPtrReturn(pVM, VERR_INVALID_PARAMETER);
2729 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
2730
2731 LogFlowFunc(("pVM=%p\n", pVM));
2732
2733 /*
2734 * Without UnrestrictedGuest, pRealModeTSS and pNonPagingModeEPTPageTable *must* always be
2735 * allocated. We no longer support the highly unlikely case of UnrestrictedGuest without
2736 * pRealModeTSS, see hmR3InitFinalizeR0Intel().
2737 */
2738 if ( !pVM->hm.s.vmx.fUnrestrictedGuest
2739 && ( !pVM->hm.s.vmx.pNonPagingModeEPTPageTable
2740 || !pVM->hm.s.vmx.pRealModeTSS))
2741 {
2742 LogRelFunc(("Invalid real-on-v86 state.\n"));
2743 return VERR_INTERNAL_ERROR;
2744 }
2745
2746 /* Initialize these always, see hmR3InitFinalizeR0().*/
2747 pVM->hm.s.vmx.enmTlbFlushEpt = VMXTLBFLUSHEPT_NONE;
2748 pVM->hm.s.vmx.enmTlbFlushVpid = VMXTLBFLUSHVPID_NONE;
2749
2750 /* Setup the tagged-TLB flush handlers. */
2751 int rc = hmR0VmxSetupTaggedTlb(pVM);
2752 if (RT_FAILURE(rc))
2753 {
2754 LogRelFunc(("hmR0VmxSetupTaggedTlb failed! rc=%Rrc\n", rc));
2755 return rc;
2756 }
2757
2758 /* Check if we can use the VMCS controls for swapping the EFER MSR. */
2759 Assert(!pVM->hm.s.vmx.fSupportsVmcsEfer);
2760#if HC_ARCH_BITS == 64
2761 if ( (pVM->hm.s.vmx.Msrs.EntryCtls.n.allowed1 & VMX_ENTRY_CTLS_LOAD_EFER_MSR)
2762 && (pVM->hm.s.vmx.Msrs.ExitCtls.n.allowed1 & VMX_EXIT_CTLS_LOAD_EFER_MSR)
2763 && (pVM->hm.s.vmx.Msrs.ExitCtls.n.allowed1 & VMX_EXIT_CTLS_SAVE_EFER_MSR))
2764 {
2765 pVM->hm.s.vmx.fSupportsVmcsEfer = true;
2766 }
2767#endif
2768
2769 /* At least verify VMX is enabled, since we can't check if we're in VMX root mode without #GP'ing. */
2770 RTCCUINTREG const uHostCR4 = ASMGetCR4();
2771 if (RT_UNLIKELY(!(uHostCR4 & X86_CR4_VMXE)))
2772 return VERR_VMX_NOT_IN_VMX_ROOT_MODE;
2773
2774 for (VMCPUID i = 0; i < pVM->cCpus; i++)
2775 {
2776 PVMCPU pVCpu = &pVM->aCpus[i];
2777 AssertPtr(pVCpu);
2778 AssertPtr(pVCpu->hm.s.vmx.pvVmcs);
2779
2780 /* Log the VCPU pointers, useful for debugging SMP VMs. */
2781 Log4Func(("pVCpu=%p idCpu=%RU32\n", pVCpu, pVCpu->idCpu));
2782
2783 /* Set revision dword at the beginning of the VMCS structure. */
2784 *(uint32_t *)pVCpu->hm.s.vmx.pvVmcs = RT_BF_GET(pVM->hm.s.vmx.Msrs.u64Basic, VMX_BF_BASIC_VMCS_ID);
2785
2786 /* Set the VMCS launch state to "clear", see Intel spec. 31.6 "Preparation and launch a virtual machine". */
2787 rc = VMXClearVmcs(pVCpu->hm.s.vmx.HCPhysVmcs);
2788 AssertLogRelMsgRCReturnStmt(rc, ("VMXR0SetupVM: VMXClearVmcs failed! rc=%Rrc\n", rc),
2789 hmR0VmxUpdateErrorRecord(pVCpu, rc), rc);
2790
2791 /* Load this VMCS as the current VMCS. */
2792 rc = VMXActivateVmcs(pVCpu->hm.s.vmx.HCPhysVmcs);
2793 AssertLogRelMsgRCReturnStmt(rc, ("VMXR0SetupVM: VMXActivateVmcs failed! rc=%Rrc\n", rc),
2794 hmR0VmxUpdateErrorRecord(pVCpu, rc), rc);
2795
2796 rc = hmR0VmxSetupPinCtls(pVCpu);
2797 AssertLogRelMsgRCReturnStmt(rc, ("VMXR0SetupVM: hmR0VmxSetupPinCtls failed! rc=%Rrc\n", rc),
2798 hmR0VmxUpdateErrorRecord(pVCpu, rc), rc);
2799
2800 rc = hmR0VmxSetupProcCtls(pVCpu);
2801 AssertLogRelMsgRCReturnStmt(rc, ("VMXR0SetupVM: hmR0VmxSetupProcCtls failed! rc=%Rrc\n", rc),
2802 hmR0VmxUpdateErrorRecord(pVCpu, rc), rc);
2803
2804 rc = hmR0VmxSetupMiscCtls(pVCpu);
2805 AssertLogRelMsgRCReturnStmt(rc, ("VMXR0SetupVM: hmR0VmxSetupMiscCtls failed! rc=%Rrc\n", rc),
2806 hmR0VmxUpdateErrorRecord(pVCpu, rc), rc);
2807
2808 rc = hmR0VmxInitXcptBitmap(pVCpu);
2809 AssertLogRelMsgRCReturnStmt(rc, ("VMXR0SetupVM: hmR0VmxInitXcptBitmap failed! rc=%Rrc\n", rc),
2810 hmR0VmxUpdateErrorRecord(pVCpu, rc), rc);
2811
2812#if HC_ARCH_BITS == 32
2813 rc = hmR0VmxInitVmcsReadCache(pVCpu);
2814 AssertLogRelMsgRCReturnStmt(rc, ("VMXR0SetupVM: hmR0VmxInitVmcsReadCache failed! rc=%Rrc\n", rc),
2815 hmR0VmxUpdateErrorRecord(pVCpu, rc), rc);
2816#endif
2817
2818 /* Sync any CPU internal VMCS data back into our VMCS in memory. */
2819 rc = VMXClearVmcs(pVCpu->hm.s.vmx.HCPhysVmcs);
2820 AssertLogRelMsgRCReturnStmt(rc, ("VMXR0SetupVM: VMXClearVmcs(2) failed! rc=%Rrc\n", rc),
2821 hmR0VmxUpdateErrorRecord(pVCpu, rc), rc);
2822
2823 pVCpu->hm.s.vmx.uVmcsState = HMVMX_VMCS_STATE_CLEAR;
2824
2825 hmR0VmxUpdateErrorRecord(pVCpu, rc);
2826 }
2827
2828 return VINF_SUCCESS;
2829}
2830
2831
2832/**
2833 * Saves the host control registers (CR0, CR3, CR4) into the host-state area in
2834 * the VMCS.
2835 *
2836 * @returns VBox status code.
2837 */
2838static int hmR0VmxExportHostControlRegs(void)
2839{
2840 RTCCUINTREG uReg = ASMGetCR0();
2841 int rc = VMXWriteVmcsHstN(VMX_VMCS_HOST_CR0, uReg);
2842 AssertRCReturn(rc, rc);
2843
2844 uReg = ASMGetCR3();
2845 rc = VMXWriteVmcsHstN(VMX_VMCS_HOST_CR3, uReg);
2846 AssertRCReturn(rc, rc);
2847
2848 uReg = ASMGetCR4();
2849 rc = VMXWriteVmcsHstN(VMX_VMCS_HOST_CR4, uReg);
2850 AssertRCReturn(rc, rc);
2851 return rc;
2852}
2853
2854
2855/**
2856 * Saves the host segment registers and GDTR, IDTR, (TR, GS and FS bases) into
2857 * the host-state area in the VMCS.
2858 *
2859 * @returns VBox status code.
2860 * @param pVCpu The cross context virtual CPU structure.
2861 */
2862static int hmR0VmxExportHostSegmentRegs(PVMCPU pVCpu)
2863{
2864#if HC_ARCH_BITS == 64
2865/**
2866 * Macro for adjusting host segment selectors to satisfy VT-x's VM-entry
2867 * requirements. See hmR0VmxExportHostSegmentRegs().
2868 */
2869# define VMXLOCAL_ADJUST_HOST_SEG(seg, selValue) \
2870 if ((selValue) & (X86_SEL_RPL | X86_SEL_LDT)) \
2871 { \
2872 bool fValidSelector = true; \
2873 if ((selValue) & X86_SEL_LDT) \
2874 { \
2875 uint32_t uAttr = ASMGetSegAttr((selValue)); \
2876 fValidSelector = RT_BOOL(uAttr != UINT32_MAX && (uAttr & X86_DESC_P)); \
2877 } \
2878 if (fValidSelector) \
2879 { \
2880 pVCpu->hm.s.vmx.fRestoreHostFlags |= VMX_RESTORE_HOST_SEL_##seg; \
2881 pVCpu->hm.s.vmx.RestoreHost.uHostSel##seg = (selValue); \
2882 } \
2883 (selValue) = 0; \
2884 }
2885
2886 /*
2887 * If we've executed guest code using VT-x, the host-state bits will be messed up. We
2888 * should -not- save the messed up state without restoring the original host-state,
2889 * see @bugref{7240}.
2890 *
2891 * This apparently can happen (most likely the FPU changes), deal with it rather than
2892 * asserting. Was observed booting Solaris 10u10 32-bit guest.
2893 */
2894 if ( (pVCpu->hm.s.vmx.fRestoreHostFlags & VMX_RESTORE_HOST_REQUIRED)
2895 && (pVCpu->hm.s.vmx.fRestoreHostFlags & ~VMX_RESTORE_HOST_REQUIRED))
2896 {
2897 Log4Func(("Restoring Host State: fRestoreHostFlags=%#RX32 HostCpuId=%u\n", pVCpu->hm.s.vmx.fRestoreHostFlags,
2898 pVCpu->idCpu));
2899 VMXRestoreHostState(pVCpu->hm.s.vmx.fRestoreHostFlags, &pVCpu->hm.s.vmx.RestoreHost);
2900 }
2901 pVCpu->hm.s.vmx.fRestoreHostFlags = 0;
2902#else
2903 RT_NOREF(pVCpu);
2904#endif
2905
2906 /*
2907 * Host DS, ES, FS and GS segment registers.
2908 */
2909#if HC_ARCH_BITS == 64
2910 RTSEL uSelDS = ASMGetDS();
2911 RTSEL uSelES = ASMGetES();
2912 RTSEL uSelFS = ASMGetFS();
2913 RTSEL uSelGS = ASMGetGS();
2914#else
2915 RTSEL uSelDS = 0;
2916 RTSEL uSelES = 0;
2917 RTSEL uSelFS = 0;
2918 RTSEL uSelGS = 0;
2919#endif
2920
2921 /*
2922 * Host CS and SS segment registers.
2923 */
2924 RTSEL uSelCS = ASMGetCS();
2925 RTSEL uSelSS = ASMGetSS();
2926
2927 /*
2928 * Host TR segment register.
2929 */
2930 RTSEL uSelTR = ASMGetTR();
2931
2932#if HC_ARCH_BITS == 64
2933 /*
2934 * Determine if the host segment registers are suitable for VT-x. Otherwise use zero to
2935 * gain VM-entry and restore them before we get preempted.
2936 *
2937 * See Intel spec. 26.2.3 "Checks on Host Segment and Descriptor-Table Registers".
2938 */
2939 VMXLOCAL_ADJUST_HOST_SEG(DS, uSelDS);
2940 VMXLOCAL_ADJUST_HOST_SEG(ES, uSelES);
2941 VMXLOCAL_ADJUST_HOST_SEG(FS, uSelFS);
2942 VMXLOCAL_ADJUST_HOST_SEG(GS, uSelGS);
2943# undef VMXLOCAL_ADJUST_HOST_SEG
2944#endif
2945
2946 /* Verification based on Intel spec. 26.2.3 "Checks on Host Segment and Descriptor-Table Registers" */
2947 Assert(!(uSelCS & X86_SEL_RPL)); Assert(!(uSelCS & X86_SEL_LDT));
2948 Assert(!(uSelSS & X86_SEL_RPL)); Assert(!(uSelSS & X86_SEL_LDT));
2949 Assert(!(uSelDS & X86_SEL_RPL)); Assert(!(uSelDS & X86_SEL_LDT));
2950 Assert(!(uSelES & X86_SEL_RPL)); Assert(!(uSelES & X86_SEL_LDT));
2951 Assert(!(uSelFS & X86_SEL_RPL)); Assert(!(uSelFS & X86_SEL_LDT));
2952 Assert(!(uSelGS & X86_SEL_RPL)); Assert(!(uSelGS & X86_SEL_LDT));
2953 Assert(!(uSelTR & X86_SEL_RPL)); Assert(!(uSelTR & X86_SEL_LDT));
2954 Assert(uSelCS);
2955 Assert(uSelTR);
2956
2957 /* Assertion is right but we would not have updated u32ExitCtls yet. */
2958#if 0
2959 if (!(pVCpu->hm.s.vmx.u32ExitCtls & VMX_EXIT_CTLS_HOST_ADDR_SPACE_SIZE))
2960 Assert(uSelSS != 0);
2961#endif
2962
2963 /* Write these host selector fields into the host-state area in the VMCS. */
2964 int rc = VMXWriteVmcs32(VMX_VMCS16_HOST_CS_SEL, uSelCS);
2965 rc |= VMXWriteVmcs32(VMX_VMCS16_HOST_SS_SEL, uSelSS);
2966#if HC_ARCH_BITS == 64
2967 rc |= VMXWriteVmcs32(VMX_VMCS16_HOST_DS_SEL, uSelDS);
2968 rc |= VMXWriteVmcs32(VMX_VMCS16_HOST_ES_SEL, uSelES);
2969 rc |= VMXWriteVmcs32(VMX_VMCS16_HOST_FS_SEL, uSelFS);
2970 rc |= VMXWriteVmcs32(VMX_VMCS16_HOST_GS_SEL, uSelGS);
2971#else
2972 NOREF(uSelDS);
2973 NOREF(uSelES);
2974 NOREF(uSelFS);
2975 NOREF(uSelGS);
2976#endif
2977 rc |= VMXWriteVmcs32(VMX_VMCS16_HOST_TR_SEL, uSelTR);
2978 AssertRCReturn(rc, rc);
2979
2980 /*
2981 * Host GDTR and IDTR.
2982 */
2983 RTGDTR Gdtr;
2984 RTIDTR Idtr;
2985 RT_ZERO(Gdtr);
2986 RT_ZERO(Idtr);
2987 ASMGetGDTR(&Gdtr);
2988 ASMGetIDTR(&Idtr);
2989 rc = VMXWriteVmcsHstN(VMX_VMCS_HOST_GDTR_BASE, Gdtr.pGdt);
2990 rc |= VMXWriteVmcsHstN(VMX_VMCS_HOST_IDTR_BASE, Idtr.pIdt);
2991 AssertRCReturn(rc, rc);
2992
2993#if HC_ARCH_BITS == 64
2994 /*
2995 * Determine if we need to manually need to restore the GDTR and IDTR limits as VT-x zaps
2996 * them to the maximum limit (0xffff) on every VM-exit.
2997 */
2998 if (Gdtr.cbGdt != 0xffff)
2999 pVCpu->hm.s.vmx.fRestoreHostFlags |= VMX_RESTORE_HOST_GDTR;
3000
3001 /*
3002 * IDT limit is effectively capped at 0xfff. (See Intel spec. 6.14.1 "64-Bit Mode IDT" and
3003 * Intel spec. 6.2 "Exception and Interrupt Vectors".) Therefore if the host has the limit
3004 * as 0xfff, VT-x bloating the limit to 0xffff shouldn't cause any different CPU behavior.
3005 * However, several hosts either insists on 0xfff being the limit (Windows Patch Guard) or
3006 * uses the limit for other purposes (darwin puts the CPU ID in there but botches sidt
3007 * alignment in at least one consumer). So, we're only allowing the IDTR.LIMIT to be left
3008 * at 0xffff on hosts where we are sure it won't cause trouble.
3009 */
3010# if defined(RT_OS_LINUX) || defined(RT_OS_SOLARIS)
3011 if (Idtr.cbIdt < 0x0fff)
3012# else
3013 if (Idtr.cbIdt != 0xffff)
3014# endif
3015 {
3016 pVCpu->hm.s.vmx.fRestoreHostFlags |= VMX_RESTORE_HOST_IDTR;
3017 AssertCompile(sizeof(Idtr) == sizeof(X86XDTR64));
3018 memcpy(&pVCpu->hm.s.vmx.RestoreHost.HostIdtr, &Idtr, sizeof(X86XDTR64));
3019 }
3020#endif
3021
3022 /*
3023 * Host TR base. Verify that TR selector doesn't point past the GDT. Masking off the TI
3024 * and RPL bits is effectively what the CPU does for "scaling by 8". TI is always 0 and
3025 * RPL should be too in most cases.
3026 */
3027 AssertMsgReturn((uSelTR | X86_SEL_RPL_LDT) <= Gdtr.cbGdt,
3028 ("TR selector exceeds limit. TR=%RTsel cbGdt=%#x\n", uSelTR, Gdtr.cbGdt), VERR_VMX_INVALID_HOST_STATE);
3029
3030 PCX86DESCHC pDesc = (PCX86DESCHC)(Gdtr.pGdt + (uSelTR & X86_SEL_MASK));
3031#if HC_ARCH_BITS == 64
3032 uintptr_t uTRBase = X86DESC64_BASE(pDesc);
3033
3034 /*
3035 * VT-x unconditionally restores the TR limit to 0x67 and type to 11 (32-bit busy TSS) on
3036 * all VM-exits. The type is the same for 64-bit busy TSS[1]. The limit needs manual
3037 * restoration if the host has something else. Task switching is not supported in 64-bit
3038 * mode[2], but the limit still matters as IOPM is supported in 64-bit mode. Restoring the
3039 * limit lazily while returning to ring-3 is safe because IOPM is not applicable in ring-0.
3040 *
3041 * [1] See Intel spec. 3.5 "System Descriptor Types".
3042 * [2] See Intel spec. 7.2.3 "TSS Descriptor in 64-bit mode".
3043 */
3044 PVM pVM = pVCpu->CTX_SUFF(pVM);
3045 Assert(pDesc->System.u4Type == 11);
3046 if ( pDesc->System.u16LimitLow != 0x67
3047 || pDesc->System.u4LimitHigh)
3048 {
3049 pVCpu->hm.s.vmx.fRestoreHostFlags |= VMX_RESTORE_HOST_SEL_TR;
3050 /* If the host has made GDT read-only, we would need to temporarily toggle CR0.WP before writing the GDT. */
3051 if (pVM->hm.s.fHostKernelFeatures & SUPKERNELFEATURES_GDT_READ_ONLY)
3052 pVCpu->hm.s.vmx.fRestoreHostFlags |= VMX_RESTORE_HOST_GDT_READ_ONLY;
3053 pVCpu->hm.s.vmx.RestoreHost.uHostSelTR = uSelTR;
3054 }
3055
3056 /*
3057 * Store the GDTR as we need it when restoring the GDT and while restoring the TR.
3058 */
3059 if (pVCpu->hm.s.vmx.fRestoreHostFlags & (VMX_RESTORE_HOST_GDTR | VMX_RESTORE_HOST_SEL_TR))
3060 {
3061 AssertCompile(sizeof(Gdtr) == sizeof(X86XDTR64));
3062 memcpy(&pVCpu->hm.s.vmx.RestoreHost.HostGdtr, &Gdtr, sizeof(X86XDTR64));
3063 if (pVM->hm.s.fHostKernelFeatures & SUPKERNELFEATURES_GDT_NEED_WRITABLE)
3064 {
3065 /* The GDT is read-only but the writable GDT is available. */
3066 pVCpu->hm.s.vmx.fRestoreHostFlags |= VMX_RESTORE_HOST_GDT_NEED_WRITABLE;
3067 pVCpu->hm.s.vmx.RestoreHost.HostGdtrRw.cb = Gdtr.cbGdt;
3068 rc = SUPR0GetCurrentGdtRw(&pVCpu->hm.s.vmx.RestoreHost.HostGdtrRw.uAddr);
3069 AssertRCReturn(rc, rc);
3070 }
3071 }
3072#else
3073 uintptr_t uTRBase = X86DESC_BASE(pDesc);
3074#endif
3075 rc = VMXWriteVmcsHstN(VMX_VMCS_HOST_TR_BASE, uTRBase);
3076 AssertRCReturn(rc, rc);
3077
3078 /*
3079 * Host FS base and GS base.
3080 */
3081#if HC_ARCH_BITS == 64
3082 uint64_t u64FSBase = ASMRdMsr(MSR_K8_FS_BASE);
3083 uint64_t u64GSBase = ASMRdMsr(MSR_K8_GS_BASE);
3084 rc = VMXWriteVmcs64(VMX_VMCS_HOST_FS_BASE, u64FSBase);
3085 rc |= VMXWriteVmcs64(VMX_VMCS_HOST_GS_BASE, u64GSBase);
3086 AssertRCReturn(rc, rc);
3087
3088 /* Store the base if we have to restore FS or GS manually as we need to restore the base as well. */
3089 if (pVCpu->hm.s.vmx.fRestoreHostFlags & VMX_RESTORE_HOST_SEL_FS)
3090 pVCpu->hm.s.vmx.RestoreHost.uHostFSBase = u64FSBase;
3091 if (pVCpu->hm.s.vmx.fRestoreHostFlags & VMX_RESTORE_HOST_SEL_GS)
3092 pVCpu->hm.s.vmx.RestoreHost.uHostGSBase = u64GSBase;
3093#endif
3094 return VINF_SUCCESS;
3095}
3096
3097
3098/**
3099 * Exports certain host MSRs in the VM-exit MSR-load area and some in the
3100 * host-state area of the VMCS.
3101 *
3102 * Theses MSRs will be automatically restored on the host after every successful
3103 * VM-exit.
3104 *
3105 * @returns VBox status code.
3106 * @param pVCpu The cross context virtual CPU structure.
3107 *
3108 * @remarks No-long-jump zone!!!
3109 */
3110static int hmR0VmxExportHostMsrs(PVMCPU pVCpu)
3111{
3112 AssertPtr(pVCpu);
3113 AssertPtr(pVCpu->hm.s.vmx.pvHostMsr);
3114
3115 /*
3116 * Save MSRs that we restore lazily (due to preemption or transition to ring-3)
3117 * rather than swapping them on every VM-entry.
3118 */
3119 hmR0VmxLazySaveHostMsrs(pVCpu);
3120
3121 /*
3122 * Host Sysenter MSRs.
3123 */
3124 int rc = VMXWriteVmcs32(VMX_VMCS32_HOST_SYSENTER_CS, ASMRdMsr_Low(MSR_IA32_SYSENTER_CS));
3125#if HC_ARCH_BITS == 32
3126 rc |= VMXWriteVmcs32(VMX_VMCS_HOST_SYSENTER_ESP, ASMRdMsr_Low(MSR_IA32_SYSENTER_ESP));
3127 rc |= VMXWriteVmcs32(VMX_VMCS_HOST_SYSENTER_EIP, ASMRdMsr_Low(MSR_IA32_SYSENTER_EIP));
3128#else
3129 rc |= VMXWriteVmcs64(VMX_VMCS_HOST_SYSENTER_ESP, ASMRdMsr(MSR_IA32_SYSENTER_ESP));
3130 rc |= VMXWriteVmcs64(VMX_VMCS_HOST_SYSENTER_EIP, ASMRdMsr(MSR_IA32_SYSENTER_EIP));
3131#endif
3132 AssertRCReturn(rc, rc);
3133
3134 /*
3135 * Host EFER MSR.
3136 *
3137 * If the CPU supports the newer VMCS controls for managing EFER, use it. Otherwise it's
3138 * done as part of auto-load/store MSR area in the VMCS, see hmR0VmxExportGuestMsrs().
3139 */
3140 PVM pVM = pVCpu->CTX_SUFF(pVM);
3141 if (pVM->hm.s.vmx.fSupportsVmcsEfer)
3142 {
3143 rc = VMXWriteVmcs64(VMX_VMCS64_HOST_EFER_FULL, pVM->hm.s.vmx.u64HostEfer);
3144 AssertRCReturn(rc, rc);
3145 }
3146
3147 /** @todo IA32_PERF_GLOBALCTRL, IA32_PAT also see hmR0VmxExportGuestExitCtls(). */
3148
3149 return VINF_SUCCESS;
3150}
3151
3152
3153/**
3154 * Figures out if we need to swap the EFER MSR which is particularly expensive.
3155 *
3156 * We check all relevant bits. For now, that's everything besides LMA/LME, as
3157 * these two bits are handled by VM-entry, see hmR0VmxExportGuestExitCtls() and
3158 * hmR0VMxExportGuestEntryCtls().
3159 *
3160 * @returns true if we need to load guest EFER, false otherwise.
3161 * @param pVCpu The cross context virtual CPU structure.
3162 *
3163 * @remarks Requires EFER, CR4.
3164 * @remarks No-long-jump zone!!!
3165 */
3166static bool hmR0VmxShouldSwapEferMsr(PVMCPU pVCpu)
3167{
3168#ifdef HMVMX_ALWAYS_SWAP_EFER
3169 RT_NOREF(pVCpu);
3170 return true;
3171#else
3172
3173 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
3174#if HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS)
3175 /* For 32-bit hosts running 64-bit guests, we always swap EFER in the world-switcher. Nothing to do here. */
3176 if (CPUMIsGuestInLongModeEx(pCtx))
3177 return false;
3178#endif
3179
3180 PVM pVM = pVCpu->CTX_SUFF(pVM);
3181 uint64_t const u64HostEfer = pVM->hm.s.vmx.u64HostEfer;
3182 uint64_t const u64GuestEfer = pCtx->msrEFER;
3183
3184 /*
3185 * For 64-bit guests, if EFER.SCE bit differs, we need to swap EFER to ensure that the
3186 * guest's SYSCALL behaviour isn't broken, see @bugref{7386}.
3187 */
3188 if ( CPUMIsGuestInLongModeEx(pCtx)
3189 && (u64GuestEfer & MSR_K6_EFER_SCE) != (u64HostEfer & MSR_K6_EFER_SCE))
3190 {
3191 return true;
3192 }
3193
3194 /*
3195 * If the guest uses PAE and EFER.NXE bit differs, we need to swap EFER as it
3196 * affects guest paging. 64-bit paging implies CR4.PAE as well.
3197 * See Intel spec. 4.5 "IA-32e Paging" and Intel spec. 4.1.1 "Three Paging Modes".
3198 */
3199 if ( (pCtx->cr4 & X86_CR4_PAE)
3200 && (pCtx->cr0 & X86_CR0_PG)
3201 && (u64GuestEfer & MSR_K6_EFER_NXE) != (u64HostEfer & MSR_K6_EFER_NXE))
3202 {
3203 /* Assert that host is NX capable. */
3204 Assert(pVCpu->CTX_SUFF(pVM)->cpum.ro.HostFeatures.fNoExecute);
3205 return true;
3206 }
3207
3208 return false;
3209#endif
3210}
3211
3212
3213/**
3214 * Exports the guest state with appropriate VM-entry controls in the VMCS.
3215 *
3216 * These controls can affect things done on VM-exit; e.g. "load debug controls",
3217 * see Intel spec. 24.8.1 "VM-entry controls".
3218 *
3219 * @returns VBox status code.
3220 * @param pVCpu The cross context virtual CPU structure.
3221 *
3222 * @remarks Requires EFER.
3223 * @remarks No-long-jump zone!!!
3224 */
3225static int hmR0VmxExportGuestEntryCtls(PVMCPU pVCpu)
3226{
3227 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_VMX_ENTRY_CTLS)
3228 {
3229 PVM pVM = pVCpu->CTX_SUFF(pVM);
3230 uint32_t fVal = pVM->hm.s.vmx.Msrs.EntryCtls.n.allowed0; /* Bits set here must be set in the VMCS. */
3231 uint32_t const fZap = pVM->hm.s.vmx.Msrs.EntryCtls.n.allowed1; /* Bits cleared here must be cleared in the VMCS. */
3232
3233 /* Load debug controls (DR7 & IA32_DEBUGCTL_MSR). The first VT-x capable CPUs only supports the 1-setting of this bit. */
3234 fVal |= VMX_ENTRY_CTLS_LOAD_DEBUG;
3235
3236 /* Set if the guest is in long mode. This will set/clear the EFER.LMA bit on VM-entry. */
3237 if (CPUMIsGuestInLongModeEx(&pVCpu->cpum.GstCtx))
3238 {
3239 fVal |= VMX_ENTRY_CTLS_IA32E_MODE_GUEST;
3240 Log4Func(("VMX_ENTRY_CTLS_IA32E_MODE_GUEST\n"));
3241 }
3242 else
3243 Assert(!(fVal & VMX_ENTRY_CTLS_IA32E_MODE_GUEST));
3244
3245 /* If the CPU supports the newer VMCS controls for managing guest/host EFER, use it. */
3246 if ( pVM->hm.s.vmx.fSupportsVmcsEfer
3247 && hmR0VmxShouldSwapEferMsr(pVCpu))
3248 {
3249 fVal |= VMX_ENTRY_CTLS_LOAD_EFER_MSR;
3250 Log4Func(("VMX_ENTRY_CTLS_LOAD_EFER_MSR\n"));
3251 }
3252
3253 /*
3254 * The following should -not- be set (since we're not in SMM mode):
3255 * - VMX_ENTRY_CTLS_ENTRY_TO_SMM
3256 * - VMX_ENTRY_CTLS_DEACTIVATE_DUAL_MON
3257 */
3258
3259 /** @todo VMX_ENTRY_CTLS_LOAD_PERF_MSR,
3260 * VMX_ENTRY_CTLS_LOAD_PAT_MSR. */
3261
3262 if ((fVal & fZap) != fVal)
3263 {
3264 Log4Func(("Invalid VM-entry controls combo! Cpu=%#RX32 fVal=%#RX32 fZap=%#RX32\n",
3265 pVM->hm.s.vmx.Msrs.EntryCtls.n.allowed0, fVal, fZap));
3266 pVCpu->hm.s.u32HMError = VMX_UFC_CTRL_ENTRY;
3267 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
3268 }
3269
3270 /* Commit it to the VMCS and update our cache. */
3271 if (pVCpu->hm.s.vmx.u32EntryCtls != fVal)
3272 {
3273 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_ENTRY, fVal);
3274 AssertRCReturn(rc, rc);
3275 pVCpu->hm.s.vmx.u32EntryCtls = fVal;
3276 }
3277
3278 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_VMX_ENTRY_CTLS);
3279 }
3280 return VINF_SUCCESS;
3281}
3282
3283
3284/**
3285 * Exports the guest state with appropriate VM-exit controls in the VMCS.
3286 *
3287 * @returns VBox status code.
3288 * @param pVCpu The cross context virtual CPU structure.
3289 *
3290 * @remarks Requires EFER.
3291 */
3292static int hmR0VmxExportGuestExitCtls(PVMCPU pVCpu)
3293{
3294 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_VMX_EXIT_CTLS)
3295 {
3296 PVM pVM = pVCpu->CTX_SUFF(pVM);
3297 uint32_t fVal = pVM->hm.s.vmx.Msrs.ExitCtls.n.allowed0; /* Bits set here must be set in the VMCS. */
3298 uint32_t const fZap = pVM->hm.s.vmx.Msrs.ExitCtls.n.allowed1; /* Bits cleared here must be cleared in the VMCS. */
3299
3300 /* Save debug controls (DR7 & IA32_DEBUGCTL_MSR). The first VT-x CPUs only supported the 1-setting of this bit. */
3301 fVal |= VMX_EXIT_CTLS_SAVE_DEBUG;
3302
3303 /*
3304 * Set the host long mode active (EFER.LMA) bit (which Intel calls "Host address-space size") if necessary.
3305 * On VM-exit, VT-x sets both the host EFER.LMA and EFER.LME bit to this value. See assertion in
3306 * hmR0VmxExportHostMsrs().
3307 */
3308#if HC_ARCH_BITS == 64
3309 fVal |= VMX_EXIT_CTLS_HOST_ADDR_SPACE_SIZE;
3310 Log4Func(("VMX_EXIT_CTLS_HOST_ADDR_SPACE_SIZE\n"));
3311#else
3312 Assert( pVCpu->hm.s.vmx.pfnStartVM == VMXR0SwitcherStartVM64
3313 || pVCpu->hm.s.vmx.pfnStartVM == VMXR0StartVM32);
3314 /* Set the host address-space size based on the switcher, not guest state. See @bugref{8432}. */
3315 if (pVCpu->hm.s.vmx.pfnStartVM == VMXR0SwitcherStartVM64)
3316 {
3317 /* The switcher returns to long mode, EFER is managed by the switcher. */
3318 fVal |= VMX_EXIT_CTLS_HOST_ADDR_SPACE_SIZE;
3319 Log4Func(("VMX_EXIT_CTLS_HOST_ADDR_SPACE_SIZE\n"));
3320 }
3321 else
3322 Assert(!(fVal & VMX_EXIT_CTLS_HOST_ADDR_SPACE_SIZE));
3323#endif
3324
3325 /* If the newer VMCS fields for managing EFER exists, use it. */
3326 if ( pVM->hm.s.vmx.fSupportsVmcsEfer
3327 && hmR0VmxShouldSwapEferMsr(pVCpu))
3328 {
3329 fVal |= VMX_EXIT_CTLS_SAVE_EFER_MSR
3330 | VMX_EXIT_CTLS_LOAD_EFER_MSR;
3331 Log4Func(("VMX_EXIT_CTLS_SAVE_EFER_MSR and VMX_EXIT_CTLS_LOAD_EFER_MSR\n"));
3332 }
3333
3334 /* Don't acknowledge external interrupts on VM-exit. We want to let the host do that. */
3335 Assert(!(fVal & VMX_EXIT_CTLS_ACK_EXT_INT));
3336
3337 /** @todo VMX_EXIT_CTLS_LOAD_PERF_MSR,
3338 * VMX_EXIT_CTLS_SAVE_PAT_MSR,
3339 * VMX_EXIT_CTLS_LOAD_PAT_MSR. */
3340
3341 /* Enable saving of the VMX preemption timer value on VM-exit. */
3342 if ( pVM->hm.s.vmx.fUsePreemptTimer
3343 && (pVM->hm.s.vmx.Msrs.ExitCtls.n.allowed1 & VMX_EXIT_CTLS_SAVE_PREEMPT_TIMER))
3344 fVal |= VMX_EXIT_CTLS_SAVE_PREEMPT_TIMER;
3345
3346 if ((fVal & fZap) != fVal)
3347 {
3348 LogRelFunc(("Invalid VM-exit controls combo! cpu=%#RX32 fVal=%#RX32 fZap=%R#X32\n",
3349 pVM->hm.s.vmx.Msrs.ExitCtls.n.allowed0, fVal, fZap));
3350 pVCpu->hm.s.u32HMError = VMX_UFC_CTRL_EXIT;
3351 return VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO;
3352 }
3353
3354 /* Commit it to the VMCS and update our cache. */
3355 if (pVCpu->hm.s.vmx.u32ExitCtls != fVal)
3356 {
3357 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_EXIT, fVal);
3358 AssertRCReturn(rc, rc);
3359 pVCpu->hm.s.vmx.u32ExitCtls = fVal;
3360 }
3361
3362 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_VMX_EXIT_CTLS);
3363 }
3364 return VINF_SUCCESS;
3365}
3366
3367
3368/**
3369 * Sets the TPR threshold in the VMCS.
3370 *
3371 * @returns VBox status code.
3372 * @param pVCpu The cross context virtual CPU structure.
3373 * @param u32TprThreshold The TPR threshold (task-priority class only).
3374 */
3375DECLINLINE(int) hmR0VmxApicSetTprThreshold(PVMCPU pVCpu, uint32_t u32TprThreshold)
3376{
3377 Assert(!(u32TprThreshold & ~VMX_TPR_THRESHOLD_MASK)); /* Bits 31:4 MBZ. */
3378 Assert(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TPR_SHADOW); RT_NOREF_PV(pVCpu);
3379 return VMXWriteVmcs32(VMX_VMCS32_CTRL_TPR_THRESHOLD, u32TprThreshold);
3380}
3381
3382
3383/**
3384 * Exports the guest APIC TPR state into the VMCS.
3385 *
3386 * @returns VBox status code.
3387 * @param pVCpu The cross context virtual CPU structure.
3388 *
3389 * @remarks No-long-jump zone!!!
3390 */
3391static int hmR0VmxExportGuestApicTpr(PVMCPU pVCpu)
3392{
3393 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_APIC_TPR)
3394 {
3395 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_APIC_TPR);
3396
3397 if ( PDMHasApic(pVCpu->CTX_SUFF(pVM))
3398 && APICIsEnabled(pVCpu))
3399 {
3400 /*
3401 * Setup TPR shadowing.
3402 */
3403 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TPR_SHADOW)
3404 {
3405 Assert(pVCpu->hm.s.vmx.HCPhysVirtApic);
3406
3407 bool fPendingIntr = false;
3408 uint8_t u8Tpr = 0;
3409 uint8_t u8PendingIntr = 0;
3410 int rc = APICGetTpr(pVCpu, &u8Tpr, &fPendingIntr, &u8PendingIntr);
3411 AssertRCReturn(rc, rc);
3412
3413 /*
3414 * If there are interrupts pending but masked by the TPR, instruct VT-x to
3415 * cause a TPR-below-threshold VM-exit when the guest lowers its TPR below the
3416 * priority of the pending interrupt so we can deliver the interrupt. If there
3417 * are no interrupts pending, set threshold to 0 to not cause any
3418 * TPR-below-threshold VM-exits.
3419 */
3420 pVCpu->hm.s.vmx.pbVirtApic[XAPIC_OFF_TPR] = u8Tpr;
3421 uint32_t u32TprThreshold = 0;
3422 if (fPendingIntr)
3423 {
3424 /* Bits 3:0 of the TPR threshold field correspond to bits 7:4 of the TPR (which is the Task-Priority Class). */
3425 const uint8_t u8PendingPriority = u8PendingIntr >> 4;
3426 const uint8_t u8TprPriority = u8Tpr >> 4;
3427 if (u8PendingPriority <= u8TprPriority)
3428 u32TprThreshold = u8PendingPriority;
3429 }
3430
3431 rc = hmR0VmxApicSetTprThreshold(pVCpu, u32TprThreshold);
3432 AssertRCReturn(rc, rc);
3433 }
3434 }
3435 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_APIC_TPR);
3436 }
3437 return VINF_SUCCESS;
3438}
3439
3440
3441/**
3442 * Gets the guest's interruptibility-state ("interrupt shadow" as AMD calls it).
3443 *
3444 * @returns Guest's interruptibility-state.
3445 * @param pVCpu The cross context virtual CPU structure.
3446 *
3447 * @remarks No-long-jump zone!!!
3448 */
3449static uint32_t hmR0VmxGetGuestIntrState(PVMCPU pVCpu)
3450{
3451 /*
3452 * Check if we should inhibit interrupt delivery due to instructions like STI and MOV SS.
3453 */
3454 uint32_t fIntrState = 0;
3455 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS))
3456 {
3457 /* If inhibition is active, RIP & RFLAGS should've been accessed
3458 (i.e. read previously from the VMCS or from ring-3). */
3459 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
3460#ifdef VBOX_STRICT
3461 uint64_t const fExtrn = ASMAtomicUoReadU64(&pCtx->fExtrn);
3462 AssertMsg(!(fExtrn & (CPUMCTX_EXTRN_RIP | CPUMCTX_EXTRN_RFLAGS)), ("%#x\n", fExtrn));
3463#endif
3464 if (pCtx->rip == EMGetInhibitInterruptsPC(pVCpu))
3465 {
3466 if (pCtx->eflags.Bits.u1IF)
3467 fIntrState = VMX_VMCS_GUEST_INT_STATE_BLOCK_STI;
3468 else
3469 fIntrState = VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS;
3470 }
3471 else if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS))
3472 {
3473 /*
3474 * We can clear the inhibit force flag as even if we go back to the recompiler
3475 * without executing guest code in VT-x, the flag's condition to be cleared is
3476 * met and thus the cleared state is correct.
3477 */
3478 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS);
3479 }
3480 }
3481
3482 /*
3483 * NMIs to the guest are blocked after an NMI is injected until the guest executes an IRET. We only
3484 * bother with virtual-NMI blocking when we have support for virtual NMIs in the CPU, otherwise
3485 * setting this would block host-NMIs and IRET will not clear the blocking.
3486 *
3487 * See Intel spec. 26.6.1 "Interruptibility state". See @bugref{7445}.
3488 */
3489 if ( VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_BLOCK_NMIS)
3490 && (pVCpu->hm.s.vmx.u32PinCtls & VMX_PIN_CTLS_VIRT_NMI))
3491 {
3492 fIntrState |= VMX_VMCS_GUEST_INT_STATE_BLOCK_NMI;
3493 }
3494
3495 return fIntrState;
3496}
3497
3498
3499/**
3500 * Exports the exception intercepts required for guest execution in the VMCS.
3501 *
3502 * @returns VBox status code.
3503 * @param pVCpu The cross context virtual CPU structure.
3504 *
3505 * @remarks No-long-jump zone!!!
3506 */
3507static int hmR0VmxExportGuestXcptIntercepts(PVMCPU pVCpu)
3508{
3509 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_VMX_GUEST_XCPT_INTERCEPTS)
3510 {
3511 uint32_t uXcptBitmap = pVCpu->hm.s.vmx.u32XcptBitmap;
3512
3513 /* The remaining exception intercepts are handled elsewhere, e.g. in hmR0VmxExportSharedCR0(). */
3514 if (pVCpu->hm.s.fGIMTrapXcptUD)
3515 uXcptBitmap |= RT_BIT(X86_XCPT_UD);
3516#ifndef HMVMX_ALWAYS_TRAP_ALL_XCPTS
3517 else
3518 uXcptBitmap &= ~RT_BIT(X86_XCPT_UD);
3519#endif
3520
3521 Assert(uXcptBitmap & RT_BIT_32(X86_XCPT_AC));
3522 Assert(uXcptBitmap & RT_BIT_32(X86_XCPT_DB));
3523
3524 if (uXcptBitmap != pVCpu->hm.s.vmx.u32XcptBitmap)
3525 {
3526 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_EXCEPTION_BITMAP, uXcptBitmap);
3527 AssertRCReturn(rc, rc);
3528 pVCpu->hm.s.vmx.u32XcptBitmap = uXcptBitmap;
3529 }
3530
3531 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_VMX_GUEST_XCPT_INTERCEPTS);
3532 Log4Func(("VMX_VMCS32_CTRL_EXCEPTION_BITMAP=%#RX64\n", uXcptBitmap));
3533 }
3534 return VINF_SUCCESS;
3535}
3536
3537
3538/**
3539 * Exports the guest's RIP into the guest-state area in the VMCS.
3540 *
3541 * @returns VBox status code.
3542 * @param pVCpu The cross context virtual CPU structure.
3543 *
3544 * @remarks No-long-jump zone!!!
3545 */
3546static int hmR0VmxExportGuestRip(PVMCPU pVCpu)
3547{
3548 int rc = VINF_SUCCESS;
3549 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_RIP)
3550 {
3551 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_RIP);
3552
3553 rc = VMXWriteVmcsGstN(VMX_VMCS_GUEST_RIP, pVCpu->cpum.GstCtx.rip);
3554 AssertRCReturn(rc, rc);
3555
3556 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_RIP);
3557 Log4Func(("RIP=%#RX64\n", pVCpu->cpum.GstCtx.rip));
3558 }
3559 return rc;
3560}
3561
3562
3563/**
3564 * Exports the guest's RSP into the guest-state area in the VMCS.
3565 *
3566 * @returns VBox status code.
3567 * @param pVCpu The cross context virtual CPU structure.
3568 *
3569 * @remarks No-long-jump zone!!!
3570 */
3571static int hmR0VmxExportGuestRsp(PVMCPU pVCpu)
3572{
3573 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_RSP)
3574 {
3575 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_RSP);
3576
3577 int rc = VMXWriteVmcsGstN(VMX_VMCS_GUEST_RSP, pVCpu->cpum.GstCtx.rsp);
3578 AssertRCReturn(rc, rc);
3579
3580 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_RSP);
3581 }
3582 return VINF_SUCCESS;
3583}
3584
3585
3586/**
3587 * Exports the guest's RFLAGS into the guest-state area in the VMCS.
3588 *
3589 * @returns VBox status code.
3590 * @param pVCpu The cross context virtual CPU structure.
3591 *
3592 * @remarks No-long-jump zone!!!
3593 */
3594static int hmR0VmxExportGuestRflags(PVMCPU pVCpu)
3595{
3596 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_RFLAGS)
3597 {
3598 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_RFLAGS);
3599
3600 /* Intel spec. 2.3.1 "System Flags and Fields in IA-32e Mode" claims the upper 32-bits of RFLAGS are reserved (MBZ).
3601 Let us assert it as such and use 32-bit VMWRITE. */
3602 Assert(!RT_HI_U32(pVCpu->cpum.GstCtx.rflags.u64));
3603 X86EFLAGS fEFlags = pVCpu->cpum.GstCtx.eflags;
3604 Assert(fEFlags.u32 & X86_EFL_RA1_MASK);
3605 Assert(!(fEFlags.u32 & ~(X86_EFL_1 | X86_EFL_LIVE_MASK)));
3606
3607 /*
3608 * If we're emulating real-mode using Virtual 8086 mode, save the real-mode eflags so
3609 * we can restore them on VM-exit. Modify the real-mode guest's eflags so that VT-x
3610 * can run the real-mode guest code under Virtual 8086 mode.
3611 */
3612 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
3613 {
3614 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.vmx.pRealModeTSS);
3615 Assert(PDMVmmDevHeapIsEnabled(pVCpu->CTX_SUFF(pVM)));
3616 pVCpu->hm.s.vmx.RealMode.Eflags.u32 = fEFlags.u32; /* Save the original eflags of the real-mode guest. */
3617 fEFlags.Bits.u1VM = 1; /* Set the Virtual 8086 mode bit. */
3618 fEFlags.Bits.u2IOPL = 0; /* Change IOPL to 0, otherwise certain instructions won't fault. */
3619 }
3620
3621 int rc = VMXWriteVmcs32(VMX_VMCS_GUEST_RFLAGS, fEFlags.u32);
3622 AssertRCReturn(rc, rc);
3623
3624 /*
3625 * Setup pending debug exceptions if the guest is single-stepping using EFLAGS.TF.
3626 *
3627 * We must avoid setting any automatic debug exceptions delivery when single-stepping
3628 * through the hypervisor debugger using EFLAGS.TF.
3629 */
3630 if ( !pVCpu->hm.s.fSingleInstruction
3631 && fEFlags.Bits.u1TF)
3632 {
3633 /** @todo r=ramshankar: Warning! We ASSUME EFLAGS.TF will not cleared on
3634 * premature trips to ring-3 esp since IEM does not yet handle it. */
3635 rc = VMXWriteVmcs32(VMX_VMCS_GUEST_PENDING_DEBUG_XCPTS, VMX_VMCS_GUEST_PENDING_DEBUG_XCPT_BS);
3636 AssertRCReturn(rc, rc);
3637 }
3638
3639 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_RFLAGS);
3640 Log4Func(("EFlags=%#RX32\n", fEFlags.u32));
3641 }
3642 return VINF_SUCCESS;
3643}
3644
3645
3646/**
3647 * Exports the guest CR0 control register into the guest-state area in the VMCS.
3648 *
3649 * The guest FPU state is always pre-loaded hence we don't need to bother about
3650 * sharing FPU related CR0 bits between the guest and host.
3651 *
3652 * @returns VBox status code.
3653 * @param pVCpu The cross context virtual CPU structure.
3654 *
3655 * @remarks No-long-jump zone!!!
3656 */
3657static int hmR0VmxExportGuestCR0(PVMCPU pVCpu)
3658{
3659 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_CR0)
3660 {
3661 PVM pVM = pVCpu->CTX_SUFF(pVM);
3662 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_CR0);
3663 Assert(!RT_HI_U32(pVCpu->cpum.GstCtx.cr0));
3664
3665 uint32_t const u32ShadowCr0 = pVCpu->cpum.GstCtx.cr0;
3666 uint32_t u32GuestCr0 = pVCpu->cpum.GstCtx.cr0;
3667
3668 /*
3669 * Setup VT-x's view of the guest CR0.
3670 * Minimize VM-exits due to CR3 changes when we have NestedPaging.
3671 */
3672 uint32_t uProcCtls = pVCpu->hm.s.vmx.u32ProcCtls;
3673 if (pVM->hm.s.fNestedPaging)
3674 {
3675 if (CPUMIsGuestPagingEnabled(pVCpu))
3676 {
3677 /* The guest has paging enabled, let it access CR3 without causing a VM-exit if supported. */
3678 uProcCtls &= ~( VMX_PROC_CTLS_CR3_LOAD_EXIT
3679 | VMX_PROC_CTLS_CR3_STORE_EXIT);
3680 }
3681 else
3682 {
3683 /* The guest doesn't have paging enabled, make CR3 access cause a VM-exit to update our shadow. */
3684 uProcCtls |= VMX_PROC_CTLS_CR3_LOAD_EXIT
3685 | VMX_PROC_CTLS_CR3_STORE_EXIT;
3686 }
3687
3688 /* If we have unrestricted guest execution, we never have to intercept CR3 reads. */
3689 if (pVM->hm.s.vmx.fUnrestrictedGuest)
3690 uProcCtls &= ~VMX_PROC_CTLS_CR3_STORE_EXIT;
3691 }
3692 else
3693 {
3694 /* Guest CPL 0 writes to its read-only pages should cause a #PF VM-exit. */
3695 u32GuestCr0 |= X86_CR0_WP;
3696 }
3697
3698 /*
3699 * Guest FPU bits.
3700 *
3701 * Since we pre-load the guest FPU always before VM-entry there is no need to track lazy state
3702 * using CR0.TS.
3703 *
3704 * Intel spec. 23.8 "Restrictions on VMX operation" mentions that CR0.NE bit must always be
3705 * set on the first CPUs to support VT-x and no mention of with regards to UX in VM-entry checks.
3706 */
3707 u32GuestCr0 |= X86_CR0_NE;
3708
3709 /* If CR0.NE isn't set, we need to intercept #MF exceptions and report them to the guest differently. */
3710 bool const fInterceptMF = !(u32ShadowCr0 & X86_CR0_NE);
3711
3712 /*
3713 * Update exception intercepts.
3714 */
3715 uint32_t uXcptBitmap = pVCpu->hm.s.vmx.u32XcptBitmap;
3716 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
3717 {
3718 Assert(PDMVmmDevHeapIsEnabled(pVM));
3719 Assert(pVM->hm.s.vmx.pRealModeTSS);
3720 uXcptBitmap |= HMVMX_REAL_MODE_XCPT_MASK;
3721 }
3722 else
3723 {
3724 /* For now, cleared here as mode-switches can happen outside HM/VT-x. See @bugref{7626#c11}. */
3725 uXcptBitmap &= ~HMVMX_REAL_MODE_XCPT_MASK;
3726 if (fInterceptMF)
3727 uXcptBitmap |= RT_BIT(X86_XCPT_MF);
3728 }
3729
3730 /* Additional intercepts for debugging, define these yourself explicitly. */
3731#ifdef HMVMX_ALWAYS_TRAP_ALL_XCPTS
3732 uXcptBitmap |= 0
3733 | RT_BIT(X86_XCPT_BP)
3734 | RT_BIT(X86_XCPT_DE)
3735 | RT_BIT(X86_XCPT_NM)
3736 | RT_BIT(X86_XCPT_TS)
3737 | RT_BIT(X86_XCPT_UD)
3738 | RT_BIT(X86_XCPT_NP)
3739 | RT_BIT(X86_XCPT_SS)
3740 | RT_BIT(X86_XCPT_GP)
3741 | RT_BIT(X86_XCPT_PF)
3742 | RT_BIT(X86_XCPT_MF)
3743 ;
3744#elif defined(HMVMX_ALWAYS_TRAP_PF)
3745 uXcptBitmap |= RT_BIT(X86_XCPT_PF);
3746#endif
3747 if (pVCpu->hm.s.fTrapXcptGpForLovelyMesaDrv)
3748 uXcptBitmap |= RT_BIT(X86_XCPT_GP);
3749 Assert(pVM->hm.s.fNestedPaging || (uXcptBitmap & RT_BIT(X86_XCPT_PF)));
3750
3751 /*
3752 * Set/clear the CR0 specific bits along with their exceptions (PE, PG, CD, NW).
3753 */
3754 uint32_t fSetCr0 = (uint32_t)(pVM->hm.s.vmx.Msrs.u64Cr0Fixed0 & pVM->hm.s.vmx.Msrs.u64Cr0Fixed1);
3755 uint32_t fZapCr0 = (uint32_t)(pVM->hm.s.vmx.Msrs.u64Cr0Fixed0 | pVM->hm.s.vmx.Msrs.u64Cr0Fixed1);
3756 if (pVM->hm.s.vmx.fUnrestrictedGuest) /* Exceptions for unrestricted-guests for fixed CR0 bits (PE, PG). */
3757 fSetCr0 &= ~(X86_CR0_PE | X86_CR0_PG);
3758 else
3759 Assert((fSetCr0 & (X86_CR0_PE | X86_CR0_PG)) == (X86_CR0_PE | X86_CR0_PG));
3760
3761 u32GuestCr0 |= fSetCr0;
3762 u32GuestCr0 &= fZapCr0;
3763 u32GuestCr0 &= ~(X86_CR0_CD | X86_CR0_NW); /* Always enable caching. */
3764
3765 /*
3766 * CR0 is shared between host and guest along with a CR0 read shadow. Therefore, certain bits must not be changed
3767 * by the guest because VT-x ignores saving/restoring them (namely CD, ET, NW) and for certain other bits
3768 * we want to be notified immediately of guest CR0 changes (e.g. PG to update our shadow page tables).
3769 */
3770 uint32_t u32Cr0Mask = X86_CR0_PE
3771 | X86_CR0_NE
3772 | (pVM->hm.s.fNestedPaging ? 0 : X86_CR0_WP)
3773 | X86_CR0_PG
3774 | X86_CR0_ET /* Bit ignored on VM-entry and VM-exit. Don't let the guest modify the host CR0.ET */
3775 | X86_CR0_CD /* Bit ignored on VM-entry and VM-exit. Don't let the guest modify the host CR0.CD */
3776 | X86_CR0_NW; /* Bit ignored on VM-entry and VM-exit. Don't let the guest modify the host CR0.NW */
3777
3778 /** @todo Avoid intercepting CR0.PE with unrestricted guests. Fix PGM
3779 * enmGuestMode to be in-sync with the current mode. See @bugref{6398}
3780 * and @bugref{6944}. */
3781#if 0
3782 if (pVM->hm.s.vmx.fUnrestrictedGuest)
3783 u32Cr0Mask &= ~X86_CR0_PE;
3784#endif
3785 /*
3786 * Finally, update VMCS fields with the CR0 values and the exception bitmap.
3787 */
3788 int rc = VMXWriteVmcs32(VMX_VMCS_GUEST_CR0, u32GuestCr0);
3789 rc |= VMXWriteVmcs32(VMX_VMCS_CTRL_CR0_READ_SHADOW, u32ShadowCr0);
3790 if (u32Cr0Mask != pVCpu->hm.s.vmx.u32Cr0Mask)
3791 rc |= VMXWriteVmcs32(VMX_VMCS_CTRL_CR0_MASK, u32Cr0Mask);
3792 if (uProcCtls != pVCpu->hm.s.vmx.u32ProcCtls)
3793 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, uProcCtls);
3794 if (uXcptBitmap != pVCpu->hm.s.vmx.u32XcptBitmap)
3795 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_EXCEPTION_BITMAP, uXcptBitmap);
3796 AssertRCReturn(rc, rc);
3797
3798 /* Update our caches. */
3799 pVCpu->hm.s.vmx.u32Cr0Mask = u32Cr0Mask;
3800 pVCpu->hm.s.vmx.u32ProcCtls = uProcCtls;
3801 pVCpu->hm.s.vmx.u32XcptBitmap = uXcptBitmap;
3802
3803 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_CR0);
3804
3805 Log4Func(("u32Cr0Mask=%#RX32 u32ShadowCr0=%#RX32 u32GuestCr0=%#RX32 (fSetCr0=%#RX32 fZapCr0=%#RX32\n", u32Cr0Mask,
3806 u32ShadowCr0, u32GuestCr0, fSetCr0, fZapCr0));
3807 }
3808
3809 return VINF_SUCCESS;
3810}
3811
3812
3813/**
3814 * Exports the guest control registers (CR3, CR4) into the guest-state area
3815 * in the VMCS.
3816 *
3817 * @returns VBox strict status code.
3818 * @retval VINF_EM_RESCHEDULE_REM if we try to emulate non-paged guest code
3819 * without unrestricted guest access and the VMMDev is not presently
3820 * mapped (e.g. EFI32).
3821 *
3822 * @param pVCpu The cross context virtual CPU structure.
3823 *
3824 * @remarks No-long-jump zone!!!
3825 */
3826static VBOXSTRICTRC hmR0VmxExportGuestCR3AndCR4(PVMCPU pVCpu)
3827{
3828 int rc = VINF_SUCCESS;
3829 PVM pVM = pVCpu->CTX_SUFF(pVM);
3830
3831 /*
3832 * Guest CR2.
3833 * It's always loaded in the assembler code. Nothing to do here.
3834 */
3835
3836 /*
3837 * Guest CR3.
3838 */
3839 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_CR3)
3840 {
3841 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_CR3);
3842
3843 RTGCPHYS GCPhysGuestCR3 = NIL_RTGCPHYS;
3844 if (pVM->hm.s.fNestedPaging)
3845 {
3846 pVCpu->hm.s.vmx.HCPhysEPTP = PGMGetHyperCR3(pVCpu);
3847
3848 /* Validate. See Intel spec. 28.2.2 "EPT Translation Mechanism" and 24.6.11 "Extended-Page-Table Pointer (EPTP)" */
3849 Assert(pVCpu->hm.s.vmx.HCPhysEPTP);
3850 Assert(!(pVCpu->hm.s.vmx.HCPhysEPTP & UINT64_C(0xfff0000000000000)));
3851 Assert(!(pVCpu->hm.s.vmx.HCPhysEPTP & 0xfff));
3852
3853 /* VMX_EPT_MEMTYPE_WB support is already checked in hmR0VmxSetupTaggedTlb(). */
3854 pVCpu->hm.s.vmx.HCPhysEPTP |= VMX_EPT_MEMTYPE_WB
3855 | (VMX_EPT_PAGE_WALK_LENGTH_DEFAULT << VMX_EPT_PAGE_WALK_LENGTH_SHIFT);
3856
3857 /* Validate. See Intel spec. 26.2.1 "Checks on VMX Controls" */
3858 AssertMsg( ((pVCpu->hm.s.vmx.HCPhysEPTP >> 3) & 0x07) == 3 /* Bits 3:5 (EPT page walk length - 1) must be 3. */
3859 && ((pVCpu->hm.s.vmx.HCPhysEPTP >> 7) & 0x1f) == 0, /* Bits 7:11 MBZ. */
3860 ("EPTP %#RX64\n", pVCpu->hm.s.vmx.HCPhysEPTP));
3861 AssertMsg( !((pVCpu->hm.s.vmx.HCPhysEPTP >> 6) & 0x01) /* Bit 6 (EPT accessed & dirty bit). */
3862 || (pVM->hm.s.vmx.Msrs.u64EptVpidCaps & MSR_IA32_VMX_EPT_VPID_CAP_EPT_ACCESS_DIRTY),
3863 ("EPTP accessed/dirty bit not supported by CPU but set %#RX64\n", pVCpu->hm.s.vmx.HCPhysEPTP));
3864
3865 rc = VMXWriteVmcs64(VMX_VMCS64_CTRL_EPTP_FULL, pVCpu->hm.s.vmx.HCPhysEPTP);
3866 AssertRCReturn(rc, rc);
3867
3868 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
3869 if ( pVM->hm.s.vmx.fUnrestrictedGuest
3870 || CPUMIsGuestPagingEnabledEx(pCtx))
3871 {
3872 /* If the guest is in PAE mode, pass the PDPEs to VT-x using the VMCS fields. */
3873 if (CPUMIsGuestInPAEModeEx(pCtx))
3874 {
3875 rc = PGMGstGetPaePdpes(pVCpu, &pVCpu->hm.s.aPdpes[0]);
3876 AssertRCReturn(rc, rc);
3877 rc = VMXWriteVmcs64(VMX_VMCS64_GUEST_PDPTE0_FULL, pVCpu->hm.s.aPdpes[0].u);
3878 rc |= VMXWriteVmcs64(VMX_VMCS64_GUEST_PDPTE1_FULL, pVCpu->hm.s.aPdpes[1].u);
3879 rc |= VMXWriteVmcs64(VMX_VMCS64_GUEST_PDPTE2_FULL, pVCpu->hm.s.aPdpes[2].u);
3880 rc |= VMXWriteVmcs64(VMX_VMCS64_GUEST_PDPTE3_FULL, pVCpu->hm.s.aPdpes[3].u);
3881 AssertRCReturn(rc, rc);
3882 }
3883
3884 /*
3885 * The guest's view of its CR3 is unblemished with Nested Paging when the
3886 * guest is using paging or we have unrestricted guest execution to handle
3887 * the guest when it's not using paging.
3888 */
3889 GCPhysGuestCR3 = pCtx->cr3;
3890 }
3891 else
3892 {
3893 /*
3894 * The guest is not using paging, but the CPU (VT-x) has to. While the guest
3895 * thinks it accesses physical memory directly, we use our identity-mapped
3896 * page table to map guest-linear to guest-physical addresses. EPT takes care
3897 * of translating it to host-physical addresses.
3898 */
3899 RTGCPHYS GCPhys;
3900 Assert(pVM->hm.s.vmx.pNonPagingModeEPTPageTable);
3901
3902 /* We obtain it here every time as the guest could have relocated this PCI region. */
3903 rc = PDMVmmDevHeapR3ToGCPhys(pVM, pVM->hm.s.vmx.pNonPagingModeEPTPageTable, &GCPhys);
3904 if (RT_SUCCESS(rc))
3905 { /* likely */ }
3906 else if (rc == VERR_PDM_DEV_HEAP_R3_TO_GCPHYS)
3907 {
3908 Log4Func(("VERR_PDM_DEV_HEAP_R3_TO_GCPHYS -> VINF_EM_RESCHEDULE_REM\n"));
3909 return VINF_EM_RESCHEDULE_REM; /* We cannot execute now, switch to REM/IEM till the guest maps in VMMDev. */
3910 }
3911 else
3912 AssertMsgFailedReturn(("%Rrc\n", rc), rc);
3913
3914 GCPhysGuestCR3 = GCPhys;
3915 }
3916
3917 Log4Func(("u32GuestCr3=%#RGp (GstN)\n", GCPhysGuestCR3));
3918 rc = VMXWriteVmcsGstN(VMX_VMCS_GUEST_CR3, GCPhysGuestCR3);
3919 AssertRCReturn(rc, rc);
3920 }
3921 else
3922 {
3923 /* Non-nested paging case, just use the hypervisor's CR3. */
3924 RTHCPHYS HCPhysGuestCR3 = PGMGetHyperCR3(pVCpu);
3925
3926 Log4Func(("u32GuestCr3=%#RHv (HstN)\n", HCPhysGuestCR3));
3927 rc = VMXWriteVmcsHstN(VMX_VMCS_GUEST_CR3, HCPhysGuestCR3);
3928 AssertRCReturn(rc, rc);
3929 }
3930
3931 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_CR3);
3932 }
3933
3934 /*
3935 * Guest CR4.
3936 * ASSUMES this is done everytime we get in from ring-3! (XCR0)
3937 */
3938 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_CR4)
3939 {
3940 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
3941 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_CR4);
3942 Assert(!RT_HI_U32(pCtx->cr4));
3943
3944 uint32_t u32GuestCr4 = pCtx->cr4;
3945 uint32_t const u32ShadowCr4 = pCtx->cr4;
3946
3947 /*
3948 * Setup VT-x's view of the guest CR4.
3949 *
3950 * If we're emulating real-mode using virtual-8086 mode, we want to redirect software
3951 * interrupts to the 8086 program interrupt handler. Clear the VME bit (the interrupt
3952 * redirection bitmap is already all 0, see hmR3InitFinalizeR0())
3953 *
3954 * See Intel spec. 20.2 "Software Interrupt Handling Methods While in Virtual-8086 Mode".
3955 */
3956 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
3957 {
3958 Assert(pVM->hm.s.vmx.pRealModeTSS);
3959 Assert(PDMVmmDevHeapIsEnabled(pVM));
3960 u32GuestCr4 &= ~X86_CR4_VME;
3961 }
3962
3963 if (pVM->hm.s.fNestedPaging)
3964 {
3965 if ( !CPUMIsGuestPagingEnabledEx(pCtx)
3966 && !pVM->hm.s.vmx.fUnrestrictedGuest)
3967 {
3968 /* We use 4 MB pages in our identity mapping page table when the guest doesn't have paging. */
3969 u32GuestCr4 |= X86_CR4_PSE;
3970 /* Our identity mapping is a 32-bit page directory. */
3971 u32GuestCr4 &= ~X86_CR4_PAE;
3972 }
3973 /* else use guest CR4.*/
3974 }
3975 else
3976 {
3977 /*
3978 * The shadow paging modes and guest paging modes are different, the shadow is in accordance with the host
3979 * paging mode and thus we need to adjust VT-x's view of CR4 depending on our shadow page tables.
3980 */
3981 switch (pVCpu->hm.s.enmShadowMode)
3982 {
3983 case PGMMODE_REAL: /* Real-mode. */
3984 case PGMMODE_PROTECTED: /* Protected mode without paging. */
3985 case PGMMODE_32_BIT: /* 32-bit paging. */
3986 {
3987 u32GuestCr4 &= ~X86_CR4_PAE;
3988 break;
3989 }
3990
3991 case PGMMODE_PAE: /* PAE paging. */
3992 case PGMMODE_PAE_NX: /* PAE paging with NX. */
3993 {
3994 u32GuestCr4 |= X86_CR4_PAE;
3995 break;
3996 }
3997
3998 case PGMMODE_AMD64: /* 64-bit AMD paging (long mode). */
3999 case PGMMODE_AMD64_NX: /* 64-bit AMD paging (long mode) with NX enabled. */
4000#ifdef VBOX_ENABLE_64_BITS_GUESTS
4001 break;
4002#endif
4003 default:
4004 AssertFailed();
4005 return VERR_PGM_UNSUPPORTED_SHADOW_PAGING_MODE;
4006 }
4007 }
4008
4009 /* We need to set and clear the CR4 specific bits here (mainly the X86_CR4_VMXE bit). */
4010 uint64_t const fSetCr4 = (pVM->hm.s.vmx.Msrs.u64Cr4Fixed0 & pVM->hm.s.vmx.Msrs.u64Cr4Fixed1);
4011 uint64_t const fZapCr4 = (pVM->hm.s.vmx.Msrs.u64Cr4Fixed0 | pVM->hm.s.vmx.Msrs.u64Cr4Fixed1);
4012 u32GuestCr4 |= fSetCr4;
4013 u32GuestCr4 &= fZapCr4;
4014
4015 /* Setup CR4 mask. CR4 flags owned by the host, if the guest attempts to change them,
4016 that would cause a VM-exit. */
4017 uint32_t u32Cr4Mask = X86_CR4_VME
4018 | X86_CR4_PAE
4019 | X86_CR4_PGE
4020 | X86_CR4_PSE
4021 | X86_CR4_VMXE;
4022 if (pVM->cpum.ro.HostFeatures.fXSaveRstor)
4023 u32Cr4Mask |= X86_CR4_OSXSAVE;
4024 if (pVM->cpum.ro.GuestFeatures.fPcid)
4025 u32Cr4Mask |= X86_CR4_PCIDE;
4026
4027 /* Write VT-x's view of the guest CR4, the CR4 modify mask and the read-only CR4 shadow
4028 into the VMCS and update our cache. */
4029 rc = VMXWriteVmcs32(VMX_VMCS_GUEST_CR4, u32GuestCr4);
4030 rc |= VMXWriteVmcs32(VMX_VMCS_CTRL_CR4_READ_SHADOW, u32ShadowCr4);
4031 if (pVCpu->hm.s.vmx.u32Cr4Mask != u32Cr4Mask)
4032 rc |= VMXWriteVmcs32(VMX_VMCS_CTRL_CR4_MASK, u32Cr4Mask);
4033 AssertRCReturn(rc, rc);
4034 pVCpu->hm.s.vmx.u32Cr4Mask = u32Cr4Mask;
4035
4036 /* Whether to save/load/restore XCR0 during world switch depends on CR4.OSXSAVE and host+guest XCR0. */
4037 pVCpu->hm.s.fLoadSaveGuestXcr0 = (pCtx->cr4 & X86_CR4_OSXSAVE) && pCtx->aXcr[0] != ASMGetXcr0();
4038
4039 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_CR4);
4040
4041 Log4Func(("u32GuestCr4=%#RX32 u32ShadowCr4=%#RX32 (fSetCr4=%#RX32 fZapCr4=%#RX32)\n", u32GuestCr4, u32ShadowCr4, fSetCr4,
4042 fZapCr4));
4043 }
4044 return rc;
4045}
4046
4047
4048/**
4049 * Exports the guest debug registers into the guest-state area in the VMCS.
4050 * The guest debug bits are partially shared with the host (e.g. DR6, DR0-3).
4051 *
4052 * This also sets up whether \#DB and MOV DRx accesses cause VM-exits.
4053 *
4054 * @returns VBox status code.
4055 * @param pVCpu The cross context virtual CPU structure.
4056 *
4057 * @remarks No-long-jump zone!!!
4058 */
4059static int hmR0VmxExportSharedDebugState(PVMCPU pVCpu)
4060{
4061 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
4062
4063#ifdef VBOX_STRICT
4064 /* Validate. Intel spec. 26.3.1.1 "Checks on Guest Controls Registers, Debug Registers, MSRs" */
4065 if (pVCpu->hm.s.vmx.u32EntryCtls & VMX_ENTRY_CTLS_LOAD_DEBUG)
4066 {
4067 /* Validate. Intel spec. 17.2 "Debug Registers", recompiler paranoia checks. */
4068 Assert((pVCpu->cpum.GstCtx.dr[7] & (X86_DR7_MBZ_MASK | X86_DR7_RAZ_MASK)) == 0);
4069 Assert((pVCpu->cpum.GstCtx.dr[7] & X86_DR7_RA1_MASK) == X86_DR7_RA1_MASK);
4070 }
4071#endif
4072
4073 bool fSteppingDB = false;
4074 bool fInterceptMovDRx = false;
4075 uint32_t uProcCtls = pVCpu->hm.s.vmx.u32ProcCtls;
4076 if (pVCpu->hm.s.fSingleInstruction)
4077 {
4078 /* If the CPU supports the monitor trap flag, use it for single stepping in DBGF and avoid intercepting #DB. */
4079 PVM pVM = pVCpu->CTX_SUFF(pVM);
4080 if (pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_MONITOR_TRAP_FLAG)
4081 {
4082 uProcCtls |= VMX_PROC_CTLS_MONITOR_TRAP_FLAG;
4083 Assert(fSteppingDB == false);
4084 }
4085 else
4086 {
4087 pVCpu->cpum.GstCtx.eflags.u32 |= X86_EFL_TF;
4088 pVCpu->hm.s.fCtxChanged |= HM_CHANGED_GUEST_RFLAGS;
4089 pVCpu->hm.s.fClearTrapFlag = true;
4090 fSteppingDB = true;
4091 }
4092 }
4093
4094 uint32_t u32GuestDr7;
4095 if ( fSteppingDB
4096 || (CPUMGetHyperDR7(pVCpu) & X86_DR7_ENABLED_MASK))
4097 {
4098 /*
4099 * Use the combined guest and host DRx values found in the hypervisor register set
4100 * because the debugger has breakpoints active or someone is single stepping on the
4101 * host side without a monitor trap flag.
4102 *
4103 * Note! DBGF expects a clean DR6 state before executing guest code.
4104 */
4105#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS)
4106 if ( CPUMIsGuestInLongModeEx(&pVCpu->cpum.GstCtx)
4107 && !CPUMIsHyperDebugStateActivePending(pVCpu))
4108 {
4109 CPUMR0LoadHyperDebugState(pVCpu, true /* include DR6 */);
4110 Assert(CPUMIsHyperDebugStateActivePending(pVCpu));
4111 Assert(!CPUMIsGuestDebugStateActivePending(pVCpu));
4112 }
4113 else
4114#endif
4115 if (!CPUMIsHyperDebugStateActive(pVCpu))
4116 {
4117 CPUMR0LoadHyperDebugState(pVCpu, true /* include DR6 */);
4118 Assert(CPUMIsHyperDebugStateActive(pVCpu));
4119 Assert(!CPUMIsGuestDebugStateActive(pVCpu));
4120 }
4121
4122 /* Update DR7 with the hypervisor value (other DRx registers are handled by CPUM one way or another). */
4123 u32GuestDr7 = (uint32_t)CPUMGetHyperDR7(pVCpu);
4124 pVCpu->hm.s.fUsingHyperDR7 = true;
4125 fInterceptMovDRx = true;
4126 }
4127 else
4128 {
4129 /*
4130 * If the guest has enabled debug registers, we need to load them prior to
4131 * executing guest code so they'll trigger at the right time.
4132 */
4133 if (pVCpu->cpum.GstCtx.dr[7] & (X86_DR7_ENABLED_MASK | X86_DR7_GD))
4134 {
4135#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS)
4136 if ( CPUMIsGuestInLongModeEx(&pVCpu->cpum.GstCtx)
4137 && !CPUMIsGuestDebugStateActivePending(pVCpu))
4138 {
4139 CPUMR0LoadGuestDebugState(pVCpu, true /* include DR6 */);
4140 Assert(CPUMIsGuestDebugStateActivePending(pVCpu));
4141 Assert(!CPUMIsHyperDebugStateActivePending(pVCpu));
4142 STAM_COUNTER_INC(&pVCpu->hm.s.StatDRxArmed);
4143 }
4144 else
4145#endif
4146 if (!CPUMIsGuestDebugStateActive(pVCpu))
4147 {
4148 CPUMR0LoadGuestDebugState(pVCpu, true /* include DR6 */);
4149 Assert(CPUMIsGuestDebugStateActive(pVCpu));
4150 Assert(!CPUMIsHyperDebugStateActive(pVCpu));
4151 STAM_COUNTER_INC(&pVCpu->hm.s.StatDRxArmed);
4152 }
4153 Assert(!fInterceptMovDRx);
4154 }
4155 /*
4156 * If no debugging enabled, we'll lazy load DR0-3. Unlike on AMD-V, we
4157 * must intercept #DB in order to maintain a correct DR6 guest value, and
4158 * because we need to intercept it to prevent nested #DBs from hanging the
4159 * CPU, we end up always having to intercept it. See hmR0VmxInitXcptBitmap.
4160 */
4161#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS)
4162 else if ( !CPUMIsGuestDebugStateActivePending(pVCpu)
4163 && !CPUMIsGuestDebugStateActive(pVCpu))
4164#else
4165 else if (!CPUMIsGuestDebugStateActive(pVCpu))
4166#endif
4167 {
4168 fInterceptMovDRx = true;
4169 }
4170
4171 /* Update DR7 with the actual guest value. */
4172 u32GuestDr7 = pVCpu->cpum.GstCtx.dr[7];
4173 pVCpu->hm.s.fUsingHyperDR7 = false;
4174 }
4175
4176 if (fInterceptMovDRx)
4177 uProcCtls |= VMX_PROC_CTLS_MOV_DR_EXIT;
4178 else
4179 uProcCtls &= ~VMX_PROC_CTLS_MOV_DR_EXIT;
4180
4181 /*
4182 * Update the processor-based VM-execution controls with the MOV-DRx intercepts and the
4183 * monitor-trap flag and update our cache.
4184 */
4185 if (uProcCtls != pVCpu->hm.s.vmx.u32ProcCtls)
4186 {
4187 int rc2 = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, uProcCtls);
4188 AssertRCReturn(rc2, rc2);
4189 pVCpu->hm.s.vmx.u32ProcCtls = uProcCtls;
4190 }
4191
4192 /*
4193 * Update guest DR7.
4194 */
4195 int rc = VMXWriteVmcs32(VMX_VMCS_GUEST_DR7, u32GuestDr7);
4196 AssertRCReturn(rc, rc);
4197
4198 /*
4199 * If we have forced EFLAGS.TF to be set because we're single-stepping in the hypervisor debugger,
4200 * we need to clear interrupt inhibition if any as otherwise it causes a VM-entry failure.
4201 *
4202 * See Intel spec. 26.3.1.5 "Checks on Guest Non-Register State".
4203 */
4204 if (fSteppingDB)
4205 {
4206 Assert(pVCpu->hm.s.fSingleInstruction);
4207 Assert(pVCpu->cpum.GstCtx.eflags.Bits.u1TF);
4208
4209 uint32_t fIntrState = 0;
4210 rc = VMXReadVmcs32(VMX_VMCS32_GUEST_INT_STATE, &fIntrState);
4211 AssertRCReturn(rc, rc);
4212
4213 if (fIntrState & (VMX_VMCS_GUEST_INT_STATE_BLOCK_STI | VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS))
4214 {
4215 fIntrState &= ~(VMX_VMCS_GUEST_INT_STATE_BLOCK_STI | VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS);
4216 rc = VMXWriteVmcs32(VMX_VMCS32_GUEST_INT_STATE, fIntrState);
4217 AssertRCReturn(rc, rc);
4218 }
4219 }
4220
4221 return VINF_SUCCESS;
4222}
4223
4224
4225#ifdef VBOX_STRICT
4226/**
4227 * Strict function to validate segment registers.
4228 *
4229 * @param pVCpu The cross context virtual CPU structure.
4230 *
4231 * @remarks Will import guest CR0 on strict builds during validation of
4232 * segments.
4233 */
4234static void hmR0VmxValidateSegmentRegs(PVMCPU pVCpu)
4235{
4236 /*
4237 * Validate segment registers. See Intel spec. 26.3.1.2 "Checks on Guest Segment Registers".
4238 *
4239 * The reason we check for attribute value 0 in this function and not just the unusable bit is
4240 * because hmR0VmxExportGuestSegmentReg() only updates the VMCS' copy of the value with the unusable bit
4241 * and doesn't change the guest-context value.
4242 */
4243 PVM pVM = pVCpu->CTX_SUFF(pVM);
4244 PCCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
4245 hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_CR0);
4246 if ( !pVM->hm.s.vmx.fUnrestrictedGuest
4247 && ( !CPUMIsGuestInRealModeEx(pCtx)
4248 && !CPUMIsGuestInV86ModeEx(pCtx)))
4249 {
4250 /* Protected mode checks */
4251 /* CS */
4252 Assert(pCtx->cs.Attr.n.u1Present);
4253 Assert(!(pCtx->cs.Attr.u & 0xf00));
4254 Assert(!(pCtx->cs.Attr.u & 0xfffe0000));
4255 Assert( (pCtx->cs.u32Limit & 0xfff) == 0xfff
4256 || !(pCtx->cs.Attr.n.u1Granularity));
4257 Assert( !(pCtx->cs.u32Limit & 0xfff00000)
4258 || (pCtx->cs.Attr.n.u1Granularity));
4259 /* CS cannot be loaded with NULL in protected mode. */
4260 Assert(pCtx->cs.Attr.u && !(pCtx->cs.Attr.u & X86DESCATTR_UNUSABLE)); /** @todo is this really true even for 64-bit CS? */
4261 if (pCtx->cs.Attr.n.u4Type == 9 || pCtx->cs.Attr.n.u4Type == 11)
4262 Assert(pCtx->cs.Attr.n.u2Dpl == pCtx->ss.Attr.n.u2Dpl);
4263 else if (pCtx->cs.Attr.n.u4Type == 13 || pCtx->cs.Attr.n.u4Type == 15)
4264 Assert(pCtx->cs.Attr.n.u2Dpl <= pCtx->ss.Attr.n.u2Dpl);
4265 else
4266 AssertMsgFailed(("Invalid CS Type %#x\n", pCtx->cs.Attr.n.u2Dpl));
4267 /* SS */
4268 Assert((pCtx->ss.Sel & X86_SEL_RPL) == (pCtx->cs.Sel & X86_SEL_RPL));
4269 Assert(pCtx->ss.Attr.n.u2Dpl == (pCtx->ss.Sel & X86_SEL_RPL));
4270 if ( !(pCtx->cr0 & X86_CR0_PE)
4271 || pCtx->cs.Attr.n.u4Type == 3)
4272 {
4273 Assert(!pCtx->ss.Attr.n.u2Dpl);
4274 }
4275 if (pCtx->ss.Attr.u && !(pCtx->ss.Attr.u & X86DESCATTR_UNUSABLE))
4276 {
4277 Assert((pCtx->ss.Sel & X86_SEL_RPL) == (pCtx->cs.Sel & X86_SEL_RPL));
4278 Assert(pCtx->ss.Attr.n.u4Type == 3 || pCtx->ss.Attr.n.u4Type == 7);
4279 Assert(pCtx->ss.Attr.n.u1Present);
4280 Assert(!(pCtx->ss.Attr.u & 0xf00));
4281 Assert(!(pCtx->ss.Attr.u & 0xfffe0000));
4282 Assert( (pCtx->ss.u32Limit & 0xfff) == 0xfff
4283 || !(pCtx->ss.Attr.n.u1Granularity));
4284 Assert( !(pCtx->ss.u32Limit & 0xfff00000)
4285 || (pCtx->ss.Attr.n.u1Granularity));
4286 }
4287 /* DS, ES, FS, GS - only check for usable selectors, see hmR0VmxExportGuestSegmentReg(). */
4288 if (pCtx->ds.Attr.u && !(pCtx->ds.Attr.u & X86DESCATTR_UNUSABLE))
4289 {
4290 Assert(pCtx->ds.Attr.n.u4Type & X86_SEL_TYPE_ACCESSED);
4291 Assert(pCtx->ds.Attr.n.u1Present);
4292 Assert(pCtx->ds.Attr.n.u4Type > 11 || pCtx->ds.Attr.n.u2Dpl >= (pCtx->ds.Sel & X86_SEL_RPL));
4293 Assert(!(pCtx->ds.Attr.u & 0xf00));
4294 Assert(!(pCtx->ds.Attr.u & 0xfffe0000));
4295 Assert( (pCtx->ds.u32Limit & 0xfff) == 0xfff
4296 || !(pCtx->ds.Attr.n.u1Granularity));
4297 Assert( !(pCtx->ds.u32Limit & 0xfff00000)
4298 || (pCtx->ds.Attr.n.u1Granularity));
4299 Assert( !(pCtx->ds.Attr.n.u4Type & X86_SEL_TYPE_CODE)
4300 || (pCtx->ds.Attr.n.u4Type & X86_SEL_TYPE_READ));
4301 }
4302 if (pCtx->es.Attr.u && !(pCtx->es.Attr.u & X86DESCATTR_UNUSABLE))
4303 {
4304 Assert(pCtx->es.Attr.n.u4Type & X86_SEL_TYPE_ACCESSED);
4305 Assert(pCtx->es.Attr.n.u1Present);
4306 Assert(pCtx->es.Attr.n.u4Type > 11 || pCtx->es.Attr.n.u2Dpl >= (pCtx->es.Sel & X86_SEL_RPL));
4307 Assert(!(pCtx->es.Attr.u & 0xf00));
4308 Assert(!(pCtx->es.Attr.u & 0xfffe0000));
4309 Assert( (pCtx->es.u32Limit & 0xfff) == 0xfff
4310 || !(pCtx->es.Attr.n.u1Granularity));
4311 Assert( !(pCtx->es.u32Limit & 0xfff00000)
4312 || (pCtx->es.Attr.n.u1Granularity));
4313 Assert( !(pCtx->es.Attr.n.u4Type & X86_SEL_TYPE_CODE)
4314 || (pCtx->es.Attr.n.u4Type & X86_SEL_TYPE_READ));
4315 }
4316 if (pCtx->fs.Attr.u && !(pCtx->fs.Attr.u & X86DESCATTR_UNUSABLE))
4317 {
4318 Assert(pCtx->fs.Attr.n.u4Type & X86_SEL_TYPE_ACCESSED);
4319 Assert(pCtx->fs.Attr.n.u1Present);
4320 Assert(pCtx->fs.Attr.n.u4Type > 11 || pCtx->fs.Attr.n.u2Dpl >= (pCtx->fs.Sel & X86_SEL_RPL));
4321 Assert(!(pCtx->fs.Attr.u & 0xf00));
4322 Assert(!(pCtx->fs.Attr.u & 0xfffe0000));
4323 Assert( (pCtx->fs.u32Limit & 0xfff) == 0xfff
4324 || !(pCtx->fs.Attr.n.u1Granularity));
4325 Assert( !(pCtx->fs.u32Limit & 0xfff00000)
4326 || (pCtx->fs.Attr.n.u1Granularity));
4327 Assert( !(pCtx->fs.Attr.n.u4Type & X86_SEL_TYPE_CODE)
4328 || (pCtx->fs.Attr.n.u4Type & X86_SEL_TYPE_READ));
4329 }
4330 if (pCtx->gs.Attr.u && !(pCtx->gs.Attr.u & X86DESCATTR_UNUSABLE))
4331 {
4332 Assert(pCtx->gs.Attr.n.u4Type & X86_SEL_TYPE_ACCESSED);
4333 Assert(pCtx->gs.Attr.n.u1Present);
4334 Assert(pCtx->gs.Attr.n.u4Type > 11 || pCtx->gs.Attr.n.u2Dpl >= (pCtx->gs.Sel & X86_SEL_RPL));
4335 Assert(!(pCtx->gs.Attr.u & 0xf00));
4336 Assert(!(pCtx->gs.Attr.u & 0xfffe0000));
4337 Assert( (pCtx->gs.u32Limit & 0xfff) == 0xfff
4338 || !(pCtx->gs.Attr.n.u1Granularity));
4339 Assert( !(pCtx->gs.u32Limit & 0xfff00000)
4340 || (pCtx->gs.Attr.n.u1Granularity));
4341 Assert( !(pCtx->gs.Attr.n.u4Type & X86_SEL_TYPE_CODE)
4342 || (pCtx->gs.Attr.n.u4Type & X86_SEL_TYPE_READ));
4343 }
4344 /* 64-bit capable CPUs. */
4345# if HC_ARCH_BITS == 64
4346 Assert(!RT_HI_U32(pCtx->cs.u64Base));
4347 Assert(!pCtx->ss.Attr.u || !RT_HI_U32(pCtx->ss.u64Base));
4348 Assert(!pCtx->ds.Attr.u || !RT_HI_U32(pCtx->ds.u64Base));
4349 Assert(!pCtx->es.Attr.u || !RT_HI_U32(pCtx->es.u64Base));
4350# endif
4351 }
4352 else if ( CPUMIsGuestInV86ModeEx(pCtx)
4353 || ( CPUMIsGuestInRealModeEx(pCtx)
4354 && !pVM->hm.s.vmx.fUnrestrictedGuest))
4355 {
4356 /* Real and v86 mode checks. */
4357 /* hmR0VmxExportGuestSegmentReg() writes the modified in VMCS. We want what we're feeding to VT-x. */
4358 uint32_t u32CSAttr, u32SSAttr, u32DSAttr, u32ESAttr, u32FSAttr, u32GSAttr;
4359 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
4360 {
4361 u32CSAttr = 0xf3; u32SSAttr = 0xf3; u32DSAttr = 0xf3; u32ESAttr = 0xf3; u32FSAttr = 0xf3; u32GSAttr = 0xf3;
4362 }
4363 else
4364 {
4365 u32CSAttr = pCtx->cs.Attr.u; u32SSAttr = pCtx->ss.Attr.u; u32DSAttr = pCtx->ds.Attr.u;
4366 u32ESAttr = pCtx->es.Attr.u; u32FSAttr = pCtx->fs.Attr.u; u32GSAttr = pCtx->gs.Attr.u;
4367 }
4368
4369 /* CS */
4370 AssertMsg((pCtx->cs.u64Base == (uint64_t)pCtx->cs.Sel << 4), ("CS base %#x %#x\n", pCtx->cs.u64Base, pCtx->cs.Sel));
4371 Assert(pCtx->cs.u32Limit == 0xffff);
4372 Assert(u32CSAttr == 0xf3);
4373 /* SS */
4374 Assert(pCtx->ss.u64Base == (uint64_t)pCtx->ss.Sel << 4);
4375 Assert(pCtx->ss.u32Limit == 0xffff);
4376 Assert(u32SSAttr == 0xf3);
4377 /* DS */
4378 Assert(pCtx->ds.u64Base == (uint64_t)pCtx->ds.Sel << 4);
4379 Assert(pCtx->ds.u32Limit == 0xffff);
4380 Assert(u32DSAttr == 0xf3);
4381 /* ES */
4382 Assert(pCtx->es.u64Base == (uint64_t)pCtx->es.Sel << 4);
4383 Assert(pCtx->es.u32Limit == 0xffff);
4384 Assert(u32ESAttr == 0xf3);
4385 /* FS */
4386 Assert(pCtx->fs.u64Base == (uint64_t)pCtx->fs.Sel << 4);
4387 Assert(pCtx->fs.u32Limit == 0xffff);
4388 Assert(u32FSAttr == 0xf3);
4389 /* GS */
4390 Assert(pCtx->gs.u64Base == (uint64_t)pCtx->gs.Sel << 4);
4391 Assert(pCtx->gs.u32Limit == 0xffff);
4392 Assert(u32GSAttr == 0xf3);
4393 /* 64-bit capable CPUs. */
4394# if HC_ARCH_BITS == 64
4395 Assert(!RT_HI_U32(pCtx->cs.u64Base));
4396 Assert(!u32SSAttr || !RT_HI_U32(pCtx->ss.u64Base));
4397 Assert(!u32DSAttr || !RT_HI_U32(pCtx->ds.u64Base));
4398 Assert(!u32ESAttr || !RT_HI_U32(pCtx->es.u64Base));
4399# endif
4400 }
4401}
4402#endif /* VBOX_STRICT */
4403
4404
4405/**
4406 * Exports a guest segment register into the guest-state area in the VMCS.
4407 *
4408 * @returns VBox status code.
4409 * @param pVCpu The cross context virtual CPU structure.
4410 * @param idxSel Index of the selector in the VMCS.
4411 * @param idxLimit Index of the segment limit in the VMCS.
4412 * @param idxBase Index of the segment base in the VMCS.
4413 * @param idxAccess Index of the access rights of the segment in the VMCS.
4414 * @param pSelReg Pointer to the segment selector.
4415 *
4416 * @remarks No-long-jump zone!!!
4417 */
4418static int hmR0VmxExportGuestSegmentReg(PVMCPU pVCpu, uint32_t idxSel, uint32_t idxLimit, uint32_t idxBase, uint32_t idxAccess,
4419 PCCPUMSELREG pSelReg)
4420{
4421 int rc = VMXWriteVmcs32(idxSel, pSelReg->Sel); /* 16-bit guest selector field. */
4422 rc |= VMXWriteVmcs32(idxLimit, pSelReg->u32Limit); /* 32-bit guest segment limit field. */
4423 rc |= VMXWriteVmcsGstN(idxBase, pSelReg->u64Base); /* Natural width guest segment base field.*/
4424 AssertRCReturn(rc, rc);
4425
4426 uint32_t u32Access = pSelReg->Attr.u;
4427 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
4428 {
4429 /* VT-x requires our real-using-v86 mode hack to override the segment access-right bits. */
4430 u32Access = 0xf3;
4431 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.vmx.pRealModeTSS);
4432 Assert(PDMVmmDevHeapIsEnabled(pVCpu->CTX_SUFF(pVM)));
4433 }
4434 else
4435 {
4436 /*
4437 * The way to differentiate between whether this is really a null selector or was just
4438 * a selector loaded with 0 in real-mode is using the segment attributes. A selector
4439 * loaded in real-mode with the value 0 is valid and usable in protected-mode and we
4440 * should -not- mark it as an unusable segment. Both the recompiler & VT-x ensures
4441 * NULL selectors loaded in protected-mode have their attribute as 0.
4442 */
4443 if (!u32Access)
4444 u32Access = X86DESCATTR_UNUSABLE;
4445 }
4446
4447 /* Validate segment access rights. Refer to Intel spec. "26.3.1.2 Checks on Guest Segment Registers". */
4448 AssertMsg((u32Access & X86DESCATTR_UNUSABLE) || (u32Access & X86_SEL_TYPE_ACCESSED),
4449 ("Access bit not set for usable segment. idx=%#x sel=%#x attr %#x\n", idxBase, pSelReg, pSelReg->Attr.u));
4450
4451 rc = VMXWriteVmcs32(idxAccess, u32Access); /* 32-bit guest segment access-rights field. */
4452 AssertRCReturn(rc, rc);
4453 return rc;
4454}
4455
4456
4457/**
4458 * Exports the guest segment registers, GDTR, IDTR, LDTR, (TR, FS and GS bases)
4459 * into the guest-state area in the VMCS.
4460 *
4461 * @returns VBox status code.
4462 * @param pVCpu The cross context virtual CPU structure.
4463 *
4464 * @remarks Will import guest CR0 on strict builds during validation of
4465 * segments.
4466 * @remarks No-long-jump zone!!!
4467 */
4468static int hmR0VmxExportGuestSegmentRegs(PVMCPU pVCpu)
4469{
4470 int rc = VERR_INTERNAL_ERROR_5;
4471 PVM pVM = pVCpu->CTX_SUFF(pVM);
4472 PCCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
4473
4474 /*
4475 * Guest Segment registers: CS, SS, DS, ES, FS, GS.
4476 */
4477 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_SREG_MASK)
4478 {
4479#ifdef VBOX_WITH_REM
4480 if (!pVM->hm.s.vmx.fUnrestrictedGuest)
4481 {
4482 Assert(pVM->hm.s.vmx.pRealModeTSS);
4483 AssertCompile(PGMMODE_REAL < PGMMODE_PROTECTED);
4484 if ( pVCpu->hm.s.vmx.fWasInRealMode
4485 && PGMGetGuestMode(pVCpu) >= PGMMODE_PROTECTED)
4486 {
4487 /* Signal that the recompiler must flush its code-cache as the guest -may- rewrite code it will later execute
4488 in real-mode (e.g. OpenBSD 4.0) */
4489 REMFlushTBs(pVM);
4490 Log4Func(("Switch to protected mode detected!\n"));
4491 pVCpu->hm.s.vmx.fWasInRealMode = false;
4492 }
4493 }
4494#endif
4495 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_CS)
4496 {
4497 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_CS);
4498 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
4499 pVCpu->hm.s.vmx.RealMode.AttrCS.u = pCtx->cs.Attr.u;
4500 rc = HMVMX_EXPORT_SREG(CS, &pCtx->cs);
4501 AssertRCReturn(rc, rc);
4502 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_CS);
4503 }
4504
4505 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_SS)
4506 {
4507 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_SS);
4508 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
4509 pVCpu->hm.s.vmx.RealMode.AttrSS.u = pCtx->ss.Attr.u;
4510 rc = HMVMX_EXPORT_SREG(SS, &pCtx->ss);
4511 AssertRCReturn(rc, rc);
4512 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_SS);
4513 }
4514
4515 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_DS)
4516 {
4517 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_DS);
4518 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
4519 pVCpu->hm.s.vmx.RealMode.AttrDS.u = pCtx->ds.Attr.u;
4520 rc = HMVMX_EXPORT_SREG(DS, &pCtx->ds);
4521 AssertRCReturn(rc, rc);
4522 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_DS);
4523 }
4524
4525 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_ES)
4526 {
4527 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_ES);
4528 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
4529 pVCpu->hm.s.vmx.RealMode.AttrES.u = pCtx->es.Attr.u;
4530 rc = HMVMX_EXPORT_SREG(ES, &pCtx->es);
4531 AssertRCReturn(rc, rc);
4532 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_ES);
4533 }
4534
4535 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_FS)
4536 {
4537 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_FS);
4538 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
4539 pVCpu->hm.s.vmx.RealMode.AttrFS.u = pCtx->fs.Attr.u;
4540 rc = HMVMX_EXPORT_SREG(FS, &pCtx->fs);
4541 AssertRCReturn(rc, rc);
4542 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_FS);
4543 }
4544
4545 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_GS)
4546 {
4547 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_GS);
4548 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
4549 pVCpu->hm.s.vmx.RealMode.AttrGS.u = pCtx->gs.Attr.u;
4550 rc = HMVMX_EXPORT_SREG(GS, &pCtx->gs);
4551 AssertRCReturn(rc, rc);
4552 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_GS);
4553 }
4554
4555#ifdef VBOX_STRICT
4556 hmR0VmxValidateSegmentRegs(pVCpu);
4557#endif
4558
4559 Log4Func(("CS=%#RX16 Base=%#RX64 Limit=%#RX32 Attr=%#RX32\n", pCtx->cs.Sel, pCtx->cs.u64Base,
4560 pCtx->cs.u32Limit, pCtx->cs.Attr.u));
4561 }
4562
4563 /*
4564 * Guest TR.
4565 */
4566 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_TR)
4567 {
4568 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_TR);
4569
4570 /*
4571 * Real-mode emulation using virtual-8086 mode with CR4.VME. Interrupt redirection is
4572 * achieved using the interrupt redirection bitmap (all bits cleared to let the guest
4573 * handle INT-n's) in the TSS. See hmR3InitFinalizeR0() to see how pRealModeTSS is setup.
4574 */
4575 uint16_t u16Sel = 0;
4576 uint32_t u32Limit = 0;
4577 uint64_t u64Base = 0;
4578 uint32_t u32AccessRights = 0;
4579
4580 if (!pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
4581 {
4582 u16Sel = pCtx->tr.Sel;
4583 u32Limit = pCtx->tr.u32Limit;
4584 u64Base = pCtx->tr.u64Base;
4585 u32AccessRights = pCtx->tr.Attr.u;
4586 }
4587 else
4588 {
4589 Assert(pVM->hm.s.vmx.pRealModeTSS);
4590 Assert(PDMVmmDevHeapIsEnabled(pVM)); /* Guaranteed by HMCanExecuteGuest() -XXX- what about inner loop changes? */
4591
4592 /* We obtain it here every time as PCI regions could be reconfigured in the guest, changing the VMMDev base. */
4593 RTGCPHYS GCPhys;
4594 rc = PDMVmmDevHeapR3ToGCPhys(pVM, pVM->hm.s.vmx.pRealModeTSS, &GCPhys);
4595 AssertRCReturn(rc, rc);
4596
4597 X86DESCATTR DescAttr;
4598 DescAttr.u = 0;
4599 DescAttr.n.u1Present = 1;
4600 DescAttr.n.u4Type = X86_SEL_TYPE_SYS_386_TSS_BUSY;
4601
4602 u16Sel = 0;
4603 u32Limit = HM_VTX_TSS_SIZE;
4604 u64Base = GCPhys; /* in real-mode phys = virt. */
4605 u32AccessRights = DescAttr.u;
4606 }
4607
4608 /* Validate. */
4609 Assert(!(u16Sel & RT_BIT(2)));
4610 AssertMsg( (u32AccessRights & 0xf) == X86_SEL_TYPE_SYS_386_TSS_BUSY
4611 || (u32AccessRights & 0xf) == X86_SEL_TYPE_SYS_286_TSS_BUSY, ("TSS is not busy!? %#x\n", u32AccessRights));
4612 AssertMsg(!(u32AccessRights & X86DESCATTR_UNUSABLE), ("TR unusable bit is not clear!? %#x\n", u32AccessRights));
4613 Assert(!(u32AccessRights & RT_BIT(4))); /* System MBZ.*/
4614 Assert(u32AccessRights & RT_BIT(7)); /* Present MB1.*/
4615 Assert(!(u32AccessRights & 0xf00)); /* 11:8 MBZ. */
4616 Assert(!(u32AccessRights & 0xfffe0000)); /* 31:17 MBZ. */
4617 Assert( (u32Limit & 0xfff) == 0xfff
4618 || !(u32AccessRights & RT_BIT(15))); /* Granularity MBZ. */
4619 Assert( !(pCtx->tr.u32Limit & 0xfff00000)
4620 || (u32AccessRights & RT_BIT(15))); /* Granularity MB1. */
4621
4622 rc = VMXWriteVmcs32(VMX_VMCS16_GUEST_TR_SEL, u16Sel);
4623 rc |= VMXWriteVmcs32(VMX_VMCS32_GUEST_TR_LIMIT, u32Limit);
4624 rc |= VMXWriteVmcs32(VMX_VMCS32_GUEST_TR_ACCESS_RIGHTS, u32AccessRights);
4625 rc |= VMXWriteVmcsGstN(VMX_VMCS_GUEST_TR_BASE, u64Base);
4626 AssertRCReturn(rc, rc);
4627
4628 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_TR);
4629 Log4Func(("TR base=%#RX64\n", pCtx->tr.u64Base));
4630 }
4631
4632 /*
4633 * Guest GDTR.
4634 */
4635 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_GDTR)
4636 {
4637 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_GDTR);
4638
4639 rc = VMXWriteVmcs32(VMX_VMCS32_GUEST_GDTR_LIMIT, pCtx->gdtr.cbGdt);
4640 rc |= VMXWriteVmcsGstN(VMX_VMCS_GUEST_GDTR_BASE, pCtx->gdtr.pGdt);
4641 AssertRCReturn(rc, rc);
4642
4643 /* Validate. */
4644 Assert(!(pCtx->gdtr.cbGdt & 0xffff0000)); /* Bits 31:16 MBZ. */
4645
4646 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_GDTR);
4647 Log4Func(("GDTR base=%#RX64\n", pCtx->gdtr.pGdt));
4648 }
4649
4650 /*
4651 * Guest LDTR.
4652 */
4653 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_LDTR)
4654 {
4655 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_LDTR);
4656
4657 /* The unusable bit is specific to VT-x, if it's a null selector mark it as an unusable segment. */
4658 uint32_t u32Access = 0;
4659 if (!pCtx->ldtr.Attr.u)
4660 u32Access = X86DESCATTR_UNUSABLE;
4661 else
4662 u32Access = pCtx->ldtr.Attr.u;
4663
4664 rc = VMXWriteVmcs32(VMX_VMCS16_GUEST_LDTR_SEL, pCtx->ldtr.Sel);
4665 rc |= VMXWriteVmcs32(VMX_VMCS32_GUEST_LDTR_LIMIT, pCtx->ldtr.u32Limit);
4666 rc |= VMXWriteVmcs32(VMX_VMCS32_GUEST_LDTR_ACCESS_RIGHTS, u32Access);
4667 rc |= VMXWriteVmcsGstN(VMX_VMCS_GUEST_LDTR_BASE, pCtx->ldtr.u64Base);
4668 AssertRCReturn(rc, rc);
4669
4670 /* Validate. */
4671 if (!(u32Access & X86DESCATTR_UNUSABLE))
4672 {
4673 Assert(!(pCtx->ldtr.Sel & RT_BIT(2))); /* TI MBZ. */
4674 Assert(pCtx->ldtr.Attr.n.u4Type == 2); /* Type MB2 (LDT). */
4675 Assert(!pCtx->ldtr.Attr.n.u1DescType); /* System MBZ. */
4676 Assert(pCtx->ldtr.Attr.n.u1Present == 1); /* Present MB1. */
4677 Assert(!pCtx->ldtr.Attr.n.u4LimitHigh); /* 11:8 MBZ. */
4678 Assert(!(pCtx->ldtr.Attr.u & 0xfffe0000)); /* 31:17 MBZ. */
4679 Assert( (pCtx->ldtr.u32Limit & 0xfff) == 0xfff
4680 || !pCtx->ldtr.Attr.n.u1Granularity); /* Granularity MBZ. */
4681 Assert( !(pCtx->ldtr.u32Limit & 0xfff00000)
4682 || pCtx->ldtr.Attr.n.u1Granularity); /* Granularity MB1. */
4683 }
4684
4685 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_LDTR);
4686 Log4Func(("LDTR base=%#RX64\n", pCtx->ldtr.u64Base));
4687 }
4688
4689 /*
4690 * Guest IDTR.
4691 */
4692 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_IDTR)
4693 {
4694 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_IDTR);
4695
4696 rc = VMXWriteVmcs32(VMX_VMCS32_GUEST_IDTR_LIMIT, pCtx->idtr.cbIdt);
4697 rc |= VMXWriteVmcsGstN(VMX_VMCS_GUEST_IDTR_BASE, pCtx->idtr.pIdt);
4698 AssertRCReturn(rc, rc);
4699
4700 /* Validate. */
4701 Assert(!(pCtx->idtr.cbIdt & 0xffff0000)); /* Bits 31:16 MBZ. */
4702
4703 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_IDTR);
4704 Log4Func(("IDTR base=%#RX64\n", pCtx->idtr.pIdt));
4705 }
4706
4707 return VINF_SUCCESS;
4708}
4709
4710
4711/**
4712 * Exports certain guest MSRs into the VM-entry MSR-load and VM-exit MSR-store
4713 * areas.
4714 *
4715 * These MSRs will automatically be loaded to the host CPU on every successful
4716 * VM-entry and stored from the host CPU on every successful VM-exit. This also
4717 * creates/updates MSR slots for the host MSRs. The actual host MSR values are
4718 * -not- updated here for performance reasons. See hmR0VmxExportHostMsrs().
4719 *
4720 * Also exports the guest sysenter MSRs into the guest-state area in the VMCS.
4721 *
4722 * @returns VBox status code.
4723 * @param pVCpu The cross context virtual CPU structure.
4724 *
4725 * @remarks No-long-jump zone!!!
4726 */
4727static int hmR0VmxExportGuestMsrs(PVMCPU pVCpu)
4728{
4729 AssertPtr(pVCpu);
4730 AssertPtr(pVCpu->hm.s.vmx.pvGuestMsr);
4731
4732 /*
4733 * MSRs that we use the auto-load/store MSR area in the VMCS.
4734 * For 64-bit hosts, we load/restore them lazily, see hmR0VmxLazyLoadGuestMsrs().
4735 */
4736 PVM pVM = pVCpu->CTX_SUFF(pVM);
4737 PCCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
4738 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_VMX_GUEST_AUTO_MSRS)
4739 {
4740 if (pVM->hm.s.fAllow64BitGuests)
4741 {
4742#if HC_ARCH_BITS == 32
4743 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_SYSCALL_MSRS | CPUMCTX_EXTRN_KERNEL_GS_BASE);
4744
4745 int rc = hmR0VmxAddAutoLoadStoreMsr(pVCpu, MSR_K8_LSTAR, pCtx->msrLSTAR, false, NULL);
4746 rc |= hmR0VmxAddAutoLoadStoreMsr(pVCpu, MSR_K6_STAR, pCtx->msrSTAR, false, NULL);
4747 rc |= hmR0VmxAddAutoLoadStoreMsr(pVCpu, MSR_K8_SF_MASK, pCtx->msrSFMASK, false, NULL);
4748 rc |= hmR0VmxAddAutoLoadStoreMsr(pVCpu, MSR_K8_KERNEL_GS_BASE, pCtx->msrKERNELGSBASE, false, NULL);
4749 AssertRCReturn(rc, rc);
4750# ifdef LOG_ENABLED
4751 PCVMXAUTOMSR pMsr = (PCVMXAUTOMSR)pVCpu->hm.s.vmx.pvGuestMsr;
4752 for (uint32_t i = 0; i < pVCpu->hm.s.vmx.cMsrs; i++, pMsr++)
4753 Log4Func(("MSR[%RU32]: u32Msr=%#RX32 u64Value=%#RX64\n", i, pMsr->u32Msr, pMsr->u64Value));
4754# endif
4755#endif
4756 }
4757 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_VMX_GUEST_AUTO_MSRS);
4758 }
4759
4760 /*
4761 * Guest Sysenter MSRs.
4762 * These flags are only set when MSR-bitmaps are not supported by the CPU and we cause
4763 * VM-exits on WRMSRs for these MSRs.
4764 */
4765 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_SYSENTER_MSR_MASK)
4766 {
4767 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_SYSENTER_MSRS);
4768
4769 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_SYSENTER_CS_MSR)
4770 {
4771 int rc = VMXWriteVmcs32(VMX_VMCS32_GUEST_SYSENTER_CS, pCtx->SysEnter.cs);
4772 AssertRCReturn(rc, rc);
4773 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_SYSENTER_CS_MSR);
4774 }
4775
4776 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_SYSENTER_EIP_MSR)
4777 {
4778 int rc = VMXWriteVmcsGstN(VMX_VMCS_GUEST_SYSENTER_EIP, pCtx->SysEnter.eip);
4779 AssertRCReturn(rc, rc);
4780 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_SYSENTER_EIP_MSR);
4781 }
4782
4783 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_SYSENTER_ESP_MSR)
4784 {
4785 int rc = VMXWriteVmcsGstN(VMX_VMCS_GUEST_SYSENTER_ESP, pCtx->SysEnter.esp);
4786 AssertRCReturn(rc, rc);
4787 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_SYSENTER_ESP_MSR);
4788 }
4789 }
4790
4791 if (ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged) & HM_CHANGED_GUEST_EFER_MSR)
4792 {
4793 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_EFER);
4794
4795 if (hmR0VmxShouldSwapEferMsr(pVCpu))
4796 {
4797 /*
4798 * If the CPU supports VMCS controls for swapping EFER, use it. Otherwise, we have no option
4799 * but to use the auto-load store MSR area in the VMCS for swapping EFER. See @bugref{7368}.
4800 */
4801 if (pVM->hm.s.vmx.fSupportsVmcsEfer)
4802 {
4803 int rc = VMXWriteVmcs64(VMX_VMCS64_GUEST_EFER_FULL, pCtx->msrEFER);
4804 AssertRCReturn(rc,rc);
4805 Log4Func(("EFER=%#RX64\n", pCtx->msrEFER));
4806 }
4807 else
4808 {
4809 int rc = hmR0VmxAddAutoLoadStoreMsr(pVCpu, MSR_K6_EFER, pCtx->msrEFER, false /* fUpdateHostMsr */,
4810 NULL /* pfAddedAndUpdated */);
4811 AssertRCReturn(rc, rc);
4812
4813 /* We need to intercept reads too, see @bugref{7386#c16}. */
4814 if (pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_USE_MSR_BITMAPS)
4815 hmR0VmxSetMsrPermission(pVCpu, MSR_K6_EFER, VMXMSREXIT_INTERCEPT_READ, VMXMSREXIT_INTERCEPT_WRITE);
4816 Log4Func(("MSR[--]: u32Msr=%#RX32 u64Value=%#RX64 cMsrs=%u\n", MSR_K6_EFER, pCtx->msrEFER,
4817 pVCpu->hm.s.vmx.cMsrs));
4818 }
4819 }
4820 else if (!pVM->hm.s.vmx.fSupportsVmcsEfer)
4821 hmR0VmxRemoveAutoLoadStoreMsr(pVCpu, MSR_K6_EFER);
4822 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~HM_CHANGED_GUEST_EFER_MSR);
4823 }
4824
4825 return VINF_SUCCESS;
4826}
4827
4828
4829#if HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS)
4830/**
4831 * Check if guest state allows safe use of 32-bit switcher again.
4832 *
4833 * Segment bases and protected mode structures must be 32-bit addressable
4834 * because the 32-bit switcher will ignore high dword when writing these VMCS
4835 * fields. See @bugref{8432} for details.
4836 *
4837 * @returns true if safe, false if must continue to use the 64-bit switcher.
4838 * @param pCtx Pointer to the guest-CPU context.
4839 *
4840 * @remarks No-long-jump zone!!!
4841 */
4842static bool hmR0VmxIs32BitSwitcherSafe(PCCPUMCTX pCtx)
4843{
4844 if (pCtx->gdtr.pGdt & UINT64_C(0xffffffff00000000)) return false;
4845 if (pCtx->idtr.pIdt & UINT64_C(0xffffffff00000000)) return false;
4846 if (pCtx->ldtr.u64Base & UINT64_C(0xffffffff00000000)) return false;
4847 if (pCtx->tr.u64Base & UINT64_C(0xffffffff00000000)) return false;
4848 if (pCtx->es.u64Base & UINT64_C(0xffffffff00000000)) return false;
4849 if (pCtx->cs.u64Base & UINT64_C(0xffffffff00000000)) return false;
4850 if (pCtx->ss.u64Base & UINT64_C(0xffffffff00000000)) return false;
4851 if (pCtx->ds.u64Base & UINT64_C(0xffffffff00000000)) return false;
4852 if (pCtx->fs.u64Base & UINT64_C(0xffffffff00000000)) return false;
4853 if (pCtx->gs.u64Base & UINT64_C(0xffffffff00000000)) return false;
4854
4855 /* All good, bases are 32-bit. */
4856 return true;
4857}
4858#endif
4859
4860
4861/**
4862 * Selects up the appropriate function to run guest code.
4863 *
4864 * @returns VBox status code.
4865 * @param pVCpu The cross context virtual CPU structure.
4866 *
4867 * @remarks No-long-jump zone!!!
4868 */
4869static int hmR0VmxSelectVMRunHandler(PVMCPU pVCpu)
4870{
4871 PCCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
4872 if (CPUMIsGuestInLongModeEx(pCtx))
4873 {
4874#ifndef VBOX_ENABLE_64_BITS_GUESTS
4875 return VERR_PGM_UNSUPPORTED_SHADOW_PAGING_MODE;
4876#endif
4877 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.fAllow64BitGuests); /* Guaranteed by hmR3InitFinalizeR0(). */
4878#if HC_ARCH_BITS == 32
4879 /* 32-bit host. We need to switch to 64-bit before running the 64-bit guest. */
4880 if (pVCpu->hm.s.vmx.pfnStartVM != VMXR0SwitcherStartVM64)
4881 {
4882#ifdef VBOX_STRICT
4883 if (pVCpu->hm.s.vmx.pfnStartVM != NULL) /* Very first entry would have saved host-state already, ignore it. */
4884 {
4885 /* Currently, all mode changes sends us back to ring-3, so these should be set. See @bugref{6944}. */
4886 uint64_t const fCtxChanged = ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged);
4887 RT_UNTRUSTED_NONVOLATILE_COPY_FENCE();
4888 AssertMsg(fCtxChanged & ( HM_CHANGED_VMX_EXIT_CTLS
4889 | HM_CHANGED_VMX_ENTRY_CTLS
4890 | HM_CHANGED_GUEST_EFER_MSR), ("fCtxChanged=%#RX64\n", fCtxChanged));
4891 }
4892#endif
4893 pVCpu->hm.s.vmx.pfnStartVM = VMXR0SwitcherStartVM64;
4894
4895 /* Mark that we've switched to 64-bit handler, we can't safely switch back to 32-bit for
4896 the rest of the VM run (until VM reset). See @bugref{8432#c7}. */
4897 pVCpu->hm.s.vmx.fSwitchedTo64on32 = true;
4898 Log4Func(("Selected 64-bit switcher\n"));
4899 }
4900#else
4901 /* 64-bit host. */
4902 pVCpu->hm.s.vmx.pfnStartVM = VMXR0StartVM64;
4903#endif
4904 }
4905 else
4906 {
4907 /* Guest is not in long mode, use the 32-bit handler. */
4908#if HC_ARCH_BITS == 32
4909 if ( pVCpu->hm.s.vmx.pfnStartVM != VMXR0StartVM32
4910 && !pVCpu->hm.s.vmx.fSwitchedTo64on32 /* If set, guest mode change does not imply switcher change. */
4911 && pVCpu->hm.s.vmx.pfnStartVM != NULL) /* Very first entry would have saved host-state already, ignore it. */
4912 {
4913# ifdef VBOX_STRICT
4914 /* Currently, all mode changes sends us back to ring-3, so these should be set. See @bugref{6944}. */
4915 uint64_t const fCtxChanged = ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged);
4916 RT_UNTRUSTED_NONVOLATILE_COPY_FENCE();
4917 AssertMsg(fCtxChanged & ( HM_CHANGED_VMX_EXIT_CTLS
4918 | HM_CHANGED_VMX_ENTRY_CTLS
4919 | HM_CHANGED_GUEST_EFER_MSR), ("fCtxChanged=%#RX64\n", fCtxChanged));
4920# endif
4921 }
4922# ifdef VBOX_ENABLE_64_BITS_GUESTS
4923 /*
4924 * Keep using the 64-bit switcher even though we're in 32-bit because of bad Intel
4925 * design, see @bugref{8432#c7}. If real-on-v86 mode is active, clear the 64-bit
4926 * switcher flag because now we know the guest is in a sane state where it's safe
4927 * to use the 32-bit switcher. Otherwise check the guest state if it's safe to use
4928 * the much faster 32-bit switcher again.
4929 */
4930 if (!pVCpu->hm.s.vmx.fSwitchedTo64on32)
4931 {
4932 if (pVCpu->hm.s.vmx.pfnStartVM != VMXR0StartVM32)
4933 Log4Func(("Selected 32-bit switcher\n"));
4934 pVCpu->hm.s.vmx.pfnStartVM = VMXR0StartVM32;
4935 }
4936 else
4937 {
4938 Assert(pVCpu->hm.s.vmx.pfnStartVM == VMXR0SwitcherStartVM64);
4939 if ( pVCpu->hm.s.vmx.RealMode.fRealOnV86Active
4940 || hmR0VmxIs32BitSwitcherSafe(pCtx))
4941 {
4942 pVCpu->hm.s.vmx.fSwitchedTo64on32 = false;
4943 pVCpu->hm.s.vmx.pfnStartVM = VMXR0StartVM32;
4944 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_EFER_MSR
4945 | HM_CHANGED_VMX_ENTRY_CTLS
4946 | HM_CHANGED_VMX_EXIT_CTLS
4947 | HM_CHANGED_HOST_CONTEXT);
4948 Log4Func(("Selected 32-bit switcher (safe)\n"));
4949 }
4950 }
4951# else
4952 pVCpu->hm.s.vmx.pfnStartVM = VMXR0StartVM32;
4953# endif
4954#else
4955 pVCpu->hm.s.vmx.pfnStartVM = VMXR0StartVM32;
4956#endif
4957 }
4958 Assert(pVCpu->hm.s.vmx.pfnStartVM);
4959 return VINF_SUCCESS;
4960}
4961
4962
4963/**
4964 * Wrapper for running the guest code in VT-x.
4965 *
4966 * @returns VBox status code, no informational status codes.
4967 * @param pVCpu The cross context virtual CPU structure.
4968 *
4969 * @remarks No-long-jump zone!!!
4970 */
4971DECLINLINE(int) hmR0VmxRunGuest(PVMCPU pVCpu)
4972{
4973 /* Mark that HM is the keeper of all guest-CPU registers now that we're going to execute guest code. */
4974 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
4975 pCtx->fExtrn |= HMVMX_CPUMCTX_EXTRN_ALL | CPUMCTX_EXTRN_KEEPER_HM;
4976
4977 /*
4978 * 64-bit Windows uses XMM registers in the kernel as the Microsoft compiler expresses
4979 * floating-point operations using SSE instructions. Some XMM registers (XMM6-XMM15) are
4980 * callee-saved and thus the need for this XMM wrapper.
4981 *
4982 * See MSDN "Configuring Programs for 64-bit/x64 Software Conventions / Register Usage".
4983 */
4984 bool const fResumeVM = RT_BOOL(pVCpu->hm.s.vmx.uVmcsState & HMVMX_VMCS_STATE_LAUNCHED);
4985 /** @todo Add stats for resume vs launch. */
4986 PVM pVM = pVCpu->CTX_SUFF(pVM);
4987#ifdef VBOX_WITH_KERNEL_USING_XMM
4988 int rc = hmR0VMXStartVMWrapXMM(fResumeVM, pCtx, &pVCpu->hm.s.vmx.VMCSCache, pVM, pVCpu, pVCpu->hm.s.vmx.pfnStartVM);
4989#else
4990 int rc = pVCpu->hm.s.vmx.pfnStartVM(fResumeVM, pCtx, &pVCpu->hm.s.vmx.VMCSCache, pVM, pVCpu);
4991#endif
4992 AssertMsg(rc <= VINF_SUCCESS, ("%Rrc\n", rc));
4993 return rc;
4994}
4995
4996
4997/**
4998 * Reports world-switch error and dumps some useful debug info.
4999 *
5000 * @param pVCpu The cross context virtual CPU structure.
5001 * @param rcVMRun The return code from VMLAUNCH/VMRESUME.
5002 * @param pVmxTransient Pointer to the VMX transient structure (only
5003 * exitReason updated).
5004 */
5005static void hmR0VmxReportWorldSwitchError(PVMCPU pVCpu, int rcVMRun, PVMXTRANSIENT pVmxTransient)
5006{
5007 Assert(pVCpu);
5008 Assert(pVmxTransient);
5009 HMVMX_ASSERT_PREEMPT_SAFE(pVCpu);
5010
5011 Log4Func(("VM-entry failure: %Rrc\n", rcVMRun));
5012 switch (rcVMRun)
5013 {
5014 case VERR_VMX_INVALID_VMXON_PTR:
5015 AssertFailed();
5016 break;
5017 case VINF_SUCCESS: /* VMLAUNCH/VMRESUME succeeded but VM-entry failed... yeah, true story. */
5018 case VERR_VMX_UNABLE_TO_START_VM: /* VMLAUNCH/VMRESUME itself failed. */
5019 {
5020 int rc = VMXReadVmcs32(VMX_VMCS32_RO_EXIT_REASON, &pVCpu->hm.s.vmx.LastError.u32ExitReason);
5021 rc |= VMXReadVmcs32(VMX_VMCS32_RO_VM_INSTR_ERROR, &pVCpu->hm.s.vmx.LastError.u32InstrError);
5022 rc |= hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
5023 AssertRC(rc);
5024
5025 pVCpu->hm.s.vmx.LastError.idEnteredCpu = pVCpu->hm.s.idEnteredCpu;
5026 /* LastError.idCurrentCpu was already updated in hmR0VmxPreRunGuestCommitted().
5027 Cannot do it here as we may have been long preempted. */
5028
5029#ifdef VBOX_STRICT
5030 Log4(("uExitReason %#RX32 (VmxTransient %#RX16)\n", pVCpu->hm.s.vmx.LastError.u32ExitReason,
5031 pVmxTransient->uExitReason));
5032 Log4(("Exit Qualification %#RX64\n", pVmxTransient->uExitQual));
5033 Log4(("InstrError %#RX32\n", pVCpu->hm.s.vmx.LastError.u32InstrError));
5034 if (pVCpu->hm.s.vmx.LastError.u32InstrError <= HMVMX_INSTR_ERROR_MAX)
5035 Log4(("InstrError Desc. \"%s\"\n", g_apszVmxInstrErrors[pVCpu->hm.s.vmx.LastError.u32InstrError]));
5036 else
5037 Log4(("InstrError Desc. Range exceeded %u\n", HMVMX_INSTR_ERROR_MAX));
5038 Log4(("Entered host CPU %u\n", pVCpu->hm.s.vmx.LastError.idEnteredCpu));
5039 Log4(("Current host CPU %u\n", pVCpu->hm.s.vmx.LastError.idCurrentCpu));
5040
5041 /* VMX control bits. */
5042 uint32_t u32Val;
5043 uint64_t u64Val;
5044 RTHCUINTREG uHCReg;
5045 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_PIN_EXEC, &u32Val); AssertRC(rc);
5046 Log4(("VMX_VMCS32_CTRL_PIN_EXEC %#RX32\n", u32Val));
5047 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, &u32Val); AssertRC(rc);
5048 Log4(("VMX_VMCS32_CTRL_PROC_EXEC %#RX32\n", u32Val));
5049 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_SECONDARY_CTLS)
5050 {
5051 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_PROC_EXEC2, &u32Val); AssertRC(rc);
5052 Log4(("VMX_VMCS32_CTRL_PROC_EXEC2 %#RX32\n", u32Val));
5053 }
5054 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY, &u32Val); AssertRC(rc);
5055 Log4(("VMX_VMCS32_CTRL_ENTRY %#RX32\n", u32Val));
5056 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_EXIT, &u32Val); AssertRC(rc);
5057 Log4(("VMX_VMCS32_CTRL_EXIT %#RX32\n", u32Val));
5058 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_CR3_TARGET_COUNT, &u32Val); AssertRC(rc);
5059 Log4(("VMX_VMCS32_CTRL_CR3_TARGET_COUNT %#RX32\n", u32Val));
5060 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY_INTERRUPTION_INFO, &u32Val); AssertRC(rc);
5061 Log4(("VMX_VMCS32_CTRL_ENTRY_INTERRUPTION_INFO %#RX32\n", u32Val));
5062 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY_EXCEPTION_ERRCODE, &u32Val); AssertRC(rc);
5063 Log4(("VMX_VMCS32_CTRL_ENTRY_EXCEPTION_ERRCODE %#RX32\n", u32Val));
5064 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY_INSTR_LENGTH, &u32Val); AssertRC(rc);
5065 Log4(("VMX_VMCS32_CTRL_ENTRY_INSTR_LENGTH %u\n", u32Val));
5066 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_TPR_THRESHOLD, &u32Val); AssertRC(rc);
5067 Log4(("VMX_VMCS32_CTRL_TPR_THRESHOLD %u\n", u32Val));
5068 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_EXIT_MSR_STORE_COUNT, &u32Val); AssertRC(rc);
5069 Log4(("VMX_VMCS32_CTRL_EXIT_MSR_STORE_COUNT %u (guest MSRs)\n", u32Val));
5070 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_EXIT_MSR_LOAD_COUNT, &u32Val); AssertRC(rc);
5071 Log4(("VMX_VMCS32_CTRL_EXIT_MSR_LOAD_COUNT %u (host MSRs)\n", u32Val));
5072 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY_MSR_LOAD_COUNT, &u32Val); AssertRC(rc);
5073 Log4(("VMX_VMCS32_CTRL_ENTRY_MSR_LOAD_COUNT %u (guest MSRs)\n", u32Val));
5074 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_EXCEPTION_BITMAP, &u32Val); AssertRC(rc);
5075 Log4(("VMX_VMCS32_CTRL_EXCEPTION_BITMAP %#RX32\n", u32Val));
5076 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_PAGEFAULT_ERROR_MASK, &u32Val); AssertRC(rc);
5077 Log4(("VMX_VMCS32_CTRL_PAGEFAULT_ERROR_MASK %#RX32\n", u32Val));
5078 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_PAGEFAULT_ERROR_MATCH, &u32Val); AssertRC(rc);
5079 Log4(("VMX_VMCS32_CTRL_PAGEFAULT_ERROR_MATCH %#RX32\n", u32Val));
5080 rc = VMXReadVmcsHstN(VMX_VMCS_CTRL_CR0_MASK, &uHCReg); AssertRC(rc);
5081 Log4(("VMX_VMCS_CTRL_CR0_MASK %#RHr\n", uHCReg));
5082 rc = VMXReadVmcsHstN(VMX_VMCS_CTRL_CR0_READ_SHADOW, &uHCReg); AssertRC(rc);
5083 Log4(("VMX_VMCS_CTRL_CR4_READ_SHADOW %#RHr\n", uHCReg));
5084 rc = VMXReadVmcsHstN(VMX_VMCS_CTRL_CR4_MASK, &uHCReg); AssertRC(rc);
5085 Log4(("VMX_VMCS_CTRL_CR4_MASK %#RHr\n", uHCReg));
5086 rc = VMXReadVmcsHstN(VMX_VMCS_CTRL_CR4_READ_SHADOW, &uHCReg); AssertRC(rc);
5087 Log4(("VMX_VMCS_CTRL_CR4_READ_SHADOW %#RHr\n", uHCReg));
5088 if (pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging)
5089 {
5090 rc = VMXReadVmcs64(VMX_VMCS64_CTRL_EPTP_FULL, &u64Val); AssertRC(rc);
5091 Log4(("VMX_VMCS64_CTRL_EPTP_FULL %#RX64\n", u64Val));
5092 }
5093
5094 /* Guest bits. */
5095 rc = VMXReadVmcsGstN(VMX_VMCS_GUEST_RIP, &u64Val); AssertRC(rc);
5096 Log4(("Old Guest Rip %#RX64 New %#RX64\n", pVCpu->cpum.GstCtx.rip, u64Val));
5097 rc = VMXReadVmcsGstN(VMX_VMCS_GUEST_RSP, &u64Val); AssertRC(rc);
5098 Log4(("Old Guest Rsp %#RX64 New %#RX64\n", pVCpu->cpum.GstCtx.rsp, u64Val));
5099 rc = VMXReadVmcs32(VMX_VMCS_GUEST_RFLAGS, &u32Val); AssertRC(rc);
5100 Log4(("Old Guest Rflags %#RX32 New %#RX32\n", pVCpu->cpum.GstCtx.eflags.u32, u32Val));
5101 if (pVCpu->CTX_SUFF(pVM)->hm.s.vmx.fVpid)
5102 {
5103 rc = VMXReadVmcs32(VMX_VMCS16_VPID, &u32Val); AssertRC(rc);
5104 Log4(("VMX_VMCS16_VPID %u\n", u32Val));
5105 }
5106
5107 /* Host bits. */
5108 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_CR0, &uHCReg); AssertRC(rc);
5109 Log4(("Host CR0 %#RHr\n", uHCReg));
5110 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_CR3, &uHCReg); AssertRC(rc);
5111 Log4(("Host CR3 %#RHr\n", uHCReg));
5112 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_CR4, &uHCReg); AssertRC(rc);
5113 Log4(("Host CR4 %#RHr\n", uHCReg));
5114
5115 RTGDTR HostGdtr;
5116 PCX86DESCHC pDesc;
5117 ASMGetGDTR(&HostGdtr);
5118 rc = VMXReadVmcs32(VMX_VMCS16_HOST_CS_SEL, &u32Val); AssertRC(rc);
5119 Log4(("Host CS %#08x\n", u32Val));
5120 if (u32Val < HostGdtr.cbGdt)
5121 {
5122 pDesc = (PCX86DESCHC)(HostGdtr.pGdt + (u32Val & X86_SEL_MASK));
5123 hmR0DumpDescriptor(pDesc, u32Val, "CS: ");
5124 }
5125
5126 rc = VMXReadVmcs32(VMX_VMCS16_HOST_DS_SEL, &u32Val); AssertRC(rc);
5127 Log4(("Host DS %#08x\n", u32Val));
5128 if (u32Val < HostGdtr.cbGdt)
5129 {
5130 pDesc = (PCX86DESCHC)(HostGdtr.pGdt + (u32Val & X86_SEL_MASK));
5131 hmR0DumpDescriptor(pDesc, u32Val, "DS: ");
5132 }
5133
5134 rc = VMXReadVmcs32(VMX_VMCS16_HOST_ES_SEL, &u32Val); AssertRC(rc);
5135 Log4(("Host ES %#08x\n", u32Val));
5136 if (u32Val < HostGdtr.cbGdt)
5137 {
5138 pDesc = (PCX86DESCHC)(HostGdtr.pGdt + (u32Val & X86_SEL_MASK));
5139 hmR0DumpDescriptor(pDesc, u32Val, "ES: ");
5140 }
5141
5142 rc = VMXReadVmcs32(VMX_VMCS16_HOST_FS_SEL, &u32Val); AssertRC(rc);
5143 Log4(("Host FS %#08x\n", u32Val));
5144 if (u32Val < HostGdtr.cbGdt)
5145 {
5146 pDesc = (PCX86DESCHC)(HostGdtr.pGdt + (u32Val & X86_SEL_MASK));
5147 hmR0DumpDescriptor(pDesc, u32Val, "FS: ");
5148 }
5149
5150 rc = VMXReadVmcs32(VMX_VMCS16_HOST_GS_SEL, &u32Val); AssertRC(rc);
5151 Log4(("Host GS %#08x\n", u32Val));
5152 if (u32Val < HostGdtr.cbGdt)
5153 {
5154 pDesc = (PCX86DESCHC)(HostGdtr.pGdt + (u32Val & X86_SEL_MASK));
5155 hmR0DumpDescriptor(pDesc, u32Val, "GS: ");
5156 }
5157
5158 rc = VMXReadVmcs32(VMX_VMCS16_HOST_SS_SEL, &u32Val); AssertRC(rc);
5159 Log4(("Host SS %#08x\n", u32Val));
5160 if (u32Val < HostGdtr.cbGdt)
5161 {
5162 pDesc = (PCX86DESCHC)(HostGdtr.pGdt + (u32Val & X86_SEL_MASK));
5163 hmR0DumpDescriptor(pDesc, u32Val, "SS: ");
5164 }
5165
5166 rc = VMXReadVmcs32(VMX_VMCS16_HOST_TR_SEL, &u32Val); AssertRC(rc);
5167 Log4(("Host TR %#08x\n", u32Val));
5168 if (u32Val < HostGdtr.cbGdt)
5169 {
5170 pDesc = (PCX86DESCHC)(HostGdtr.pGdt + (u32Val & X86_SEL_MASK));
5171 hmR0DumpDescriptor(pDesc, u32Val, "TR: ");
5172 }
5173
5174 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_TR_BASE, &uHCReg); AssertRC(rc);
5175 Log4(("Host TR Base %#RHv\n", uHCReg));
5176 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_GDTR_BASE, &uHCReg); AssertRC(rc);
5177 Log4(("Host GDTR Base %#RHv\n", uHCReg));
5178 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_IDTR_BASE, &uHCReg); AssertRC(rc);
5179 Log4(("Host IDTR Base %#RHv\n", uHCReg));
5180 rc = VMXReadVmcs32(VMX_VMCS32_HOST_SYSENTER_CS, &u32Val); AssertRC(rc);
5181 Log4(("Host SYSENTER CS %#08x\n", u32Val));
5182 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_SYSENTER_EIP, &uHCReg); AssertRC(rc);
5183 Log4(("Host SYSENTER EIP %#RHv\n", uHCReg));
5184 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_SYSENTER_ESP, &uHCReg); AssertRC(rc);
5185 Log4(("Host SYSENTER ESP %#RHv\n", uHCReg));
5186 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_RSP, &uHCReg); AssertRC(rc);
5187 Log4(("Host RSP %#RHv\n", uHCReg));
5188 rc = VMXReadVmcsHstN(VMX_VMCS_HOST_RIP, &uHCReg); AssertRC(rc);
5189 Log4(("Host RIP %#RHv\n", uHCReg));
5190# if HC_ARCH_BITS == 64
5191 Log4(("MSR_K6_EFER = %#RX64\n", ASMRdMsr(MSR_K6_EFER)));
5192 Log4(("MSR_K8_CSTAR = %#RX64\n", ASMRdMsr(MSR_K8_CSTAR)));
5193 Log4(("MSR_K8_LSTAR = %#RX64\n", ASMRdMsr(MSR_K8_LSTAR)));
5194 Log4(("MSR_K6_STAR = %#RX64\n", ASMRdMsr(MSR_K6_STAR)));
5195 Log4(("MSR_K8_SF_MASK = %#RX64\n", ASMRdMsr(MSR_K8_SF_MASK)));
5196 Log4(("MSR_K8_KERNEL_GS_BASE = %#RX64\n", ASMRdMsr(MSR_K8_KERNEL_GS_BASE)));
5197# endif
5198#endif /* VBOX_STRICT */
5199 break;
5200 }
5201
5202 default:
5203 /* Impossible */
5204 AssertMsgFailed(("hmR0VmxReportWorldSwitchError %Rrc (%#x)\n", rcVMRun, rcVMRun));
5205 break;
5206 }
5207}
5208
5209
5210#if HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS)
5211#ifndef VMX_USE_CACHED_VMCS_ACCESSES
5212# error "VMX_USE_CACHED_VMCS_ACCESSES not defined when it should be!"
5213#endif
5214#ifdef VBOX_STRICT
5215static bool hmR0VmxIsValidWriteField(uint32_t idxField)
5216{
5217 switch (idxField)
5218 {
5219 case VMX_VMCS_GUEST_RIP:
5220 case VMX_VMCS_GUEST_RSP:
5221 case VMX_VMCS_GUEST_SYSENTER_EIP:
5222 case VMX_VMCS_GUEST_SYSENTER_ESP:
5223 case VMX_VMCS_GUEST_GDTR_BASE:
5224 case VMX_VMCS_GUEST_IDTR_BASE:
5225 case VMX_VMCS_GUEST_CS_BASE:
5226 case VMX_VMCS_GUEST_DS_BASE:
5227 case VMX_VMCS_GUEST_ES_BASE:
5228 case VMX_VMCS_GUEST_FS_BASE:
5229 case VMX_VMCS_GUEST_GS_BASE:
5230 case VMX_VMCS_GUEST_SS_BASE:
5231 case VMX_VMCS_GUEST_LDTR_BASE:
5232 case VMX_VMCS_GUEST_TR_BASE:
5233 case VMX_VMCS_GUEST_CR3:
5234 return true;
5235 }
5236 return false;
5237}
5238
5239static bool hmR0VmxIsValidReadField(uint32_t idxField)
5240{
5241 switch (idxField)
5242 {
5243 /* Read-only fields. */
5244 case VMX_VMCS_RO_EXIT_QUALIFICATION:
5245 return true;
5246 }
5247 /* Remaining readable fields should also be writable. */
5248 return hmR0VmxIsValidWriteField(idxField);
5249}
5250#endif /* VBOX_STRICT */
5251
5252
5253/**
5254 * Executes the specified handler in 64-bit mode.
5255 *
5256 * @returns VBox status code (no informational status codes).
5257 * @param pVCpu The cross context virtual CPU structure.
5258 * @param enmOp The operation to perform.
5259 * @param cParams Number of parameters.
5260 * @param paParam Array of 32-bit parameters.
5261 */
5262VMMR0DECL(int) VMXR0Execute64BitsHandler(PVMCPU pVCpu, HM64ON32OP enmOp, uint32_t cParams, uint32_t *paParam)
5263{
5264 PVM pVM = pVCpu->CTX_SUFF(pVM);
5265 AssertReturn(pVM->hm.s.pfnHost32ToGuest64R0, VERR_HM_NO_32_TO_64_SWITCHER);
5266 Assert(enmOp > HM64ON32OP_INVALID && enmOp < HM64ON32OP_END);
5267 Assert(pVCpu->hm.s.vmx.VMCSCache.Write.cValidEntries <= RT_ELEMENTS(pVCpu->hm.s.vmx.VMCSCache.Write.aField));
5268 Assert(pVCpu->hm.s.vmx.VMCSCache.Read.cValidEntries <= RT_ELEMENTS(pVCpu->hm.s.vmx.VMCSCache.Read.aField));
5269
5270#ifdef VBOX_STRICT
5271 for (uint32_t i = 0; i < pVCpu->hm.s.vmx.VMCSCache.Write.cValidEntries; i++)
5272 Assert(hmR0VmxIsValidWriteField(pVCpu->hm.s.vmx.VMCSCache.Write.aField[i]));
5273
5274 for (uint32_t i = 0; i <pVCpu->hm.s.vmx.VMCSCache.Read.cValidEntries; i++)
5275 Assert(hmR0VmxIsValidReadField(pVCpu->hm.s.vmx.VMCSCache.Read.aField[i]));
5276#endif
5277
5278 /* Disable interrupts. */
5279 RTCCUINTREG fOldEFlags = ASMIntDisableFlags();
5280
5281#ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
5282 RTCPUID idHostCpu = RTMpCpuId();
5283 CPUMR0SetLApic(pVCpu, idHostCpu);
5284#endif
5285
5286 PHMGLOBALCPUINFO pCpu = hmR0GetCurrentCpu();
5287 RTHCPHYS HCPhysCpuPage = pCpu->HCPhysMemObj;
5288
5289 /* Clear VMCS. Marking it inactive, clearing implementation-specific data and writing VMCS data back to memory. */
5290 VMXClearVmcs(pVCpu->hm.s.vmx.HCPhysVmcs);
5291 pVCpu->hm.s.vmx.uVmcsState = HMVMX_VMCS_STATE_CLEAR;
5292
5293 /* Leave VMX Root Mode. */
5294 VMXDisable();
5295
5296 SUPR0ChangeCR4(0, ~X86_CR4_VMXE);
5297
5298 CPUMSetHyperESP(pVCpu, VMMGetStackRC(pVCpu));
5299 CPUMSetHyperEIP(pVCpu, enmOp);
5300 for (int i = (int)cParams - 1; i >= 0; i--)
5301 CPUMPushHyper(pVCpu, paParam[i]);
5302
5303 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatWorldSwitch3264, z);
5304
5305 /* Call the switcher. */
5306 int rc = pVM->hm.s.pfnHost32ToGuest64R0(pVM, RT_UOFFSETOF_DYN(VM, aCpus[pVCpu->idCpu].cpum) - RT_UOFFSETOF(VM, cpum));
5307 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatWorldSwitch3264, z);
5308
5309 /** @todo replace with hmR0VmxEnterRootMode() and hmR0VmxLeaveRootMode(). */
5310 /* Make sure the VMX instructions don't cause #UD faults. */
5311 SUPR0ChangeCR4(X86_CR4_VMXE, RTCCUINTREG_MAX);
5312
5313 /* Re-enter VMX Root Mode */
5314 int rc2 = VMXEnable(HCPhysCpuPage);
5315 if (RT_FAILURE(rc2))
5316 {
5317 SUPR0ChangeCR4(0, ~X86_CR4_VMXE);
5318 ASMSetFlags(fOldEFlags);
5319 pVM->hm.s.vmx.HCPhysVmxEnableError = HCPhysCpuPage;
5320 return rc2;
5321 }
5322
5323 rc2 = VMXActivateVmcs(pVCpu->hm.s.vmx.HCPhysVmcs);
5324 AssertRC(rc2);
5325 pVCpu->hm.s.vmx.uVmcsState = HMVMX_VMCS_STATE_ACTIVE;
5326 Assert(!(ASMGetFlags() & X86_EFL_IF));
5327 ASMSetFlags(fOldEFlags);
5328 return rc;
5329}
5330
5331
5332/**
5333 * Prepares for and executes VMLAUNCH (64-bit guests) for 32-bit hosts
5334 * supporting 64-bit guests.
5335 *
5336 * @returns VBox status code.
5337 * @param fResume Whether to VMLAUNCH or VMRESUME.
5338 * @param pCtx Pointer to the guest-CPU context.
5339 * @param pCache Pointer to the VMCS cache.
5340 * @param pVM The cross context VM structure.
5341 * @param pVCpu The cross context virtual CPU structure.
5342 */
5343DECLASM(int) VMXR0SwitcherStartVM64(RTHCUINT fResume, PCPUMCTX pCtx, PVMCSCACHE pCache, PVM pVM, PVMCPU pVCpu)
5344{
5345 NOREF(fResume);
5346
5347 PHMGLOBALCPUINFO pCpu = hmR0GetCurrentCpu();
5348 RTHCPHYS HCPhysCpuPage = pCpu->HCPhysMemObj;
5349
5350#ifdef VBOX_WITH_CRASHDUMP_MAGIC
5351 pCache->uPos = 1;
5352 pCache->interPD = PGMGetInterPaeCR3(pVM);
5353 pCache->pSwitcher = (uint64_t)pVM->hm.s.pfnHost32ToGuest64R0;
5354#endif
5355
5356#if defined(DEBUG) && defined(VMX_USE_CACHED_VMCS_ACCESSES)
5357 pCache->TestIn.HCPhysCpuPage = 0;
5358 pCache->TestIn.HCPhysVmcs = 0;
5359 pCache->TestIn.pCache = 0;
5360 pCache->TestOut.HCPhysVmcs = 0;
5361 pCache->TestOut.pCache = 0;
5362 pCache->TestOut.pCtx = 0;
5363 pCache->TestOut.eflags = 0;
5364#else
5365 NOREF(pCache);
5366#endif
5367
5368 uint32_t aParam[10];
5369 aParam[0] = RT_LO_U32(HCPhysCpuPage); /* Param 1: VMXON physical address - Lo. */
5370 aParam[1] = RT_HI_U32(HCPhysCpuPage); /* Param 1: VMXON physical address - Hi. */
5371 aParam[2] = RT_LO_U32(pVCpu->hm.s.vmx.HCPhysVmcs); /* Param 2: VMCS physical address - Lo. */
5372 aParam[3] = RT_HI_U32(pVCpu->hm.s.vmx.HCPhysVmcs); /* Param 2: VMCS physical address - Hi. */
5373 aParam[4] = VM_RC_ADDR(pVM, &pVM->aCpus[pVCpu->idCpu].hm.s.vmx.VMCSCache);
5374 aParam[5] = 0;
5375 aParam[6] = VM_RC_ADDR(pVM, pVM);
5376 aParam[7] = 0;
5377 aParam[8] = VM_RC_ADDR(pVM, pVCpu);
5378 aParam[9] = 0;
5379
5380#ifdef VBOX_WITH_CRASHDUMP_MAGIC
5381 pCtx->dr[4] = pVM->hm.s.vmx.pScratchPhys + 16 + 8;
5382 *(uint32_t *)(pVM->hm.s.vmx.pScratch + 16 + 8) = 1;
5383#endif
5384 int rc = VMXR0Execute64BitsHandler(pVCpu, HM64ON32OP_VMXRCStartVM64, RT_ELEMENTS(aParam), &aParam[0]);
5385
5386#ifdef VBOX_WITH_CRASHDUMP_MAGIC
5387 Assert(*(uint32_t *)(pVM->hm.s.vmx.pScratch + 16 + 8) == 5);
5388 Assert(pCtx->dr[4] == 10);
5389 *(uint32_t *)(pVM->hm.s.vmx.pScratch + 16 + 8) = 0xff;
5390#endif
5391
5392#if defined(DEBUG) && defined(VMX_USE_CACHED_VMCS_ACCESSES)
5393 AssertMsg(pCache->TestIn.HCPhysCpuPage == HCPhysCpuPage, ("%RHp vs %RHp\n", pCache->TestIn.HCPhysCpuPage, HCPhysCpuPage));
5394 AssertMsg(pCache->TestIn.HCPhysVmcs == pVCpu->hm.s.vmx.HCPhysVmcs, ("%RHp vs %RHp\n", pCache->TestIn.HCPhysVmcs,
5395 pVCpu->hm.s.vmx.HCPhysVmcs));
5396 AssertMsg(pCache->TestIn.HCPhysVmcs == pCache->TestOut.HCPhysVmcs, ("%RHp vs %RHp\n", pCache->TestIn.HCPhysVmcs,
5397 pCache->TestOut.HCPhysVmcs));
5398 AssertMsg(pCache->TestIn.pCache == pCache->TestOut.pCache, ("%RGv vs %RGv\n", pCache->TestIn.pCache,
5399 pCache->TestOut.pCache));
5400 AssertMsg(pCache->TestIn.pCache == VM_RC_ADDR(pVM, &pVM->aCpus[pVCpu->idCpu].hm.s.vmx.VMCSCache),
5401 ("%RGv vs %RGv\n", pCache->TestIn.pCache, VM_RC_ADDR(pVM, &pVM->aCpus[pVCpu->idCpu].hm.s.vmx.VMCSCache)));
5402 AssertMsg(pCache->TestIn.pCtx == pCache->TestOut.pCtx, ("%RGv vs %RGv\n", pCache->TestIn.pCtx,
5403 pCache->TestOut.pCtx));
5404 Assert(!(pCache->TestOut.eflags & X86_EFL_IF));
5405#endif
5406 NOREF(pCtx);
5407 return rc;
5408}
5409
5410
5411/**
5412 * Initialize the VMCS-Read cache.
5413 *
5414 * The VMCS cache is used for 32-bit hosts running 64-bit guests (except 32-bit
5415 * Darwin which runs with 64-bit paging in 32-bit mode) for 64-bit fields that
5416 * cannot be accessed in 32-bit mode. Some 64-bit fields -can- be accessed
5417 * (those that have a 32-bit FULL & HIGH part).
5418 *
5419 * @returns VBox status code.
5420 * @param pVCpu The cross context virtual CPU structure.
5421 */
5422static int hmR0VmxInitVmcsReadCache(PVMCPU pVCpu)
5423{
5424#define VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, idxField) \
5425 do { \
5426 Assert(pCache->Read.aField[idxField##_CACHE_IDX] == 0); \
5427 pCache->Read.aField[idxField##_CACHE_IDX] = idxField; \
5428 pCache->Read.aFieldVal[idxField##_CACHE_IDX] = 0; \
5429 ++cReadFields; \
5430 } while (0)
5431
5432 PVMCSCACHE pCache = &pVCpu->hm.s.vmx.VMCSCache;
5433 uint32_t cReadFields = 0;
5434
5435 /*
5436 * Don't remove the #if 0'd fields in this code. They're listed here for consistency
5437 * and serve to indicate exceptions to the rules.
5438 */
5439
5440 /* Guest-natural selector base fields. */
5441#if 0
5442 /* These are 32-bit in practice. See Intel spec. 2.5 "Control Registers". */
5443 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_CR0);
5444 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_CR4);
5445#endif
5446 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_ES_BASE);
5447 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_CS_BASE);
5448 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_SS_BASE);
5449 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_DS_BASE);
5450 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_FS_BASE);
5451 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_GS_BASE);
5452 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_LDTR_BASE);
5453 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_TR_BASE);
5454 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_GDTR_BASE);
5455 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_IDTR_BASE);
5456 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_RSP);
5457 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_RIP);
5458#if 0
5459 /* Unused natural width guest-state fields. */
5460 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_PENDING_DEBUG_XCPTS);
5461 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_CR3); /* Handled in Nested Paging case */
5462#endif
5463 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_SYSENTER_ESP);
5464 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_SYSENTER_EIP);
5465
5466 /* 64-bit guest-state fields; unused as we use two 32-bit VMREADs for
5467 these 64-bit fields (using "FULL" and "HIGH" fields). */
5468#if 0
5469 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS64_GUEST_VMCS_LINK_PTR_FULL);
5470 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS64_GUEST_DEBUGCTL_FULL);
5471 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS64_GUEST_PAT_FULL);
5472 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS64_GUEST_EFER_FULL);
5473 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS64_GUEST_PERF_GLOBAL_CTRL_FULL);
5474 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS64_GUEST_PDPTE0_FULL);
5475 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS64_GUEST_PDPTE1_FULL);
5476 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS64_GUEST_PDPTE2_FULL);
5477 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS64_GUEST_PDPTE3_FULL);
5478#endif
5479
5480 /* Natural width guest-state fields. */
5481 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_RO_EXIT_QUALIFICATION);
5482 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_RO_GUEST_LINEAR_ADDR);
5483
5484 if (pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging)
5485 {
5486 VMXLOCAL_INIT_READ_CACHE_FIELD(pCache, VMX_VMCS_GUEST_CR3);
5487 AssertMsg(cReadFields == VMX_VMCS_MAX_NESTED_PAGING_CACHE_IDX, ("cReadFields=%u expected %u\n", cReadFields,
5488 VMX_VMCS_MAX_NESTED_PAGING_CACHE_IDX));
5489 pCache->Read.cValidEntries = VMX_VMCS_MAX_NESTED_PAGING_CACHE_IDX;
5490 }
5491 else
5492 {
5493 AssertMsg(cReadFields == VMX_VMCS_MAX_CACHE_IDX, ("cReadFields=%u expected %u\n", cReadFields, VMX_VMCS_MAX_CACHE_IDX));
5494 pCache->Read.cValidEntries = VMX_VMCS_MAX_CACHE_IDX;
5495 }
5496
5497#undef VMXLOCAL_INIT_READ_CACHE_FIELD
5498 return VINF_SUCCESS;
5499}
5500
5501
5502/**
5503 * Writes a field into the VMCS. This can either directly invoke a VMWRITE or
5504 * queue up the VMWRITE by using the VMCS write cache (on 32-bit hosts, except
5505 * darwin, running 64-bit guests).
5506 *
5507 * @returns VBox status code.
5508 * @param pVCpu The cross context virtual CPU structure.
5509 * @param idxField The VMCS field encoding.
5510 * @param u64Val 16, 32 or 64-bit value.
5511 */
5512VMMR0DECL(int) VMXWriteVmcs64Ex(PVMCPU pVCpu, uint32_t idxField, uint64_t u64Val)
5513{
5514 int rc;
5515 switch (idxField)
5516 {
5517 /*
5518 * These fields consists of a "FULL" and a "HIGH" part which can be written to individually.
5519 */
5520 /* 64-bit Control fields. */
5521 case VMX_VMCS64_CTRL_IO_BITMAP_A_FULL:
5522 case VMX_VMCS64_CTRL_IO_BITMAP_B_FULL:
5523 case VMX_VMCS64_CTRL_MSR_BITMAP_FULL:
5524 case VMX_VMCS64_CTRL_EXIT_MSR_STORE_FULL:
5525 case VMX_VMCS64_CTRL_EXIT_MSR_LOAD_FULL:
5526 case VMX_VMCS64_CTRL_ENTRY_MSR_LOAD_FULL:
5527 case VMX_VMCS64_CTRL_EXEC_VMCS_PTR_FULL:
5528 case VMX_VMCS64_CTRL_TSC_OFFSET_FULL:
5529 case VMX_VMCS64_CTRL_VIRT_APIC_PAGEADDR_FULL:
5530 case VMX_VMCS64_CTRL_APIC_ACCESSADDR_FULL:
5531 case VMX_VMCS64_CTRL_VMFUNC_CTRLS_FULL:
5532 case VMX_VMCS64_CTRL_EPTP_FULL:
5533 case VMX_VMCS64_CTRL_EPTP_LIST_FULL:
5534 /* 64-bit Guest-state fields. */
5535 case VMX_VMCS64_GUEST_VMCS_LINK_PTR_FULL:
5536 case VMX_VMCS64_GUEST_DEBUGCTL_FULL:
5537 case VMX_VMCS64_GUEST_PAT_FULL:
5538 case VMX_VMCS64_GUEST_EFER_FULL:
5539 case VMX_VMCS64_GUEST_PERF_GLOBAL_CTRL_FULL:
5540 case VMX_VMCS64_GUEST_PDPTE0_FULL:
5541 case VMX_VMCS64_GUEST_PDPTE1_FULL:
5542 case VMX_VMCS64_GUEST_PDPTE2_FULL:
5543 case VMX_VMCS64_GUEST_PDPTE3_FULL:
5544 /* 64-bit Host-state fields. */
5545 case VMX_VMCS64_HOST_PAT_FULL:
5546 case VMX_VMCS64_HOST_EFER_FULL:
5547 case VMX_VMCS64_HOST_PERF_GLOBAL_CTRL_FULL:
5548 {
5549 rc = VMXWriteVmcs32(idxField, RT_LO_U32(u64Val));
5550 rc |= VMXWriteVmcs32(idxField + 1, RT_HI_U32(u64Val));
5551 break;
5552 }
5553
5554 /*
5555 * These fields do not have high and low parts. Queue up the VMWRITE by using the VMCS write-cache (for 64-bit
5556 * values). When we switch the host to 64-bit mode for running 64-bit guests, these VMWRITEs get executed then.
5557 */
5558 /* Natural-width Guest-state fields. */
5559 case VMX_VMCS_GUEST_CR3:
5560 case VMX_VMCS_GUEST_ES_BASE:
5561 case VMX_VMCS_GUEST_CS_BASE:
5562 case VMX_VMCS_GUEST_SS_BASE:
5563 case VMX_VMCS_GUEST_DS_BASE:
5564 case VMX_VMCS_GUEST_FS_BASE:
5565 case VMX_VMCS_GUEST_GS_BASE:
5566 case VMX_VMCS_GUEST_LDTR_BASE:
5567 case VMX_VMCS_GUEST_TR_BASE:
5568 case VMX_VMCS_GUEST_GDTR_BASE:
5569 case VMX_VMCS_GUEST_IDTR_BASE:
5570 case VMX_VMCS_GUEST_RSP:
5571 case VMX_VMCS_GUEST_RIP:
5572 case VMX_VMCS_GUEST_SYSENTER_ESP:
5573 case VMX_VMCS_GUEST_SYSENTER_EIP:
5574 {
5575 if (!(RT_HI_U32(u64Val)))
5576 {
5577 /* If this field is 64-bit, VT-x will zero out the top bits. */
5578 rc = VMXWriteVmcs32(idxField, RT_LO_U32(u64Val));
5579 }
5580 else
5581 {
5582 /* Assert that only the 32->64 switcher case should ever come here. */
5583 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.fAllow64BitGuests);
5584 rc = VMXWriteCachedVmcsEx(pVCpu, idxField, u64Val);
5585 }
5586 break;
5587 }
5588
5589 default:
5590 {
5591 AssertMsgFailed(("VMXWriteVmcs64Ex: Invalid field %#RX32 (pVCpu=%p u64Val=%#RX64)\n", idxField, pVCpu, u64Val));
5592 rc = VERR_INVALID_PARAMETER;
5593 break;
5594 }
5595 }
5596 AssertRCReturn(rc, rc);
5597 return rc;
5598}
5599
5600
5601/**
5602 * Queue up a VMWRITE by using the VMCS write cache.
5603 * This is only used on 32-bit hosts (except darwin) for 64-bit guests.
5604 *
5605 * @param pVCpu The cross context virtual CPU structure.
5606 * @param idxField The VMCS field encoding.
5607 * @param u64Val 16, 32 or 64-bit value.
5608 */
5609VMMR0DECL(int) VMXWriteCachedVmcsEx(PVMCPU pVCpu, uint32_t idxField, uint64_t u64Val)
5610{
5611 AssertPtr(pVCpu);
5612 PVMCSCACHE pCache = &pVCpu->hm.s.vmx.VMCSCache;
5613
5614 AssertMsgReturn(pCache->Write.cValidEntries < VMCSCACHE_MAX_ENTRY - 1,
5615 ("entries=%u\n", pCache->Write.cValidEntries), VERR_ACCESS_DENIED);
5616
5617 /* Make sure there are no duplicates. */
5618 for (uint32_t i = 0; i < pCache->Write.cValidEntries; i++)
5619 {
5620 if (pCache->Write.aField[i] == idxField)
5621 {
5622 pCache->Write.aFieldVal[i] = u64Val;
5623 return VINF_SUCCESS;
5624 }
5625 }
5626
5627 pCache->Write.aField[pCache->Write.cValidEntries] = idxField;
5628 pCache->Write.aFieldVal[pCache->Write.cValidEntries] = u64Val;
5629 pCache->Write.cValidEntries++;
5630 return VINF_SUCCESS;
5631}
5632#endif /* HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS) */
5633
5634
5635/**
5636 * Sets up the usage of TSC-offsetting and updates the VMCS.
5637 *
5638 * If offsetting is not possible, cause VM-exits on RDTSC(P)s. Also sets up the
5639 * VMX preemption timer.
5640 *
5641 * @returns VBox status code.
5642 * @param pVCpu The cross context virtual CPU structure.
5643 *
5644 * @remarks No-long-jump zone!!!
5645 */
5646static void hmR0VmxUpdateTscOffsettingAndPreemptTimer(PVMCPU pVCpu)
5647{
5648 bool fOffsettedTsc;
5649 bool fParavirtTsc;
5650 PVM pVM = pVCpu->CTX_SUFF(pVM);
5651 uint64_t uTscOffset;
5652 if (pVM->hm.s.vmx.fUsePreemptTimer)
5653 {
5654 uint64_t cTicksToDeadline = TMCpuTickGetDeadlineAndTscOffset(pVM, pVCpu, &uTscOffset, &fOffsettedTsc, &fParavirtTsc);
5655
5656 /* Make sure the returned values have sane upper and lower boundaries. */
5657 uint64_t u64CpuHz = SUPGetCpuHzFromGipBySetIndex(g_pSUPGlobalInfoPage, pVCpu->iHostCpuSet);
5658 cTicksToDeadline = RT_MIN(cTicksToDeadline, u64CpuHz / 64); /* 1/64th of a second */
5659 cTicksToDeadline = RT_MAX(cTicksToDeadline, u64CpuHz / 2048); /* 1/2048th of a second */
5660 cTicksToDeadline >>= pVM->hm.s.vmx.cPreemptTimerShift;
5661
5662 uint32_t cPreemptionTickCount = (uint32_t)RT_MIN(cTicksToDeadline, UINT32_MAX - 16);
5663 int rc = VMXWriteVmcs32(VMX_VMCS32_PREEMPT_TIMER_VALUE, cPreemptionTickCount);
5664 AssertRC(rc);
5665 }
5666 else
5667 fOffsettedTsc = TMCpuTickCanUseRealTSC(pVM, pVCpu, &uTscOffset, &fParavirtTsc);
5668
5669 if (fParavirtTsc)
5670 {
5671 /* Currently neither Hyper-V nor KVM need to update their paravirt. TSC
5672 information before every VM-entry, hence disable it for performance sake. */
5673#if 0
5674 int rc = GIMR0UpdateParavirtTsc(pVM, 0 /* u64Offset */);
5675 AssertRC(rc);
5676#endif
5677 STAM_COUNTER_INC(&pVCpu->hm.s.StatTscParavirt);
5678 }
5679
5680 uint32_t uProcCtls = pVCpu->hm.s.vmx.u32ProcCtls;
5681 if ( fOffsettedTsc
5682 && RT_LIKELY(!pVCpu->hm.s.fDebugWantRdTscExit))
5683 {
5684 if (pVCpu->hm.s.vmx.u64TscOffset != uTscOffset)
5685 {
5686 int rc = VMXWriteVmcs64(VMX_VMCS64_CTRL_TSC_OFFSET_FULL, uTscOffset);
5687 AssertRC(rc);
5688 pVCpu->hm.s.vmx.u64TscOffset = uTscOffset;
5689 }
5690
5691 if (uProcCtls & VMX_PROC_CTLS_RDTSC_EXIT)
5692 {
5693 uProcCtls &= ~VMX_PROC_CTLS_RDTSC_EXIT;
5694 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, uProcCtls);
5695 AssertRC(rc);
5696 pVCpu->hm.s.vmx.u32ProcCtls = uProcCtls;
5697 }
5698 STAM_COUNTER_INC(&pVCpu->hm.s.StatTscOffset);
5699 }
5700 else
5701 {
5702 /* We can't use TSC-offsetting (non-fixed TSC, warp drive active etc.), VM-exit on RDTSC(P). */
5703 if (!(uProcCtls & VMX_PROC_CTLS_RDTSC_EXIT))
5704 {
5705 uProcCtls |= VMX_PROC_CTLS_RDTSC_EXIT;
5706 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, uProcCtls);
5707 AssertRC(rc);
5708 pVCpu->hm.s.vmx.u32ProcCtls = uProcCtls;
5709 }
5710 STAM_COUNTER_INC(&pVCpu->hm.s.StatTscIntercept);
5711 }
5712}
5713
5714
5715/**
5716 * Gets the IEM exception flags for the specified vector and IDT vectoring /
5717 * VM-exit interruption info type.
5718 *
5719 * @returns The IEM exception flags.
5720 * @param uVector The event vector.
5721 * @param uVmxVectorType The VMX event type.
5722 *
5723 * @remarks This function currently only constructs flags required for
5724 * IEMEvaluateRecursiveXcpt and not the complete flags (e.g, error-code
5725 * and CR2 aspects of an exception are not included).
5726 */
5727static uint32_t hmR0VmxGetIemXcptFlags(uint8_t uVector, uint32_t uVmxVectorType)
5728{
5729 uint32_t fIemXcptFlags;
5730 switch (uVmxVectorType)
5731 {
5732 case VMX_IDT_VECTORING_INFO_TYPE_HW_XCPT:
5733 case VMX_IDT_VECTORING_INFO_TYPE_NMI:
5734 fIemXcptFlags = IEM_XCPT_FLAGS_T_CPU_XCPT;
5735 break;
5736
5737 case VMX_IDT_VECTORING_INFO_TYPE_EXT_INT:
5738 fIemXcptFlags = IEM_XCPT_FLAGS_T_EXT_INT;
5739 break;
5740
5741 case VMX_IDT_VECTORING_INFO_TYPE_PRIV_SW_XCPT:
5742 fIemXcptFlags = IEM_XCPT_FLAGS_T_SOFT_INT | IEM_XCPT_FLAGS_ICEBP_INSTR;
5743 break;
5744
5745 case VMX_IDT_VECTORING_INFO_TYPE_SW_XCPT:
5746 {
5747 fIemXcptFlags = IEM_XCPT_FLAGS_T_SOFT_INT;
5748 if (uVector == X86_XCPT_BP)
5749 fIemXcptFlags |= IEM_XCPT_FLAGS_BP_INSTR;
5750 else if (uVector == X86_XCPT_OF)
5751 fIemXcptFlags |= IEM_XCPT_FLAGS_OF_INSTR;
5752 else
5753 {
5754 fIemXcptFlags = 0;
5755 AssertMsgFailed(("Unexpected vector for software int. uVector=%#x", uVector));
5756 }
5757 break;
5758 }
5759
5760 case VMX_IDT_VECTORING_INFO_TYPE_SW_INT:
5761 fIemXcptFlags = IEM_XCPT_FLAGS_T_SOFT_INT;
5762 break;
5763
5764 default:
5765 fIemXcptFlags = 0;
5766 AssertMsgFailed(("Unexpected vector type! uVmxVectorType=%#x uVector=%#x", uVmxVectorType, uVector));
5767 break;
5768 }
5769 return fIemXcptFlags;
5770}
5771
5772
5773/**
5774 * Sets an event as a pending event to be injected into the guest.
5775 *
5776 * @param pVCpu The cross context virtual CPU structure.
5777 * @param u32IntInfo The VM-entry interruption-information field.
5778 * @param cbInstr The VM-entry instruction length in bytes (for software
5779 * interrupts, exceptions and privileged software
5780 * exceptions).
5781 * @param u32ErrCode The VM-entry exception error code.
5782 * @param GCPtrFaultAddress The fault-address (CR2) in case it's a
5783 * page-fault.
5784 *
5785 * @remarks Statistics counter assumes this is a guest event being injected or
5786 * re-injected into the guest, i.e. 'StatInjectPendingReflect' is
5787 * always incremented.
5788 */
5789DECLINLINE(void) hmR0VmxSetPendingEvent(PVMCPU pVCpu, uint32_t u32IntInfo, uint32_t cbInstr, uint32_t u32ErrCode,
5790 RTGCUINTPTR GCPtrFaultAddress)
5791{
5792 Assert(!pVCpu->hm.s.Event.fPending);
5793 pVCpu->hm.s.Event.fPending = true;
5794 pVCpu->hm.s.Event.u64IntInfo = u32IntInfo;
5795 pVCpu->hm.s.Event.u32ErrCode = u32ErrCode;
5796 pVCpu->hm.s.Event.cbInstr = cbInstr;
5797 pVCpu->hm.s.Event.GCPtrFaultAddress = GCPtrFaultAddress;
5798}
5799
5800
5801/**
5802 * Sets a double-fault (\#DF) exception as pending-for-injection into the VM.
5803 *
5804 * @param pVCpu The cross context virtual CPU structure.
5805 */
5806DECLINLINE(void) hmR0VmxSetPendingXcptDF(PVMCPU pVCpu)
5807{
5808 uint32_t const u32IntInfo = RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VECTOR, X86_XCPT_DF)
5809 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_TYPE, VMX_EXIT_INT_INFO_TYPE_HW_XCPT)
5810 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_ERR_CODE_VALID, 1)
5811 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VALID, 1);
5812 hmR0VmxSetPendingEvent(pVCpu, u32IntInfo, 0 /* cbInstr */, 0 /* u32ErrCode */, 0 /* GCPtrFaultAddress */);
5813}
5814
5815
5816/**
5817 * Sets an invalid-opcode (\#UD) exception as pending-for-injection into the VM.
5818 *
5819 * @param pVCpu The cross context virtual CPU structure.
5820 */
5821DECLINLINE(void) hmR0VmxSetPendingXcptUD(PVMCPU pVCpu)
5822{
5823 uint32_t const u32IntInfo = RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VECTOR, X86_XCPT_UD)
5824 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_TYPE, VMX_EXIT_INT_INFO_TYPE_HW_XCPT)
5825 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_ERR_CODE_VALID, 0)
5826 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VALID, 1);
5827 hmR0VmxSetPendingEvent(pVCpu, u32IntInfo, 0 /* cbInstr */, 0 /* u32ErrCode */, 0 /* GCPtrFaultAddress */);
5828}
5829
5830
5831/**
5832 * Sets a debug (\#DB) exception as pending-for-injection into the VM.
5833 *
5834 * @param pVCpu The cross context virtual CPU structure.
5835 */
5836DECLINLINE(void) hmR0VmxSetPendingXcptDB(PVMCPU pVCpu)
5837{
5838 uint32_t const u32IntInfo = RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VECTOR, X86_XCPT_DB)
5839 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_TYPE, VMX_EXIT_INT_INFO_TYPE_HW_XCPT)
5840 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_ERR_CODE_VALID, 0)
5841 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VALID, 1);
5842 hmR0VmxSetPendingEvent(pVCpu, u32IntInfo, 0 /* cbInstr */, 0 /* u32ErrCode */, 0 /* GCPtrFaultAddress */);
5843}
5844
5845
5846#ifdef VBOX_WITH_NESTED_HWVIRT_VMX
5847/**
5848 * Sets a general-protection (\#GP) exception as pending-for-injection into the VM.
5849 *
5850 * @param pVCpu The cross context virtual CPU structure.
5851 * @param u32ErrCode The error code for the general-protection exception.
5852 */
5853DECLINLINE(void) hmR0VmxSetPendingXcptGP(PVMCPU pVCpu, uint32_t u32ErrCode)
5854{
5855 uint32_t const u32IntInfo = RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VECTOR, X86_XCPT_GP)
5856 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_TYPE, VMX_EXIT_INT_INFO_TYPE_HW_XCPT)
5857 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_ERR_CODE_VALID, 1)
5858 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VALID, 1);
5859 hmR0VmxSetPendingEvent(pVCpu, u32IntInfo, 0 /* cbInstr */, u32ErrCode, 0 /* GCPtrFaultAddress */);
5860}
5861
5862
5863/**
5864 * Sets a stack (\#SS) exception as pending-for-injection into the VM.
5865 *
5866 * @param pVCpu The cross context virtual CPU structure.
5867 * @param u32ErrCode The error code for the stack exception.
5868 */
5869DECLINLINE(void) hmR0VmxSetPendingXcptSS(PVMCPU pVCpu, uint32_t u32ErrCode)
5870{
5871 uint32_t const u32IntInfo = RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VECTOR, X86_XCPT_SS)
5872 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_TYPE, VMX_EXIT_INT_INFO_TYPE_HW_XCPT)
5873 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_ERR_CODE_VALID, 1)
5874 | RT_BF_MAKE(VMX_BF_ENTRY_INT_INFO_VALID, 1);
5875 hmR0VmxSetPendingEvent(pVCpu, u32IntInfo, 0 /* cbInstr */, u32ErrCode, 0 /* GCPtrFaultAddress */);
5876}
5877
5878
5879/**
5880 * Decodes the memory operand of an instruction that caused a VM-exit.
5881 *
5882 * The VM-exit qualification field provides the displacement field for memory
5883 * operand instructions, if any.
5884 *
5885 * @returns Strict VBox status code (i.e. informational status codes too).
5886 * @retval VINF_SUCCESS if the operand was successfully decoded.
5887 * @retval VINF_HM_PENDING_XCPT if an exception was raised while decoding the
5888 * operand.
5889 * @param pVCpu The cross context virtual CPU structure.
5890 * @param uExitInstrInfo The VM-exit instruction information field.
5891 * @param enmMemAccess The memory operand's access type (read or write).
5892 * @param GCPtrDisp The instruction displacement field, if any. For
5893 * RIP-relative addressing pass RIP + displacement here.
5894 * @param pGCPtrMem Where to store the effective destination memory address.
5895 */
5896static VBOXSTRICTRC hmR0VmxDecodeMemOperand(PVMCPU pVCpu, uint32_t uExitInstrInfo, RTGCPTR GCPtrDisp, VMXMEMACCESS enmMemAccess,
5897 PRTGCPTR pGCPtrMem)
5898{
5899 Assert(pGCPtrMem);
5900 Assert(!CPUMIsGuestInRealOrV86Mode(pVCpu));
5901 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_RIP | CPUMCTX_EXTRN_RSP | CPUMCTX_EXTRN_SREG_MASK | CPUMCTX_EXTRN_EFER
5902 | CPUMCTX_EXTRN_CR0);
5903
5904 static uint64_t const s_auAddrSizeMasks[] = { UINT64_C(0xffff), UINT64_C(0xffffffff), UINT64_C(0xffffffffffffffff) };
5905 static uint64_t const s_auAccessSizeMasks[] = { sizeof(uint16_t), sizeof(uint32_t), sizeof(uint64_t) };
5906 AssertCompile(RT_ELEMENTS(s_auAccessSizeMasks) == RT_ELEMENTS(s_auAddrSizeMasks));
5907
5908 VMXEXITINSTRINFO ExitInstrInfo;
5909 ExitInstrInfo.u = uExitInstrInfo;
5910 uint8_t const uAddrSize = ExitInstrInfo.All.u3AddrSize;
5911 uint8_t const iSegReg = ExitInstrInfo.All.iSegReg;
5912 bool const fIdxRegValid = !ExitInstrInfo.All.fIdxRegInvalid;
5913 uint8_t const iIdxReg = ExitInstrInfo.All.iIdxReg;
5914 uint8_t const uScale = ExitInstrInfo.All.u2Scaling;
5915 bool const fBaseRegValid = !ExitInstrInfo.All.fBaseRegInvalid;
5916 uint8_t const iBaseReg = ExitInstrInfo.All.iBaseReg;
5917 bool const fIsMemOperand = !ExitInstrInfo.All.fIsRegOperand;
5918 bool const fIsLongMode = CPUMIsGuestInLongModeEx(&pVCpu->cpum.GstCtx);
5919
5920 /*
5921 * Validate instruction information.
5922 * This shouldn't happen on real hardware but useful while testing our nested hardware-virtualization code.
5923 */
5924 AssertLogRelMsgReturn(uAddrSize < RT_ELEMENTS(s_auAddrSizeMasks),
5925 ("Invalid address size. ExitInstrInfo=%#RX32\n", ExitInstrInfo.u), VERR_VMX_IPE_1);
5926 AssertLogRelMsgReturn(iSegReg < X86_SREG_COUNT,
5927 ("Invalid segment register. ExitInstrInfo=%#RX32\n", ExitInstrInfo.u), VERR_VMX_IPE_2);
5928 AssertLogRelMsgReturn(fIsMemOperand,
5929 ("Expected memory operand. ExitInstrInfo=%#RX32\n", ExitInstrInfo.u), VERR_VMX_IPE_3);
5930
5931 /*
5932 * Compute the complete effective address.
5933 *
5934 * See AMD instruction spec. 1.4.2 "SIB Byte Format"
5935 * See AMD spec. 4.5.2 "Segment Registers".
5936 */
5937 RTGCPTR GCPtrMem = GCPtrDisp;
5938 if (fBaseRegValid)
5939 GCPtrMem += pVCpu->cpum.GstCtx.aGRegs[iBaseReg].u64;
5940 if (fIdxRegValid)
5941 GCPtrMem += pVCpu->cpum.GstCtx.aGRegs[iIdxReg].u64 << uScale;
5942
5943 RTGCPTR const GCPtrOff = GCPtrMem;
5944 if ( !fIsLongMode
5945 || iSegReg >= X86_SREG_FS)
5946 GCPtrMem += pVCpu->cpum.GstCtx.aSRegs[iSegReg].u64Base;
5947 GCPtrMem &= s_auAddrSizeMasks[uAddrSize];
5948
5949 /*
5950 * Validate effective address.
5951 * See AMD spec. 4.5.3 "Segment Registers in 64-Bit Mode".
5952 */
5953 uint8_t const cbAccess = s_auAccessSizeMasks[uAddrSize];
5954 Assert(cbAccess > 0);
5955 if (fIsLongMode)
5956 {
5957 if (X86_IS_CANONICAL(GCPtrMem))
5958 {
5959 *pGCPtrMem = GCPtrMem;
5960 return VINF_SUCCESS;
5961 }
5962
5963 /** @todo r=ramshankar: We should probably raise \#SS or \#GP. See AMD spec. 4.12.2
5964 * "Data Limit Checks in 64-bit Mode". */
5965 Log4Func(("Long mode effective address is not canonical GCPtrMem=%#RX64\n", GCPtrMem));
5966 hmR0VmxSetPendingXcptGP(pVCpu, 0);
5967 return VINF_HM_PENDING_XCPT;
5968 }
5969
5970 /*
5971 * This is a watered down version of iemMemApplySegment().
5972 * Parts that are not applicable for VMX instructions like real-or-v8086 mode
5973 * and segment CPL/DPL checks are skipped.
5974 */
5975 RTGCPTR32 const GCPtrFirst32 = (RTGCPTR32)GCPtrOff;
5976 RTGCPTR32 const GCPtrLast32 = GCPtrFirst32 + cbAccess - 1;
5977 PCCPUMSELREG pSel = &pVCpu->cpum.GstCtx.aSRegs[iSegReg];
5978
5979 /* Check if the segment is present and usable. */
5980 if ( pSel->Attr.n.u1Present
5981 && !pSel->Attr.n.u1Unusable)
5982 {
5983 Assert(pSel->Attr.n.u1DescType);
5984 if (!(pSel->Attr.n.u4Type & X86_SEL_TYPE_CODE))
5985 {
5986 /* Check permissions for the data segment. */
5987 if ( enmMemAccess == VMXMEMACCESS_WRITE
5988 && !(pSel->Attr.n.u4Type & X86_SEL_TYPE_WRITE))
5989 {
5990 Log4Func(("Data segment access invalid. iSegReg=%#x Attr=%#RX32\n", iSegReg, pSel->Attr.u));
5991 hmR0VmxSetPendingXcptGP(pVCpu, iSegReg);
5992 return VINF_HM_PENDING_XCPT;
5993 }
5994
5995 /* Check limits if it's a normal data segment. */
5996 if (!(pSel->Attr.n.u4Type & X86_SEL_TYPE_DOWN))
5997 {
5998 if ( GCPtrFirst32 > pSel->u32Limit
5999 || GCPtrLast32 > pSel->u32Limit)
6000 {
6001 Log4Func(("Data segment limit exceeded."
6002 "iSegReg=%#x GCPtrFirst32=%#RX32 GCPtrLast32=%#RX32 u32Limit=%#RX32\n", iSegReg, GCPtrFirst32,
6003 GCPtrLast32, pSel->u32Limit));
6004 if (iSegReg == X86_SREG_SS)
6005 hmR0VmxSetPendingXcptSS(pVCpu, 0);
6006 else
6007 hmR0VmxSetPendingXcptGP(pVCpu, 0);
6008 return VINF_HM_PENDING_XCPT;
6009 }
6010 }
6011 else
6012 {
6013 /* Check limits if it's an expand-down data segment.
6014 Note! The upper boundary is defined by the B bit, not the G bit! */
6015 if ( GCPtrFirst32 < pSel->u32Limit + UINT32_C(1)
6016 || GCPtrLast32 > (pSel->Attr.n.u1DefBig ? UINT32_MAX : UINT32_C(0xffff)))
6017 {
6018 Log4Func(("Expand-down data segment limit exceeded."
6019 "iSegReg=%#x GCPtrFirst32=%#RX32 GCPtrLast32=%#RX32 u32Limit=%#RX32\n", iSegReg, GCPtrFirst32,
6020 GCPtrLast32, pSel->u32Limit));
6021 if (iSegReg == X86_SREG_SS)
6022 hmR0VmxSetPendingXcptSS(pVCpu, 0);
6023 else
6024 hmR0VmxSetPendingXcptGP(pVCpu, 0);
6025 return VINF_HM_PENDING_XCPT;
6026 }
6027 }
6028 }
6029 else
6030 {
6031 /* Check permissions for the code segment. */
6032 if ( enmMemAccess == VMXMEMACCESS_WRITE
6033 || ( enmMemAccess == VMXMEMACCESS_READ
6034 && !(pSel->Attr.n.u4Type & X86_SEL_TYPE_READ)))
6035 {
6036 Log4Func(("Code segment access invalid. Attr=%#RX32\n", pSel->Attr.u));
6037 Assert(!CPUMIsGuestInRealOrV86ModeEx(&pVCpu->cpum.GstCtx));
6038 hmR0VmxSetPendingXcptGP(pVCpu, 0);
6039 return VINF_HM_PENDING_XCPT;
6040 }
6041
6042 /* Check limits for the code segment (normal/expand-down not applicable for code segments). */
6043 if ( GCPtrFirst32 > pSel->u32Limit
6044 || GCPtrLast32 > pSel->u32Limit)
6045 {
6046 Log4Func(("Code segment limit exceeded. GCPtrFirst32=%#RX32 GCPtrLast32=%#RX32 u32Limit=%#RX32\n",
6047 GCPtrFirst32, GCPtrLast32, pSel->u32Limit));
6048 if (iSegReg == X86_SREG_SS)
6049 hmR0VmxSetPendingXcptSS(pVCpu, 0);
6050 else
6051 hmR0VmxSetPendingXcptGP(pVCpu, 0);
6052 return VINF_HM_PENDING_XCPT;
6053 }
6054 }
6055 }
6056 else
6057 {
6058 Log4Func(("Not present or unusable segment. iSegReg=%#x Attr=%#RX32\n", iSegReg, pSel->Attr.u));
6059 hmR0VmxSetPendingXcptGP(pVCpu, 0);
6060 return VINF_HM_PENDING_XCPT;
6061 }
6062
6063 *pGCPtrMem = GCPtrMem;
6064 return VINF_SUCCESS;
6065}
6066
6067
6068/**
6069 * Perform the relevant VMX instruction checks for VM-exits that occurred due to the
6070 * guest attempting to execute a VMX instruction.
6071 *
6072 * @returns Strict VBox status code (i.e. informational status codes too).
6073 * @retval VINF_SUCCESS if we should continue handling the VM-exit.
6074 * @retval VINF_HM_PENDING_XCPT if an exception was raised.
6075 *
6076 * @param pVCpu The cross context virtual CPU structure.
6077 * @param uExitReason The VM-exit reason.
6078 *
6079 * @todo NstVmx: Document other error codes when VM-exit is implemented.
6080 * @remarks No-long-jump zone!!!
6081 */
6082static VBOXSTRICTRC hmR0VmxCheckExitDueToVmxInstr(PVMCPU pVCpu, uint32_t uExitReason)
6083{
6084 HMVMX_CPUMCTX_ASSERT(pVCpu, CPUMCTX_EXTRN_CR4 | CPUMCTX_EXTRN_CR0 | CPUMCTX_EXTRN_RFLAGS | CPUMCTX_EXTRN_SS
6085 | CPUMCTX_EXTRN_CS | CPUMCTX_EXTRN_EFER);
6086
6087 if ( CPUMIsGuestInRealOrV86ModeEx(&pVCpu->cpum.GstCtx)
6088 || ( CPUMIsGuestInLongModeEx(&pVCpu->cpum.GstCtx)
6089 && !CPUMIsGuestIn64BitCodeEx(&pVCpu->cpum.GstCtx)))
6090 {
6091 Log4Func(("In real/v86-mode or long-mode outside 64-bit code segment -> #UD\n"));
6092 hmR0VmxSetPendingXcptUD(pVCpu);
6093 return VINF_HM_PENDING_XCPT;
6094 }
6095
6096 if (uExitReason == VMX_EXIT_VMXON)
6097 {
6098 /*
6099 * We check CR4.VMXE because it is required to be always set while in VMX operation
6100 * by physical CPUs and our CR4 read shadow is only consulted when executing specific
6101 * instructions (CLTS, LMSW, MOV CR, and SMSW) and thus doesn't affect CPU operation
6102 * otherwise (i.e. physical CPU won't automatically #UD if Cr4Shadow.VMXE is 0).
6103 */
6104 if (!CPUMIsGuestVmxEnabled(&pVCpu->cpum.GstCtx))
6105 {
6106 Log4Func(("CR4.VMXE is not set -> #UD\n"));
6107 hmR0VmxSetPendingXcptUD(pVCpu);
6108 return VINF_HM_PENDING_XCPT;
6109 }
6110 }
6111 else if (!CPUMIsGuestInVmxRootMode(&pVCpu->cpum.GstCtx))
6112 {
6113 /*
6114 * The guest has not entered VMX operation but attempted to execute a VMX instruction
6115 * (other than VMXON), we need to raise a #UD.
6116 */
6117 Log4Func(("Not in VMX root mode -> #UD\n"));
6118 hmR0VmxSetPendingXcptUD(pVCpu);
6119 return VINF_HM_PENDING_XCPT;
6120 }
6121
6122 if (CPUMIsGuestInVmxNonRootMode(&pVCpu->cpum.GstCtx))
6123 {
6124 /*
6125 * The nested-guest attempted to execute a VMX instruction, cause a VM-exit and let
6126 * the guest hypervisor deal with it.
6127 */
6128 /** @todo NSTVMX: Trigger a VM-exit */
6129 }
6130
6131 /*
6132 * VMX instructions require CPL 0 except in VMX non-root mode where the VM-exit intercept
6133 * (above) takes preceedence over the CPL check.
6134 */
6135 if (CPUMGetGuestCPL(pVCpu) > 0)
6136 {
6137 Log4Func(("CPL > 0 -> #GP(0)\n"));
6138 hmR0VmxSetPendingXcptGP(pVCpu, 0);
6139 return VINF_HM_PENDING_XCPT;
6140 }
6141
6142 return VINF_SUCCESS;
6143}
6144
6145#endif /* VBOX_WITH_NESTED_HWVIRT_VMX */
6146
6147
6148/**
6149 * Handle a condition that occurred while delivering an event through the guest
6150 * IDT.
6151 *
6152 * @returns Strict VBox status code (i.e. informational status codes too).
6153 * @retval VINF_SUCCESS if we should continue handling the VM-exit.
6154 * @retval VINF_HM_DOUBLE_FAULT if a \#DF condition was detected and we ought
6155 * to continue execution of the guest which will delivery the \#DF.
6156 * @retval VINF_EM_RESET if we detected a triple-fault condition.
6157 * @retval VERR_EM_GUEST_CPU_HANG if we detected a guest CPU hang.
6158 *
6159 * @param pVCpu The cross context virtual CPU structure.
6160 * @param pVmxTransient Pointer to the VMX transient structure.
6161 *
6162 * @remarks No-long-jump zone!!!
6163 */
6164static VBOXSTRICTRC hmR0VmxCheckExitDueToEventDelivery(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
6165{
6166 uint32_t const uExitVector = VMX_EXIT_INT_INFO_VECTOR(pVmxTransient->uExitIntInfo);
6167
6168 int rc2 = hmR0VmxReadIdtVectoringInfoVmcs(pVmxTransient);
6169 rc2 |= hmR0VmxReadExitIntInfoVmcs(pVmxTransient);
6170 AssertRCReturn(rc2, rc2);
6171
6172 VBOXSTRICTRC rcStrict = VINF_SUCCESS;
6173 if (VMX_IDT_VECTORING_INFO_IS_VALID(pVmxTransient->uIdtVectoringInfo))
6174 {
6175 uint32_t const uIdtVectorType = VMX_IDT_VECTORING_INFO_TYPE(pVmxTransient->uIdtVectoringInfo);
6176 uint32_t const uIdtVector = VMX_IDT_VECTORING_INFO_VECTOR(pVmxTransient->uIdtVectoringInfo);
6177
6178 /*
6179 * If the event was a software interrupt (generated with INT n) or a software exception
6180 * (generated by INT3/INTO) or a privileged software exception (generated by INT1), we
6181 * can handle the VM-exit and continue guest execution which will re-execute the
6182 * instruction rather than re-injecting the exception, as that can cause premature
6183 * trips to ring-3 before injection and involve TRPM which currently has no way of
6184 * storing that these exceptions were caused by these instructions (ICEBP's #DB poses
6185 * the problem).
6186 */
6187 IEMXCPTRAISE enmRaise;
6188 IEMXCPTRAISEINFO fRaiseInfo;
6189 if ( uIdtVectorType == VMX_IDT_VECTORING_INFO_TYPE_SW_INT
6190 || uIdtVectorType == VMX_IDT_VECTORING_INFO_TYPE_SW_XCPT
6191 || uIdtVectorType == VMX_IDT_VECTORING_INFO_TYPE_PRIV_SW_XCPT)
6192 {
6193 enmRaise = IEMXCPTRAISE_REEXEC_INSTR;
6194 fRaiseInfo = IEMXCPTRAISEINFO_NONE;
6195 }
6196 else if (VMX_EXIT_INT_INFO_IS_VALID(pVmxTransient->uExitIntInfo))
6197 {
6198 uint32_t const uExitVectorType = VMX_IDT_VECTORING_INFO_TYPE(pVmxTransient->uExitIntInfo);
6199 uint32_t const fIdtVectorFlags = hmR0VmxGetIemXcptFlags(uIdtVector, uIdtVectorType);
6200 uint32_t const fExitVectorFlags = hmR0VmxGetIemXcptFlags(uExitVector, uExitVectorType);
6201 /** @todo Make AssertMsgReturn as just AssertMsg later. */
6202 AssertMsgReturn(uExitVectorType == VMX_EXIT_INT_INFO_TYPE_HW_XCPT,
6203 ("hmR0VmxCheckExitDueToEventDelivery: Unexpected VM-exit interruption info. %#x!\n",
6204 uExitVectorType), VERR_VMX_IPE_5);
6205
6206 enmRaise = IEMEvaluateRecursiveXcpt(pVCpu, fIdtVectorFlags, uIdtVector, fExitVectorFlags, uExitVector, &fRaiseInfo);
6207
6208 /* Determine a vectoring #PF condition, see comment in hmR0VmxExitXcptPF(). */
6209 if (fRaiseInfo & (IEMXCPTRAISEINFO_EXT_INT_PF | IEMXCPTRAISEINFO_NMI_PF))
6210 {
6211 pVmxTransient->fVectoringPF = true;
6212 enmRaise = IEMXCPTRAISE_PREV_EVENT;
6213 }
6214 }
6215 else
6216 {
6217 /*
6218 * If an exception or hardware interrupt delivery caused an EPT violation/misconfig or APIC access
6219 * VM-exit, then the VM-exit interruption-information will not be valid and we end up here.
6220 * It is sufficient to reflect the original event to the guest after handling the VM-exit.
6221 */
6222 Assert( uIdtVectorType == VMX_IDT_VECTORING_INFO_TYPE_HW_XCPT
6223 || uIdtVectorType == VMX_IDT_VECTORING_INFO_TYPE_NMI
6224 || uIdtVectorType == VMX_IDT_VECTORING_INFO_TYPE_EXT_INT);
6225 enmRaise = IEMXCPTRAISE_PREV_EVENT;
6226 fRaiseInfo = IEMXCPTRAISEINFO_NONE;
6227 }
6228
6229 /*
6230 * On CPUs that support Virtual NMIs, if this VM-exit (be it an exception or EPT violation/misconfig
6231 * etc.) occurred while delivering the NMI, we need to clear the block-by-NMI field in the guest
6232 * interruptibility-state before re-delivering the NMI after handling the VM-exit. Otherwise the
6233 * subsequent VM-entry would fail.
6234 *
6235 * See Intel spec. 30.7.1.2 "Resuming Guest Software after Handling an Exception". See @bugref{7445}.
6236 */
6237 if ( VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_BLOCK_NMIS)
6238 && uIdtVectorType == VMX_IDT_VECTORING_INFO_TYPE_NMI
6239 && ( enmRaise == IEMXCPTRAISE_PREV_EVENT
6240 || (fRaiseInfo & IEMXCPTRAISEINFO_NMI_PF))
6241 && (pVCpu->hm.s.vmx.u32PinCtls & VMX_PIN_CTLS_VIRT_NMI))
6242 {
6243 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_BLOCK_NMIS);
6244 }
6245
6246 switch (enmRaise)
6247 {
6248 case IEMXCPTRAISE_CURRENT_XCPT:
6249 {
6250 Log4Func(("IDT: Pending secondary Xcpt: uIdtVectoringInfo=%#RX64 uExitIntInfo=%#RX64\n",
6251 pVmxTransient->uIdtVectoringInfo, pVmxTransient->uExitIntInfo));
6252 Assert(rcStrict == VINF_SUCCESS);
6253 break;
6254 }
6255
6256 case IEMXCPTRAISE_PREV_EVENT:
6257 {
6258 uint32_t u32ErrCode;
6259 if (VMX_IDT_VECTORING_INFO_IS_ERROR_CODE_VALID(pVmxTransient->uIdtVectoringInfo))
6260 {
6261 rc2 = hmR0VmxReadIdtVectoringErrorCodeVmcs(pVmxTransient);
6262 AssertRCReturn(rc2, rc2);
6263 u32ErrCode = pVmxTransient->uIdtVectoringErrorCode;
6264 }
6265 else
6266 u32ErrCode = 0;
6267
6268 /* If uExitVector is #PF, CR2 value will be updated from the VMCS if it's a guest #PF, see hmR0VmxExitXcptPF(). */
6269 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectPendingReflect);
6270 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_IDT_INFO(pVmxTransient->uIdtVectoringInfo),
6271 0 /* cbInstr */, u32ErrCode, pVCpu->cpum.GstCtx.cr2);
6272
6273 Log4Func(("IDT: Pending vectoring event %#RX64 Err=%#RX32\n", pVCpu->hm.s.Event.u64IntInfo,
6274 pVCpu->hm.s.Event.u32ErrCode));
6275 Assert(rcStrict == VINF_SUCCESS);
6276 break;
6277 }
6278
6279 case IEMXCPTRAISE_REEXEC_INSTR:
6280 Assert(rcStrict == VINF_SUCCESS);
6281 break;
6282
6283 case IEMXCPTRAISE_DOUBLE_FAULT:
6284 {
6285 /*
6286 * Determing a vectoring double #PF condition. Used later, when PGM evaluates the
6287 * second #PF as a guest #PF (and not a shadow #PF) and needs to be converted into a #DF.
6288 */
6289 if (fRaiseInfo & IEMXCPTRAISEINFO_PF_PF)
6290 {
6291 pVmxTransient->fVectoringDoublePF = true;
6292 Log4Func(("IDT: Vectoring double #PF %#RX64 cr2=%#RX64\n", pVCpu->hm.s.Event.u64IntInfo,
6293 pVCpu->cpum.GstCtx.cr2));
6294 rcStrict = VINF_SUCCESS;
6295 }
6296 else
6297 {
6298 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectPendingReflect);
6299 hmR0VmxSetPendingXcptDF(pVCpu);
6300 Log4Func(("IDT: Pending vectoring #DF %#RX64 uIdtVector=%#x uExitVector=%#x\n", pVCpu->hm.s.Event.u64IntInfo,
6301 uIdtVector, uExitVector));
6302 rcStrict = VINF_HM_DOUBLE_FAULT;
6303 }
6304 break;
6305 }
6306
6307 case IEMXCPTRAISE_TRIPLE_FAULT:
6308 {
6309 Log4Func(("IDT: Pending vectoring triple-fault uIdt=%#x uExit=%#x\n", uIdtVector, uExitVector));
6310 rcStrict = VINF_EM_RESET;
6311 break;
6312 }
6313
6314 case IEMXCPTRAISE_CPU_HANG:
6315 {
6316 Log4Func(("IDT: Bad guest! Entering CPU hang. fRaiseInfo=%#x\n", fRaiseInfo));
6317 rcStrict = VERR_EM_GUEST_CPU_HANG;
6318 break;
6319 }
6320
6321 default:
6322 {
6323 AssertMsgFailed(("IDT: vcpu[%RU32] Unexpected/invalid value! enmRaise=%#x\n", pVCpu->idCpu, enmRaise));
6324 rcStrict = VERR_VMX_IPE_2;
6325 break;
6326 }
6327 }
6328 }
6329 else if ( VMX_EXIT_INT_INFO_IS_VALID(pVmxTransient->uExitIntInfo)
6330 && VMX_EXIT_INT_INFO_IS_NMI_UNBLOCK_IRET(pVmxTransient->uExitIntInfo)
6331 && uExitVector != X86_XCPT_DF
6332 && (pVCpu->hm.s.vmx.u32PinCtls & VMX_PIN_CTLS_VIRT_NMI))
6333 {
6334 /*
6335 * Execution of IRET caused this fault when NMI blocking was in effect (i.e we're in the guest NMI handler).
6336 * We need to set the block-by-NMI field so that NMIs remain blocked until the IRET execution is restarted.
6337 * See Intel spec. 30.7.1.2 "Resuming guest software after handling an exception".
6338 */
6339 if (!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_BLOCK_NMIS))
6340 {
6341 Log4Func(("Setting VMCPU_FF_BLOCK_NMIS. fValid=%RTbool uExitReason=%u\n",
6342 VMX_EXIT_INT_INFO_IS_VALID(pVmxTransient->uExitIntInfo), pVmxTransient->uExitReason));
6343 VMCPU_FF_SET(pVCpu, VMCPU_FF_BLOCK_NMIS);
6344 }
6345 }
6346
6347 Assert( rcStrict == VINF_SUCCESS || rcStrict == VINF_HM_DOUBLE_FAULT
6348 || rcStrict == VINF_EM_RESET || rcStrict == VERR_EM_GUEST_CPU_HANG);
6349 return rcStrict;
6350}
6351
6352
6353/**
6354 * Imports a guest segment register from the current VMCS into
6355 * the guest-CPU context.
6356 *
6357 * @returns VBox status code.
6358 * @param pVCpu The cross context virtual CPU structure.
6359 * @param idxSel Index of the selector in the VMCS.
6360 * @param idxLimit Index of the segment limit in the VMCS.
6361 * @param idxBase Index of the segment base in the VMCS.
6362 * @param idxAccess Index of the access rights of the segment in the VMCS.
6363 * @param pSelReg Pointer to the segment selector.
6364 *
6365 * @remarks Called with interrupts and/or preemption disabled, try not to assert and
6366 * do not log!
6367 *
6368 * @remarks Never call this function directly!!! Use the
6369 * HMVMX_IMPORT_SREG() macro as that takes care
6370 * of whether to read from the VMCS cache or not.
6371 */
6372static int hmR0VmxImportGuestSegmentReg(PVMCPU pVCpu, uint32_t idxSel, uint32_t idxLimit, uint32_t idxBase, uint32_t idxAccess,
6373 PCPUMSELREG pSelReg)
6374{
6375 NOREF(pVCpu);
6376
6377 uint32_t u32Sel;
6378 uint32_t u32Limit;
6379 uint32_t u32Attr;
6380 uint64_t u64Base;
6381 int rc = VMXReadVmcs32(idxSel, &u32Sel);
6382 rc |= VMXReadVmcs32(idxLimit, &u32Limit);
6383 rc |= VMXReadVmcs32(idxAccess, &u32Attr);
6384 rc |= VMXReadVmcsGstNByIdxVal(idxBase, &u64Base);
6385 AssertRCReturn(rc, rc);
6386
6387 pSelReg->Sel = (uint16_t)u32Sel;
6388 pSelReg->ValidSel = (uint16_t)u32Sel;
6389 pSelReg->fFlags = CPUMSELREG_FLAGS_VALID;
6390 pSelReg->u32Limit = u32Limit;
6391 pSelReg->u64Base = u64Base;
6392 pSelReg->Attr.u = u32Attr;
6393
6394 /*
6395 * If VT-x marks the segment as unusable, most other bits remain undefined:
6396 * - For CS the L, D and G bits have meaning.
6397 * - For SS the DPL has meaning (it -is- the CPL for Intel and VBox).
6398 * - For the remaining data segments no bits are defined.
6399 *
6400 * The present bit and the unusable bit has been observed to be set at the
6401 * same time (the selector was supposed to be invalid as we started executing
6402 * a V8086 interrupt in ring-0).
6403 *
6404 * What should be important for the rest of the VBox code, is that the P bit is
6405 * cleared. Some of the other VBox code recognizes the unusable bit, but
6406 * AMD-V certainly don't, and REM doesn't really either. So, to be on the
6407 * safe side here, we'll strip off P and other bits we don't care about. If
6408 * any code breaks because Attr.u != 0 when Sel < 4, it should be fixed.
6409 *
6410 * See Intel spec. 27.3.2 "Saving Segment Registers and Descriptor-Table Registers".
6411 */
6412 if (pSelReg->Attr.u & X86DESCATTR_UNUSABLE)
6413 {
6414 Assert(idxSel != VMX_VMCS16_GUEST_TR_SEL); /* TR is the only selector that can never be unusable. */
6415
6416 /* Masking off: X86DESCATTR_P, X86DESCATTR_LIMIT_HIGH, and X86DESCATTR_AVL. The latter two are really irrelevant. */
6417 pSelReg->Attr.u &= X86DESCATTR_UNUSABLE | X86DESCATTR_L | X86DESCATTR_D | X86DESCATTR_G
6418 | X86DESCATTR_DPL | X86DESCATTR_TYPE | X86DESCATTR_DT;
6419#ifdef VBOX_STRICT
6420 VMMRZCallRing3Disable(pVCpu);
6421 Log4Func(("Unusable idxSel=%#x attr=%#x -> %#x\n", idxSel, u32Sel, pSelReg->Attr.u));
6422# ifdef DEBUG_bird
6423 AssertMsg((u32Attr & ~X86DESCATTR_P) == pSelReg->Attr.u,
6424 ("%#x: %#x != %#x (sel=%#x base=%#llx limit=%#x)\n",
6425 idxSel, u32Sel, pSelReg->Attr.u, pSelReg->Sel, pSelReg->u64Base, pSelReg->u32Limit));
6426# endif
6427 VMMRZCallRing3Enable(pVCpu);
6428#endif
6429 }
6430 return VINF_SUCCESS;
6431}
6432
6433
6434/**
6435 * Imports the guest RIP from the VMCS back into the guest-CPU context.
6436 *
6437 * @returns VBox status code.
6438 * @param pVCpu The cross context virtual CPU structure.
6439 *
6440 * @remarks Called with interrupts and/or preemption disabled, should not assert!
6441 * @remarks Do -not- call this function directly, use hmR0VmxImportGuestState()
6442 * instead!!!
6443 */
6444DECLINLINE(int) hmR0VmxImportGuestRip(PVMCPU pVCpu)
6445{
6446 uint64_t u64Val;
6447 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
6448 if (pCtx->fExtrn & CPUMCTX_EXTRN_RIP)
6449 {
6450 int rc = VMXReadVmcsGstN(VMX_VMCS_GUEST_RIP, &u64Val);
6451 if (RT_SUCCESS(rc))
6452 {
6453 pCtx->rip = u64Val;
6454 EMR0HistoryUpdatePC(pVCpu, pCtx->rip, false);
6455 pCtx->fExtrn &= ~CPUMCTX_EXTRN_RIP;
6456 }
6457 return rc;
6458 }
6459 return VINF_SUCCESS;
6460}
6461
6462
6463/**
6464 * Imports the guest RFLAGS from the VMCS back into the guest-CPU context.
6465 *
6466 * @returns VBox status code.
6467 * @param pVCpu The cross context virtual CPU structure.
6468 *
6469 * @remarks Called with interrupts and/or preemption disabled, should not assert!
6470 * @remarks Do -not- call this function directly, use hmR0VmxImportGuestState()
6471 * instead!!!
6472 */
6473DECLINLINE(int) hmR0VmxImportGuestRFlags(PVMCPU pVCpu)
6474{
6475 uint32_t u32Val;
6476 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
6477 if (pCtx->fExtrn & CPUMCTX_EXTRN_RFLAGS)
6478 {
6479 int rc = VMXReadVmcs32(VMX_VMCS_GUEST_RFLAGS, &u32Val);
6480 if (RT_SUCCESS(rc))
6481 {
6482 pCtx->eflags.u32 = u32Val;
6483
6484 /* Restore eflags for real-on-v86-mode hack. */
6485 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
6486 {
6487 pCtx->eflags.Bits.u1VM = 0;
6488 pCtx->eflags.Bits.u2IOPL = pVCpu->hm.s.vmx.RealMode.Eflags.Bits.u2IOPL;
6489 }
6490 }
6491 pCtx->fExtrn &= ~CPUMCTX_EXTRN_RFLAGS;
6492 return rc;
6493 }
6494 return VINF_SUCCESS;
6495}
6496
6497
6498/**
6499 * Imports the guest interruptibility-state from the VMCS back into the guest-CPU
6500 * context.
6501 *
6502 * @returns VBox status code.
6503 * @param pVCpu The cross context virtual CPU structure.
6504 *
6505 * @remarks Called with interrupts and/or preemption disabled, try not to assert and
6506 * do not log!
6507 * @remarks Do -not- call this function directly, use hmR0VmxImportGuestState()
6508 * instead!!!
6509 */
6510DECLINLINE(int) hmR0VmxImportGuestIntrState(PVMCPU pVCpu)
6511{
6512 uint32_t u32Val;
6513 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
6514 int rc = VMXReadVmcs32(VMX_VMCS32_GUEST_INT_STATE, &u32Val);
6515 AssertRCReturn(rc, rc);
6516
6517 /*
6518 * We additionally have a requirement to import RIP, RFLAGS depending on whether we
6519 * might need them in hmR0VmxEvaluatePendingEvent().
6520 */
6521 if (!u32Val)
6522 {
6523 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS))
6524 {
6525 rc = hmR0VmxImportGuestRip(pVCpu);
6526 rc |= hmR0VmxImportGuestRFlags(pVCpu);
6527 AssertRCReturn(rc, rc);
6528 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS);
6529 }
6530
6531 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_BLOCK_NMIS))
6532 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_BLOCK_NMIS);
6533 }
6534 else
6535 {
6536 rc = hmR0VmxImportGuestRip(pVCpu);
6537 rc |= hmR0VmxImportGuestRFlags(pVCpu);
6538 AssertRCReturn(rc, rc);
6539
6540 if (u32Val & ( VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS
6541 | VMX_VMCS_GUEST_INT_STATE_BLOCK_STI))
6542 {
6543 EMSetInhibitInterruptsPC(pVCpu, pCtx->rip);
6544 }
6545 else if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS))
6546 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS);
6547
6548 if (u32Val & VMX_VMCS_GUEST_INT_STATE_BLOCK_NMI)
6549 {
6550 if (!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_BLOCK_NMIS))
6551 VMCPU_FF_SET(pVCpu, VMCPU_FF_BLOCK_NMIS);
6552 }
6553 else if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_BLOCK_NMIS))
6554 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_BLOCK_NMIS);
6555 }
6556
6557 return VINF_SUCCESS;
6558}
6559
6560
6561/**
6562 * Worker for VMXR0ImportStateOnDemand.
6563 *
6564 * @returns VBox status code.
6565 * @param pVCpu The cross context virtual CPU structure.
6566 * @param fWhat What to import, CPUMCTX_EXTRN_XXX.
6567 */
6568static int hmR0VmxImportGuestState(PVMCPU pVCpu, uint64_t fWhat)
6569{
6570#define VMXLOCAL_BREAK_RC(a_rc) \
6571 if (RT_FAILURE(a_rc)) \
6572 break
6573
6574 int rc = VINF_SUCCESS;
6575 PVM pVM = pVCpu->CTX_SUFF(pVM);
6576 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
6577 uint64_t u64Val;
6578 uint32_t u32Val;
6579
6580 Log4Func(("fExtrn=%#RX64 fWhat=%#RX64\n", pCtx->fExtrn, fWhat));
6581 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatImportGuestState, x);
6582
6583 /*
6584 * We disable interrupts to make the updating of the state and in particular
6585 * the fExtrn modification atomic wrt to preemption hooks.
6586 */
6587 RTCCUINTREG const fEFlags = ASMIntDisableFlags();
6588
6589 fWhat &= pCtx->fExtrn;
6590 if (fWhat)
6591 {
6592 do
6593 {
6594 if (fWhat & CPUMCTX_EXTRN_RIP)
6595 {
6596 rc = hmR0VmxImportGuestRip(pVCpu);
6597 VMXLOCAL_BREAK_RC(rc);
6598 }
6599
6600 if (fWhat & CPUMCTX_EXTRN_RFLAGS)
6601 {
6602 rc = hmR0VmxImportGuestRFlags(pVCpu);
6603 VMXLOCAL_BREAK_RC(rc);
6604 }
6605
6606 if (fWhat & CPUMCTX_EXTRN_HM_VMX_INT_STATE)
6607 {
6608 rc = hmR0VmxImportGuestIntrState(pVCpu);
6609 VMXLOCAL_BREAK_RC(rc);
6610 }
6611
6612 if (fWhat & CPUMCTX_EXTRN_RSP)
6613 {
6614 rc = VMXReadVmcsGstN(VMX_VMCS_GUEST_RSP, &u64Val);
6615 VMXLOCAL_BREAK_RC(rc);
6616 pCtx->rsp = u64Val;
6617 }
6618
6619 if (fWhat & CPUMCTX_EXTRN_SREG_MASK)
6620 {
6621 if (fWhat & CPUMCTX_EXTRN_CS)
6622 {
6623 rc = HMVMX_IMPORT_SREG(CS, &pCtx->cs);
6624 rc |= hmR0VmxImportGuestRip(pVCpu);
6625 VMXLOCAL_BREAK_RC(rc);
6626 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
6627 pCtx->cs.Attr.u = pVCpu->hm.s.vmx.RealMode.AttrCS.u;
6628 EMR0HistoryUpdatePC(pVCpu, pCtx->cs.u64Base + pCtx->rip, true);
6629 }
6630 if (fWhat & CPUMCTX_EXTRN_SS)
6631 {
6632 rc = HMVMX_IMPORT_SREG(SS, &pCtx->ss);
6633 VMXLOCAL_BREAK_RC(rc);
6634 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
6635 pCtx->ss.Attr.u = pVCpu->hm.s.vmx.RealMode.AttrSS.u;
6636 }
6637 if (fWhat & CPUMCTX_EXTRN_DS)
6638 {
6639 rc = HMVMX_IMPORT_SREG(DS, &pCtx->ds);
6640 VMXLOCAL_BREAK_RC(rc);
6641 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
6642 pCtx->ds.Attr.u = pVCpu->hm.s.vmx.RealMode.AttrDS.u;
6643 }
6644 if (fWhat & CPUMCTX_EXTRN_ES)
6645 {
6646 rc = HMVMX_IMPORT_SREG(ES, &pCtx->es);
6647 VMXLOCAL_BREAK_RC(rc);
6648 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
6649 pCtx->es.Attr.u = pVCpu->hm.s.vmx.RealMode.AttrES.u;
6650 }
6651 if (fWhat & CPUMCTX_EXTRN_FS)
6652 {
6653 rc = HMVMX_IMPORT_SREG(FS, &pCtx->fs);
6654 VMXLOCAL_BREAK_RC(rc);
6655 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
6656 pCtx->fs.Attr.u = pVCpu->hm.s.vmx.RealMode.AttrFS.u;
6657 }
6658 if (fWhat & CPUMCTX_EXTRN_GS)
6659 {
6660 rc = HMVMX_IMPORT_SREG(GS, &pCtx->gs);
6661 VMXLOCAL_BREAK_RC(rc);
6662 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
6663 pCtx->gs.Attr.u = pVCpu->hm.s.vmx.RealMode.AttrGS.u;
6664 }
6665 }
6666
6667 if (fWhat & CPUMCTX_EXTRN_TABLE_MASK)
6668 {
6669 if (fWhat & CPUMCTX_EXTRN_LDTR)
6670 {
6671 rc = HMVMX_IMPORT_SREG(LDTR, &pCtx->ldtr);
6672 VMXLOCAL_BREAK_RC(rc);
6673 }
6674
6675 if (fWhat & CPUMCTX_EXTRN_GDTR)
6676 {
6677 rc = VMXReadVmcsGstN(VMX_VMCS_GUEST_GDTR_BASE, &u64Val);
6678 rc |= VMXReadVmcs32(VMX_VMCS32_GUEST_GDTR_LIMIT, &u32Val);
6679 VMXLOCAL_BREAK_RC(rc);
6680 pCtx->gdtr.pGdt = u64Val;
6681 pCtx->gdtr.cbGdt = u32Val;
6682 }
6683
6684 /* Guest IDTR. */
6685 if (fWhat & CPUMCTX_EXTRN_IDTR)
6686 {
6687 rc = VMXReadVmcsGstN(VMX_VMCS_GUEST_IDTR_BASE, &u64Val);
6688 rc |= VMXReadVmcs32(VMX_VMCS32_GUEST_IDTR_LIMIT, &u32Val);
6689 VMXLOCAL_BREAK_RC(rc);
6690 pCtx->idtr.pIdt = u64Val;
6691 pCtx->idtr.cbIdt = u32Val;
6692 }
6693
6694 /* Guest TR. */
6695 if (fWhat & CPUMCTX_EXTRN_TR)
6696 {
6697 /* Real-mode emulation using virtual-8086 mode has the fake TSS (pRealModeTSS) in TR, don't save that one. */
6698 if (!pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
6699 {
6700 rc = HMVMX_IMPORT_SREG(TR, &pCtx->tr);
6701 VMXLOCAL_BREAK_RC(rc);
6702 }
6703 }
6704 }
6705
6706 if (fWhat & CPUMCTX_EXTRN_SYSENTER_MSRS)
6707 {
6708 rc = VMXReadVmcsGstN(VMX_VMCS_GUEST_SYSENTER_EIP, &pCtx->SysEnter.eip);
6709 rc |= VMXReadVmcsGstN(VMX_VMCS_GUEST_SYSENTER_ESP, &pCtx->SysEnter.esp);
6710 rc |= VMXReadVmcs32(VMX_VMCS32_GUEST_SYSENTER_CS, &u32Val);
6711 pCtx->SysEnter.cs = u32Val;
6712 VMXLOCAL_BREAK_RC(rc);
6713 }
6714
6715#if HC_ARCH_BITS == 64
6716 if (fWhat & CPUMCTX_EXTRN_KERNEL_GS_BASE)
6717 {
6718 if ( pVM->hm.s.fAllow64BitGuests
6719 && (pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_LOADED_GUEST))
6720 pCtx->msrKERNELGSBASE = ASMRdMsr(MSR_K8_KERNEL_GS_BASE);
6721 }
6722
6723 if (fWhat & CPUMCTX_EXTRN_SYSCALL_MSRS)
6724 {
6725 if ( pVM->hm.s.fAllow64BitGuests
6726 && (pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_LOADED_GUEST))
6727 {
6728 pCtx->msrLSTAR = ASMRdMsr(MSR_K8_LSTAR);
6729 pCtx->msrSTAR = ASMRdMsr(MSR_K6_STAR);
6730 pCtx->msrSFMASK = ASMRdMsr(MSR_K8_SF_MASK);
6731 }
6732 }
6733#endif
6734
6735 if ( (fWhat & (CPUMCTX_EXTRN_TSC_AUX | CPUMCTX_EXTRN_OTHER_MSRS))
6736#if HC_ARCH_BITS == 32
6737 || (fWhat & (CPUMCTX_EXTRN_KERNEL_GS_BASE | CPUMCTX_EXTRN_SYSCALL_MSRS))
6738#endif
6739 )
6740 {
6741 PCVMXAUTOMSR pMsr = (PVMXAUTOMSR)pVCpu->hm.s.vmx.pvGuestMsr;
6742 uint32_t const cMsrs = pVCpu->hm.s.vmx.cMsrs;
6743 for (uint32_t i = 0; i < cMsrs; i++, pMsr++)
6744 {
6745 switch (pMsr->u32Msr)
6746 {
6747#if HC_ARCH_BITS == 32
6748 case MSR_K8_LSTAR: pCtx->msrLSTAR = pMsr->u64Value; break;
6749 case MSR_K6_STAR: pCtx->msrSTAR = pMsr->u64Value; break;
6750 case MSR_K8_SF_MASK: pCtx->msrSFMASK = pMsr->u64Value; break;
6751 case MSR_K8_KERNEL_GS_BASE: pCtx->msrKERNELGSBASE = pMsr->u64Value; break;
6752#endif
6753 case MSR_IA32_SPEC_CTRL: CPUMSetGuestSpecCtrl(pVCpu, pMsr->u64Value); break;
6754 case MSR_K8_TSC_AUX: CPUMSetGuestTscAux(pVCpu, pMsr->u64Value); break;
6755 case MSR_K6_EFER: /* EFER can't be changed without causing a VM-exit */ break;
6756 default:
6757 {
6758 pVCpu->hm.s.u32HMError = pMsr->u32Msr;
6759 ASMSetFlags(fEFlags);
6760 AssertMsgFailed(("Unexpected MSR in auto-load/store area. uMsr=%#RX32 cMsrs=%u\n", pMsr->u32Msr,
6761 cMsrs));
6762 return VERR_HM_UNEXPECTED_LD_ST_MSR;
6763 }
6764 }
6765 }
6766 }
6767
6768 if (fWhat & CPUMCTX_EXTRN_DR7)
6769 {
6770 if (!pVCpu->hm.s.fUsingHyperDR7)
6771 {
6772 /* Upper 32-bits are always zero. See Intel spec. 2.7.3 "Loading and Storing Debug Registers". */
6773 rc = VMXReadVmcs32(VMX_VMCS_GUEST_DR7, &u32Val);
6774 VMXLOCAL_BREAK_RC(rc);
6775 pCtx->dr[7] = u32Val;
6776 }
6777 }
6778
6779 if (fWhat & CPUMCTX_EXTRN_CR_MASK)
6780 {
6781 uint32_t u32Shadow;
6782 if (fWhat & CPUMCTX_EXTRN_CR0)
6783 {
6784 rc = VMXReadVmcs32(VMX_VMCS_GUEST_CR0, &u32Val);
6785 rc |= VMXReadVmcs32(VMX_VMCS_CTRL_CR0_READ_SHADOW, &u32Shadow);
6786 VMXLOCAL_BREAK_RC(rc);
6787 u32Val = (u32Val & ~pVCpu->hm.s.vmx.u32Cr0Mask)
6788 | (u32Shadow & pVCpu->hm.s.vmx.u32Cr0Mask);
6789 VMMRZCallRing3Disable(pVCpu); /* Calls into PGM which has Log statements. */
6790 CPUMSetGuestCR0(pVCpu, u32Val);
6791 VMMRZCallRing3Enable(pVCpu);
6792 }
6793
6794 if (fWhat & CPUMCTX_EXTRN_CR4)
6795 {
6796 rc = VMXReadVmcs32(VMX_VMCS_GUEST_CR4, &u32Val);
6797 rc |= VMXReadVmcs32(VMX_VMCS_CTRL_CR4_READ_SHADOW, &u32Shadow);
6798 VMXLOCAL_BREAK_RC(rc);
6799 u32Val = (u32Val & ~pVCpu->hm.s.vmx.u32Cr4Mask)
6800 | (u32Shadow & pVCpu->hm.s.vmx.u32Cr4Mask);
6801 CPUMSetGuestCR4(pVCpu, u32Val);
6802 }
6803
6804 if (fWhat & CPUMCTX_EXTRN_CR3)
6805 {
6806 /* CR0.PG bit changes are always intercepted, so it's up to date. */
6807 if ( pVM->hm.s.vmx.fUnrestrictedGuest
6808 || ( pVM->hm.s.fNestedPaging
6809 && CPUMIsGuestPagingEnabledEx(pCtx)))
6810 {
6811 rc = VMXReadVmcsGstN(VMX_VMCS_GUEST_CR3, &u64Val);
6812 if (pCtx->cr3 != u64Val)
6813 {
6814 CPUMSetGuestCR3(pVCpu, u64Val);
6815 VMCPU_FF_SET(pVCpu, VMCPU_FF_HM_UPDATE_CR3);
6816 }
6817
6818 /* If the guest is in PAE mode, sync back the PDPE's into the guest state.
6819 Note: CR4.PAE, CR0.PG, EFER bit changes are always intercepted, so they're up to date. */
6820 if (CPUMIsGuestInPAEModeEx(pCtx))
6821 {
6822 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_PDPTE0_FULL, &pVCpu->hm.s.aPdpes[0].u);
6823 rc |= VMXReadVmcs64(VMX_VMCS64_GUEST_PDPTE1_FULL, &pVCpu->hm.s.aPdpes[1].u);
6824 rc |= VMXReadVmcs64(VMX_VMCS64_GUEST_PDPTE2_FULL, &pVCpu->hm.s.aPdpes[2].u);
6825 rc |= VMXReadVmcs64(VMX_VMCS64_GUEST_PDPTE3_FULL, &pVCpu->hm.s.aPdpes[3].u);
6826 VMXLOCAL_BREAK_RC(rc);
6827 VMCPU_FF_SET(pVCpu, VMCPU_FF_HM_UPDATE_PAE_PDPES);
6828 }
6829 }
6830 }
6831 }
6832 } while (0);
6833
6834 if (RT_SUCCESS(rc))
6835 {
6836 /* Update fExtrn. */
6837 pCtx->fExtrn &= ~fWhat;
6838
6839 /* If everything has been imported, clear the HM keeper bit. */
6840 if (!(pCtx->fExtrn & HMVMX_CPUMCTX_EXTRN_ALL))
6841 {
6842 pCtx->fExtrn &= ~CPUMCTX_EXTRN_KEEPER_HM;
6843 Assert(!pCtx->fExtrn);
6844 }
6845 }
6846 }
6847 else
6848 AssertMsg(!pCtx->fExtrn || (pCtx->fExtrn & HMVMX_CPUMCTX_EXTRN_ALL), ("%#RX64\n", pCtx->fExtrn));
6849
6850 ASMSetFlags(fEFlags);
6851
6852 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatImportGuestState, x);
6853
6854 /*
6855 * Honor any pending CR3 updates.
6856 *
6857 * Consider this scenario: VM-exit -> VMMRZCallRing3Enable() -> do stuff that causes a longjmp -> hmR0VmxCallRing3Callback()
6858 * -> VMMRZCallRing3Disable() -> hmR0VmxImportGuestState() -> Sets VMCPU_FF_HM_UPDATE_CR3 pending -> return from the longjmp
6859 * -> continue with VM-exit handling -> hmR0VmxImportGuestState() and here we are.
6860 *
6861 * The reason for such complicated handling is because VM-exits that call into PGM expect CR3 to be up-to-date and thus
6862 * if any CR3-saves -before- the VM-exit (longjmp) postponed the CR3 update via the force-flag, any VM-exit handler that
6863 * calls into PGM when it re-saves CR3 will end up here and we call PGMUpdateCR3(). This is why the code below should
6864 * -NOT- check if CPUMCTX_EXTRN_CR3 is set!
6865 *
6866 * The longjmp exit path can't check these CR3 force-flags and call code that takes a lock again. We cover for it here.
6867 */
6868 if (VMMRZCallRing3IsEnabled(pVCpu))
6869 {
6870 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_CR3))
6871 {
6872 Assert(!(ASMAtomicUoReadU64(&pCtx->fExtrn) & CPUMCTX_EXTRN_CR3));
6873 PGMUpdateCR3(pVCpu, CPUMGetGuestCR3(pVCpu));
6874 }
6875
6876 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_PAE_PDPES))
6877 PGMGstUpdatePaePdpes(pVCpu, &pVCpu->hm.s.aPdpes[0]);
6878
6879 Assert(!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_CR3));
6880 Assert(!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_PAE_PDPES));
6881 }
6882
6883 return VINF_SUCCESS;
6884#undef VMXLOCAL_BREAK_RC
6885}
6886
6887
6888/**
6889 * Saves the guest state from the VMCS into the guest-CPU context.
6890 *
6891 * @returns VBox status code.
6892 * @param pVCpu The cross context virtual CPU structure.
6893 * @param fWhat What to import, CPUMCTX_EXTRN_XXX.
6894 */
6895VMMR0DECL(int) VMXR0ImportStateOnDemand(PVMCPU pVCpu, uint64_t fWhat)
6896{
6897 return hmR0VmxImportGuestState(pVCpu, fWhat);
6898}
6899
6900
6901/**
6902 * Check per-VM and per-VCPU force flag actions that require us to go back to
6903 * ring-3 for one reason or another.
6904 *
6905 * @returns Strict VBox status code (i.e. informational status codes too)
6906 * @retval VINF_SUCCESS if we don't have any actions that require going back to
6907 * ring-3.
6908 * @retval VINF_PGM_SYNC_CR3 if we have pending PGM CR3 sync.
6909 * @retval VINF_EM_PENDING_REQUEST if we have pending requests (like hardware
6910 * interrupts)
6911 * @retval VINF_PGM_POOL_FLUSH_PENDING if PGM is doing a pool flush and requires
6912 * all EMTs to be in ring-3.
6913 * @retval VINF_EM_RAW_TO_R3 if there is pending DMA requests.
6914 * @retval VINF_EM_NO_MEMORY PGM is out of memory, we need to return
6915 * to the EM loop.
6916 *
6917 * @param pVCpu The cross context virtual CPU structure.
6918 * @param fStepping Running in hmR0VmxRunGuestCodeStep().
6919 */
6920static VBOXSTRICTRC hmR0VmxCheckForceFlags(PVMCPU pVCpu, bool fStepping)
6921{
6922 Assert(VMMRZCallRing3IsEnabled(pVCpu));
6923
6924 /*
6925 * Anything pending? Should be more likely than not if we're doing a good job.
6926 */
6927 PVM pVM = pVCpu->CTX_SUFF(pVM);
6928 if ( !fStepping
6929 ? !VM_FF_IS_ANY_SET(pVM, VM_FF_HP_R0_PRE_HM_MASK)
6930 && !VMCPU_FF_IS_ANY_SET(pVCpu, VMCPU_FF_HP_R0_PRE_HM_MASK)
6931 : !VM_FF_IS_ANY_SET(pVM, VM_FF_HP_R0_PRE_HM_STEP_MASK)
6932 && !VMCPU_FF_IS_ANY_SET(pVCpu, VMCPU_FF_HP_R0_PRE_HM_STEP_MASK) )
6933 return VINF_SUCCESS;
6934
6935 /* Pending PGM C3 sync. */
6936 if (VMCPU_FF_IS_ANY_SET(pVCpu,VMCPU_FF_PGM_SYNC_CR3 | VMCPU_FF_PGM_SYNC_CR3_NON_GLOBAL))
6937 {
6938 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
6939 Assert(!(ASMAtomicUoReadU64(&pCtx->fExtrn) & (CPUMCTX_EXTRN_CR0 | CPUMCTX_EXTRN_CR3 | CPUMCTX_EXTRN_CR4)));
6940 VBOXSTRICTRC rcStrict2 = PGMSyncCR3(pVCpu, pCtx->cr0, pCtx->cr3, pCtx->cr4,
6941 VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_PGM_SYNC_CR3));
6942 if (rcStrict2 != VINF_SUCCESS)
6943 {
6944 AssertRC(VBOXSTRICTRC_VAL(rcStrict2));
6945 Log4Func(("PGMSyncCR3 forcing us back to ring-3. rc2=%d\n", VBOXSTRICTRC_VAL(rcStrict2)));
6946 return rcStrict2;
6947 }
6948 }
6949
6950 /* Pending HM-to-R3 operations (critsects, timers, EMT rendezvous etc.) */
6951 if ( VM_FF_IS_ANY_SET(pVM, VM_FF_HM_TO_R3_MASK)
6952 || VMCPU_FF_IS_ANY_SET(pVCpu, VMCPU_FF_HM_TO_R3_MASK))
6953 {
6954 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchHmToR3FF);
6955 int rc2 = RT_LIKELY(!VM_FF_IS_SET(pVM, VM_FF_PGM_NO_MEMORY)) ? VINF_EM_RAW_TO_R3 : VINF_EM_NO_MEMORY;
6956 Log4Func(("HM_TO_R3 forcing us back to ring-3. rc=%d\n", rc2));
6957 return rc2;
6958 }
6959
6960 /* Pending VM request packets, such as hardware interrupts. */
6961 if ( VM_FF_IS_SET(pVM, VM_FF_REQUEST)
6962 || VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_REQUEST))
6963 {
6964 Log4Func(("Pending VM request forcing us back to ring-3\n"));
6965 return VINF_EM_PENDING_REQUEST;
6966 }
6967
6968 /* Pending PGM pool flushes. */
6969 if (VM_FF_IS_SET(pVM, VM_FF_PGM_POOL_FLUSH_PENDING))
6970 {
6971 Log4Func(("PGM pool flush pending forcing us back to ring-3\n"));
6972 return VINF_PGM_POOL_FLUSH_PENDING;
6973 }
6974
6975 /* Pending DMA requests. */
6976 if (VM_FF_IS_SET(pVM, VM_FF_PDM_DMA))
6977 {
6978 Log4Func(("Pending DMA request forcing us back to ring-3\n"));
6979 return VINF_EM_RAW_TO_R3;
6980 }
6981
6982 return VINF_SUCCESS;
6983}
6984
6985
6986/**
6987 * Converts any TRPM trap into a pending HM event. This is typically used when
6988 * entering from ring-3 (not longjmp returns).
6989 *
6990 * @param pVCpu The cross context virtual CPU structure.
6991 */
6992static void hmR0VmxTrpmTrapToPendingEvent(PVMCPU pVCpu)
6993{
6994 Assert(TRPMHasTrap(pVCpu));
6995 Assert(!pVCpu->hm.s.Event.fPending);
6996
6997 uint8_t uVector;
6998 TRPMEVENT enmTrpmEvent;
6999 RTGCUINT uErrCode;
7000 RTGCUINTPTR GCPtrFaultAddress;
7001 uint8_t cbInstr;
7002
7003 int rc = TRPMQueryTrapAll(pVCpu, &uVector, &enmTrpmEvent, &uErrCode, &GCPtrFaultAddress, &cbInstr);
7004 AssertRC(rc);
7005
7006 /* Refer Intel spec. 24.8.3 "VM-entry Controls for Event Injection" for the format of u32IntInfo. */
7007 uint32_t u32IntInfo = uVector | VMX_EXIT_INT_INFO_VALID;
7008 if (enmTrpmEvent == TRPM_TRAP)
7009 {
7010 switch (uVector)
7011 {
7012 case X86_XCPT_NMI:
7013 u32IntInfo |= (VMX_EXIT_INT_INFO_TYPE_NMI << VMX_EXIT_INT_INFO_TYPE_SHIFT);
7014 break;
7015
7016 case X86_XCPT_BP:
7017 case X86_XCPT_OF:
7018 u32IntInfo |= (VMX_EXIT_INT_INFO_TYPE_SW_XCPT << VMX_EXIT_INT_INFO_TYPE_SHIFT);
7019 break;
7020
7021 case X86_XCPT_PF:
7022 case X86_XCPT_DF:
7023 case X86_XCPT_TS:
7024 case X86_XCPT_NP:
7025 case X86_XCPT_SS:
7026 case X86_XCPT_GP:
7027 case X86_XCPT_AC:
7028 u32IntInfo |= VMX_EXIT_INT_INFO_ERROR_CODE_VALID;
7029 RT_FALL_THRU();
7030 default:
7031 u32IntInfo |= (VMX_EXIT_INT_INFO_TYPE_HW_XCPT << VMX_EXIT_INT_INFO_TYPE_SHIFT);
7032 break;
7033 }
7034 }
7035 else if (enmTrpmEvent == TRPM_HARDWARE_INT)
7036 u32IntInfo |= (VMX_EXIT_INT_INFO_TYPE_EXT_INT << VMX_EXIT_INT_INFO_TYPE_SHIFT);
7037 else if (enmTrpmEvent == TRPM_SOFTWARE_INT)
7038 u32IntInfo |= (VMX_EXIT_INT_INFO_TYPE_SW_INT << VMX_EXIT_INT_INFO_TYPE_SHIFT);
7039 else
7040 AssertMsgFailed(("Invalid TRPM event type %d\n", enmTrpmEvent));
7041
7042 rc = TRPMResetTrap(pVCpu);
7043 AssertRC(rc);
7044 Log4(("TRPM->HM event: u32IntInfo=%#RX32 enmTrpmEvent=%d cbInstr=%u uErrCode=%#RX32 GCPtrFaultAddress=%#RGv\n",
7045 u32IntInfo, enmTrpmEvent, cbInstr, uErrCode, GCPtrFaultAddress));
7046
7047 hmR0VmxSetPendingEvent(pVCpu, u32IntInfo, cbInstr, uErrCode, GCPtrFaultAddress);
7048}
7049
7050
7051/**
7052 * Converts the pending HM event into a TRPM trap.
7053 *
7054 * @param pVCpu The cross context virtual CPU structure.
7055 */
7056static void hmR0VmxPendingEventToTrpmTrap(PVMCPU pVCpu)
7057{
7058 Assert(pVCpu->hm.s.Event.fPending);
7059
7060 uint32_t uVectorType = VMX_IDT_VECTORING_INFO_TYPE(pVCpu->hm.s.Event.u64IntInfo);
7061 uint32_t uVector = VMX_IDT_VECTORING_INFO_VECTOR(pVCpu->hm.s.Event.u64IntInfo);
7062 bool fErrorCodeValid = VMX_IDT_VECTORING_INFO_IS_ERROR_CODE_VALID(pVCpu->hm.s.Event.u64IntInfo);
7063 uint32_t uErrorCode = pVCpu->hm.s.Event.u32ErrCode;
7064
7065 /* If a trap was already pending, we did something wrong! */
7066 Assert(TRPMQueryTrap(pVCpu, NULL /* pu8TrapNo */, NULL /* pEnmType */) == VERR_TRPM_NO_ACTIVE_TRAP);
7067
7068 TRPMEVENT enmTrapType;
7069 switch (uVectorType)
7070 {
7071 case VMX_IDT_VECTORING_INFO_TYPE_EXT_INT:
7072 enmTrapType = TRPM_HARDWARE_INT;
7073 break;
7074
7075 case VMX_IDT_VECTORING_INFO_TYPE_SW_INT:
7076 enmTrapType = TRPM_SOFTWARE_INT;
7077 break;
7078
7079 case VMX_IDT_VECTORING_INFO_TYPE_NMI:
7080 case VMX_IDT_VECTORING_INFO_TYPE_PRIV_SW_XCPT:
7081 case VMX_IDT_VECTORING_INFO_TYPE_SW_XCPT: /* #BP and #OF */
7082 case VMX_IDT_VECTORING_INFO_TYPE_HW_XCPT:
7083 enmTrapType = TRPM_TRAP;
7084 break;
7085
7086 default:
7087 AssertMsgFailed(("Invalid trap type %#x\n", uVectorType));
7088 enmTrapType = TRPM_32BIT_HACK;
7089 break;
7090 }
7091
7092 Log4(("HM event->TRPM: uVector=%#x enmTrapType=%d\n", uVector, enmTrapType));
7093
7094 int rc = TRPMAssertTrap(pVCpu, uVector, enmTrapType);
7095 AssertRC(rc);
7096
7097 if (fErrorCodeValid)
7098 TRPMSetErrorCode(pVCpu, uErrorCode);
7099
7100 if ( uVectorType == VMX_IDT_VECTORING_INFO_TYPE_HW_XCPT
7101 && uVector == X86_XCPT_PF)
7102 {
7103 TRPMSetFaultAddress(pVCpu, pVCpu->hm.s.Event.GCPtrFaultAddress);
7104 }
7105 else if ( uVectorType == VMX_IDT_VECTORING_INFO_TYPE_SW_INT
7106 || uVectorType == VMX_IDT_VECTORING_INFO_TYPE_SW_XCPT
7107 || uVectorType == VMX_IDT_VECTORING_INFO_TYPE_PRIV_SW_XCPT)
7108 {
7109 AssertMsg( uVectorType == VMX_IDT_VECTORING_INFO_TYPE_SW_INT
7110 || (uVector == X86_XCPT_BP || uVector == X86_XCPT_OF),
7111 ("Invalid vector: uVector=%#x uVectorType=%#x\n", uVector, uVectorType));
7112 TRPMSetInstrLength(pVCpu, pVCpu->hm.s.Event.cbInstr);
7113 }
7114
7115 /* Clear the events from the VMCS. */
7116 VMXWriteVmcs32(VMX_VMCS32_CTRL_ENTRY_INTERRUPTION_INFO, 0);
7117
7118 /* We're now done converting the pending event. */
7119 pVCpu->hm.s.Event.fPending = false;
7120}
7121
7122
7123/**
7124 * Does the necessary state syncing before returning to ring-3 for any reason
7125 * (longjmp, preemption, voluntary exits to ring-3) from VT-x.
7126 *
7127 * @returns VBox status code.
7128 * @param pVCpu The cross context virtual CPU structure.
7129 * @param fImportState Whether to import the guest state from the VMCS back
7130 * to the guest-CPU context.
7131 *
7132 * @remarks No-long-jmp zone!!!
7133 */
7134static int hmR0VmxLeave(PVMCPU pVCpu, bool fImportState)
7135{
7136 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
7137 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
7138
7139 RTCPUID idCpu = RTMpCpuId();
7140 Log4Func(("HostCpuId=%u\n", idCpu));
7141
7142 /*
7143 * !!! IMPORTANT !!!
7144 * If you modify code here, check whether hmR0VmxCallRing3Callback() needs to be updated too.
7145 */
7146
7147 /* Save the guest state if necessary. */
7148 if (fImportState)
7149 {
7150 int rc = hmR0VmxImportGuestState(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
7151 AssertRCReturn(rc, rc);
7152 }
7153
7154 /* Restore host FPU state if necessary. We will resync on next R0 reentry. */
7155 CPUMR0FpuStateMaybeSaveGuestAndRestoreHost(pVCpu);
7156 Assert(!CPUMIsGuestFPUStateActive(pVCpu));
7157
7158 /* Restore host debug registers if necessary. We will resync on next R0 reentry. */
7159#ifdef VBOX_STRICT
7160 if (CPUMIsHyperDebugStateActive(pVCpu))
7161 Assert(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_MOV_DR_EXIT);
7162#endif
7163 CPUMR0DebugStateMaybeSaveGuestAndRestoreHost(pVCpu, true /* save DR6 */);
7164 Assert(!CPUMIsGuestDebugStateActive(pVCpu) && !CPUMIsGuestDebugStateActivePending(pVCpu));
7165 Assert(!CPUMIsHyperDebugStateActive(pVCpu) && !CPUMIsHyperDebugStateActivePending(pVCpu));
7166
7167#if HC_ARCH_BITS == 64
7168 /* Restore host-state bits that VT-x only restores partially. */
7169 if ( (pVCpu->hm.s.vmx.fRestoreHostFlags & VMX_RESTORE_HOST_REQUIRED)
7170 && (pVCpu->hm.s.vmx.fRestoreHostFlags & ~VMX_RESTORE_HOST_REQUIRED))
7171 {
7172 Log4Func(("Restoring Host State: fRestoreHostFlags=%#RX32 HostCpuId=%u\n", pVCpu->hm.s.vmx.fRestoreHostFlags, idCpu));
7173 VMXRestoreHostState(pVCpu->hm.s.vmx.fRestoreHostFlags, &pVCpu->hm.s.vmx.RestoreHost);
7174 }
7175 pVCpu->hm.s.vmx.fRestoreHostFlags = 0;
7176#endif
7177
7178 /* Restore the lazy host MSRs as we're leaving VT-x context. */
7179 if (pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_LOADED_GUEST)
7180 {
7181 /* We shouldn't restore the host MSRs without saving the guest MSRs first. */
7182 if (!fImportState)
7183 {
7184 int rc = hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_KERNEL_GS_BASE | CPUMCTX_EXTRN_SYSCALL_MSRS);
7185 AssertRCReturn(rc, rc);
7186 }
7187 hmR0VmxLazyRestoreHostMsrs(pVCpu);
7188 Assert(!pVCpu->hm.s.vmx.fLazyMsrs);
7189 }
7190 else
7191 pVCpu->hm.s.vmx.fLazyMsrs = 0;
7192
7193 /* Update auto-load/store host MSRs values when we re-enter VT-x (as we could be on a different CPU). */
7194 pVCpu->hm.s.vmx.fUpdatedHostMsrs = false;
7195
7196 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatEntry);
7197 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatImportGuestState);
7198 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatExportGuestState);
7199 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatPreExit);
7200 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatExitHandling);
7201 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatExitIO);
7202 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatExitMovCRx);
7203 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatExitXcptNmi);
7204 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchLongJmpToR3);
7205
7206 VMCPU_CMPXCHG_STATE(pVCpu, VMCPUSTATE_STARTED_HM, VMCPUSTATE_STARTED_EXEC);
7207
7208 /** @todo This partially defeats the purpose of having preemption hooks.
7209 * The problem is, deregistering the hooks should be moved to a place that
7210 * lasts until the EMT is about to be destroyed not everytime while leaving HM
7211 * context.
7212 */
7213 if (pVCpu->hm.s.vmx.uVmcsState & HMVMX_VMCS_STATE_ACTIVE)
7214 {
7215 int rc = VMXClearVmcs(pVCpu->hm.s.vmx.HCPhysVmcs);
7216 AssertRCReturn(rc, rc);
7217
7218 pVCpu->hm.s.vmx.uVmcsState = HMVMX_VMCS_STATE_CLEAR;
7219 Log4Func(("Cleared Vmcs. HostCpuId=%u\n", idCpu));
7220 }
7221 Assert(!(pVCpu->hm.s.vmx.uVmcsState & HMVMX_VMCS_STATE_LAUNCHED));
7222 NOREF(idCpu);
7223
7224 return VINF_SUCCESS;
7225}
7226
7227
7228/**
7229 * Leaves the VT-x session.
7230 *
7231 * @returns VBox status code.
7232 * @param pVCpu The cross context virtual CPU structure.
7233 *
7234 * @remarks No-long-jmp zone!!!
7235 */
7236static int hmR0VmxLeaveSession(PVMCPU pVCpu)
7237{
7238 HM_DISABLE_PREEMPT(pVCpu);
7239 HMVMX_ASSERT_CPU_SAFE(pVCpu);
7240 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
7241 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
7242
7243 /* When thread-context hooks are used, we can avoid doing the leave again if we had been preempted before
7244 and done this from the VMXR0ThreadCtxCallback(). */
7245 if (!pVCpu->hm.s.fLeaveDone)
7246 {
7247 int rc2 = hmR0VmxLeave(pVCpu, true /* fImportState */);
7248 AssertRCReturnStmt(rc2, HM_RESTORE_PREEMPT(), rc2);
7249 pVCpu->hm.s.fLeaveDone = true;
7250 }
7251 Assert(!pVCpu->cpum.GstCtx.fExtrn);
7252
7253 /*
7254 * !!! IMPORTANT !!!
7255 * If you modify code here, make sure to check whether hmR0VmxCallRing3Callback() needs to be updated too.
7256 */
7257
7258 /* Deregister hook now that we've left HM context before re-enabling preemption. */
7259 /** @todo Deregistering here means we need to VMCLEAR always
7260 * (longjmp/exit-to-r3) in VT-x which is not efficient, eliminate need
7261 * for calling VMMR0ThreadCtxHookDisable here! */
7262 VMMR0ThreadCtxHookDisable(pVCpu);
7263
7264 /* Leave HM context. This takes care of local init (term). */
7265 int rc = HMR0LeaveCpu(pVCpu);
7266
7267 HM_RESTORE_PREEMPT();
7268 return rc;
7269}
7270
7271
7272/**
7273 * Does the necessary state syncing before doing a longjmp to ring-3.
7274 *
7275 * @returns VBox status code.
7276 * @param pVCpu The cross context virtual CPU structure.
7277 *
7278 * @remarks No-long-jmp zone!!!
7279 */
7280DECLINLINE(int) hmR0VmxLongJmpToRing3(PVMCPU pVCpu)
7281{
7282 return hmR0VmxLeaveSession(pVCpu);
7283}
7284
7285
7286/**
7287 * Take necessary actions before going back to ring-3.
7288 *
7289 * An action requires us to go back to ring-3. This function does the necessary
7290 * steps before we can safely return to ring-3. This is not the same as longjmps
7291 * to ring-3, this is voluntary and prepares the guest so it may continue
7292 * executing outside HM (recompiler/IEM).
7293 *
7294 * @returns VBox status code.
7295 * @param pVCpu The cross context virtual CPU structure.
7296 * @param rcExit The reason for exiting to ring-3. Can be
7297 * VINF_VMM_UNKNOWN_RING3_CALL.
7298 */
7299static int hmR0VmxExitToRing3(PVMCPU pVCpu, VBOXSTRICTRC rcExit)
7300{
7301 Assert(pVCpu);
7302 HMVMX_ASSERT_PREEMPT_SAFE(pVCpu);
7303
7304 if (RT_UNLIKELY(rcExit == VERR_VMX_INVALID_VMCS_PTR))
7305 {
7306 VMXGetActivatedVmcs(&pVCpu->hm.s.vmx.LastError.u64VmcsPhys);
7307 pVCpu->hm.s.vmx.LastError.u32VmcsRev = *(uint32_t *)pVCpu->hm.s.vmx.pvVmcs;
7308 pVCpu->hm.s.vmx.LastError.idEnteredCpu = pVCpu->hm.s.idEnteredCpu;
7309 /* LastError.idCurrentCpu was updated in hmR0VmxPreRunGuestCommitted(). */
7310 }
7311
7312 /* Please, no longjumps here (any logging shouldn't flush jump back to ring-3). NO LOGGING BEFORE THIS POINT! */
7313 VMMRZCallRing3Disable(pVCpu);
7314 Log4Func(("rcExit=%d\n", VBOXSTRICTRC_VAL(rcExit)));
7315
7316 /* We need to do this only while truly exiting the "inner loop" back to ring-3 and -not- for any longjmp to ring3. */
7317 if (pVCpu->hm.s.Event.fPending)
7318 {
7319 hmR0VmxPendingEventToTrpmTrap(pVCpu);
7320 Assert(!pVCpu->hm.s.Event.fPending);
7321 }
7322
7323 /* Clear interrupt-window and NMI-window controls as we re-evaluate it when we return from ring-3. */
7324 hmR0VmxClearIntNmiWindowsVmcs(pVCpu);
7325
7326 /* If we're emulating an instruction, we shouldn't have any TRPM traps pending
7327 and if we're injecting an event we should have a TRPM trap pending. */
7328 AssertMsg(rcExit != VINF_EM_RAW_INJECT_TRPM_EVENT || TRPMHasTrap(pVCpu), ("%Rrc\n", VBOXSTRICTRC_VAL(rcExit)));
7329#ifndef DEBUG_bird /* Triggered after firing an NMI against NT4SP1, possibly a triple fault in progress. */
7330 AssertMsg(rcExit != VINF_EM_RAW_EMULATE_INSTR || !TRPMHasTrap(pVCpu), ("%Rrc\n", VBOXSTRICTRC_VAL(rcExit)));
7331#endif
7332
7333 /* Save guest state and restore host state bits. */
7334 int rc = hmR0VmxLeaveSession(pVCpu);
7335 AssertRCReturn(rc, rc);
7336 STAM_COUNTER_DEC(&pVCpu->hm.s.StatSwitchLongJmpToR3);
7337 /* Thread-context hooks are unregistered at this point!!! */
7338
7339 /* Sync recompiler state. */
7340 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_TO_R3);
7341 CPUMSetChangedFlags(pVCpu, CPUM_CHANGED_SYSENTER_MSR
7342 | CPUM_CHANGED_LDTR
7343 | CPUM_CHANGED_GDTR
7344 | CPUM_CHANGED_IDTR
7345 | CPUM_CHANGED_TR
7346 | CPUM_CHANGED_HIDDEN_SEL_REGS);
7347 if ( pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging
7348 && CPUMIsGuestPagingEnabledEx(&pVCpu->cpum.GstCtx))
7349 {
7350 CPUMSetChangedFlags(pVCpu, CPUM_CHANGED_GLOBAL_TLB_FLUSH);
7351 }
7352
7353 Assert(!pVCpu->hm.s.fClearTrapFlag);
7354
7355 /* Update the exit-to-ring 3 reason. */
7356 pVCpu->hm.s.rcLastExitToR3 = VBOXSTRICTRC_VAL(rcExit);
7357
7358 /* On our way back from ring-3 reload the guest state if there is a possibility of it being changed. */
7359 if (rcExit != VINF_EM_RAW_INTERRUPT)
7360 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
7361
7362 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchExitToR3);
7363
7364 /* We do -not- want any longjmp notifications after this! We must return to ring-3 ASAP. */
7365 VMMRZCallRing3RemoveNotification(pVCpu);
7366 VMMRZCallRing3Enable(pVCpu);
7367
7368 return rc;
7369}
7370
7371
7372/**
7373 * VMMRZCallRing3() callback wrapper which saves the guest state before we
7374 * longjump to ring-3 and possibly get preempted.
7375 *
7376 * @returns VBox status code.
7377 * @param pVCpu The cross context virtual CPU structure.
7378 * @param enmOperation The operation causing the ring-3 longjump.
7379 * @param pvUser User argument, currently unused, NULL.
7380 */
7381static DECLCALLBACK(int) hmR0VmxCallRing3Callback(PVMCPU pVCpu, VMMCALLRING3 enmOperation, void *pvUser)
7382{
7383 RT_NOREF(pvUser);
7384 if (enmOperation == VMMCALLRING3_VM_R0_ASSERTION)
7385 {
7386 /*
7387 * !!! IMPORTANT !!!
7388 * If you modify code here, check whether hmR0VmxLeave() and hmR0VmxLeaveSession() needs to be updated too.
7389 * This is a stripped down version which gets out ASAP, trying to not trigger any further assertions.
7390 */
7391 VMMRZCallRing3RemoveNotification(pVCpu);
7392 VMMRZCallRing3Disable(pVCpu);
7393 RTTHREADPREEMPTSTATE PreemptState = RTTHREADPREEMPTSTATE_INITIALIZER;
7394 RTThreadPreemptDisable(&PreemptState);
7395
7396 hmR0VmxImportGuestState(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
7397 CPUMR0FpuStateMaybeSaveGuestAndRestoreHost(pVCpu);
7398 CPUMR0DebugStateMaybeSaveGuestAndRestoreHost(pVCpu, true /* save DR6 */);
7399
7400#if HC_ARCH_BITS == 64
7401 /* Restore host-state bits that VT-x only restores partially. */
7402 if ( (pVCpu->hm.s.vmx.fRestoreHostFlags & VMX_RESTORE_HOST_REQUIRED)
7403 && (pVCpu->hm.s.vmx.fRestoreHostFlags & ~VMX_RESTORE_HOST_REQUIRED))
7404 VMXRestoreHostState(pVCpu->hm.s.vmx.fRestoreHostFlags, &pVCpu->hm.s.vmx.RestoreHost);
7405 pVCpu->hm.s.vmx.fRestoreHostFlags = 0;
7406#endif
7407
7408 /* Restore the lazy host MSRs as we're leaving VT-x context. */
7409 if (pVCpu->hm.s.vmx.fLazyMsrs & VMX_LAZY_MSRS_LOADED_GUEST)
7410 hmR0VmxLazyRestoreHostMsrs(pVCpu);
7411
7412 /* Update auto-load/store host MSRs values when we re-enter VT-x (as we could be on a different CPU). */
7413 pVCpu->hm.s.vmx.fUpdatedHostMsrs = false;
7414 VMCPU_CMPXCHG_STATE(pVCpu, VMCPUSTATE_STARTED_HM, VMCPUSTATE_STARTED_EXEC);
7415 if (pVCpu->hm.s.vmx.uVmcsState & HMVMX_VMCS_STATE_ACTIVE)
7416 {
7417 VMXClearVmcs(pVCpu->hm.s.vmx.HCPhysVmcs);
7418 pVCpu->hm.s.vmx.uVmcsState = HMVMX_VMCS_STATE_CLEAR;
7419 }
7420
7421 /** @todo eliminate the need for calling VMMR0ThreadCtxHookDisable here! */
7422 VMMR0ThreadCtxHookDisable(pVCpu);
7423 HMR0LeaveCpu(pVCpu);
7424 RTThreadPreemptRestore(&PreemptState);
7425 return VINF_SUCCESS;
7426 }
7427
7428 Assert(pVCpu);
7429 Assert(pvUser);
7430 Assert(VMMRZCallRing3IsEnabled(pVCpu));
7431 HMVMX_ASSERT_PREEMPT_SAFE(pVCpu);
7432
7433 VMMRZCallRing3Disable(pVCpu);
7434 Assert(VMMR0IsLogFlushDisabled(pVCpu));
7435
7436 Log4Func((" -> hmR0VmxLongJmpToRing3 enmOperation=%d\n", enmOperation));
7437
7438 int rc = hmR0VmxLongJmpToRing3(pVCpu);
7439 AssertRCReturn(rc, rc);
7440
7441 VMMRZCallRing3Enable(pVCpu);
7442 return VINF_SUCCESS;
7443}
7444
7445
7446/**
7447 * Sets the interrupt-window exiting control in the VMCS which instructs VT-x to
7448 * cause a VM-exit as soon as the guest is in a state to receive interrupts.
7449 *
7450 * @param pVCpu The cross context virtual CPU structure.
7451 */
7452DECLINLINE(void) hmR0VmxSetIntWindowExitVmcs(PVMCPU pVCpu)
7453{
7454 if (RT_LIKELY(pVCpu->CTX_SUFF(pVM)->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_INT_WINDOW_EXIT))
7455 {
7456 if (!(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_INT_WINDOW_EXIT))
7457 {
7458 pVCpu->hm.s.vmx.u32ProcCtls |= VMX_PROC_CTLS_INT_WINDOW_EXIT;
7459 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, pVCpu->hm.s.vmx.u32ProcCtls);
7460 AssertRC(rc);
7461 Log4Func(("Setup interrupt-window exiting\n"));
7462 }
7463 } /* else we will deliver interrupts whenever the guest exits next and is in a state to receive events. */
7464}
7465
7466
7467/**
7468 * Clears the interrupt-window exiting control in the VMCS.
7469 *
7470 * @param pVCpu The cross context virtual CPU structure.
7471 */
7472DECLINLINE(void) hmR0VmxClearIntWindowExitVmcs(PVMCPU pVCpu)
7473{
7474 Assert(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_INT_WINDOW_EXIT);
7475 pVCpu->hm.s.vmx.u32ProcCtls &= ~VMX_PROC_CTLS_INT_WINDOW_EXIT;
7476 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, pVCpu->hm.s.vmx.u32ProcCtls);
7477 AssertRC(rc);
7478 Log4Func(("Cleared interrupt-window exiting\n"));
7479}
7480
7481
7482/**
7483 * Sets the NMI-window exiting control in the VMCS which instructs VT-x to
7484 * cause a VM-exit as soon as the guest is in a state to receive NMIs.
7485 *
7486 * @param pVCpu The cross context virtual CPU structure.
7487 */
7488DECLINLINE(void) hmR0VmxSetNmiWindowExitVmcs(PVMCPU pVCpu)
7489{
7490 if (RT_LIKELY(pVCpu->CTX_SUFF(pVM)->hm.s.vmx.Msrs.ProcCtls.n.allowed1 & VMX_PROC_CTLS_NMI_WINDOW_EXIT))
7491 {
7492 if (!(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_NMI_WINDOW_EXIT))
7493 {
7494 pVCpu->hm.s.vmx.u32ProcCtls |= VMX_PROC_CTLS_NMI_WINDOW_EXIT;
7495 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, pVCpu->hm.s.vmx.u32ProcCtls);
7496 AssertRC(rc);
7497 Log4Func(("Setup NMI-window exiting\n"));
7498 }
7499 } /* else we will deliver NMIs whenever we VM-exit next, even possibly nesting NMIs. Can't be helped on ancient CPUs. */
7500}
7501
7502
7503/**
7504 * Clears the NMI-window exiting control in the VMCS.
7505 *
7506 * @param pVCpu The cross context virtual CPU structure.
7507 */
7508DECLINLINE(void) hmR0VmxClearNmiWindowExitVmcs(PVMCPU pVCpu)
7509{
7510 Assert(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_NMI_WINDOW_EXIT);
7511 pVCpu->hm.s.vmx.u32ProcCtls &= ~VMX_PROC_CTLS_NMI_WINDOW_EXIT;
7512 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, pVCpu->hm.s.vmx.u32ProcCtls);
7513 AssertRC(rc);
7514 Log4Func(("Cleared NMI-window exiting\n"));
7515}
7516
7517
7518/**
7519 * Evaluates the event to be delivered to the guest and sets it as the pending
7520 * event.
7521 *
7522 * @returns The VT-x guest-interruptibility state.
7523 * @param pVCpu The cross context virtual CPU structure.
7524 */
7525static uint32_t hmR0VmxEvaluatePendingEvent(PVMCPU pVCpu)
7526{
7527 /* Get the current interruptibility-state of the guest and then figure out what can be injected. */
7528 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
7529 uint32_t const fIntrState = hmR0VmxGetGuestIntrState(pVCpu);
7530 bool const fBlockMovSS = RT_BOOL(fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS);
7531 bool const fBlockSti = RT_BOOL(fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_STI);
7532 bool const fBlockNmi = RT_BOOL(fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_NMI);
7533
7534 Assert(!fBlockSti || !(ASMAtomicUoReadU64(&pCtx->fExtrn) & CPUMCTX_EXTRN_RFLAGS));
7535 Assert(!(fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_SMI)); /* We don't support block-by-SMI yet.*/
7536 Assert(!fBlockSti || pCtx->eflags.Bits.u1IF); /* Cannot set block-by-STI when interrupts are disabled. */
7537 Assert(!TRPMHasTrap(pVCpu));
7538
7539 if (VMCPU_FF_TEST_AND_CLEAR(pVCpu, VMCPU_FF_UPDATE_APIC))
7540 APICUpdatePendingInterrupts(pVCpu);
7541
7542 /*
7543 * Toggling of interrupt force-flags here is safe since we update TRPM on premature exits
7544 * to ring-3 before executing guest code, see hmR0VmxExitToRing3(). We must NOT restore these force-flags.
7545 */
7546 /** @todo SMI. SMIs take priority over NMIs. */
7547 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_INTERRUPT_NMI)) /* NMI. NMIs take priority over regular interrupts. */
7548 {
7549 /* On some CPUs block-by-STI also blocks NMIs. See Intel spec. 26.3.1.5 "Checks On Guest Non-Register State". */
7550 if ( !pVCpu->hm.s.Event.fPending
7551 && !fBlockNmi
7552 && !fBlockSti
7553 && !fBlockMovSS)
7554 {
7555 Log4Func(("Pending NMI\n"));
7556 uint32_t u32IntInfo = X86_XCPT_NMI | VMX_EXIT_INT_INFO_VALID;
7557 u32IntInfo |= (VMX_EXIT_INT_INFO_TYPE_NMI << VMX_EXIT_INT_INFO_TYPE_SHIFT);
7558
7559 hmR0VmxSetPendingEvent(pVCpu, u32IntInfo, 0 /* cbInstr */, 0 /* u32ErrCode */, 0 /* GCPtrFaultAddress */);
7560 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INTERRUPT_NMI);
7561 }
7562 else
7563 hmR0VmxSetNmiWindowExitVmcs(pVCpu);
7564 }
7565 /*
7566 * Check if the guest can receive external interrupts (PIC/APIC). Once PDMGetInterrupt() returns
7567 * a valid interrupt we must- deliver the interrupt. We can no longer re-request it from the APIC.
7568 */
7569 else if ( VMCPU_FF_IS_ANY_SET(pVCpu, VMCPU_FF_INTERRUPT_APIC | VMCPU_FF_INTERRUPT_PIC)
7570 && !pVCpu->hm.s.fSingleInstruction)
7571 {
7572 Assert(!DBGFIsStepping(pVCpu));
7573 int rc = hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_RFLAGS);
7574 AssertRCReturn(rc, 0);
7575 bool const fBlockInt = !(pCtx->eflags.u32 & X86_EFL_IF);
7576 if ( !pVCpu->hm.s.Event.fPending
7577 && !fBlockInt
7578 && !fBlockSti
7579 && !fBlockMovSS)
7580 {
7581 uint8_t u8Interrupt;
7582 rc = PDMGetInterrupt(pVCpu, &u8Interrupt);
7583 if (RT_SUCCESS(rc))
7584 {
7585 Log4Func(("Pending external interrupt u8Interrupt=%#x\n", u8Interrupt));
7586 uint32_t u32IntInfo = u8Interrupt
7587 | VMX_EXIT_INT_INFO_VALID
7588 | (VMX_EXIT_INT_INFO_TYPE_EXT_INT << VMX_EXIT_INT_INFO_TYPE_SHIFT);
7589
7590 hmR0VmxSetPendingEvent(pVCpu, u32IntInfo, 0 /* cbInstr */, 0 /* u32ErrCode */, 0 /* GCPtrfaultAddress */);
7591 }
7592 else if (rc == VERR_APIC_INTR_MASKED_BY_TPR)
7593 {
7594 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TPR_SHADOW)
7595 hmR0VmxApicSetTprThreshold(pVCpu, u8Interrupt >> 4);
7596 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchTprMaskedIrq);
7597
7598 /*
7599 * If the CPU doesn't have TPR shadowing, we will always get a VM-exit on TPR changes and
7600 * APICSetTpr() will end up setting the VMCPU_FF_INTERRUPT_APIC if required, so there is no
7601 * need to re-set this force-flag here.
7602 */
7603 }
7604 else
7605 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchGuestIrq);
7606 }
7607 else
7608 hmR0VmxSetIntWindowExitVmcs(pVCpu);
7609 }
7610
7611 return fIntrState;
7612}
7613
7614
7615/**
7616 * Injects any pending events into the guest if the guest is in a state to
7617 * receive them.
7618 *
7619 * @returns Strict VBox status code (i.e. informational status codes too).
7620 * @param pVCpu The cross context virtual CPU structure.
7621 * @param fIntrState The VT-x guest-interruptibility state.
7622 * @param fStepping Running in hmR0VmxRunGuestCodeStep() and we should
7623 * return VINF_EM_DBG_STEPPED if the event was
7624 * dispatched directly.
7625 */
7626static VBOXSTRICTRC hmR0VmxInjectPendingEvent(PVMCPU pVCpu, uint32_t fIntrState, bool fStepping)
7627{
7628 HMVMX_ASSERT_PREEMPT_SAFE(pVCpu);
7629 Assert(VMMRZCallRing3IsEnabled(pVCpu));
7630
7631 bool const fBlockMovSS = RT_BOOL(fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS);
7632 bool const fBlockSti = RT_BOOL(fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_STI);
7633
7634 Assert(!fBlockSti || !(ASMAtomicUoReadU64(&pVCpu->cpum.GstCtx.fExtrn) & CPUMCTX_EXTRN_RFLAGS));
7635 Assert(!(fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_SMI)); /* We don't support block-by-SMI yet.*/
7636 Assert(!fBlockSti || pVCpu->cpum.GstCtx.eflags.Bits.u1IF); /* Cannot set block-by-STI when interrupts are disabled. */
7637 Assert(!TRPMHasTrap(pVCpu));
7638
7639 VBOXSTRICTRC rcStrict = VINF_SUCCESS;
7640 if (pVCpu->hm.s.Event.fPending)
7641 {
7642 /*
7643 * Do -not- clear any interrupt-window exiting control here. We might have an interrupt
7644 * pending even while injecting an event and in this case, we want a VM-exit as soon as
7645 * the guest is ready for the next interrupt, see @bugref{6208#c45}.
7646 *
7647 * See Intel spec. 26.6.5 "Interrupt-Window Exiting and Virtual-Interrupt Delivery".
7648 */
7649 uint32_t const uIntType = VMX_ENTRY_INT_INFO_TYPE(pVCpu->hm.s.Event.u64IntInfo);
7650#ifdef VBOX_STRICT
7651 if (uIntType == VMX_ENTRY_INT_INFO_TYPE_EXT_INT)
7652 {
7653 bool const fBlockInt = !(pVCpu->cpum.GstCtx.eflags.u32 & X86_EFL_IF);
7654 Assert(!fBlockInt);
7655 Assert(!fBlockSti);
7656 Assert(!fBlockMovSS);
7657 }
7658 else if (uIntType == VMX_ENTRY_INT_INFO_TYPE_NMI)
7659 {
7660 bool const fBlockNmi = RT_BOOL(fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_NMI);
7661 Assert(!fBlockSti);
7662 Assert(!fBlockMovSS);
7663 Assert(!fBlockNmi);
7664 }
7665#endif
7666 Log4(("Injecting pending event vcpu[%RU32] u64IntInfo=%#RX64 Type=%#RX32\n", pVCpu->idCpu, pVCpu->hm.s.Event.u64IntInfo,
7667 uIntType));
7668
7669 /*
7670 * Inject the event and get any changes to the guest-interruptibility state.
7671 *
7672 * The guest-interruptibility state may need to be updated if we inject the event
7673 * into the guest IDT ourselves (for real-on-v86 guest injecting software interrupts).
7674 */
7675 rcStrict = hmR0VmxInjectEventVmcs(pVCpu, pVCpu->hm.s.Event.u64IntInfo, pVCpu->hm.s.Event.cbInstr,
7676 pVCpu->hm.s.Event.u32ErrCode, pVCpu->hm.s.Event.GCPtrFaultAddress, fStepping,
7677 &fIntrState);
7678 AssertRCReturn(VBOXSTRICTRC_VAL(rcStrict), rcStrict);
7679
7680 if (uIntType == VMX_ENTRY_INT_INFO_TYPE_EXT_INT)
7681 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectInterrupt);
7682 else
7683 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectXcpt);
7684 }
7685
7686 /*
7687 * Update the guest-interruptibility state.
7688 *
7689 * This is required for the real-on-v86 software interrupt injection case above, as well as
7690 * updates to the guest state from ring-3 or IEM/REM.
7691 */
7692 int rc = VMXWriteVmcs32(VMX_VMCS32_GUEST_INT_STATE, fIntrState);
7693 AssertRCReturn(rc, rc);
7694
7695 /*
7696 * There's no need to clear the VM-entry interruption-information field here if we're not
7697 * injecting anything. VT-x clears the valid bit on every VM-exit.
7698 *
7699 * See Intel spec. 24.8.3 "VM-Entry Controls for Event Injection".
7700 */
7701
7702 Assert(rcStrict == VINF_SUCCESS || rcStrict == VINF_EM_RESET || (rcStrict == VINF_EM_DBG_STEPPED && fStepping));
7703 NOREF(fBlockMovSS); NOREF(fBlockSti);
7704 return rcStrict;
7705}
7706
7707
7708/**
7709 * Injects a double-fault (\#DF) exception into the VM.
7710 *
7711 * @returns Strict VBox status code (i.e. informational status codes too).
7712 * @param pVCpu The cross context virtual CPU structure.
7713 * @param fStepping Whether we're running in hmR0VmxRunGuestCodeStep()
7714 * and should return VINF_EM_DBG_STEPPED if the event
7715 * is injected directly (register modified by us, not
7716 * by hardware on VM-entry).
7717 * @param pfIntrState Pointer to the current guest interruptibility-state.
7718 * This interruptibility-state will be updated if
7719 * necessary. This cannot not be NULL.
7720 */
7721DECLINLINE(VBOXSTRICTRC) hmR0VmxInjectXcptDF(PVMCPU pVCpu, bool fStepping, uint32_t *pfIntrState)
7722{
7723 uint32_t const u32IntInfo = X86_XCPT_DF | VMX_EXIT_INT_INFO_VALID
7724 | (VMX_EXIT_INT_INFO_TYPE_HW_XCPT << VMX_EXIT_INT_INFO_TYPE_SHIFT)
7725 | VMX_EXIT_INT_INFO_ERROR_CODE_VALID;
7726 return hmR0VmxInjectEventVmcs(pVCpu, u32IntInfo, 0 /* cbInstr */, 0 /* u32ErrCode */, 0 /* GCPtrFaultAddress */, fStepping,
7727 pfIntrState);
7728}
7729
7730
7731/**
7732 * Injects a general-protection (\#GP) fault into the VM.
7733 *
7734 * @returns Strict VBox status code (i.e. informational status codes too).
7735 * @param pVCpu The cross context virtual CPU structure.
7736 * @param fErrorCodeValid Whether the error code is valid (depends on the CPU
7737 * mode, i.e. in real-mode it's not valid).
7738 * @param u32ErrorCode The error code associated with the \#GP.
7739 * @param fStepping Whether we're running in
7740 * hmR0VmxRunGuestCodeStep() and should return
7741 * VINF_EM_DBG_STEPPED if the event is injected
7742 * directly (register modified by us, not by
7743 * hardware on VM-entry).
7744 * @param pfIntrState Pointer to the current guest interruptibility-state.
7745 * This interruptibility-state will be updated if
7746 * necessary. This cannot not be NULL.
7747 */
7748DECLINLINE(VBOXSTRICTRC) hmR0VmxInjectXcptGP(PVMCPU pVCpu, bool fErrorCodeValid, uint32_t u32ErrorCode, bool fStepping,
7749 uint32_t *pfIntrState)
7750{
7751 uint32_t const u32IntInfo = X86_XCPT_GP | VMX_EXIT_INT_INFO_VALID
7752 | (VMX_EXIT_INT_INFO_TYPE_HW_XCPT << VMX_EXIT_INT_INFO_TYPE_SHIFT)
7753 | (fErrorCodeValid ? VMX_EXIT_INT_INFO_ERROR_CODE_VALID : 0);
7754 return hmR0VmxInjectEventVmcs(pVCpu, u32IntInfo, 0 /* cbInstr */, u32ErrorCode, 0 /* GCPtrFaultAddress */, fStepping,
7755 pfIntrState);
7756}
7757
7758
7759/**
7760 * Pushes a 2-byte value onto the real-mode (in virtual-8086 mode) guest's
7761 * stack.
7762 *
7763 * @returns Strict VBox status code (i.e. informational status codes too).
7764 * @retval VINF_EM_RESET if pushing a value to the stack caused a triple-fault.
7765 * @param pVCpu The cross context virtual CPU structure.
7766 * @param uValue The value to push to the guest stack.
7767 */
7768static VBOXSTRICTRC hmR0VmxRealModeGuestStackPush(PVMCPU pVCpu, uint16_t uValue)
7769{
7770 /*
7771 * The stack limit is 0xffff in real-on-virtual 8086 mode. Real-mode with weird stack limits cannot be run in
7772 * virtual 8086 mode in VT-x. See Intel spec. 26.3.1.2 "Checks on Guest Segment Registers".
7773 * See Intel Instruction reference for PUSH and Intel spec. 22.33.1 "Segment Wraparound".
7774 */
7775 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
7776 if (pCtx->sp == 1)
7777 return VINF_EM_RESET;
7778 pCtx->sp -= sizeof(uint16_t); /* May wrap around which is expected behaviour. */
7779 int rc = PGMPhysSimpleWriteGCPhys(pVCpu->CTX_SUFF(pVM), pCtx->ss.u64Base + pCtx->sp, &uValue, sizeof(uint16_t));
7780 AssertRC(rc);
7781 return rc;
7782}
7783
7784
7785/**
7786 * Injects an event into the guest upon VM-entry by updating the relevant fields
7787 * in the VM-entry area in the VMCS.
7788 *
7789 * @returns Strict VBox status code (i.e. informational status codes too).
7790 * @retval VINF_SUCCESS if the event is successfully injected into the VMCS.
7791 * @retval VINF_EM_RESET if event injection resulted in a triple-fault.
7792 *
7793 * @param pVCpu The cross context virtual CPU structure.
7794 * @param u64IntInfo The VM-entry interruption-information field.
7795 * @param cbInstr The VM-entry instruction length in bytes (for
7796 * software interrupts, exceptions and privileged
7797 * software exceptions).
7798 * @param u32ErrCode The VM-entry exception error code.
7799 * @param GCPtrFaultAddress The page-fault address for \#PF exceptions.
7800 * @param pfIntrState Pointer to the current guest interruptibility-state.
7801 * This interruptibility-state will be updated if
7802 * necessary. This cannot not be NULL.
7803 * @param fStepping Whether we're running in
7804 * hmR0VmxRunGuestCodeStep() and should return
7805 * VINF_EM_DBG_STEPPED if the event is injected
7806 * directly (register modified by us, not by
7807 * hardware on VM-entry).
7808 */
7809static VBOXSTRICTRC hmR0VmxInjectEventVmcs(PVMCPU pVCpu, uint64_t u64IntInfo, uint32_t cbInstr, uint32_t u32ErrCode,
7810 RTGCUINTREG GCPtrFaultAddress, bool fStepping, uint32_t *pfIntrState)
7811{
7812 /* Intel spec. 24.8.3 "VM-Entry Controls for Event Injection" specifies the interruption-information field to be 32-bits. */
7813 AssertMsg(!RT_HI_U32(u64IntInfo), ("%#RX64\n", u64IntInfo));
7814 Assert(pfIntrState);
7815
7816 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
7817 uint32_t u32IntInfo = (uint32_t)u64IntInfo;
7818 uint32_t const uVector = VMX_ENTRY_INT_INFO_VECTOR(u32IntInfo);
7819 uint32_t const uIntType = VMX_ENTRY_INT_INFO_TYPE(u32IntInfo);
7820
7821#ifdef VBOX_STRICT
7822 /*
7823 * Validate the error-code-valid bit for hardware exceptions.
7824 * No error codes for exceptions in real-mode.
7825 *
7826 * See Intel spec. 20.1.4 "Interrupt and Exception Handling"
7827 */
7828 if ( uIntType == VMX_EXIT_INT_INFO_TYPE_HW_XCPT
7829 && !CPUMIsGuestInRealModeEx(pCtx))
7830 {
7831 switch (uVector)
7832 {
7833 case X86_XCPT_PF:
7834 case X86_XCPT_DF:
7835 case X86_XCPT_TS:
7836 case X86_XCPT_NP:
7837 case X86_XCPT_SS:
7838 case X86_XCPT_GP:
7839 case X86_XCPT_AC:
7840 AssertMsg(VMX_ENTRY_INT_INFO_IS_ERROR_CODE_VALID(u32IntInfo),
7841 ("Error-code-valid bit not set for exception that has an error code uVector=%#x\n", uVector));
7842 RT_FALL_THRU();
7843 default:
7844 break;
7845 }
7846 }
7847#endif
7848
7849 /* Cannot inject an NMI when block-by-MOV SS is in effect. */
7850 Assert( uIntType != VMX_EXIT_INT_INFO_TYPE_NMI
7851 || !(*pfIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS));
7852
7853 STAM_COUNTER_INC(&pVCpu->hm.s.paStatInjectedIrqsR0[uVector & MASK_INJECT_IRQ_STAT]);
7854
7855 /*
7856 * Hardware interrupts & exceptions cannot be delivered through the software interrupt
7857 * redirection bitmap to the real mode task in virtual-8086 mode. We must jump to the
7858 * interrupt handler in the (real-mode) guest.
7859 *
7860 * See Intel spec. 20.3 "Interrupt and Exception handling in Virtual-8086 Mode".
7861 * See Intel spec. 20.1.4 "Interrupt and Exception Handling" for real-mode interrupt handling.
7862 */
7863 if (CPUMIsGuestInRealModeEx(pCtx)) /* CR0.PE bit changes are always intercepted, so it's up to date. */
7864 {
7865 if (pVCpu->CTX_SUFF(pVM)->hm.s.vmx.fUnrestrictedGuest)
7866 {
7867 /*
7868 * For unrestricted execution enabled CPUs running real-mode guests, we must not
7869 * set the deliver-error-code bit.
7870 *
7871 * See Intel spec. 26.2.1.3 "VM-Entry Control Fields".
7872 */
7873 u32IntInfo &= ~VMX_ENTRY_INT_INFO_ERROR_CODE_VALID;
7874 }
7875 else
7876 {
7877 PVM pVM = pVCpu->CTX_SUFF(pVM);
7878 Assert(PDMVmmDevHeapIsEnabled(pVM));
7879 Assert(pVM->hm.s.vmx.pRealModeTSS);
7880
7881 /* We require RIP, RSP, RFLAGS, CS, IDTR, import them. */
7882 int rc2 = hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_SREG_MASK | CPUMCTX_EXTRN_TABLE_MASK | CPUMCTX_EXTRN_RIP
7883 | CPUMCTX_EXTRN_RSP | CPUMCTX_EXTRN_RFLAGS);
7884 AssertRCReturn(rc2, rc2);
7885
7886 /* Check if the interrupt handler is present in the IVT (real-mode IDT). IDT limit is (4N - 1). */
7887 size_t const cbIdtEntry = sizeof(X86IDTR16);
7888 if (uVector * cbIdtEntry + (cbIdtEntry - 1) > pCtx->idtr.cbIdt)
7889 {
7890 /* If we are trying to inject a #DF with no valid IDT entry, return a triple-fault. */
7891 if (uVector == X86_XCPT_DF)
7892 return VINF_EM_RESET;
7893
7894 /* If we're injecting a #GP with no valid IDT entry, inject a double-fault. */
7895 if (uVector == X86_XCPT_GP)
7896 return hmR0VmxInjectXcptDF(pVCpu, fStepping, pfIntrState);
7897
7898 /*
7899 * If we're injecting an event with no valid IDT entry, inject a #GP.
7900 * No error codes for exceptions in real-mode.
7901 *
7902 * See Intel spec. 20.1.4 "Interrupt and Exception Handling"
7903 */
7904 return hmR0VmxInjectXcptGP(pVCpu, false /* fErrCodeValid */, 0 /* u32ErrCode */, fStepping, pfIntrState);
7905 }
7906
7907 /* Software exceptions (#BP and #OF exceptions thrown as a result of INT3 or INTO) */
7908 uint16_t uGuestIp = pCtx->ip;
7909 if (uIntType == VMX_ENTRY_INT_INFO_TYPE_SW_XCPT)
7910 {
7911 Assert(uVector == X86_XCPT_BP || uVector == X86_XCPT_OF);
7912 /* #BP and #OF are both benign traps, we need to resume the next instruction. */
7913 uGuestIp = pCtx->ip + (uint16_t)cbInstr;
7914 }
7915 else if (uIntType == VMX_ENTRY_INT_INFO_TYPE_SW_INT)
7916 uGuestIp = pCtx->ip + (uint16_t)cbInstr;
7917
7918 /* Get the code segment selector and offset from the IDT entry for the interrupt handler. */
7919 X86IDTR16 IdtEntry;
7920 RTGCPHYS GCPhysIdtEntry = (RTGCPHYS)pCtx->idtr.pIdt + uVector * cbIdtEntry;
7921 rc2 = PGMPhysSimpleReadGCPhys(pVM, &IdtEntry, GCPhysIdtEntry, cbIdtEntry);
7922 AssertRCReturn(rc2, rc2);
7923
7924 /* Construct the stack frame for the interrupt/exception handler. */
7925 VBOXSTRICTRC rcStrict;
7926 rcStrict = hmR0VmxRealModeGuestStackPush(pVCpu, pCtx->eflags.u32);
7927 if (rcStrict == VINF_SUCCESS)
7928 rcStrict = hmR0VmxRealModeGuestStackPush(pVCpu, pCtx->cs.Sel);
7929 if (rcStrict == VINF_SUCCESS)
7930 rcStrict = hmR0VmxRealModeGuestStackPush(pVCpu, uGuestIp);
7931
7932 /* Clear the required eflag bits and jump to the interrupt/exception handler. */
7933 if (rcStrict == VINF_SUCCESS)
7934 {
7935 pCtx->eflags.u32 &= ~(X86_EFL_IF | X86_EFL_TF | X86_EFL_RF | X86_EFL_AC);
7936 pCtx->rip = IdtEntry.offSel;
7937 pCtx->cs.Sel = IdtEntry.uSel;
7938 pCtx->cs.ValidSel = IdtEntry.uSel;
7939 pCtx->cs.u64Base = IdtEntry.uSel << cbIdtEntry;
7940 if ( uIntType == VMX_ENTRY_INT_INFO_TYPE_HW_XCPT
7941 && uVector == X86_XCPT_PF)
7942 pCtx->cr2 = GCPtrFaultAddress;
7943
7944 /* If any other guest-state bits are changed here, make sure to update
7945 hmR0VmxPreRunGuestCommitted() when thread-context hooks are used. */
7946 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_CS | HM_CHANGED_GUEST_CR2
7947 | HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS
7948 | HM_CHANGED_GUEST_RSP);
7949
7950 /* We're clearing interrupts, which means no block-by-STI interrupt-inhibition. */
7951 if (*pfIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_STI)
7952 {
7953 Assert( uIntType != VMX_ENTRY_INT_INFO_TYPE_NMI
7954 && uIntType != VMX_ENTRY_INT_INFO_TYPE_EXT_INT);
7955 Log4Func(("Clearing inhibition due to STI\n"));
7956 *pfIntrState &= ~VMX_VMCS_GUEST_INT_STATE_BLOCK_STI;
7957 }
7958 Log4(("Injecting real-mode: u32IntInfo=%#x u32ErrCode=%#x cbInstr=%#x Eflags=%#x CS:EIP=%04x:%04x\n",
7959 u32IntInfo, u32ErrCode, cbInstr, pCtx->eflags.u, pCtx->cs.Sel, pCtx->eip));
7960
7961 /* The event has been truly dispatched. Mark it as no longer pending so we don't attempt to 'undo'
7962 it, if we are returning to ring-3 before executing guest code. */
7963 pVCpu->hm.s.Event.fPending = false;
7964
7965 /* Make hmR0VmxPreRunGuest() return if we're stepping since we've changed cs:rip. */
7966 if (fStepping)
7967 rcStrict = VINF_EM_DBG_STEPPED;
7968 }
7969 AssertMsg(rcStrict == VINF_SUCCESS || rcStrict == VINF_EM_RESET || (rcStrict == VINF_EM_DBG_STEPPED && fStepping),
7970 ("%Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
7971 return rcStrict;
7972 }
7973 }
7974
7975 /* Validate. */
7976 Assert(VMX_ENTRY_INT_INFO_IS_VALID(u32IntInfo)); /* Bit 31 (Valid bit) must be set by caller. */
7977 Assert(!(u32IntInfo & VMX_BF_ENTRY_INT_INFO_RSVD_12_30_MASK)); /* Bits 30:12 MBZ. */
7978
7979 /* Inject. */
7980 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_ENTRY_INTERRUPTION_INFO, u32IntInfo);
7981 if (VMX_ENTRY_INT_INFO_IS_ERROR_CODE_VALID(u32IntInfo))
7982 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_ENTRY_EXCEPTION_ERRCODE, u32ErrCode);
7983 rc |= VMXWriteVmcs32(VMX_VMCS32_CTRL_ENTRY_INSTR_LENGTH, cbInstr);
7984 AssertRCReturn(rc, rc);
7985
7986 /* Update CR2. */
7987 if ( VMX_ENTRY_INT_INFO_TYPE(u32IntInfo) == VMX_EXIT_INT_INFO_TYPE_HW_XCPT
7988 && uVector == X86_XCPT_PF)
7989 pCtx->cr2 = GCPtrFaultAddress;
7990
7991 Log4(("Injecting u32IntInfo=%#x u32ErrCode=%#x cbInstr=%#x CR2=%#RX64\n", u32IntInfo, u32ErrCode, cbInstr, pCtx->cr2));
7992
7993 return VINF_SUCCESS;
7994}
7995
7996
7997/**
7998 * Clears the interrupt-window exiting control in the VMCS and if necessary
7999 * clears the current event in the VMCS as well.
8000 *
8001 * @returns VBox status code.
8002 * @param pVCpu The cross context virtual CPU structure.
8003 *
8004 * @remarks Use this function only to clear events that have not yet been
8005 * delivered to the guest but are injected in the VMCS!
8006 * @remarks No-long-jump zone!!!
8007 */
8008static void hmR0VmxClearIntNmiWindowsVmcs(PVMCPU pVCpu)
8009{
8010 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_INT_WINDOW_EXIT)
8011 {
8012 hmR0VmxClearIntWindowExitVmcs(pVCpu);
8013 Log4Func(("Cleared interrupt window\n"));
8014 }
8015
8016 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_NMI_WINDOW_EXIT)
8017 {
8018 hmR0VmxClearNmiWindowExitVmcs(pVCpu);
8019 Log4Func(("Cleared NMI window\n"));
8020 }
8021}
8022
8023
8024/**
8025 * Enters the VT-x session.
8026 *
8027 * @returns VBox status code.
8028 * @param pVCpu The cross context virtual CPU structure.
8029 * @param pHostCpu Pointer to the global CPU info struct.
8030 */
8031VMMR0DECL(int) VMXR0Enter(PVMCPU pVCpu, PHMGLOBALCPUINFO pHostCpu)
8032{
8033 AssertPtr(pVCpu);
8034 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.vmx.fSupported);
8035 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
8036 RT_NOREF(pHostCpu);
8037
8038 LogFlowFunc(("pVCpu=%p\n", pVCpu));
8039 Assert((pVCpu->hm.s.fCtxChanged & (HM_CHANGED_HOST_CONTEXT | HM_CHANGED_VMX_HOST_GUEST_SHARED_STATE))
8040 == (HM_CHANGED_HOST_CONTEXT | HM_CHANGED_VMX_HOST_GUEST_SHARED_STATE));
8041
8042#ifdef VBOX_STRICT
8043 /* At least verify VMX is enabled, since we can't check if we're in VMX root mode without #GP'ing. */
8044 RTCCUINTREG uHostCR4 = ASMGetCR4();
8045 if (!(uHostCR4 & X86_CR4_VMXE))
8046 {
8047 LogRelFunc(("X86_CR4_VMXE bit in CR4 is not set!\n"));
8048 return VERR_VMX_X86_CR4_VMXE_CLEARED;
8049 }
8050#endif
8051
8052 /*
8053 * Load the VCPU's VMCS as the current (and active) one.
8054 */
8055 Assert(pVCpu->hm.s.vmx.uVmcsState & HMVMX_VMCS_STATE_CLEAR);
8056 int rc = VMXActivateVmcs(pVCpu->hm.s.vmx.HCPhysVmcs);
8057 if (RT_FAILURE(rc))
8058 return rc;
8059
8060 pVCpu->hm.s.vmx.uVmcsState = HMVMX_VMCS_STATE_ACTIVE;
8061 pVCpu->hm.s.fLeaveDone = false;
8062 Log4Func(("Activated Vmcs. HostCpuId=%u\n", RTMpCpuId()));
8063
8064 return VINF_SUCCESS;
8065}
8066
8067
8068/**
8069 * The thread-context callback (only on platforms which support it).
8070 *
8071 * @param enmEvent The thread-context event.
8072 * @param pVCpu The cross context virtual CPU structure.
8073 * @param fGlobalInit Whether global VT-x/AMD-V init. was used.
8074 * @thread EMT(pVCpu)
8075 */
8076VMMR0DECL(void) VMXR0ThreadCtxCallback(RTTHREADCTXEVENT enmEvent, PVMCPU pVCpu, bool fGlobalInit)
8077{
8078 NOREF(fGlobalInit);
8079
8080 switch (enmEvent)
8081 {
8082 case RTTHREADCTXEVENT_OUT:
8083 {
8084 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
8085 Assert(VMMR0ThreadCtxHookIsEnabled(pVCpu));
8086 VMCPU_ASSERT_EMT(pVCpu);
8087
8088 /* No longjmps (logger flushes, locks) in this fragile context. */
8089 VMMRZCallRing3Disable(pVCpu);
8090 Log4Func(("Preempting: HostCpuId=%u\n", RTMpCpuId()));
8091
8092 /*
8093 * Restore host-state (FPU, debug etc.)
8094 */
8095 if (!pVCpu->hm.s.fLeaveDone)
8096 {
8097 /*
8098 * Do -not- import the guest-state here as we might already be in the middle of importing
8099 * it, esp. bad if we're holding the PGM lock, see comment in hmR0VmxImportGuestState().
8100 */
8101 hmR0VmxLeave(pVCpu, false /* fImportState */);
8102 pVCpu->hm.s.fLeaveDone = true;
8103 }
8104
8105 /* Leave HM context, takes care of local init (term). */
8106 int rc = HMR0LeaveCpu(pVCpu);
8107 AssertRC(rc); NOREF(rc);
8108
8109 /* Restore longjmp state. */
8110 VMMRZCallRing3Enable(pVCpu);
8111 STAM_REL_COUNTER_INC(&pVCpu->hm.s.StatSwitchPreempt);
8112 break;
8113 }
8114
8115 case RTTHREADCTXEVENT_IN:
8116 {
8117 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
8118 Assert(VMMR0ThreadCtxHookIsEnabled(pVCpu));
8119 VMCPU_ASSERT_EMT(pVCpu);
8120
8121 /* No longjmps here, as we don't want to trigger preemption (& its hook) while resuming. */
8122 VMMRZCallRing3Disable(pVCpu);
8123 Log4Func(("Resumed: HostCpuId=%u\n", RTMpCpuId()));
8124
8125 /* Initialize the bare minimum state required for HM. This takes care of
8126 initializing VT-x if necessary (onlined CPUs, local init etc.) */
8127 int rc = hmR0EnterCpu(pVCpu);
8128 AssertRC(rc);
8129 Assert((pVCpu->hm.s.fCtxChanged & (HM_CHANGED_HOST_CONTEXT | HM_CHANGED_VMX_HOST_GUEST_SHARED_STATE))
8130 == (HM_CHANGED_HOST_CONTEXT | HM_CHANGED_VMX_HOST_GUEST_SHARED_STATE));
8131
8132 /* Load the active VMCS as the current one. */
8133 if (pVCpu->hm.s.vmx.uVmcsState & HMVMX_VMCS_STATE_CLEAR)
8134 {
8135 rc = VMXActivateVmcs(pVCpu->hm.s.vmx.HCPhysVmcs);
8136 AssertRC(rc); NOREF(rc);
8137 pVCpu->hm.s.vmx.uVmcsState = HMVMX_VMCS_STATE_ACTIVE;
8138 Log4Func(("Resumed: Activated Vmcs. HostCpuId=%u\n", RTMpCpuId()));
8139 }
8140 pVCpu->hm.s.fLeaveDone = false;
8141
8142 /* Restore longjmp state. */
8143 VMMRZCallRing3Enable(pVCpu);
8144 break;
8145 }
8146
8147 default:
8148 break;
8149 }
8150}
8151
8152
8153/**
8154 * Exports the host state into the VMCS host-state area.
8155 * Sets up the VM-exit MSR-load area.
8156 *
8157 * The CPU state will be loaded from these fields on every successful VM-exit.
8158 *
8159 * @returns VBox status code.
8160 * @param pVCpu The cross context virtual CPU structure.
8161 *
8162 * @remarks No-long-jump zone!!!
8163 */
8164static int hmR0VmxExportHostState(PVMCPU pVCpu)
8165{
8166 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
8167
8168 int rc = VINF_SUCCESS;
8169 if (pVCpu->hm.s.fCtxChanged & HM_CHANGED_HOST_CONTEXT)
8170 {
8171 rc = hmR0VmxExportHostControlRegs();
8172 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8173
8174 rc = hmR0VmxExportHostSegmentRegs(pVCpu);
8175 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8176
8177 rc = hmR0VmxExportHostMsrs(pVCpu);
8178 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8179
8180 pVCpu->hm.s.fCtxChanged &= ~HM_CHANGED_HOST_CONTEXT;
8181 }
8182 return rc;
8183}
8184
8185
8186/**
8187 * Saves the host state in the VMCS host-state.
8188 *
8189 * @returns VBox status code.
8190 * @param pVCpu The cross context virtual CPU structure.
8191 *
8192 * @remarks No-long-jump zone!!!
8193 */
8194VMMR0DECL(int) VMXR0ExportHostState(PVMCPU pVCpu)
8195{
8196 AssertPtr(pVCpu);
8197 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
8198
8199 /*
8200 * Export the host state here while entering HM context.
8201 * When thread-context hooks are used, we might get preempted and have to re-save the host
8202 * state but most of the time we won't be, so do it here before we disable interrupts.
8203 */
8204 return hmR0VmxExportHostState(pVCpu);
8205}
8206
8207
8208/**
8209 * Exports the guest state into the VMCS guest-state area.
8210 *
8211 * The will typically be done before VM-entry when the guest-CPU state and the
8212 * VMCS state may potentially be out of sync.
8213 *
8214 * Sets up the VM-entry MSR-load and VM-exit MSR-store areas. Sets up the
8215 * VM-entry controls.
8216 * Sets up the appropriate VMX non-root function to execute guest code based on
8217 * the guest CPU mode.
8218 *
8219 * @returns VBox strict status code.
8220 * @retval VINF_EM_RESCHEDULE_REM if we try to emulate non-paged guest code
8221 * without unrestricted guest access and the VMMDev is not presently
8222 * mapped (e.g. EFI32).
8223 *
8224 * @param pVCpu The cross context virtual CPU structure.
8225 *
8226 * @remarks No-long-jump zone!!!
8227 */
8228static VBOXSTRICTRC hmR0VmxExportGuestState(PVMCPU pVCpu)
8229{
8230 AssertPtr(pVCpu);
8231 HMVMX_ASSERT_PREEMPT_SAFE(pVCpu);
8232
8233 LogFlowFunc(("pVCpu=%p\n", pVCpu));
8234
8235 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatExportGuestState, x);
8236
8237 /* Determine real-on-v86 mode. */
8238 pVCpu->hm.s.vmx.RealMode.fRealOnV86Active = false;
8239 if ( !pVCpu->CTX_SUFF(pVM)->hm.s.vmx.fUnrestrictedGuest
8240 && CPUMIsGuestInRealModeEx(&pVCpu->cpum.GstCtx))
8241 pVCpu->hm.s.vmx.RealMode.fRealOnV86Active = true;
8242
8243 /*
8244 * Any ordering dependency among the sub-functions below must be explicitly stated using comments.
8245 * Ideally, assert that the cross-dependent bits are up-to-date at the point of using it.
8246 */
8247 int rc = hmR0VmxSelectVMRunHandler(pVCpu);
8248 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8249
8250 /* This needs to be done after hmR0VmxSelectVMRunHandler() as changing pfnStartVM may require VM-entry control updates. */
8251 rc = hmR0VmxExportGuestEntryCtls(pVCpu);
8252 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8253
8254 /* This needs to be done after hmR0VmxSelectVMRunHandler() as changing pfnStartVM may require VM-exit control updates. */
8255 rc = hmR0VmxExportGuestExitCtls(pVCpu);
8256 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8257
8258 rc = hmR0VmxExportGuestCR0(pVCpu);
8259 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8260
8261 VBOXSTRICTRC rcStrict = hmR0VmxExportGuestCR3AndCR4(pVCpu);
8262 if (rcStrict == VINF_SUCCESS)
8263 { /* likely */ }
8264 else
8265 {
8266 Assert(rcStrict == VINF_EM_RESCHEDULE_REM || RT_FAILURE_NP(rcStrict));
8267 return rcStrict;
8268 }
8269
8270 rc = hmR0VmxExportGuestSegmentRegs(pVCpu);
8271 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8272
8273 /* This needs to be done after hmR0VmxExportGuestEntryCtls() and hmR0VmxExportGuestExitCtls() as it
8274 may alter controls if we determine we don't have to swap EFER after all. */
8275 rc = hmR0VmxExportGuestMsrs(pVCpu);
8276 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8277
8278 rc = hmR0VmxExportGuestApicTpr(pVCpu);
8279 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8280
8281 rc = hmR0VmxExportGuestXcptIntercepts(pVCpu);
8282 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8283
8284 rc = hmR0VmxExportGuestRip(pVCpu);
8285 rc |= hmR0VmxExportGuestRsp(pVCpu);
8286 rc |= hmR0VmxExportGuestRflags(pVCpu);
8287 AssertLogRelMsgRCReturn(rc, ("rc=%Rrc\n", rc), rc);
8288
8289 /* Clear any bits that may be set but exported unconditionally or unused/reserved bits. */
8290 ASMAtomicUoAndU64(&pVCpu->hm.s.fCtxChanged, ~( (HM_CHANGED_GUEST_GPRS_MASK & ~HM_CHANGED_GUEST_RSP)
8291 | HM_CHANGED_GUEST_CR2
8292 | (HM_CHANGED_GUEST_DR_MASK & ~HM_CHANGED_GUEST_DR7)
8293 | HM_CHANGED_GUEST_X87
8294 | HM_CHANGED_GUEST_SSE_AVX
8295 | HM_CHANGED_GUEST_OTHER_XSAVE
8296 | HM_CHANGED_GUEST_XCRx
8297 | HM_CHANGED_GUEST_KERNEL_GS_BASE /* Part of lazy or auto load-store MSRs. */
8298 | HM_CHANGED_GUEST_SYSCALL_MSRS /* Part of lazy or auto load-store MSRs. */
8299 | HM_CHANGED_GUEST_TSC_AUX
8300 | HM_CHANGED_GUEST_OTHER_MSRS
8301 | HM_CHANGED_GUEST_HWVIRT
8302 | (HM_CHANGED_KEEPER_STATE_MASK & ~HM_CHANGED_VMX_MASK)));
8303
8304 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExportGuestState, x);
8305 return rc;
8306}
8307
8308
8309/**
8310 * Exports the state shared between the host and guest into the VMCS.
8311 *
8312 * @param pVCpu The cross context virtual CPU structure.
8313 *
8314 * @remarks No-long-jump zone!!!
8315 */
8316static void hmR0VmxExportSharedState(PVMCPU pVCpu)
8317{
8318 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
8319 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
8320
8321 if (pVCpu->hm.s.fCtxChanged & HM_CHANGED_GUEST_DR_MASK)
8322 {
8323 int rc = hmR0VmxExportSharedDebugState(pVCpu);
8324 AssertRC(rc);
8325 pVCpu->hm.s.fCtxChanged &= ~HM_CHANGED_GUEST_DR_MASK;
8326
8327 /* Loading shared debug bits might have changed eflags.TF bit for debugging purposes. */
8328 if (pVCpu->hm.s.fCtxChanged & HM_CHANGED_GUEST_RFLAGS)
8329 {
8330 rc = hmR0VmxExportGuestRflags(pVCpu);
8331 AssertRC(rc);
8332 }
8333 }
8334
8335 if (pVCpu->hm.s.fCtxChanged & HM_CHANGED_VMX_GUEST_LAZY_MSRS)
8336 {
8337 hmR0VmxLazyLoadGuestMsrs(pVCpu);
8338 pVCpu->hm.s.fCtxChanged &= ~HM_CHANGED_VMX_GUEST_LAZY_MSRS;
8339 }
8340
8341 AssertMsg(!(pVCpu->hm.s.fCtxChanged & HM_CHANGED_VMX_HOST_GUEST_SHARED_STATE),
8342 ("fCtxChanged=%#RX64\n", pVCpu->hm.s.fCtxChanged));
8343}
8344
8345
8346/**
8347 * Worker for loading the guest-state bits in the inner VT-x execution loop.
8348 *
8349 * @returns Strict VBox status code (i.e. informational status codes too).
8350 * @retval VINF_EM_RESCHEDULE_REM if we try to emulate non-paged guest code
8351 * without unrestricted guest access and the VMMDev is not presently
8352 * mapped (e.g. EFI32).
8353 *
8354 * @param pVCpu The cross context virtual CPU structure.
8355 *
8356 * @remarks No-long-jump zone!!!
8357 */
8358static VBOXSTRICTRC hmR0VmxExportGuestStateOptimal(PVMCPU pVCpu)
8359{
8360 HMVMX_ASSERT_PREEMPT_SAFE(pVCpu);
8361 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
8362 Assert(VMMR0IsLogFlushDisabled(pVCpu));
8363
8364#ifdef HMVMX_ALWAYS_SYNC_FULL_GUEST_STATE
8365 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
8366#endif
8367
8368 /*
8369 * For many exits it's only RIP that changes and hence try to export it first
8370 * without going through a lot of change flag checks.
8371 */
8372 VBOXSTRICTRC rcStrict;
8373 uint64_t fCtxChanged = ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged);
8374 RT_UNTRUSTED_NONVOLATILE_COPY_FENCE();
8375 if ((fCtxChanged & (HM_CHANGED_ALL_GUEST & ~HM_CHANGED_VMX_HOST_GUEST_SHARED_STATE)) == HM_CHANGED_GUEST_RIP)
8376 {
8377 rcStrict = hmR0VmxExportGuestRip(pVCpu);
8378 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
8379 { /* likely */}
8380 else
8381 AssertMsgFailedReturn(("hmR0VmxExportGuestRip failed! rc=%Rrc\n", VBOXSTRICTRC_VAL(rcStrict)), rcStrict);
8382 STAM_COUNTER_INC(&pVCpu->hm.s.StatExportMinimal);
8383 }
8384 else if (fCtxChanged & (HM_CHANGED_ALL_GUEST & ~HM_CHANGED_VMX_HOST_GUEST_SHARED_STATE))
8385 {
8386 rcStrict = hmR0VmxExportGuestState(pVCpu);
8387 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
8388 { /* likely */}
8389 else
8390 {
8391 AssertMsg(rcStrict == VINF_EM_RESCHEDULE_REM, ("hmR0VmxExportGuestState failed! rc=%Rrc\n",
8392 VBOXSTRICTRC_VAL(rcStrict)));
8393 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
8394 return rcStrict;
8395 }
8396 STAM_COUNTER_INC(&pVCpu->hm.s.StatExportFull);
8397 }
8398 else
8399 rcStrict = VINF_SUCCESS;
8400
8401#ifdef VBOX_STRICT
8402 /* All the guest state bits should be loaded except maybe the host context and/or the shared host/guest bits. */
8403 fCtxChanged = ASMAtomicUoReadU64(&pVCpu->hm.s.fCtxChanged);
8404 RT_UNTRUSTED_NONVOLATILE_COPY_FENCE();
8405 AssertMsg(!(fCtxChanged & (HM_CHANGED_ALL_GUEST & ~HM_CHANGED_VMX_HOST_GUEST_SHARED_STATE)),
8406 ("fCtxChanged=%#RX64\n", fCtxChanged));
8407#endif
8408 return rcStrict;
8409}
8410
8411
8412/**
8413 * Does the preparations before executing guest code in VT-x.
8414 *
8415 * This may cause longjmps to ring-3 and may even result in rescheduling to the
8416 * recompiler/IEM. We must be cautious what we do here regarding committing
8417 * guest-state information into the VMCS assuming we assuredly execute the
8418 * guest in VT-x mode.
8419 *
8420 * If we fall back to the recompiler/IEM after updating the VMCS and clearing
8421 * the common-state (TRPM/forceflags), we must undo those changes so that the
8422 * recompiler/IEM can (and should) use them when it resumes guest execution.
8423 * Otherwise such operations must be done when we can no longer exit to ring-3.
8424 *
8425 * @returns Strict VBox status code (i.e. informational status codes too).
8426 * @retval VINF_SUCCESS if we can proceed with running the guest, interrupts
8427 * have been disabled.
8428 * @retval VINF_EM_RESET if a triple-fault occurs while injecting a
8429 * double-fault into the guest.
8430 * @retval VINF_EM_DBG_STEPPED if @a fStepping is true and an event was
8431 * dispatched directly.
8432 * @retval VINF_* scheduling changes, we have to go back to ring-3.
8433 *
8434 * @param pVCpu The cross context virtual CPU structure.
8435 * @param pVmxTransient Pointer to the VMX transient structure.
8436 * @param fStepping Set if called from hmR0VmxRunGuestCodeStep(). Makes
8437 * us ignore some of the reasons for returning to
8438 * ring-3, and return VINF_EM_DBG_STEPPED if event
8439 * dispatching took place.
8440 */
8441static VBOXSTRICTRC hmR0VmxPreRunGuest(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient, bool fStepping)
8442{
8443 Assert(VMMRZCallRing3IsEnabled(pVCpu));
8444
8445#ifdef VBOX_WITH_NESTED_HWVIRT_ONLY_IN_IEM
8446 if (CPUMIsGuestInVmxNonRootMode(&pVCpu->cpum.GstCtx))
8447 {
8448 Log2(("hmR0VmxPreRunGuest: Rescheduling to IEM due to nested-hwvirt or forced IEM exec -> VINF_EM_RESCHEDULE_REM\n"));
8449 RT_NOREF3(pVCpu, pVmxTransient, fStepping);
8450 return VINF_EM_RESCHEDULE_REM;
8451 }
8452#endif
8453
8454#ifdef VBOX_WITH_2X_4GB_ADDR_SPACE_IN_R0
8455 PGMRZDynMapFlushAutoSet(pVCpu);
8456#endif
8457
8458 /* Check force flag actions that might require us to go back to ring-3. */
8459 VBOXSTRICTRC rcStrict = hmR0VmxCheckForceFlags(pVCpu, fStepping);
8460 if (rcStrict == VINF_SUCCESS)
8461 { /* FFs doesn't get set all the time. */ }
8462 else
8463 return rcStrict;
8464
8465 /*
8466 * Setup the virtualized-APIC accesses.
8467 *
8468 * Note! This can cause a longjumps to R3 due to the acquisition of the PGM lock
8469 * in both PGMHandlerPhysicalReset() and IOMMMIOMapMMIOHCPage(), see @bugref{8721}.
8470 *
8471 * This is the reason we do it here and not in hmR0VmxExportGuestState().
8472 */
8473 PVM pVM = pVCpu->CTX_SUFF(pVM);
8474 if ( !pVCpu->hm.s.vmx.u64MsrApicBase
8475 && (pVCpu->hm.s.vmx.u32ProcCtls2 & VMX_PROC_CTLS2_VIRT_APIC_ACCESS)
8476 && PDMHasApic(pVM))
8477 {
8478 uint64_t const u64MsrApicBase = APICGetBaseMsrNoCheck(pVCpu);
8479 Assert(u64MsrApicBase);
8480 Assert(pVM->hm.s.vmx.HCPhysApicAccess);
8481
8482 RTGCPHYS const GCPhysApicBase = u64MsrApicBase & PAGE_BASE_GC_MASK;
8483
8484 /* Unalias any existing mapping. */
8485 int rc = PGMHandlerPhysicalReset(pVM, GCPhysApicBase);
8486 AssertRCReturn(rc, rc);
8487
8488 /* Map the HC APIC-access page in place of the MMIO page, also updates the shadow page tables if necessary. */
8489 Log4Func(("Mapped HC APIC-access page at %#RGp\n", GCPhysApicBase));
8490 rc = IOMMMIOMapMMIOHCPage(pVM, pVCpu, GCPhysApicBase, pVM->hm.s.vmx.HCPhysApicAccess, X86_PTE_RW | X86_PTE_P);
8491 AssertRCReturn(rc, rc);
8492
8493 /* Update the per-VCPU cache of the APIC base MSR. */
8494 pVCpu->hm.s.vmx.u64MsrApicBase = u64MsrApicBase;
8495 }
8496
8497 if (TRPMHasTrap(pVCpu))
8498 hmR0VmxTrpmTrapToPendingEvent(pVCpu);
8499 uint32_t fIntrState = hmR0VmxEvaluatePendingEvent(pVCpu);
8500
8501 /*
8502 * Event injection may take locks (currently the PGM lock for real-on-v86 case) and thus
8503 * needs to be done with longjmps or interrupts + preemption enabled. Event injection might
8504 * also result in triple-faulting the VM.
8505 */
8506 rcStrict = hmR0VmxInjectPendingEvent(pVCpu, fIntrState, fStepping);
8507 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
8508 { /* likely */ }
8509 else
8510 {
8511 AssertMsg(rcStrict == VINF_EM_RESET || (rcStrict == VINF_EM_DBG_STEPPED && fStepping),
8512 ("%Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
8513 return rcStrict;
8514 }
8515
8516 /*
8517 * A longjump might result in importing CR3 even for VM-exits that don't necessarily
8518 * import CR3 themselves. We will need to update them here, as even as late as the above
8519 * hmR0VmxInjectPendingEvent() call may lazily import guest-CPU state on demand causing
8520 * the below force flags to be set.
8521 */
8522 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_CR3))
8523 {
8524 Assert(!(ASMAtomicUoReadU64(&pVCpu->cpum.GstCtx.fExtrn) & CPUMCTX_EXTRN_CR3));
8525 int rc2 = PGMUpdateCR3(pVCpu, CPUMGetGuestCR3(pVCpu));
8526 AssertMsgReturn(rc2 == VINF_SUCCESS || rc2 == VINF_PGM_SYNC_CR3,
8527 ("%Rrc\n", rc2), RT_FAILURE_NP(rc2) ? rc2 : VERR_IPE_UNEXPECTED_INFO_STATUS);
8528 Assert(!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_CR3));
8529 }
8530 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_PAE_PDPES))
8531 {
8532 PGMGstUpdatePaePdpes(pVCpu, &pVCpu->hm.s.aPdpes[0]);
8533 Assert(!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_PAE_PDPES));
8534 }
8535
8536 /*
8537 * No longjmps to ring-3 from this point on!!!
8538 * Asserts() will still longjmp to ring-3 (but won't return), which is intentional, better than a kernel panic.
8539 * This also disables flushing of the R0-logger instance (if any).
8540 */
8541 VMMRZCallRing3Disable(pVCpu);
8542
8543 /*
8544 * Export the guest state bits.
8545 *
8546 * We cannot perform longjmps while loading the guest state because we do not preserve the
8547 * host/guest state (although the VMCS will be preserved) across longjmps which can cause
8548 * CPU migration.
8549 *
8550 * If we are injecting events to a real-on-v86 mode guest, we will have to update
8551 * RIP and some segment registers, i.e. hmR0VmxInjectPendingEvent()->hmR0VmxInjectEventVmcs().
8552 * Hence, loading of the guest state needs to be done -after- injection of events.
8553 */
8554 rcStrict = hmR0VmxExportGuestStateOptimal(pVCpu);
8555 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
8556 { /* likely */ }
8557 else
8558 {
8559 VMMRZCallRing3Enable(pVCpu);
8560 return rcStrict;
8561 }
8562
8563 /*
8564 * We disable interrupts so that we don't miss any interrupts that would flag preemption
8565 * (IPI/timers etc.) when thread-context hooks aren't used and we've been running with
8566 * preemption disabled for a while. Since this is purly to aid the
8567 * RTThreadPreemptIsPending() code, it doesn't matter that it may temporarily reenable and
8568 * disable interrupt on NT.
8569 *
8570 * We need to check for force-flags that could've possible been altered since we last
8571 * checked them (e.g. by PDMGetInterrupt() leaving the PDM critical section,
8572 * see @bugref{6398}).
8573 *
8574 * We also check a couple of other force-flags as a last opportunity to get the EMT back
8575 * to ring-3 before executing guest code.
8576 */
8577 pVmxTransient->fEFlags = ASMIntDisableFlags();
8578
8579 if ( ( !VM_FF_IS_ANY_SET(pVM, VM_FF_EMT_RENDEZVOUS | VM_FF_TM_VIRTUAL_SYNC)
8580 && !VMCPU_FF_IS_ANY_SET(pVCpu, VMCPU_FF_HM_TO_R3_MASK))
8581 || ( fStepping /* Optimized for the non-stepping case, so a bit of unnecessary work when stepping. */
8582 && !VMCPU_FF_IS_ANY_SET(pVCpu, VMCPU_FF_HM_TO_R3_MASK & ~(VMCPU_FF_TIMER | VMCPU_FF_PDM_CRITSECT))) )
8583 {
8584 if (!RTThreadPreemptIsPending(NIL_RTTHREAD))
8585 {
8586 pVCpu->hm.s.Event.fPending = false;
8587
8588 /*
8589 * We've injected any pending events. This is really the point of no return (to ring-3).
8590 *
8591 * Note! The caller expects to continue with interrupts & longjmps disabled on successful
8592 * returns from this function, so don't enable them here.
8593 */
8594 return VINF_SUCCESS;
8595 }
8596
8597 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchPendingHostIrq);
8598 rcStrict = VINF_EM_RAW_INTERRUPT;
8599 }
8600 else
8601 {
8602 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchHmToR3FF);
8603 rcStrict = VINF_EM_RAW_TO_R3;
8604 }
8605
8606 ASMSetFlags(pVmxTransient->fEFlags);
8607 VMMRZCallRing3Enable(pVCpu);
8608
8609 return rcStrict;
8610}
8611
8612
8613/**
8614 * Prepares to run guest code in VT-x and we've committed to doing so. This
8615 * means there is no backing out to ring-3 or anywhere else at this
8616 * point.
8617 *
8618 * @param pVCpu The cross context virtual CPU structure.
8619 * @param pVmxTransient Pointer to the VMX transient structure.
8620 *
8621 * @remarks Called with preemption disabled.
8622 * @remarks No-long-jump zone!!!
8623 */
8624static void hmR0VmxPreRunGuestCommitted(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
8625{
8626 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
8627 Assert(VMMR0IsLogFlushDisabled(pVCpu));
8628 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
8629
8630 /*
8631 * Indicate start of guest execution and where poking EMT out of guest-context is recognized.
8632 */
8633 VMCPU_ASSERT_STATE(pVCpu, VMCPUSTATE_STARTED_HM);
8634 VMCPU_SET_STATE(pVCpu, VMCPUSTATE_STARTED_EXEC);
8635
8636 PVM pVM = pVCpu->CTX_SUFF(pVM);
8637 if (!CPUMIsGuestFPUStateActive(pVCpu))
8638 {
8639 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatLoadGuestFpuState, x);
8640 if (CPUMR0LoadGuestFPU(pVM, pVCpu) == VINF_CPUM_HOST_CR0_MODIFIED)
8641 pVCpu->hm.s.fCtxChanged |= HM_CHANGED_HOST_CONTEXT;
8642 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatLoadGuestFpuState, x);
8643 STAM_COUNTER_INC(&pVCpu->hm.s.StatLoadGuestFpu);
8644 }
8645
8646 /*
8647 * Lazy-update of the host MSRs values in the auto-load/store MSR area.
8648 */
8649 if ( !pVCpu->hm.s.vmx.fUpdatedHostMsrs
8650 && pVCpu->hm.s.vmx.cMsrs > 0)
8651 hmR0VmxUpdateAutoLoadStoreHostMsrs(pVCpu);
8652
8653 /*
8654 * Re-save the host state bits as we may've been preempted (only happens when
8655 * thread-context hooks are used or when hmR0VmxSetupVMRunHandler() changes pfnStartVM).
8656 * Note that the 64-on-32 switcher saves the (64-bit) host state into the VMCS and
8657 * if we change the switcher back to 32-bit, we *must* save the 32-bit host state here.
8658 * See @bugref{8432}.
8659 */
8660 if (pVCpu->hm.s.fCtxChanged & HM_CHANGED_HOST_CONTEXT)
8661 {
8662 int rc = hmR0VmxExportHostState(pVCpu);
8663 AssertRC(rc);
8664 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchPreemptExportHostState);
8665 }
8666 Assert(!(pVCpu->hm.s.fCtxChanged & HM_CHANGED_HOST_CONTEXT));
8667
8668 /*
8669 * Export the state shared between host and guest (FPU, debug, lazy MSRs).
8670 */
8671 if (pVCpu->hm.s.fCtxChanged & HM_CHANGED_VMX_HOST_GUEST_SHARED_STATE)
8672 hmR0VmxExportSharedState(pVCpu);
8673 AssertMsg(!pVCpu->hm.s.fCtxChanged, ("fCtxChanged=%#RX64\n", pVCpu->hm.s.fCtxChanged));
8674
8675 /* Store status of the shared guest-host state at the time of VM-entry. */
8676#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS)
8677 if (CPUMIsGuestInLongModeEx(&pVCpu->cpum.GstCtx))
8678 {
8679 pVmxTransient->fWasGuestDebugStateActive = CPUMIsGuestDebugStateActivePending(pVCpu);
8680 pVmxTransient->fWasHyperDebugStateActive = CPUMIsHyperDebugStateActivePending(pVCpu);
8681 }
8682 else
8683#endif
8684 {
8685 pVmxTransient->fWasGuestDebugStateActive = CPUMIsGuestDebugStateActive(pVCpu);
8686 pVmxTransient->fWasHyperDebugStateActive = CPUMIsHyperDebugStateActive(pVCpu);
8687 }
8688
8689 /*
8690 * Cache the TPR-shadow for checking on every VM-exit if it might have changed.
8691 */
8692 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TPR_SHADOW)
8693 pVmxTransient->u8GuestTpr = pVCpu->hm.s.vmx.pbVirtApic[XAPIC_OFF_TPR];
8694
8695 PHMGLOBALCPUINFO pCpu = hmR0GetCurrentCpu();
8696 RTCPUID idCurrentCpu = pCpu->idCpu;
8697 if ( pVmxTransient->fUpdateTscOffsettingAndPreemptTimer
8698 || idCurrentCpu != pVCpu->hm.s.idLastCpu)
8699 {
8700 hmR0VmxUpdateTscOffsettingAndPreemptTimer(pVCpu);
8701 pVmxTransient->fUpdateTscOffsettingAndPreemptTimer = false;
8702 }
8703
8704 ASMAtomicWriteBool(&pVCpu->hm.s.fCheckedTLBFlush, true); /* Used for TLB flushing, set this across the world switch. */
8705 hmR0VmxFlushTaggedTlb(pVCpu, pCpu); /* Invalidate the appropriate guest entries from the TLB. */
8706 Assert(idCurrentCpu == pVCpu->hm.s.idLastCpu);
8707 pVCpu->hm.s.vmx.LastError.idCurrentCpu = idCurrentCpu; /* Update the error reporting info. with the current host CPU. */
8708
8709 STAM_PROFILE_ADV_STOP_START(&pVCpu->hm.s.StatEntry, &pVCpu->hm.s.StatInGC, x);
8710
8711 TMNotifyStartOfExecution(pVCpu); /* Finally, notify TM to resume its clocks as we're about
8712 to start executing. */
8713
8714 /*
8715 * Load the TSC_AUX MSR when we are not intercepting RDTSCP.
8716 */
8717 if (pVCpu->hm.s.vmx.u32ProcCtls2 & VMX_PROC_CTLS2_RDTSCP)
8718 {
8719 if (!(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_RDTSC_EXIT))
8720 {
8721 bool fMsrUpdated;
8722 hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_TSC_AUX);
8723 int rc2 = hmR0VmxAddAutoLoadStoreMsr(pVCpu, MSR_K8_TSC_AUX, CPUMGetGuestTscAux(pVCpu), true /* fUpdateHostMsr */,
8724 &fMsrUpdated);
8725 AssertRC(rc2);
8726 Assert(fMsrUpdated || pVCpu->hm.s.vmx.fUpdatedHostMsrs);
8727 /* Finally, mark that all host MSR values are updated so we don't redo it without leaving VT-x. See @bugref{6956}. */
8728 pVCpu->hm.s.vmx.fUpdatedHostMsrs = true;
8729 }
8730 else
8731 {
8732 hmR0VmxRemoveAutoLoadStoreMsr(pVCpu, MSR_K8_TSC_AUX);
8733 Assert(!pVCpu->hm.s.vmx.cMsrs || pVCpu->hm.s.vmx.fUpdatedHostMsrs);
8734 }
8735 }
8736
8737 if (pVM->cpum.ro.GuestFeatures.fIbrs)
8738 {
8739 bool fMsrUpdated;
8740 hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_OTHER_MSRS);
8741 int rc2 = hmR0VmxAddAutoLoadStoreMsr(pVCpu, MSR_IA32_SPEC_CTRL, CPUMGetGuestSpecCtrl(pVCpu), true /* fUpdateHostMsr */,
8742 &fMsrUpdated);
8743 AssertRC(rc2);
8744 Assert(fMsrUpdated || pVCpu->hm.s.vmx.fUpdatedHostMsrs);
8745 /* Finally, mark that all host MSR values are updated so we don't redo it without leaving VT-x. See @bugref{6956}. */
8746 pVCpu->hm.s.vmx.fUpdatedHostMsrs = true;
8747 }
8748
8749#ifdef VBOX_STRICT
8750 hmR0VmxCheckAutoLoadStoreMsrs(pVCpu);
8751 hmR0VmxCheckHostEferMsr(pVCpu);
8752 AssertRC(hmR0VmxCheckVmcsCtls(pVCpu));
8753#endif
8754#ifdef HMVMX_ALWAYS_CHECK_GUEST_STATE
8755 if (!(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_MSR_BITMAPS))
8756 {
8757 uint32_t uInvalidReason = hmR0VmxCheckGuestState(pVCpu);
8758 if (uInvalidReason != VMX_IGS_REASON_NOT_FOUND)
8759 Log4(("hmR0VmxCheckGuestState returned %#x\n", uInvalidReason));
8760 }
8761#endif
8762}
8763
8764
8765/**
8766 * Performs some essential restoration of state after running guest code in
8767 * VT-x.
8768 *
8769 * @param pVCpu The cross context virtual CPU structure.
8770 * @param pVmxTransient Pointer to the VMX transient structure.
8771 * @param rcVMRun Return code of VMLAUNCH/VMRESUME.
8772 *
8773 * @remarks Called with interrupts disabled, and returns with interrupts enabled!
8774 *
8775 * @remarks No-long-jump zone!!! This function will however re-enable longjmps
8776 * unconditionally when it is safe to do so.
8777 */
8778static void hmR0VmxPostRunGuest(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient, int rcVMRun)
8779{
8780 uint64_t const uHostTsc = ASMReadTSC();
8781 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
8782
8783 ASMAtomicWriteBool(&pVCpu->hm.s.fCheckedTLBFlush, false); /* See HMInvalidatePageOnAllVCpus(): used for TLB flushing. */
8784 ASMAtomicIncU32(&pVCpu->hm.s.cWorldSwitchExits); /* Initialized in vmR3CreateUVM(): used for EMT poking. */
8785 pVCpu->hm.s.fCtxChanged = 0; /* Exits/longjmps to ring-3 requires saving the guest state. */
8786 pVmxTransient->fVmcsFieldsRead = 0; /* Transient fields need to be read from the VMCS. */
8787 pVmxTransient->fVectoringPF = false; /* Vectoring page-fault needs to be determined later. */
8788 pVmxTransient->fVectoringDoublePF = false; /* Vectoring double page-fault needs to be determined later. */
8789
8790 if (!(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_RDTSC_EXIT))
8791 TMCpuTickSetLastSeen(pVCpu, uHostTsc + pVCpu->hm.s.vmx.u64TscOffset);
8792
8793 STAM_PROFILE_ADV_STOP_START(&pVCpu->hm.s.StatInGC, &pVCpu->hm.s.StatPreExit, x);
8794 TMNotifyEndOfExecution(pVCpu); /* Notify TM that the guest is no longer running. */
8795 Assert(!ASMIntAreEnabled());
8796 VMCPU_SET_STATE(pVCpu, VMCPUSTATE_STARTED_HM);
8797
8798#if HC_ARCH_BITS == 64
8799 pVCpu->hm.s.vmx.fRestoreHostFlags |= VMX_RESTORE_HOST_REQUIRED; /* Host state messed up by VT-x, we must restore. */
8800#endif
8801#if HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS)
8802 /* The 64-on-32 switcher maintains uVmcsState on its own and we need to leave it alone here. */
8803 if (pVCpu->hm.s.vmx.pfnStartVM != VMXR0SwitcherStartVM64)
8804 pVCpu->hm.s.vmx.uVmcsState |= HMVMX_VMCS_STATE_LAUNCHED; /* Use VMRESUME instead of VMLAUNCH in the next run. */
8805#else
8806 pVCpu->hm.s.vmx.uVmcsState |= HMVMX_VMCS_STATE_LAUNCHED; /* Use VMRESUME instead of VMLAUNCH in the next run. */
8807#endif
8808#ifdef VBOX_STRICT
8809 hmR0VmxCheckHostEferMsr(pVCpu); /* Verify that VMRUN/VMLAUNCH didn't modify host EFER. */
8810#endif
8811 ASMSetFlags(pVmxTransient->fEFlags); /* Enable interrupts. */
8812
8813 /* Save the basic VM-exit reason. Refer Intel spec. 24.9.1 "Basic VM-exit Information". */
8814 uint32_t uExitReason;
8815 int rc = VMXReadVmcs32(VMX_VMCS32_RO_EXIT_REASON, &uExitReason);
8816 rc |= hmR0VmxReadEntryIntInfoVmcs(pVmxTransient);
8817 AssertRC(rc);
8818 pVmxTransient->uExitReason = VMX_EXIT_REASON_BASIC(uExitReason);
8819 pVmxTransient->fVMEntryFailed = VMX_EXIT_REASON_HAS_ENTRY_FAILED(uExitReason);
8820
8821 if (rcVMRun == VINF_SUCCESS)
8822 {
8823 /*
8824 * Update the VM-exit history array here even if the VM-entry failed due to:
8825 * - Invalid guest state.
8826 * - MSR loading.
8827 * - Machine-check event.
8828 *
8829 * In any of the above cases we will still have a "valid" VM-exit reason
8830 * despite @a fVMEntryFailed being false.
8831 *
8832 * See Intel spec. 26.7 "VM-Entry failures during or after loading guest state".
8833 *
8834 * Note! We don't have CS or RIP at this point. Will probably address that later
8835 * by amending the history entry added here.
8836 */
8837 EMHistoryAddExit(pVCpu, EMEXIT_MAKE_FT(EMEXIT_F_KIND_VMX, pVmxTransient->uExitReason & EMEXIT_F_TYPE_MASK),
8838 UINT64_MAX, uHostTsc);
8839
8840 if (!pVmxTransient->fVMEntryFailed)
8841 {
8842 VMMRZCallRing3Enable(pVCpu);
8843
8844 Assert(!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_CR3));
8845 Assert(!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_HM_UPDATE_PAE_PDPES));
8846
8847#if defined(HMVMX_ALWAYS_SYNC_FULL_GUEST_STATE) || defined(HMVMX_ALWAYS_SAVE_FULL_GUEST_STATE)
8848 rc = hmR0VmxImportGuestState(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
8849 AssertRC(rc);
8850#elif defined(HMVMX_ALWAYS_SAVE_GUEST_RFLAGS)
8851 rc = hmR0VmxImportGuestState(pVCpu, HMVMX_CPUMCTX_EXTRN_RFLAGS);
8852 AssertRC(rc);
8853#else
8854 /*
8855 * Import the guest-interruptibility state always as we need it while evaluating
8856 * injecting events on re-entry.
8857 *
8858 * We don't import CR0 (when Unrestricted guest execution is unavailable) despite
8859 * checking for real-mode while exporting the state because all bits that cause
8860 * mode changes wrt CR0 are intercepted.
8861 */
8862 rc = hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_HM_VMX_INT_STATE);
8863 AssertRC(rc);
8864#endif
8865
8866 /*
8867 * Sync the TPR shadow with our APIC state.
8868 */
8869 if ( (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TPR_SHADOW)
8870 && pVmxTransient->u8GuestTpr != pVCpu->hm.s.vmx.pbVirtApic[XAPIC_OFF_TPR])
8871 {
8872 rc = APICSetTpr(pVCpu, pVCpu->hm.s.vmx.pbVirtApic[XAPIC_OFF_TPR]);
8873 AssertRC(rc);
8874 ASMAtomicOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_APIC_TPR);
8875 }
8876
8877 Assert(VMMRZCallRing3IsEnabled(pVCpu));
8878 return;
8879 }
8880 }
8881 else
8882 Log4Func(("VM-entry failure: rcVMRun=%Rrc fVMEntryFailed=%RTbool\n", rcVMRun, pVmxTransient->fVMEntryFailed));
8883
8884 VMMRZCallRing3Enable(pVCpu);
8885}
8886
8887
8888/**
8889 * Runs the guest code using VT-x the normal way.
8890 *
8891 * @returns VBox status code.
8892 * @param pVCpu The cross context virtual CPU structure.
8893 *
8894 * @note Mostly the same as hmR0VmxRunGuestCodeStep().
8895 */
8896static VBOXSTRICTRC hmR0VmxRunGuestCodeNormal(PVMCPU pVCpu)
8897{
8898 VMXTRANSIENT VmxTransient;
8899 VmxTransient.fUpdateTscOffsettingAndPreemptTimer = true;
8900 VBOXSTRICTRC rcStrict = VERR_INTERNAL_ERROR_5;
8901 uint32_t cLoops = 0;
8902
8903 for (;; cLoops++)
8904 {
8905 Assert(!HMR0SuspendPending());
8906 HMVMX_ASSERT_CPU_SAFE(pVCpu);
8907
8908 /* Preparatory work for running guest code, this may force us to return
8909 to ring-3. This bugger disables interrupts on VINF_SUCCESS! */
8910 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatEntry, x);
8911 rcStrict = hmR0VmxPreRunGuest(pVCpu, &VmxTransient, false /* fStepping */);
8912 if (rcStrict != VINF_SUCCESS)
8913 break;
8914
8915 hmR0VmxPreRunGuestCommitted(pVCpu, &VmxTransient);
8916 int rcRun = hmR0VmxRunGuest(pVCpu);
8917
8918 /* Restore any residual host-state and save any bits shared between host
8919 and guest into the guest-CPU state. Re-enables interrupts! */
8920 hmR0VmxPostRunGuest(pVCpu, &VmxTransient, rcRun);
8921
8922 /* Check for errors with running the VM (VMLAUNCH/VMRESUME). */
8923 if (RT_SUCCESS(rcRun))
8924 { /* very likely */ }
8925 else
8926 {
8927 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatPreExit, x);
8928 hmR0VmxReportWorldSwitchError(pVCpu, rcRun, &VmxTransient);
8929 return rcRun;
8930 }
8931
8932 /* Profile the VM-exit. */
8933 AssertMsg(VmxTransient.uExitReason <= VMX_EXIT_MAX, ("%#x\n", VmxTransient.uExitReason));
8934 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitAll);
8935 STAM_COUNTER_INC(&pVCpu->hm.s.paStatExitReasonR0[VmxTransient.uExitReason & MASK_EXITREASON_STAT]);
8936 STAM_PROFILE_ADV_STOP_START(&pVCpu->hm.s.StatPreExit, &pVCpu->hm.s.StatExitHandling, x);
8937 HMVMX_START_EXIT_DISPATCH_PROF();
8938
8939 VBOXVMM_R0_HMVMX_VMEXIT_NOCTX(pVCpu, &pVCpu->cpum.GstCtx, VmxTransient.uExitReason);
8940
8941 /* Handle the VM-exit. */
8942#ifdef HMVMX_USE_FUNCTION_TABLE
8943 rcStrict = g_apfnVMExitHandlers[VmxTransient.uExitReason](pVCpu, &VmxTransient);
8944#else
8945 rcStrict = hmR0VmxHandleExit(pVCpu, &VmxTransient, VmxTransient.uExitReason);
8946#endif
8947 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExitHandling, x);
8948 if (rcStrict == VINF_SUCCESS)
8949 {
8950 if (cLoops <= pVCpu->CTX_SUFF(pVM)->hm.s.cMaxResumeLoops)
8951 continue; /* likely */
8952 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchMaxResumeLoops);
8953 rcStrict = VINF_EM_RAW_INTERRUPT;
8954 }
8955 break;
8956 }
8957
8958 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatEntry, x);
8959 return rcStrict;
8960}
8961
8962
8963
8964/** @name Execution loop for single stepping, DBGF events and expensive Dtrace
8965 * probes.
8966 *
8967 * The following few functions and associated structure contains the bloat
8968 * necessary for providing detailed debug events and dtrace probes as well as
8969 * reliable host side single stepping. This works on the principle of
8970 * "subclassing" the normal execution loop and workers. We replace the loop
8971 * method completely and override selected helpers to add necessary adjustments
8972 * to their core operation.
8973 *
8974 * The goal is to keep the "parent" code lean and mean, so as not to sacrifice
8975 * any performance for debug and analysis features.
8976 *
8977 * @{
8978 */
8979
8980/**
8981 * Transient per-VCPU debug state of VMCS and related info. we save/restore in
8982 * the debug run loop.
8983 */
8984typedef struct VMXRUNDBGSTATE
8985{
8986 /** The RIP we started executing at. This is for detecting that we stepped. */
8987 uint64_t uRipStart;
8988 /** The CS we started executing with. */
8989 uint16_t uCsStart;
8990
8991 /** Whether we've actually modified the 1st execution control field. */
8992 bool fModifiedProcCtls : 1;
8993 /** Whether we've actually modified the 2nd execution control field. */
8994 bool fModifiedProcCtls2 : 1;
8995 /** Whether we've actually modified the exception bitmap. */
8996 bool fModifiedXcptBitmap : 1;
8997
8998 /** We desire the modified the CR0 mask to be cleared. */
8999 bool fClearCr0Mask : 1;
9000 /** We desire the modified the CR4 mask to be cleared. */
9001 bool fClearCr4Mask : 1;
9002 /** Stuff we need in VMX_VMCS32_CTRL_PROC_EXEC. */
9003 uint32_t fCpe1Extra;
9004 /** Stuff we do not want in VMX_VMCS32_CTRL_PROC_EXEC. */
9005 uint32_t fCpe1Unwanted;
9006 /** Stuff we need in VMX_VMCS32_CTRL_PROC_EXEC2. */
9007 uint32_t fCpe2Extra;
9008 /** Extra stuff we need in VMX_VMCS32_CTRL_EXCEPTION_BITMAP. */
9009 uint32_t bmXcptExtra;
9010 /** The sequence number of the Dtrace provider settings the state was
9011 * configured against. */
9012 uint32_t uDtraceSettingsSeqNo;
9013 /** VM-exits to check (one bit per VM-exit). */
9014 uint32_t bmExitsToCheck[3];
9015
9016 /** The initial VMX_VMCS32_CTRL_PROC_EXEC value (helps with restore). */
9017 uint32_t fProcCtlsInitial;
9018 /** The initial VMX_VMCS32_CTRL_PROC_EXEC2 value (helps with restore). */
9019 uint32_t fProcCtls2Initial;
9020 /** The initial VMX_VMCS32_CTRL_EXCEPTION_BITMAP value (helps with restore). */
9021 uint32_t bmXcptInitial;
9022} VMXRUNDBGSTATE;
9023AssertCompileMemberSize(VMXRUNDBGSTATE, bmExitsToCheck, (VMX_EXIT_MAX + 1 + 31) / 32 * 4);
9024typedef VMXRUNDBGSTATE *PVMXRUNDBGSTATE;
9025
9026
9027/**
9028 * Initializes the VMXRUNDBGSTATE structure.
9029 *
9030 * @param pVCpu The cross context virtual CPU structure of the
9031 * calling EMT.
9032 * @param pDbgState The structure to initialize.
9033 */
9034static void hmR0VmxRunDebugStateInit(PVMCPU pVCpu, PVMXRUNDBGSTATE pDbgState)
9035{
9036 pDbgState->uRipStart = pVCpu->cpum.GstCtx.rip;
9037 pDbgState->uCsStart = pVCpu->cpum.GstCtx.cs.Sel;
9038
9039 pDbgState->fModifiedProcCtls = false;
9040 pDbgState->fModifiedProcCtls2 = false;
9041 pDbgState->fModifiedXcptBitmap = false;
9042 pDbgState->fClearCr0Mask = false;
9043 pDbgState->fClearCr4Mask = false;
9044 pDbgState->fCpe1Extra = 0;
9045 pDbgState->fCpe1Unwanted = 0;
9046 pDbgState->fCpe2Extra = 0;
9047 pDbgState->bmXcptExtra = 0;
9048 pDbgState->fProcCtlsInitial = pVCpu->hm.s.vmx.u32ProcCtls;
9049 pDbgState->fProcCtls2Initial = pVCpu->hm.s.vmx.u32ProcCtls2;
9050 pDbgState->bmXcptInitial = pVCpu->hm.s.vmx.u32XcptBitmap;
9051}
9052
9053
9054/**
9055 * Updates the VMSC fields with changes requested by @a pDbgState.
9056 *
9057 * This is performed after hmR0VmxPreRunGuestDebugStateUpdate as well
9058 * immediately before executing guest code, i.e. when interrupts are disabled.
9059 * We don't check status codes here as we cannot easily assert or return in the
9060 * latter case.
9061 *
9062 * @param pVCpu The cross context virtual CPU structure.
9063 * @param pDbgState The debug state.
9064 */
9065static void hmR0VmxPreRunGuestDebugStateApply(PVMCPU pVCpu, PVMXRUNDBGSTATE pDbgState)
9066{
9067 /*
9068 * Ensure desired flags in VMCS control fields are set.
9069 * (Ignoring write failure here, as we're committed and it's just debug extras.)
9070 *
9071 * Note! We load the shadow CR0 & CR4 bits when we flag the clearing, so
9072 * there should be no stale data in pCtx at this point.
9073 */
9074 if ( (pVCpu->hm.s.vmx.u32ProcCtls & pDbgState->fCpe1Extra) != pDbgState->fCpe1Extra
9075 || (pVCpu->hm.s.vmx.u32ProcCtls & pDbgState->fCpe1Unwanted))
9076 {
9077 pVCpu->hm.s.vmx.u32ProcCtls |= pDbgState->fCpe1Extra;
9078 pVCpu->hm.s.vmx.u32ProcCtls &= ~pDbgState->fCpe1Unwanted;
9079 VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, pVCpu->hm.s.vmx.u32ProcCtls);
9080 Log6Func(("VMX_VMCS32_CTRL_PROC_EXEC: %#RX32\n", pVCpu->hm.s.vmx.u32ProcCtls));
9081 pDbgState->fModifiedProcCtls = true;
9082 }
9083
9084 if ((pVCpu->hm.s.vmx.u32ProcCtls2 & pDbgState->fCpe2Extra) != pDbgState->fCpe2Extra)
9085 {
9086 pVCpu->hm.s.vmx.u32ProcCtls2 |= pDbgState->fCpe2Extra;
9087 VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC2, pVCpu->hm.s.vmx.u32ProcCtls2);
9088 Log6Func(("VMX_VMCS32_CTRL_PROC_EXEC2: %#RX32\n", pVCpu->hm.s.vmx.u32ProcCtls2));
9089 pDbgState->fModifiedProcCtls2 = true;
9090 }
9091
9092 if ((pVCpu->hm.s.vmx.u32XcptBitmap & pDbgState->bmXcptExtra) != pDbgState->bmXcptExtra)
9093 {
9094 pVCpu->hm.s.vmx.u32XcptBitmap |= pDbgState->bmXcptExtra;
9095 VMXWriteVmcs32(VMX_VMCS32_CTRL_EXCEPTION_BITMAP, pVCpu->hm.s.vmx.u32XcptBitmap);
9096 Log6Func(("VMX_VMCS32_CTRL_EXCEPTION_BITMAP: %#RX32\n", pVCpu->hm.s.vmx.u32XcptBitmap));
9097 pDbgState->fModifiedXcptBitmap = true;
9098 }
9099
9100 if (pDbgState->fClearCr0Mask && pVCpu->hm.s.vmx.u32Cr0Mask != 0)
9101 {
9102 pVCpu->hm.s.vmx.u32Cr0Mask = 0;
9103 VMXWriteVmcs32(VMX_VMCS_CTRL_CR0_MASK, 0);
9104 Log6Func(("VMX_VMCS_CTRL_CR0_MASK: 0\n"));
9105 }
9106
9107 if (pDbgState->fClearCr4Mask && pVCpu->hm.s.vmx.u32Cr4Mask != 0)
9108 {
9109 pVCpu->hm.s.vmx.u32Cr4Mask = 0;
9110 VMXWriteVmcs32(VMX_VMCS_CTRL_CR4_MASK, 0);
9111 Log6Func(("VMX_VMCS_CTRL_CR4_MASK: 0\n"));
9112 }
9113}
9114
9115
9116/**
9117 * Restores VMCS fields that were changed by hmR0VmxPreRunGuestDebugStateApply for
9118 * re-entry next time around.
9119 *
9120 * @returns Strict VBox status code (i.e. informational status codes too).
9121 * @param pVCpu The cross context virtual CPU structure.
9122 * @param pDbgState The debug state.
9123 * @param rcStrict The return code from executing the guest using single
9124 * stepping.
9125 */
9126static VBOXSTRICTRC hmR0VmxRunDebugStateRevert(PVMCPU pVCpu, PVMXRUNDBGSTATE pDbgState, VBOXSTRICTRC rcStrict)
9127{
9128 /*
9129 * Restore VM-exit control settings as we may not reenter this function the
9130 * next time around.
9131 */
9132 /* We reload the initial value, trigger what we can of recalculations the
9133 next time around. From the looks of things, that's all that's required atm. */
9134 if (pDbgState->fModifiedProcCtls)
9135 {
9136 if (!(pDbgState->fProcCtlsInitial & VMX_PROC_CTLS_MOV_DR_EXIT) && CPUMIsHyperDebugStateActive(pVCpu))
9137 pDbgState->fProcCtlsInitial |= VMX_PROC_CTLS_MOV_DR_EXIT; /* Avoid assertion in hmR0VmxLeave */
9138 int rc2 = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, pDbgState->fProcCtlsInitial);
9139 AssertRCReturn(rc2, rc2);
9140 pVCpu->hm.s.vmx.u32ProcCtls = pDbgState->fProcCtlsInitial;
9141 }
9142
9143 /* We're currently the only ones messing with this one, so just restore the
9144 cached value and reload the field. */
9145 if ( pDbgState->fModifiedProcCtls2
9146 && pVCpu->hm.s.vmx.u32ProcCtls2 != pDbgState->fProcCtls2Initial)
9147 {
9148 int rc2 = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC2, pDbgState->fProcCtls2Initial);
9149 AssertRCReturn(rc2, rc2);
9150 pVCpu->hm.s.vmx.u32ProcCtls2 = pDbgState->fProcCtls2Initial;
9151 }
9152
9153 /* If we've modified the exception bitmap, we restore it and trigger
9154 reloading and partial recalculation the next time around. */
9155 if (pDbgState->fModifiedXcptBitmap)
9156 pVCpu->hm.s.vmx.u32XcptBitmap = pDbgState->bmXcptInitial;
9157
9158 return rcStrict;
9159}
9160
9161
9162/**
9163 * Configures VM-exit controls for current DBGF and DTrace settings.
9164 *
9165 * This updates @a pDbgState and the VMCS execution control fields to reflect
9166 * the necessary VM-exits demanded by DBGF and DTrace.
9167 *
9168 * @param pVCpu The cross context virtual CPU structure.
9169 * @param pDbgState The debug state.
9170 * @param pVmxTransient Pointer to the VMX transient structure. May update
9171 * fUpdateTscOffsettingAndPreemptTimer.
9172 */
9173static void hmR0VmxPreRunGuestDebugStateUpdate(PVMCPU pVCpu, PVMXRUNDBGSTATE pDbgState, PVMXTRANSIENT pVmxTransient)
9174{
9175 /*
9176 * Take down the dtrace serial number so we can spot changes.
9177 */
9178 pDbgState->uDtraceSettingsSeqNo = VBOXVMM_GET_SETTINGS_SEQ_NO();
9179 ASMCompilerBarrier();
9180
9181 /*
9182 * We'll rebuild most of the middle block of data members (holding the
9183 * current settings) as we go along here, so start by clearing it all.
9184 */
9185 pDbgState->bmXcptExtra = 0;
9186 pDbgState->fCpe1Extra = 0;
9187 pDbgState->fCpe1Unwanted = 0;
9188 pDbgState->fCpe2Extra = 0;
9189 for (unsigned i = 0; i < RT_ELEMENTS(pDbgState->bmExitsToCheck); i++)
9190 pDbgState->bmExitsToCheck[i] = 0;
9191
9192 /*
9193 * Software interrupts (INT XXh) - no idea how to trigger these...
9194 */
9195 PVM pVM = pVCpu->CTX_SUFF(pVM);
9196 if ( DBGF_IS_EVENT_ENABLED(pVM, DBGFEVENT_INTERRUPT_SOFTWARE)
9197 || VBOXVMM_INT_SOFTWARE_ENABLED())
9198 {
9199 ASMBitSet(pDbgState->bmExitsToCheck, VMX_EXIT_XCPT_OR_NMI);
9200 }
9201
9202 /*
9203 * INT3 breakpoints - triggered by #BP exceptions.
9204 */
9205 if (pVM->dbgf.ro.cEnabledInt3Breakpoints > 0)
9206 pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_BP);
9207
9208 /*
9209 * Exception bitmap and XCPT events+probes.
9210 */
9211 for (int iXcpt = 0; iXcpt < (DBGFEVENT_XCPT_LAST - DBGFEVENT_XCPT_FIRST + 1); iXcpt++)
9212 if (DBGF_IS_EVENT_ENABLED(pVM, (DBGFEVENTTYPE)(DBGFEVENT_XCPT_FIRST + iXcpt)))
9213 pDbgState->bmXcptExtra |= RT_BIT_32(iXcpt);
9214
9215 if (VBOXVMM_XCPT_DE_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_DE);
9216 if (VBOXVMM_XCPT_DB_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_DB);
9217 if (VBOXVMM_XCPT_BP_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_BP);
9218 if (VBOXVMM_XCPT_OF_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_OF);
9219 if (VBOXVMM_XCPT_BR_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_BR);
9220 if (VBOXVMM_XCPT_UD_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_UD);
9221 if (VBOXVMM_XCPT_NM_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_NM);
9222 if (VBOXVMM_XCPT_DF_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_DF);
9223 if (VBOXVMM_XCPT_TS_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_TS);
9224 if (VBOXVMM_XCPT_NP_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_NP);
9225 if (VBOXVMM_XCPT_SS_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_SS);
9226 if (VBOXVMM_XCPT_GP_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_GP);
9227 if (VBOXVMM_XCPT_PF_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_PF);
9228 if (VBOXVMM_XCPT_MF_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_MF);
9229 if (VBOXVMM_XCPT_AC_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_AC);
9230 if (VBOXVMM_XCPT_XF_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_XF);
9231 if (VBOXVMM_XCPT_VE_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_VE);
9232 if (VBOXVMM_XCPT_SX_ENABLED()) pDbgState->bmXcptExtra |= RT_BIT_32(X86_XCPT_SX);
9233
9234 if (pDbgState->bmXcptExtra)
9235 ASMBitSet(pDbgState->bmExitsToCheck, VMX_EXIT_XCPT_OR_NMI);
9236
9237 /*
9238 * Process events and probes for VM-exits, making sure we get the wanted VM-exits.
9239 *
9240 * Note! This is the reverse of what hmR0VmxHandleExitDtraceEvents does.
9241 * So, when adding/changing/removing please don't forget to update it.
9242 *
9243 * Some of the macros are picking up local variables to save horizontal space,
9244 * (being able to see it in a table is the lesser evil here).
9245 */
9246#define IS_EITHER_ENABLED(a_pVM, a_EventSubName) \
9247 ( DBGF_IS_EVENT_ENABLED(a_pVM, RT_CONCAT(DBGFEVENT_, a_EventSubName)) \
9248 || RT_CONCAT3(VBOXVMM_, a_EventSubName, _ENABLED)() )
9249#define SET_ONLY_XBM_IF_EITHER_EN(a_EventSubName, a_uExit) \
9250 if (IS_EITHER_ENABLED(pVM, a_EventSubName)) \
9251 { AssertCompile((unsigned)(a_uExit) < sizeof(pDbgState->bmExitsToCheck) * 8); \
9252 ASMBitSet((pDbgState)->bmExitsToCheck, a_uExit); \
9253 } else do { } while (0)
9254#define SET_CPE1_XBM_IF_EITHER_EN(a_EventSubName, a_uExit, a_fCtrlProcExec) \
9255 if (IS_EITHER_ENABLED(pVM, a_EventSubName)) \
9256 { \
9257 (pDbgState)->fCpe1Extra |= (a_fCtrlProcExec); \
9258 AssertCompile((unsigned)(a_uExit) < sizeof(pDbgState->bmExitsToCheck) * 8); \
9259 ASMBitSet((pDbgState)->bmExitsToCheck, a_uExit); \
9260 } else do { } while (0)
9261#define SET_CPEU_XBM_IF_EITHER_EN(a_EventSubName, a_uExit, a_fUnwantedCtrlProcExec) \
9262 if (IS_EITHER_ENABLED(pVM, a_EventSubName)) \
9263 { \
9264 (pDbgState)->fCpe1Unwanted |= (a_fUnwantedCtrlProcExec); \
9265 AssertCompile((unsigned)(a_uExit) < sizeof(pDbgState->bmExitsToCheck) * 8); \
9266 ASMBitSet((pDbgState)->bmExitsToCheck, a_uExit); \
9267 } else do { } while (0)
9268#define SET_CPE2_XBM_IF_EITHER_EN(a_EventSubName, a_uExit, a_fCtrlProcExec2) \
9269 if (IS_EITHER_ENABLED(pVM, a_EventSubName)) \
9270 { \
9271 (pDbgState)->fCpe2Extra |= (a_fCtrlProcExec2); \
9272 AssertCompile((unsigned)(a_uExit) < sizeof(pDbgState->bmExitsToCheck) * 8); \
9273 ASMBitSet((pDbgState)->bmExitsToCheck, a_uExit); \
9274 } else do { } while (0)
9275
9276 SET_ONLY_XBM_IF_EITHER_EN(EXIT_TASK_SWITCH, VMX_EXIT_TASK_SWITCH); /* unconditional */
9277 SET_ONLY_XBM_IF_EITHER_EN(EXIT_VMX_EPT_VIOLATION, VMX_EXIT_EPT_VIOLATION); /* unconditional */
9278 SET_ONLY_XBM_IF_EITHER_EN(EXIT_VMX_EPT_MISCONFIG, VMX_EXIT_EPT_MISCONFIG); /* unconditional (unless #VE) */
9279 SET_ONLY_XBM_IF_EITHER_EN(EXIT_VMX_VAPIC_ACCESS, VMX_EXIT_APIC_ACCESS); /* feature dependent, nothing to enable here */
9280 SET_ONLY_XBM_IF_EITHER_EN(EXIT_VMX_VAPIC_WRITE, VMX_EXIT_APIC_WRITE); /* feature dependent, nothing to enable here */
9281
9282 SET_ONLY_XBM_IF_EITHER_EN(INSTR_CPUID, VMX_EXIT_CPUID); /* unconditional */
9283 SET_ONLY_XBM_IF_EITHER_EN( EXIT_CPUID, VMX_EXIT_CPUID);
9284 SET_ONLY_XBM_IF_EITHER_EN(INSTR_GETSEC, VMX_EXIT_GETSEC); /* unconditional */
9285 SET_ONLY_XBM_IF_EITHER_EN( EXIT_GETSEC, VMX_EXIT_GETSEC);
9286 SET_CPE1_XBM_IF_EITHER_EN(INSTR_HALT, VMX_EXIT_HLT, VMX_PROC_CTLS_HLT_EXIT); /* paranoia */
9287 SET_ONLY_XBM_IF_EITHER_EN( EXIT_HALT, VMX_EXIT_HLT);
9288 SET_ONLY_XBM_IF_EITHER_EN(INSTR_INVD, VMX_EXIT_INVD); /* unconditional */
9289 SET_ONLY_XBM_IF_EITHER_EN( EXIT_INVD, VMX_EXIT_INVD);
9290 SET_CPE1_XBM_IF_EITHER_EN(INSTR_INVLPG, VMX_EXIT_INVLPG, VMX_PROC_CTLS_INVLPG_EXIT);
9291 SET_ONLY_XBM_IF_EITHER_EN( EXIT_INVLPG, VMX_EXIT_INVLPG);
9292 SET_CPE1_XBM_IF_EITHER_EN(INSTR_RDPMC, VMX_EXIT_RDPMC, VMX_PROC_CTLS_RDPMC_EXIT);
9293 SET_ONLY_XBM_IF_EITHER_EN( EXIT_RDPMC, VMX_EXIT_RDPMC);
9294 SET_CPE1_XBM_IF_EITHER_EN(INSTR_RDTSC, VMX_EXIT_RDTSC, VMX_PROC_CTLS_RDTSC_EXIT);
9295 SET_ONLY_XBM_IF_EITHER_EN( EXIT_RDTSC, VMX_EXIT_RDTSC);
9296 SET_ONLY_XBM_IF_EITHER_EN(INSTR_RSM, VMX_EXIT_RSM); /* unconditional */
9297 SET_ONLY_XBM_IF_EITHER_EN( EXIT_RSM, VMX_EXIT_RSM);
9298 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMM_CALL, VMX_EXIT_VMCALL); /* unconditional */
9299 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMM_CALL, VMX_EXIT_VMCALL);
9300 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMCLEAR, VMX_EXIT_VMCLEAR); /* unconditional */
9301 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMCLEAR, VMX_EXIT_VMCLEAR);
9302 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMLAUNCH, VMX_EXIT_VMLAUNCH); /* unconditional */
9303 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMLAUNCH, VMX_EXIT_VMLAUNCH);
9304 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMPTRLD, VMX_EXIT_VMPTRLD); /* unconditional */
9305 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMPTRLD, VMX_EXIT_VMPTRLD);
9306 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMPTRST, VMX_EXIT_VMPTRST); /* unconditional */
9307 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMPTRST, VMX_EXIT_VMPTRST);
9308 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMREAD, VMX_EXIT_VMREAD); /* unconditional */
9309 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMREAD, VMX_EXIT_VMREAD);
9310 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMRESUME, VMX_EXIT_VMRESUME); /* unconditional */
9311 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMRESUME, VMX_EXIT_VMRESUME);
9312 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMWRITE, VMX_EXIT_VMWRITE); /* unconditional */
9313 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMWRITE, VMX_EXIT_VMWRITE);
9314 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMXOFF, VMX_EXIT_VMXOFF); /* unconditional */
9315 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMXOFF, VMX_EXIT_VMXOFF);
9316 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMXON, VMX_EXIT_VMXON); /* unconditional */
9317 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMXON, VMX_EXIT_VMXON);
9318
9319 if ( IS_EITHER_ENABLED(pVM, INSTR_CRX_READ)
9320 || IS_EITHER_ENABLED(pVM, INSTR_CRX_WRITE))
9321 {
9322 int rc = hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_CR0 | CPUMCTX_EXTRN_CR4 | CPUMCTX_EXTRN_APIC_TPR);
9323 AssertRC(rc);
9324
9325#if 0 /** @todo fix me */
9326 pDbgState->fClearCr0Mask = true;
9327 pDbgState->fClearCr4Mask = true;
9328#endif
9329 if (IS_EITHER_ENABLED(pVM, INSTR_CRX_READ))
9330 pDbgState->fCpe1Extra |= VMX_PROC_CTLS_CR3_STORE_EXIT | VMX_PROC_CTLS_CR8_STORE_EXIT;
9331 if (IS_EITHER_ENABLED(pVM, INSTR_CRX_WRITE))
9332 pDbgState->fCpe1Extra |= VMX_PROC_CTLS_CR3_LOAD_EXIT | VMX_PROC_CTLS_CR8_LOAD_EXIT;
9333 pDbgState->fCpe1Unwanted |= VMX_PROC_CTLS_USE_TPR_SHADOW; /* risky? */
9334 /* Note! We currently don't use VMX_VMCS32_CTRL_CR3_TARGET_COUNT. It would
9335 require clearing here and in the loop if we start using it. */
9336 ASMBitSet(pDbgState->bmExitsToCheck, VMX_EXIT_MOV_CRX);
9337 }
9338 else
9339 {
9340 if (pDbgState->fClearCr0Mask)
9341 {
9342 pDbgState->fClearCr0Mask = false;
9343 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_CR0);
9344 }
9345 if (pDbgState->fClearCr4Mask)
9346 {
9347 pDbgState->fClearCr4Mask = false;
9348 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_CR4);
9349 }
9350 }
9351 SET_ONLY_XBM_IF_EITHER_EN( EXIT_CRX_READ, VMX_EXIT_MOV_CRX);
9352 SET_ONLY_XBM_IF_EITHER_EN( EXIT_CRX_WRITE, VMX_EXIT_MOV_CRX);
9353
9354 if ( IS_EITHER_ENABLED(pVM, INSTR_DRX_READ)
9355 || IS_EITHER_ENABLED(pVM, INSTR_DRX_WRITE))
9356 {
9357 /** @todo later, need to fix handler as it assumes this won't usually happen. */
9358 ASMBitSet(pDbgState->bmExitsToCheck, VMX_EXIT_MOV_DRX);
9359 }
9360 SET_ONLY_XBM_IF_EITHER_EN( EXIT_DRX_READ, VMX_EXIT_MOV_DRX);
9361 SET_ONLY_XBM_IF_EITHER_EN( EXIT_DRX_WRITE, VMX_EXIT_MOV_DRX);
9362
9363 SET_CPEU_XBM_IF_EITHER_EN(INSTR_RDMSR, VMX_EXIT_RDMSR, VMX_PROC_CTLS_USE_MSR_BITMAPS); /* risky clearing this? */
9364 SET_ONLY_XBM_IF_EITHER_EN( EXIT_RDMSR, VMX_EXIT_RDMSR);
9365 SET_CPEU_XBM_IF_EITHER_EN(INSTR_WRMSR, VMX_EXIT_WRMSR, VMX_PROC_CTLS_USE_MSR_BITMAPS);
9366 SET_ONLY_XBM_IF_EITHER_EN( EXIT_WRMSR, VMX_EXIT_WRMSR);
9367 SET_CPE1_XBM_IF_EITHER_EN(INSTR_MWAIT, VMX_EXIT_MWAIT, VMX_PROC_CTLS_MWAIT_EXIT); /* paranoia */
9368 SET_ONLY_XBM_IF_EITHER_EN( EXIT_MWAIT, VMX_EXIT_MWAIT);
9369 SET_CPE1_XBM_IF_EITHER_EN(INSTR_MONITOR, VMX_EXIT_MONITOR, VMX_PROC_CTLS_MONITOR_EXIT); /* paranoia */
9370 SET_ONLY_XBM_IF_EITHER_EN( EXIT_MONITOR, VMX_EXIT_MONITOR);
9371#if 0 /** @todo too slow, fix handler. */
9372 SET_CPE1_XBM_IF_EITHER_EN(INSTR_PAUSE, VMX_EXIT_PAUSE, VMX_PROC_CTLS_PAUSE_EXIT);
9373#endif
9374 SET_ONLY_XBM_IF_EITHER_EN( EXIT_PAUSE, VMX_EXIT_PAUSE);
9375
9376 if ( IS_EITHER_ENABLED(pVM, INSTR_SGDT)
9377 || IS_EITHER_ENABLED(pVM, INSTR_SIDT)
9378 || IS_EITHER_ENABLED(pVM, INSTR_LGDT)
9379 || IS_EITHER_ENABLED(pVM, INSTR_LIDT))
9380 {
9381 pDbgState->fCpe2Extra |= VMX_PROC_CTLS2_DESC_TABLE_EXIT;
9382 ASMBitSet(pDbgState->bmExitsToCheck, VMX_EXIT_GDTR_IDTR_ACCESS);
9383 }
9384 SET_ONLY_XBM_IF_EITHER_EN( EXIT_SGDT, VMX_EXIT_GDTR_IDTR_ACCESS);
9385 SET_ONLY_XBM_IF_EITHER_EN( EXIT_SIDT, VMX_EXIT_GDTR_IDTR_ACCESS);
9386 SET_ONLY_XBM_IF_EITHER_EN( EXIT_LGDT, VMX_EXIT_GDTR_IDTR_ACCESS);
9387 SET_ONLY_XBM_IF_EITHER_EN( EXIT_LIDT, VMX_EXIT_GDTR_IDTR_ACCESS);
9388
9389 if ( IS_EITHER_ENABLED(pVM, INSTR_SLDT)
9390 || IS_EITHER_ENABLED(pVM, INSTR_STR)
9391 || IS_EITHER_ENABLED(pVM, INSTR_LLDT)
9392 || IS_EITHER_ENABLED(pVM, INSTR_LTR))
9393 {
9394 pDbgState->fCpe2Extra |= VMX_PROC_CTLS2_DESC_TABLE_EXIT;
9395 ASMBitSet(pDbgState->bmExitsToCheck, VMX_EXIT_LDTR_TR_ACCESS);
9396 }
9397 SET_ONLY_XBM_IF_EITHER_EN( EXIT_SLDT, VMX_EXIT_LDTR_TR_ACCESS);
9398 SET_ONLY_XBM_IF_EITHER_EN( EXIT_STR, VMX_EXIT_LDTR_TR_ACCESS);
9399 SET_ONLY_XBM_IF_EITHER_EN( EXIT_LLDT, VMX_EXIT_LDTR_TR_ACCESS);
9400 SET_ONLY_XBM_IF_EITHER_EN( EXIT_LTR, VMX_EXIT_LDTR_TR_ACCESS);
9401
9402 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_INVEPT, VMX_EXIT_INVEPT); /* unconditional */
9403 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_INVEPT, VMX_EXIT_INVEPT);
9404 SET_CPE1_XBM_IF_EITHER_EN(INSTR_RDTSCP, VMX_EXIT_RDTSCP, VMX_PROC_CTLS_RDTSC_EXIT);
9405 SET_ONLY_XBM_IF_EITHER_EN( EXIT_RDTSCP, VMX_EXIT_RDTSCP);
9406 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_INVVPID, VMX_EXIT_INVVPID); /* unconditional */
9407 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_INVVPID, VMX_EXIT_INVVPID);
9408 SET_CPE2_XBM_IF_EITHER_EN(INSTR_WBINVD, VMX_EXIT_WBINVD, VMX_PROC_CTLS2_WBINVD_EXIT);
9409 SET_ONLY_XBM_IF_EITHER_EN( EXIT_WBINVD, VMX_EXIT_WBINVD);
9410 SET_ONLY_XBM_IF_EITHER_EN(INSTR_XSETBV, VMX_EXIT_XSETBV); /* unconditional */
9411 SET_ONLY_XBM_IF_EITHER_EN( EXIT_XSETBV, VMX_EXIT_XSETBV);
9412 SET_CPE2_XBM_IF_EITHER_EN(INSTR_RDRAND, VMX_EXIT_RDRAND, VMX_PROC_CTLS2_RDRAND_EXIT);
9413 SET_ONLY_XBM_IF_EITHER_EN( EXIT_RDRAND, VMX_EXIT_RDRAND);
9414 SET_CPE1_XBM_IF_EITHER_EN(INSTR_VMX_INVPCID, VMX_EXIT_INVPCID, VMX_PROC_CTLS_INVLPG_EXIT);
9415 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_INVPCID, VMX_EXIT_INVPCID);
9416 SET_ONLY_XBM_IF_EITHER_EN(INSTR_VMX_VMFUNC, VMX_EXIT_VMFUNC); /* unconditional for the current setup */
9417 SET_ONLY_XBM_IF_EITHER_EN( EXIT_VMX_VMFUNC, VMX_EXIT_VMFUNC);
9418 SET_CPE2_XBM_IF_EITHER_EN(INSTR_RDSEED, VMX_EXIT_RDSEED, VMX_PROC_CTLS2_RDSEED_EXIT);
9419 SET_ONLY_XBM_IF_EITHER_EN( EXIT_RDSEED, VMX_EXIT_RDSEED);
9420 SET_ONLY_XBM_IF_EITHER_EN(INSTR_XSAVES, VMX_EXIT_XSAVES); /* unconditional (enabled by host, guest cfg) */
9421 SET_ONLY_XBM_IF_EITHER_EN(EXIT_XSAVES, VMX_EXIT_XSAVES);
9422 SET_ONLY_XBM_IF_EITHER_EN(INSTR_XRSTORS, VMX_EXIT_XRSTORS); /* unconditional (enabled by host, guest cfg) */
9423 SET_ONLY_XBM_IF_EITHER_EN( EXIT_XRSTORS, VMX_EXIT_XRSTORS);
9424
9425#undef IS_EITHER_ENABLED
9426#undef SET_ONLY_XBM_IF_EITHER_EN
9427#undef SET_CPE1_XBM_IF_EITHER_EN
9428#undef SET_CPEU_XBM_IF_EITHER_EN
9429#undef SET_CPE2_XBM_IF_EITHER_EN
9430
9431 /*
9432 * Sanitize the control stuff.
9433 */
9434 pDbgState->fCpe2Extra &= pVM->hm.s.vmx.Msrs.ProcCtls2.n.allowed1;
9435 if (pDbgState->fCpe2Extra)
9436 pDbgState->fCpe1Extra |= VMX_PROC_CTLS_USE_SECONDARY_CTLS;
9437 pDbgState->fCpe1Extra &= pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed1;
9438 pDbgState->fCpe1Unwanted &= ~pVM->hm.s.vmx.Msrs.ProcCtls.n.allowed0;
9439 if (pVCpu->hm.s.fDebugWantRdTscExit != RT_BOOL(pDbgState->fCpe1Extra & VMX_PROC_CTLS_RDTSC_EXIT))
9440 {
9441 pVCpu->hm.s.fDebugWantRdTscExit ^= true;
9442 pVmxTransient->fUpdateTscOffsettingAndPreemptTimer = true;
9443 }
9444
9445 Log6(("HM: debug state: cpe1=%#RX32 cpeu=%#RX32 cpe2=%#RX32%s%s\n",
9446 pDbgState->fCpe1Extra, pDbgState->fCpe1Unwanted, pDbgState->fCpe2Extra,
9447 pDbgState->fClearCr0Mask ? " clr-cr0" : "",
9448 pDbgState->fClearCr4Mask ? " clr-cr4" : ""));
9449}
9450
9451
9452/**
9453 * Fires off DBGF events and dtrace probes for a VM-exit, when it's
9454 * appropriate.
9455 *
9456 * The caller has checked the VM-exit against the
9457 * VMXRUNDBGSTATE::bmExitsToCheck bitmap. The caller has checked for NMIs
9458 * already, so we don't have to do that either.
9459 *
9460 * @returns Strict VBox status code (i.e. informational status codes too).
9461 * @param pVCpu The cross context virtual CPU structure.
9462 * @param pVmxTransient Pointer to the VMX-transient structure.
9463 * @param uExitReason The VM-exit reason.
9464 *
9465 * @remarks The name of this function is displayed by dtrace, so keep it short
9466 * and to the point. No longer than 33 chars long, please.
9467 */
9468static VBOXSTRICTRC hmR0VmxHandleExitDtraceEvents(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient, uint32_t uExitReason)
9469{
9470 /*
9471 * Translate the event into a DBGF event (enmEvent + uEventArg) and at the
9472 * same time check whether any corresponding Dtrace event is enabled (fDtrace).
9473 *
9474 * Note! This is the reverse operation of what hmR0VmxPreRunGuestDebugStateUpdate
9475 * does. Must add/change/remove both places. Same ordering, please.
9476 *
9477 * Added/removed events must also be reflected in the next section
9478 * where we dispatch dtrace events.
9479 */
9480 bool fDtrace1 = false;
9481 bool fDtrace2 = false;
9482 DBGFEVENTTYPE enmEvent1 = DBGFEVENT_END;
9483 DBGFEVENTTYPE enmEvent2 = DBGFEVENT_END;
9484 uint32_t uEventArg = 0;
9485#define SET_EXIT(a_EventSubName) \
9486 do { \
9487 enmEvent2 = RT_CONCAT(DBGFEVENT_EXIT_, a_EventSubName); \
9488 fDtrace2 = RT_CONCAT3(VBOXVMM_EXIT_, a_EventSubName, _ENABLED)(); \
9489 } while (0)
9490#define SET_BOTH(a_EventSubName) \
9491 do { \
9492 enmEvent1 = RT_CONCAT(DBGFEVENT_INSTR_, a_EventSubName); \
9493 enmEvent2 = RT_CONCAT(DBGFEVENT_EXIT_, a_EventSubName); \
9494 fDtrace1 = RT_CONCAT3(VBOXVMM_INSTR_, a_EventSubName, _ENABLED)(); \
9495 fDtrace2 = RT_CONCAT3(VBOXVMM_EXIT_, a_EventSubName, _ENABLED)(); \
9496 } while (0)
9497 switch (uExitReason)
9498 {
9499 case VMX_EXIT_MTF:
9500 return hmR0VmxExitMtf(pVCpu, pVmxTransient);
9501
9502 case VMX_EXIT_XCPT_OR_NMI:
9503 {
9504 uint8_t const idxVector = VMX_EXIT_INT_INFO_VECTOR(pVmxTransient->uExitIntInfo);
9505 switch (VMX_EXIT_INT_INFO_TYPE(pVmxTransient->uExitIntInfo))
9506 {
9507 case VMX_EXIT_INT_INFO_TYPE_HW_XCPT:
9508 case VMX_EXIT_INT_INFO_TYPE_SW_XCPT:
9509 case VMX_EXIT_INT_INFO_TYPE_PRIV_SW_XCPT:
9510 if (idxVector <= (unsigned)(DBGFEVENT_XCPT_LAST - DBGFEVENT_XCPT_FIRST))
9511 {
9512 if (VMX_EXIT_INT_INFO_IS_ERROR_CODE_VALID(pVmxTransient->uExitIntInfo))
9513 {
9514 hmR0VmxReadExitIntErrorCodeVmcs(pVmxTransient);
9515 uEventArg = pVmxTransient->uExitIntErrorCode;
9516 }
9517 enmEvent1 = (DBGFEVENTTYPE)(DBGFEVENT_XCPT_FIRST + idxVector);
9518 switch (enmEvent1)
9519 {
9520 case DBGFEVENT_XCPT_DE: fDtrace1 = VBOXVMM_XCPT_DE_ENABLED(); break;
9521 case DBGFEVENT_XCPT_DB: fDtrace1 = VBOXVMM_XCPT_DB_ENABLED(); break;
9522 case DBGFEVENT_XCPT_BP: fDtrace1 = VBOXVMM_XCPT_BP_ENABLED(); break;
9523 case DBGFEVENT_XCPT_OF: fDtrace1 = VBOXVMM_XCPT_OF_ENABLED(); break;
9524 case DBGFEVENT_XCPT_BR: fDtrace1 = VBOXVMM_XCPT_BR_ENABLED(); break;
9525 case DBGFEVENT_XCPT_UD: fDtrace1 = VBOXVMM_XCPT_UD_ENABLED(); break;
9526 case DBGFEVENT_XCPT_NM: fDtrace1 = VBOXVMM_XCPT_NM_ENABLED(); break;
9527 case DBGFEVENT_XCPT_DF: fDtrace1 = VBOXVMM_XCPT_DF_ENABLED(); break;
9528 case DBGFEVENT_XCPT_TS: fDtrace1 = VBOXVMM_XCPT_TS_ENABLED(); break;
9529 case DBGFEVENT_XCPT_NP: fDtrace1 = VBOXVMM_XCPT_NP_ENABLED(); break;
9530 case DBGFEVENT_XCPT_SS: fDtrace1 = VBOXVMM_XCPT_SS_ENABLED(); break;
9531 case DBGFEVENT_XCPT_GP: fDtrace1 = VBOXVMM_XCPT_GP_ENABLED(); break;
9532 case DBGFEVENT_XCPT_PF: fDtrace1 = VBOXVMM_XCPT_PF_ENABLED(); break;
9533 case DBGFEVENT_XCPT_MF: fDtrace1 = VBOXVMM_XCPT_MF_ENABLED(); break;
9534 case DBGFEVENT_XCPT_AC: fDtrace1 = VBOXVMM_XCPT_AC_ENABLED(); break;
9535 case DBGFEVENT_XCPT_XF: fDtrace1 = VBOXVMM_XCPT_XF_ENABLED(); break;
9536 case DBGFEVENT_XCPT_VE: fDtrace1 = VBOXVMM_XCPT_VE_ENABLED(); break;
9537 case DBGFEVENT_XCPT_SX: fDtrace1 = VBOXVMM_XCPT_SX_ENABLED(); break;
9538 default: break;
9539 }
9540 }
9541 else
9542 AssertFailed();
9543 break;
9544
9545 case VMX_EXIT_INT_INFO_TYPE_SW_INT:
9546 uEventArg = idxVector;
9547 enmEvent1 = DBGFEVENT_INTERRUPT_SOFTWARE;
9548 fDtrace1 = VBOXVMM_INT_SOFTWARE_ENABLED();
9549 break;
9550 }
9551 break;
9552 }
9553
9554 case VMX_EXIT_TRIPLE_FAULT:
9555 enmEvent1 = DBGFEVENT_TRIPLE_FAULT;
9556 //fDtrace1 = VBOXVMM_EXIT_TRIPLE_FAULT_ENABLED();
9557 break;
9558 case VMX_EXIT_TASK_SWITCH: SET_EXIT(TASK_SWITCH); break;
9559 case VMX_EXIT_EPT_VIOLATION: SET_EXIT(VMX_EPT_VIOLATION); break;
9560 case VMX_EXIT_EPT_MISCONFIG: SET_EXIT(VMX_EPT_MISCONFIG); break;
9561 case VMX_EXIT_APIC_ACCESS: SET_EXIT(VMX_VAPIC_ACCESS); break;
9562 case VMX_EXIT_APIC_WRITE: SET_EXIT(VMX_VAPIC_WRITE); break;
9563
9564 /* Instruction specific VM-exits: */
9565 case VMX_EXIT_CPUID: SET_BOTH(CPUID); break;
9566 case VMX_EXIT_GETSEC: SET_BOTH(GETSEC); break;
9567 case VMX_EXIT_HLT: SET_BOTH(HALT); break;
9568 case VMX_EXIT_INVD: SET_BOTH(INVD); break;
9569 case VMX_EXIT_INVLPG: SET_BOTH(INVLPG); break;
9570 case VMX_EXIT_RDPMC: SET_BOTH(RDPMC); break;
9571 case VMX_EXIT_RDTSC: SET_BOTH(RDTSC); break;
9572 case VMX_EXIT_RSM: SET_BOTH(RSM); break;
9573 case VMX_EXIT_VMCALL: SET_BOTH(VMM_CALL); break;
9574 case VMX_EXIT_VMCLEAR: SET_BOTH(VMX_VMCLEAR); break;
9575 case VMX_EXIT_VMLAUNCH: SET_BOTH(VMX_VMLAUNCH); break;
9576 case VMX_EXIT_VMPTRLD: SET_BOTH(VMX_VMPTRLD); break;
9577 case VMX_EXIT_VMPTRST: SET_BOTH(VMX_VMPTRST); break;
9578 case VMX_EXIT_VMREAD: SET_BOTH(VMX_VMREAD); break;
9579 case VMX_EXIT_VMRESUME: SET_BOTH(VMX_VMRESUME); break;
9580 case VMX_EXIT_VMWRITE: SET_BOTH(VMX_VMWRITE); break;
9581 case VMX_EXIT_VMXOFF: SET_BOTH(VMX_VMXOFF); break;
9582 case VMX_EXIT_VMXON: SET_BOTH(VMX_VMXON); break;
9583 case VMX_EXIT_MOV_CRX:
9584 hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
9585 if (VMX_EXIT_QUAL_CRX_ACCESS(pVmxTransient->uExitQual) == VMX_EXIT_QUAL_CRX_ACCESS_READ)
9586 SET_BOTH(CRX_READ);
9587 else
9588 SET_BOTH(CRX_WRITE);
9589 uEventArg = VMX_EXIT_QUAL_CRX_REGISTER(pVmxTransient->uExitQual);
9590 break;
9591 case VMX_EXIT_MOV_DRX:
9592 hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
9593 if ( VMX_EXIT_QUAL_DRX_DIRECTION(pVmxTransient->uExitQual)
9594 == VMX_EXIT_QUAL_DRX_DIRECTION_READ)
9595 SET_BOTH(DRX_READ);
9596 else
9597 SET_BOTH(DRX_WRITE);
9598 uEventArg = VMX_EXIT_QUAL_DRX_REGISTER(pVmxTransient->uExitQual);
9599 break;
9600 case VMX_EXIT_RDMSR: SET_BOTH(RDMSR); break;
9601 case VMX_EXIT_WRMSR: SET_BOTH(WRMSR); break;
9602 case VMX_EXIT_MWAIT: SET_BOTH(MWAIT); break;
9603 case VMX_EXIT_MONITOR: SET_BOTH(MONITOR); break;
9604 case VMX_EXIT_PAUSE: SET_BOTH(PAUSE); break;
9605 case VMX_EXIT_GDTR_IDTR_ACCESS:
9606 hmR0VmxReadExitInstrInfoVmcs(pVmxTransient);
9607 switch (RT_BF_GET(pVmxTransient->ExitInstrInfo.u, VMX_BF_XDTR_INSINFO_INSTR_ID))
9608 {
9609 case VMX_XDTR_INSINFO_II_SGDT: SET_BOTH(SGDT); break;
9610 case VMX_XDTR_INSINFO_II_SIDT: SET_BOTH(SIDT); break;
9611 case VMX_XDTR_INSINFO_II_LGDT: SET_BOTH(LGDT); break;
9612 case VMX_XDTR_INSINFO_II_LIDT: SET_BOTH(LIDT); break;
9613 }
9614 break;
9615
9616 case VMX_EXIT_LDTR_TR_ACCESS:
9617 hmR0VmxReadExitInstrInfoVmcs(pVmxTransient);
9618 switch (RT_BF_GET(pVmxTransient->ExitInstrInfo.u, VMX_BF_YYTR_INSINFO_INSTR_ID))
9619 {
9620 case VMX_YYTR_INSINFO_II_SLDT: SET_BOTH(SLDT); break;
9621 case VMX_YYTR_INSINFO_II_STR: SET_BOTH(STR); break;
9622 case VMX_YYTR_INSINFO_II_LLDT: SET_BOTH(LLDT); break;
9623 case VMX_YYTR_INSINFO_II_LTR: SET_BOTH(LTR); break;
9624 }
9625 break;
9626
9627 case VMX_EXIT_INVEPT: SET_BOTH(VMX_INVEPT); break;
9628 case VMX_EXIT_RDTSCP: SET_BOTH(RDTSCP); break;
9629 case VMX_EXIT_INVVPID: SET_BOTH(VMX_INVVPID); break;
9630 case VMX_EXIT_WBINVD: SET_BOTH(WBINVD); break;
9631 case VMX_EXIT_XSETBV: SET_BOTH(XSETBV); break;
9632 case VMX_EXIT_RDRAND: SET_BOTH(RDRAND); break;
9633 case VMX_EXIT_INVPCID: SET_BOTH(VMX_INVPCID); break;
9634 case VMX_EXIT_VMFUNC: SET_BOTH(VMX_VMFUNC); break;
9635 case VMX_EXIT_RDSEED: SET_BOTH(RDSEED); break;
9636 case VMX_EXIT_XSAVES: SET_BOTH(XSAVES); break;
9637 case VMX_EXIT_XRSTORS: SET_BOTH(XRSTORS); break;
9638
9639 /* Events that aren't relevant at this point. */
9640 case VMX_EXIT_EXT_INT:
9641 case VMX_EXIT_INT_WINDOW:
9642 case VMX_EXIT_NMI_WINDOW:
9643 case VMX_EXIT_TPR_BELOW_THRESHOLD:
9644 case VMX_EXIT_PREEMPT_TIMER:
9645 case VMX_EXIT_IO_INSTR:
9646 break;
9647
9648 /* Errors and unexpected events. */
9649 case VMX_EXIT_INIT_SIGNAL:
9650 case VMX_EXIT_SIPI:
9651 case VMX_EXIT_IO_SMI:
9652 case VMX_EXIT_SMI:
9653 case VMX_EXIT_ERR_INVALID_GUEST_STATE:
9654 case VMX_EXIT_ERR_MSR_LOAD:
9655 case VMX_EXIT_ERR_MACHINE_CHECK:
9656 break;
9657
9658 default:
9659 AssertMsgFailed(("Unexpected VM-exit=%#x\n", uExitReason));
9660 break;
9661 }
9662#undef SET_BOTH
9663#undef SET_EXIT
9664
9665 /*
9666 * Dtrace tracepoints go first. We do them here at once so we don't
9667 * have to copy the guest state saving and stuff a few dozen times.
9668 * Down side is that we've got to repeat the switch, though this time
9669 * we use enmEvent since the probes are a subset of what DBGF does.
9670 */
9671 if (fDtrace1 || fDtrace2)
9672 {
9673 hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
9674 hmR0VmxImportGuestState(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
9675 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
9676 switch (enmEvent1)
9677 {
9678 /** @todo consider which extra parameters would be helpful for each probe. */
9679 case DBGFEVENT_END: break;
9680 case DBGFEVENT_XCPT_DE: VBOXVMM_XCPT_DE(pVCpu, pCtx); break;
9681 case DBGFEVENT_XCPT_DB: VBOXVMM_XCPT_DB(pVCpu, pCtx, pCtx->dr[6]); break;
9682 case DBGFEVENT_XCPT_BP: VBOXVMM_XCPT_BP(pVCpu, pCtx); break;
9683 case DBGFEVENT_XCPT_OF: VBOXVMM_XCPT_OF(pVCpu, pCtx); break;
9684 case DBGFEVENT_XCPT_BR: VBOXVMM_XCPT_BR(pVCpu, pCtx); break;
9685 case DBGFEVENT_XCPT_UD: VBOXVMM_XCPT_UD(pVCpu, pCtx); break;
9686 case DBGFEVENT_XCPT_NM: VBOXVMM_XCPT_NM(pVCpu, pCtx); break;
9687 case DBGFEVENT_XCPT_DF: VBOXVMM_XCPT_DF(pVCpu, pCtx); break;
9688 case DBGFEVENT_XCPT_TS: VBOXVMM_XCPT_TS(pVCpu, pCtx, uEventArg); break;
9689 case DBGFEVENT_XCPT_NP: VBOXVMM_XCPT_NP(pVCpu, pCtx, uEventArg); break;
9690 case DBGFEVENT_XCPT_SS: VBOXVMM_XCPT_SS(pVCpu, pCtx, uEventArg); break;
9691 case DBGFEVENT_XCPT_GP: VBOXVMM_XCPT_GP(pVCpu, pCtx, uEventArg); break;
9692 case DBGFEVENT_XCPT_PF: VBOXVMM_XCPT_PF(pVCpu, pCtx, uEventArg, pCtx->cr2); break;
9693 case DBGFEVENT_XCPT_MF: VBOXVMM_XCPT_MF(pVCpu, pCtx); break;
9694 case DBGFEVENT_XCPT_AC: VBOXVMM_XCPT_AC(pVCpu, pCtx); break;
9695 case DBGFEVENT_XCPT_XF: VBOXVMM_XCPT_XF(pVCpu, pCtx); break;
9696 case DBGFEVENT_XCPT_VE: VBOXVMM_XCPT_VE(pVCpu, pCtx); break;
9697 case DBGFEVENT_XCPT_SX: VBOXVMM_XCPT_SX(pVCpu, pCtx, uEventArg); break;
9698 case DBGFEVENT_INTERRUPT_SOFTWARE: VBOXVMM_INT_SOFTWARE(pVCpu, pCtx, (uint8_t)uEventArg); break;
9699 case DBGFEVENT_INSTR_CPUID: VBOXVMM_INSTR_CPUID(pVCpu, pCtx, pCtx->eax, pCtx->ecx); break;
9700 case DBGFEVENT_INSTR_GETSEC: VBOXVMM_INSTR_GETSEC(pVCpu, pCtx); break;
9701 case DBGFEVENT_INSTR_HALT: VBOXVMM_INSTR_HALT(pVCpu, pCtx); break;
9702 case DBGFEVENT_INSTR_INVD: VBOXVMM_INSTR_INVD(pVCpu, pCtx); break;
9703 case DBGFEVENT_INSTR_INVLPG: VBOXVMM_INSTR_INVLPG(pVCpu, pCtx); break;
9704 case DBGFEVENT_INSTR_RDPMC: VBOXVMM_INSTR_RDPMC(pVCpu, pCtx); break;
9705 case DBGFEVENT_INSTR_RDTSC: VBOXVMM_INSTR_RDTSC(pVCpu, pCtx); break;
9706 case DBGFEVENT_INSTR_RSM: VBOXVMM_INSTR_RSM(pVCpu, pCtx); break;
9707 case DBGFEVENT_INSTR_CRX_READ: VBOXVMM_INSTR_CRX_READ(pVCpu, pCtx, (uint8_t)uEventArg); break;
9708 case DBGFEVENT_INSTR_CRX_WRITE: VBOXVMM_INSTR_CRX_WRITE(pVCpu, pCtx, (uint8_t)uEventArg); break;
9709 case DBGFEVENT_INSTR_DRX_READ: VBOXVMM_INSTR_DRX_READ(pVCpu, pCtx, (uint8_t)uEventArg); break;
9710 case DBGFEVENT_INSTR_DRX_WRITE: VBOXVMM_INSTR_DRX_WRITE(pVCpu, pCtx, (uint8_t)uEventArg); break;
9711 case DBGFEVENT_INSTR_RDMSR: VBOXVMM_INSTR_RDMSR(pVCpu, pCtx, pCtx->ecx); break;
9712 case DBGFEVENT_INSTR_WRMSR: VBOXVMM_INSTR_WRMSR(pVCpu, pCtx, pCtx->ecx,
9713 RT_MAKE_U64(pCtx->eax, pCtx->edx)); break;
9714 case DBGFEVENT_INSTR_MWAIT: VBOXVMM_INSTR_MWAIT(pVCpu, pCtx); break;
9715 case DBGFEVENT_INSTR_MONITOR: VBOXVMM_INSTR_MONITOR(pVCpu, pCtx); break;
9716 case DBGFEVENT_INSTR_PAUSE: VBOXVMM_INSTR_PAUSE(pVCpu, pCtx); break;
9717 case DBGFEVENT_INSTR_SGDT: VBOXVMM_INSTR_SGDT(pVCpu, pCtx); break;
9718 case DBGFEVENT_INSTR_SIDT: VBOXVMM_INSTR_SIDT(pVCpu, pCtx); break;
9719 case DBGFEVENT_INSTR_LGDT: VBOXVMM_INSTR_LGDT(pVCpu, pCtx); break;
9720 case DBGFEVENT_INSTR_LIDT: VBOXVMM_INSTR_LIDT(pVCpu, pCtx); break;
9721 case DBGFEVENT_INSTR_SLDT: VBOXVMM_INSTR_SLDT(pVCpu, pCtx); break;
9722 case DBGFEVENT_INSTR_STR: VBOXVMM_INSTR_STR(pVCpu, pCtx); break;
9723 case DBGFEVENT_INSTR_LLDT: VBOXVMM_INSTR_LLDT(pVCpu, pCtx); break;
9724 case DBGFEVENT_INSTR_LTR: VBOXVMM_INSTR_LTR(pVCpu, pCtx); break;
9725 case DBGFEVENT_INSTR_RDTSCP: VBOXVMM_INSTR_RDTSCP(pVCpu, pCtx); break;
9726 case DBGFEVENT_INSTR_WBINVD: VBOXVMM_INSTR_WBINVD(pVCpu, pCtx); break;
9727 case DBGFEVENT_INSTR_XSETBV: VBOXVMM_INSTR_XSETBV(pVCpu, pCtx); break;
9728 case DBGFEVENT_INSTR_RDRAND: VBOXVMM_INSTR_RDRAND(pVCpu, pCtx); break;
9729 case DBGFEVENT_INSTR_RDSEED: VBOXVMM_INSTR_RDSEED(pVCpu, pCtx); break;
9730 case DBGFEVENT_INSTR_XSAVES: VBOXVMM_INSTR_XSAVES(pVCpu, pCtx); break;
9731 case DBGFEVENT_INSTR_XRSTORS: VBOXVMM_INSTR_XRSTORS(pVCpu, pCtx); break;
9732 case DBGFEVENT_INSTR_VMM_CALL: VBOXVMM_INSTR_VMM_CALL(pVCpu, pCtx); break;
9733 case DBGFEVENT_INSTR_VMX_VMCLEAR: VBOXVMM_INSTR_VMX_VMCLEAR(pVCpu, pCtx); break;
9734 case DBGFEVENT_INSTR_VMX_VMLAUNCH: VBOXVMM_INSTR_VMX_VMLAUNCH(pVCpu, pCtx); break;
9735 case DBGFEVENT_INSTR_VMX_VMPTRLD: VBOXVMM_INSTR_VMX_VMPTRLD(pVCpu, pCtx); break;
9736 case DBGFEVENT_INSTR_VMX_VMPTRST: VBOXVMM_INSTR_VMX_VMPTRST(pVCpu, pCtx); break;
9737 case DBGFEVENT_INSTR_VMX_VMREAD: VBOXVMM_INSTR_VMX_VMREAD(pVCpu, pCtx); break;
9738 case DBGFEVENT_INSTR_VMX_VMRESUME: VBOXVMM_INSTR_VMX_VMRESUME(pVCpu, pCtx); break;
9739 case DBGFEVENT_INSTR_VMX_VMWRITE: VBOXVMM_INSTR_VMX_VMWRITE(pVCpu, pCtx); break;
9740 case DBGFEVENT_INSTR_VMX_VMXOFF: VBOXVMM_INSTR_VMX_VMXOFF(pVCpu, pCtx); break;
9741 case DBGFEVENT_INSTR_VMX_VMXON: VBOXVMM_INSTR_VMX_VMXON(pVCpu, pCtx); break;
9742 case DBGFEVENT_INSTR_VMX_INVEPT: VBOXVMM_INSTR_VMX_INVEPT(pVCpu, pCtx); break;
9743 case DBGFEVENT_INSTR_VMX_INVVPID: VBOXVMM_INSTR_VMX_INVVPID(pVCpu, pCtx); break;
9744 case DBGFEVENT_INSTR_VMX_INVPCID: VBOXVMM_INSTR_VMX_INVPCID(pVCpu, pCtx); break;
9745 case DBGFEVENT_INSTR_VMX_VMFUNC: VBOXVMM_INSTR_VMX_VMFUNC(pVCpu, pCtx); break;
9746 default: AssertMsgFailed(("enmEvent1=%d uExitReason=%d\n", enmEvent1, uExitReason)); break;
9747 }
9748 switch (enmEvent2)
9749 {
9750 /** @todo consider which extra parameters would be helpful for each probe. */
9751 case DBGFEVENT_END: break;
9752 case DBGFEVENT_EXIT_TASK_SWITCH: VBOXVMM_EXIT_TASK_SWITCH(pVCpu, pCtx); break;
9753 case DBGFEVENT_EXIT_CPUID: VBOXVMM_EXIT_CPUID(pVCpu, pCtx, pCtx->eax, pCtx->ecx); break;
9754 case DBGFEVENT_EXIT_GETSEC: VBOXVMM_EXIT_GETSEC(pVCpu, pCtx); break;
9755 case DBGFEVENT_EXIT_HALT: VBOXVMM_EXIT_HALT(pVCpu, pCtx); break;
9756 case DBGFEVENT_EXIT_INVD: VBOXVMM_EXIT_INVD(pVCpu, pCtx); break;
9757 case DBGFEVENT_EXIT_INVLPG: VBOXVMM_EXIT_INVLPG(pVCpu, pCtx); break;
9758 case DBGFEVENT_EXIT_RDPMC: VBOXVMM_EXIT_RDPMC(pVCpu, pCtx); break;
9759 case DBGFEVENT_EXIT_RDTSC: VBOXVMM_EXIT_RDTSC(pVCpu, pCtx); break;
9760 case DBGFEVENT_EXIT_RSM: VBOXVMM_EXIT_RSM(pVCpu, pCtx); break;
9761 case DBGFEVENT_EXIT_CRX_READ: VBOXVMM_EXIT_CRX_READ(pVCpu, pCtx, (uint8_t)uEventArg); break;
9762 case DBGFEVENT_EXIT_CRX_WRITE: VBOXVMM_EXIT_CRX_WRITE(pVCpu, pCtx, (uint8_t)uEventArg); break;
9763 case DBGFEVENT_EXIT_DRX_READ: VBOXVMM_EXIT_DRX_READ(pVCpu, pCtx, (uint8_t)uEventArg); break;
9764 case DBGFEVENT_EXIT_DRX_WRITE: VBOXVMM_EXIT_DRX_WRITE(pVCpu, pCtx, (uint8_t)uEventArg); break;
9765 case DBGFEVENT_EXIT_RDMSR: VBOXVMM_EXIT_RDMSR(pVCpu, pCtx, pCtx->ecx); break;
9766 case DBGFEVENT_EXIT_WRMSR: VBOXVMM_EXIT_WRMSR(pVCpu, pCtx, pCtx->ecx,
9767 RT_MAKE_U64(pCtx->eax, pCtx->edx)); break;
9768 case DBGFEVENT_EXIT_MWAIT: VBOXVMM_EXIT_MWAIT(pVCpu, pCtx); break;
9769 case DBGFEVENT_EXIT_MONITOR: VBOXVMM_EXIT_MONITOR(pVCpu, pCtx); break;
9770 case DBGFEVENT_EXIT_PAUSE: VBOXVMM_EXIT_PAUSE(pVCpu, pCtx); break;
9771 case DBGFEVENT_EXIT_SGDT: VBOXVMM_EXIT_SGDT(pVCpu, pCtx); break;
9772 case DBGFEVENT_EXIT_SIDT: VBOXVMM_EXIT_SIDT(pVCpu, pCtx); break;
9773 case DBGFEVENT_EXIT_LGDT: VBOXVMM_EXIT_LGDT(pVCpu, pCtx); break;
9774 case DBGFEVENT_EXIT_LIDT: VBOXVMM_EXIT_LIDT(pVCpu, pCtx); break;
9775 case DBGFEVENT_EXIT_SLDT: VBOXVMM_EXIT_SLDT(pVCpu, pCtx); break;
9776 case DBGFEVENT_EXIT_STR: VBOXVMM_EXIT_STR(pVCpu, pCtx); break;
9777 case DBGFEVENT_EXIT_LLDT: VBOXVMM_EXIT_LLDT(pVCpu, pCtx); break;
9778 case DBGFEVENT_EXIT_LTR: VBOXVMM_EXIT_LTR(pVCpu, pCtx); break;
9779 case DBGFEVENT_EXIT_RDTSCP: VBOXVMM_EXIT_RDTSCP(pVCpu, pCtx); break;
9780 case DBGFEVENT_EXIT_WBINVD: VBOXVMM_EXIT_WBINVD(pVCpu, pCtx); break;
9781 case DBGFEVENT_EXIT_XSETBV: VBOXVMM_EXIT_XSETBV(pVCpu, pCtx); break;
9782 case DBGFEVENT_EXIT_RDRAND: VBOXVMM_EXIT_RDRAND(pVCpu, pCtx); break;
9783 case DBGFEVENT_EXIT_RDSEED: VBOXVMM_EXIT_RDSEED(pVCpu, pCtx); break;
9784 case DBGFEVENT_EXIT_XSAVES: VBOXVMM_EXIT_XSAVES(pVCpu, pCtx); break;
9785 case DBGFEVENT_EXIT_XRSTORS: VBOXVMM_EXIT_XRSTORS(pVCpu, pCtx); break;
9786 case DBGFEVENT_EXIT_VMM_CALL: VBOXVMM_EXIT_VMM_CALL(pVCpu, pCtx); break;
9787 case DBGFEVENT_EXIT_VMX_VMCLEAR: VBOXVMM_EXIT_VMX_VMCLEAR(pVCpu, pCtx); break;
9788 case DBGFEVENT_EXIT_VMX_VMLAUNCH: VBOXVMM_EXIT_VMX_VMLAUNCH(pVCpu, pCtx); break;
9789 case DBGFEVENT_EXIT_VMX_VMPTRLD: VBOXVMM_EXIT_VMX_VMPTRLD(pVCpu, pCtx); break;
9790 case DBGFEVENT_EXIT_VMX_VMPTRST: VBOXVMM_EXIT_VMX_VMPTRST(pVCpu, pCtx); break;
9791 case DBGFEVENT_EXIT_VMX_VMREAD: VBOXVMM_EXIT_VMX_VMREAD(pVCpu, pCtx); break;
9792 case DBGFEVENT_EXIT_VMX_VMRESUME: VBOXVMM_EXIT_VMX_VMRESUME(pVCpu, pCtx); break;
9793 case DBGFEVENT_EXIT_VMX_VMWRITE: VBOXVMM_EXIT_VMX_VMWRITE(pVCpu, pCtx); break;
9794 case DBGFEVENT_EXIT_VMX_VMXOFF: VBOXVMM_EXIT_VMX_VMXOFF(pVCpu, pCtx); break;
9795 case DBGFEVENT_EXIT_VMX_VMXON: VBOXVMM_EXIT_VMX_VMXON(pVCpu, pCtx); break;
9796 case DBGFEVENT_EXIT_VMX_INVEPT: VBOXVMM_EXIT_VMX_INVEPT(pVCpu, pCtx); break;
9797 case DBGFEVENT_EXIT_VMX_INVVPID: VBOXVMM_EXIT_VMX_INVVPID(pVCpu, pCtx); break;
9798 case DBGFEVENT_EXIT_VMX_INVPCID: VBOXVMM_EXIT_VMX_INVPCID(pVCpu, pCtx); break;
9799 case DBGFEVENT_EXIT_VMX_VMFUNC: VBOXVMM_EXIT_VMX_VMFUNC(pVCpu, pCtx); break;
9800 case DBGFEVENT_EXIT_VMX_EPT_MISCONFIG: VBOXVMM_EXIT_VMX_EPT_MISCONFIG(pVCpu, pCtx); break;
9801 case DBGFEVENT_EXIT_VMX_EPT_VIOLATION: VBOXVMM_EXIT_VMX_EPT_VIOLATION(pVCpu, pCtx); break;
9802 case DBGFEVENT_EXIT_VMX_VAPIC_ACCESS: VBOXVMM_EXIT_VMX_VAPIC_ACCESS(pVCpu, pCtx); break;
9803 case DBGFEVENT_EXIT_VMX_VAPIC_WRITE: VBOXVMM_EXIT_VMX_VAPIC_WRITE(pVCpu, pCtx); break;
9804 default: AssertMsgFailed(("enmEvent2=%d uExitReason=%d\n", enmEvent2, uExitReason)); break;
9805 }
9806 }
9807
9808 /*
9809 * Fire of the DBGF event, if enabled (our check here is just a quick one,
9810 * the DBGF call will do a full check).
9811 *
9812 * Note! DBGF sets DBGFEVENT_INTERRUPT_SOFTWARE in the bitmap.
9813 * Note! If we have to events, we prioritize the first, i.e. the instruction
9814 * one, in order to avoid event nesting.
9815 */
9816 PVM pVM = pVCpu->CTX_SUFF(pVM);
9817 if ( enmEvent1 != DBGFEVENT_END
9818 && DBGF_IS_EVENT_ENABLED(pVM, enmEvent1))
9819 {
9820 HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CS | CPUMCTX_EXTRN_RIP);
9821 VBOXSTRICTRC rcStrict = DBGFEventGenericWithArgs(pVM, pVCpu, enmEvent1, DBGFEVENTCTX_HM, 1, uEventArg);
9822 if (rcStrict != VINF_SUCCESS)
9823 return rcStrict;
9824 }
9825 else if ( enmEvent2 != DBGFEVENT_END
9826 && DBGF_IS_EVENT_ENABLED(pVM, enmEvent2))
9827 {
9828 HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CS | CPUMCTX_EXTRN_RIP);
9829 VBOXSTRICTRC rcStrict = DBGFEventGenericWithArgs(pVM, pVCpu, enmEvent2, DBGFEVENTCTX_HM, 1, uEventArg);
9830 if (rcStrict != VINF_SUCCESS)
9831 return rcStrict;
9832 }
9833
9834 return VINF_SUCCESS;
9835}
9836
9837
9838/**
9839 * Single-stepping VM-exit filtering.
9840 *
9841 * This is preprocessing the VM-exits and deciding whether we've gotten far
9842 * enough to return VINF_EM_DBG_STEPPED already. If not, normal VM-exit
9843 * handling is performed.
9844 *
9845 * @returns Strict VBox status code (i.e. informational status codes too).
9846 * @param pVCpu The cross context virtual CPU structure of the calling EMT.
9847 * @param pVmxTransient Pointer to the VMX-transient structure.
9848 * @param pDbgState The debug state.
9849 */
9850DECLINLINE(VBOXSTRICTRC) hmR0VmxRunDebugHandleExit(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient, PVMXRUNDBGSTATE pDbgState)
9851{
9852 /*
9853 * Expensive (saves context) generic dtrace VM-exit probe.
9854 */
9855 uint32_t const uExitReason = pVmxTransient->uExitReason;
9856 if (!VBOXVMM_R0_HMVMX_VMEXIT_ENABLED())
9857 { /* more likely */ }
9858 else
9859 {
9860 hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
9861 int rc = hmR0VmxImportGuestState(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
9862 AssertRC(rc);
9863 VBOXVMM_R0_HMVMX_VMEXIT(pVCpu, &pVCpu->cpum.GstCtx, pVmxTransient->uExitReason, pVmxTransient->uExitQual);
9864 }
9865
9866 /*
9867 * Check for host NMI, just to get that out of the way.
9868 */
9869 if (uExitReason != VMX_EXIT_XCPT_OR_NMI)
9870 { /* normally likely */ }
9871 else
9872 {
9873 int rc2 = hmR0VmxReadExitIntInfoVmcs(pVmxTransient);
9874 AssertRCReturn(rc2, rc2);
9875 uint32_t uIntType = VMX_EXIT_INT_INFO_TYPE(pVmxTransient->uExitIntInfo);
9876 if (uIntType == VMX_EXIT_INT_INFO_TYPE_NMI)
9877 return hmR0VmxExitXcptOrNmi(pVCpu, pVmxTransient);
9878 }
9879
9880 /*
9881 * Check for single stepping event if we're stepping.
9882 */
9883 if (pVCpu->hm.s.fSingleInstruction)
9884 {
9885 switch (uExitReason)
9886 {
9887 case VMX_EXIT_MTF:
9888 return hmR0VmxExitMtf(pVCpu, pVmxTransient);
9889
9890 /* Various events: */
9891 case VMX_EXIT_XCPT_OR_NMI:
9892 case VMX_EXIT_EXT_INT:
9893 case VMX_EXIT_TRIPLE_FAULT:
9894 case VMX_EXIT_INT_WINDOW:
9895 case VMX_EXIT_NMI_WINDOW:
9896 case VMX_EXIT_TASK_SWITCH:
9897 case VMX_EXIT_TPR_BELOW_THRESHOLD:
9898 case VMX_EXIT_APIC_ACCESS:
9899 case VMX_EXIT_EPT_VIOLATION:
9900 case VMX_EXIT_EPT_MISCONFIG:
9901 case VMX_EXIT_PREEMPT_TIMER:
9902
9903 /* Instruction specific VM-exits: */
9904 case VMX_EXIT_CPUID:
9905 case VMX_EXIT_GETSEC:
9906 case VMX_EXIT_HLT:
9907 case VMX_EXIT_INVD:
9908 case VMX_EXIT_INVLPG:
9909 case VMX_EXIT_RDPMC:
9910 case VMX_EXIT_RDTSC:
9911 case VMX_EXIT_RSM:
9912 case VMX_EXIT_VMCALL:
9913 case VMX_EXIT_VMCLEAR:
9914 case VMX_EXIT_VMLAUNCH:
9915 case VMX_EXIT_VMPTRLD:
9916 case VMX_EXIT_VMPTRST:
9917 case VMX_EXIT_VMREAD:
9918 case VMX_EXIT_VMRESUME:
9919 case VMX_EXIT_VMWRITE:
9920 case VMX_EXIT_VMXOFF:
9921 case VMX_EXIT_VMXON:
9922 case VMX_EXIT_MOV_CRX:
9923 case VMX_EXIT_MOV_DRX:
9924 case VMX_EXIT_IO_INSTR:
9925 case VMX_EXIT_RDMSR:
9926 case VMX_EXIT_WRMSR:
9927 case VMX_EXIT_MWAIT:
9928 case VMX_EXIT_MONITOR:
9929 case VMX_EXIT_PAUSE:
9930 case VMX_EXIT_GDTR_IDTR_ACCESS:
9931 case VMX_EXIT_LDTR_TR_ACCESS:
9932 case VMX_EXIT_INVEPT:
9933 case VMX_EXIT_RDTSCP:
9934 case VMX_EXIT_INVVPID:
9935 case VMX_EXIT_WBINVD:
9936 case VMX_EXIT_XSETBV:
9937 case VMX_EXIT_RDRAND:
9938 case VMX_EXIT_INVPCID:
9939 case VMX_EXIT_VMFUNC:
9940 case VMX_EXIT_RDSEED:
9941 case VMX_EXIT_XSAVES:
9942 case VMX_EXIT_XRSTORS:
9943 {
9944 int rc = hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_CS | CPUMCTX_EXTRN_RIP);
9945 AssertRCReturn(rc, rc);
9946 if ( pVCpu->cpum.GstCtx.rip != pDbgState->uRipStart
9947 || pVCpu->cpum.GstCtx.cs.Sel != pDbgState->uCsStart)
9948 return VINF_EM_DBG_STEPPED;
9949 break;
9950 }
9951
9952 /* Errors and unexpected events: */
9953 case VMX_EXIT_INIT_SIGNAL:
9954 case VMX_EXIT_SIPI:
9955 case VMX_EXIT_IO_SMI:
9956 case VMX_EXIT_SMI:
9957 case VMX_EXIT_ERR_INVALID_GUEST_STATE:
9958 case VMX_EXIT_ERR_MSR_LOAD:
9959 case VMX_EXIT_ERR_MACHINE_CHECK:
9960 case VMX_EXIT_APIC_WRITE: /* Some talk about this being fault like, so I guess we must process it? */
9961 break;
9962
9963 default:
9964 AssertMsgFailed(("Unexpected VM-exit=%#x\n", uExitReason));
9965 break;
9966 }
9967 }
9968
9969 /*
9970 * Check for debugger event breakpoints and dtrace probes.
9971 */
9972 if ( uExitReason < RT_ELEMENTS(pDbgState->bmExitsToCheck) * 32U
9973 && ASMBitTest(pDbgState->bmExitsToCheck, uExitReason) )
9974 {
9975 VBOXSTRICTRC rcStrict = hmR0VmxHandleExitDtraceEvents(pVCpu, pVmxTransient, uExitReason);
9976 if (rcStrict != VINF_SUCCESS)
9977 return rcStrict;
9978 }
9979
9980 /*
9981 * Normal processing.
9982 */
9983#ifdef HMVMX_USE_FUNCTION_TABLE
9984 return g_apfnVMExitHandlers[uExitReason](pVCpu, pVmxTransient);
9985#else
9986 return hmR0VmxHandleExit(pVCpu, pVmxTransient, uExitReason);
9987#endif
9988}
9989
9990
9991/**
9992 * Single steps guest code using VT-x.
9993 *
9994 * @returns Strict VBox status code (i.e. informational status codes too).
9995 * @param pVCpu The cross context virtual CPU structure.
9996 *
9997 * @note Mostly the same as hmR0VmxRunGuestCodeNormal().
9998 */
9999static VBOXSTRICTRC hmR0VmxRunGuestCodeDebug(PVMCPU pVCpu)
10000{
10001 VMXTRANSIENT VmxTransient;
10002 VmxTransient.fUpdateTscOffsettingAndPreemptTimer = true;
10003
10004 /* Set HMCPU indicators. */
10005 bool const fSavedSingleInstruction = pVCpu->hm.s.fSingleInstruction;
10006 pVCpu->hm.s.fSingleInstruction = pVCpu->hm.s.fSingleInstruction || DBGFIsStepping(pVCpu);
10007 pVCpu->hm.s.fDebugWantRdTscExit = false;
10008 pVCpu->hm.s.fUsingDebugLoop = true;
10009
10010 /* State we keep to help modify and later restore the VMCS fields we alter, and for detecting steps. */
10011 VMXRUNDBGSTATE DbgState;
10012 hmR0VmxRunDebugStateInit(pVCpu, &DbgState);
10013 hmR0VmxPreRunGuestDebugStateUpdate(pVCpu, &DbgState, &VmxTransient);
10014
10015 /*
10016 * The loop.
10017 */
10018 VBOXSTRICTRC rcStrict = VERR_INTERNAL_ERROR_5;
10019 for (uint32_t cLoops = 0; ; cLoops++)
10020 {
10021 Assert(!HMR0SuspendPending());
10022 HMVMX_ASSERT_CPU_SAFE(pVCpu);
10023 bool fStepping = pVCpu->hm.s.fSingleInstruction;
10024
10025 /*
10026 * Preparatory work for running guest code, this may force us to return
10027 * to ring-3. This bugger disables interrupts on VINF_SUCCESS!
10028 */
10029 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatEntry, x);
10030 hmR0VmxPreRunGuestDebugStateApply(pVCpu, &DbgState); /* Set up execute controls the next to can respond to. */
10031 rcStrict = hmR0VmxPreRunGuest(pVCpu, &VmxTransient, fStepping);
10032 if (rcStrict != VINF_SUCCESS)
10033 break;
10034
10035 hmR0VmxPreRunGuestCommitted(pVCpu, &VmxTransient);
10036 hmR0VmxPreRunGuestDebugStateApply(pVCpu, &DbgState); /* Override any obnoxious code in the above two calls. */
10037
10038 /*
10039 * Now we can run the guest code.
10040 */
10041 int rcRun = hmR0VmxRunGuest(pVCpu);
10042
10043 /*
10044 * Restore any residual host-state and save any bits shared between host
10045 * and guest into the guest-CPU state. Re-enables interrupts!
10046 */
10047 hmR0VmxPostRunGuest(pVCpu, &VmxTransient, rcRun);
10048
10049 /* Check for errors with running the VM (VMLAUNCH/VMRESUME). */
10050 if (RT_SUCCESS(rcRun))
10051 { /* very likely */ }
10052 else
10053 {
10054 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatPreExit, x);
10055 hmR0VmxReportWorldSwitchError(pVCpu, rcRun, &VmxTransient);
10056 return rcRun;
10057 }
10058
10059 /* Profile the VM-exit. */
10060 AssertMsg(VmxTransient.uExitReason <= VMX_EXIT_MAX, ("%#x\n", VmxTransient.uExitReason));
10061 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitAll);
10062 STAM_COUNTER_INC(&pVCpu->hm.s.paStatExitReasonR0[VmxTransient.uExitReason & MASK_EXITREASON_STAT]);
10063 STAM_PROFILE_ADV_STOP_START(&pVCpu->hm.s.StatPreExit, &pVCpu->hm.s.StatExitHandling, x);
10064 HMVMX_START_EXIT_DISPATCH_PROF();
10065
10066 VBOXVMM_R0_HMVMX_VMEXIT_NOCTX(pVCpu, &pVCpu->cpum.GstCtx, VmxTransient.uExitReason);
10067
10068 /*
10069 * Handle the VM-exit - we quit earlier on certain VM-exits, see hmR0VmxHandleExitDebug().
10070 */
10071 rcStrict = hmR0VmxRunDebugHandleExit(pVCpu, &VmxTransient, &DbgState);
10072 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExitHandling, x);
10073 if (rcStrict != VINF_SUCCESS)
10074 break;
10075 if (cLoops > pVCpu->CTX_SUFF(pVM)->hm.s.cMaxResumeLoops)
10076 {
10077 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchMaxResumeLoops);
10078 rcStrict = VINF_EM_RAW_INTERRUPT;
10079 break;
10080 }
10081
10082 /*
10083 * Stepping: Did the RIP change, if so, consider it a single step.
10084 * Otherwise, make sure one of the TFs gets set.
10085 */
10086 if (fStepping)
10087 {
10088 int rc = hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_CS | CPUMCTX_EXTRN_RIP);
10089 AssertRC(rc);
10090 if ( pVCpu->cpum.GstCtx.rip != DbgState.uRipStart
10091 || pVCpu->cpum.GstCtx.cs.Sel != DbgState.uCsStart)
10092 {
10093 rcStrict = VINF_EM_DBG_STEPPED;
10094 break;
10095 }
10096 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_DR7);
10097 }
10098
10099 /*
10100 * Update when dtrace settings changes (DBGF kicks us, so no need to check).
10101 */
10102 if (VBOXVMM_GET_SETTINGS_SEQ_NO() != DbgState.uDtraceSettingsSeqNo)
10103 hmR0VmxPreRunGuestDebugStateUpdate(pVCpu, &DbgState, &VmxTransient);
10104 }
10105
10106 /*
10107 * Clear the X86_EFL_TF if necessary.
10108 */
10109 if (pVCpu->hm.s.fClearTrapFlag)
10110 {
10111 int rc = hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_RFLAGS);
10112 AssertRC(rc);
10113 pVCpu->hm.s.fClearTrapFlag = false;
10114 pVCpu->cpum.GstCtx.eflags.Bits.u1TF = 0;
10115 }
10116 /** @todo there seems to be issues with the resume flag when the monitor trap
10117 * flag is pending without being used. Seen early in bios init when
10118 * accessing APIC page in protected mode. */
10119
10120 /*
10121 * Restore VM-exit control settings as we may not reenter this function the
10122 * next time around.
10123 */
10124 rcStrict = hmR0VmxRunDebugStateRevert(pVCpu, &DbgState, rcStrict);
10125
10126 /* Restore HMCPU indicators. */
10127 pVCpu->hm.s.fUsingDebugLoop = false;
10128 pVCpu->hm.s.fDebugWantRdTscExit = false;
10129 pVCpu->hm.s.fSingleInstruction = fSavedSingleInstruction;
10130
10131 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatEntry, x);
10132 return rcStrict;
10133}
10134
10135
10136/** @} */
10137
10138
10139/**
10140 * Checks if any expensive dtrace probes are enabled and we should go to the
10141 * debug loop.
10142 *
10143 * @returns true if we should use debug loop, false if not.
10144 */
10145static bool hmR0VmxAnyExpensiveProbesEnabled(void)
10146{
10147 /* It's probably faster to OR the raw 32-bit counter variables together.
10148 Since the variables are in an array and the probes are next to one
10149 another (more or less), we have good locality. So, better read
10150 eight-nine cache lines ever time and only have one conditional, than
10151 128+ conditionals, right? */
10152 return ( VBOXVMM_R0_HMVMX_VMEXIT_ENABLED_RAW() /* expensive too due to context */
10153 | VBOXVMM_XCPT_DE_ENABLED_RAW()
10154 | VBOXVMM_XCPT_DB_ENABLED_RAW()
10155 | VBOXVMM_XCPT_BP_ENABLED_RAW()
10156 | VBOXVMM_XCPT_OF_ENABLED_RAW()
10157 | VBOXVMM_XCPT_BR_ENABLED_RAW()
10158 | VBOXVMM_XCPT_UD_ENABLED_RAW()
10159 | VBOXVMM_XCPT_NM_ENABLED_RAW()
10160 | VBOXVMM_XCPT_DF_ENABLED_RAW()
10161 | VBOXVMM_XCPT_TS_ENABLED_RAW()
10162 | VBOXVMM_XCPT_NP_ENABLED_RAW()
10163 | VBOXVMM_XCPT_SS_ENABLED_RAW()
10164 | VBOXVMM_XCPT_GP_ENABLED_RAW()
10165 | VBOXVMM_XCPT_PF_ENABLED_RAW()
10166 | VBOXVMM_XCPT_MF_ENABLED_RAW()
10167 | VBOXVMM_XCPT_AC_ENABLED_RAW()
10168 | VBOXVMM_XCPT_XF_ENABLED_RAW()
10169 | VBOXVMM_XCPT_VE_ENABLED_RAW()
10170 | VBOXVMM_XCPT_SX_ENABLED_RAW()
10171 | VBOXVMM_INT_SOFTWARE_ENABLED_RAW()
10172 | VBOXVMM_INT_HARDWARE_ENABLED_RAW()
10173 ) != 0
10174 || ( VBOXVMM_INSTR_HALT_ENABLED_RAW()
10175 | VBOXVMM_INSTR_MWAIT_ENABLED_RAW()
10176 | VBOXVMM_INSTR_MONITOR_ENABLED_RAW()
10177 | VBOXVMM_INSTR_CPUID_ENABLED_RAW()
10178 | VBOXVMM_INSTR_INVD_ENABLED_RAW()
10179 | VBOXVMM_INSTR_WBINVD_ENABLED_RAW()
10180 | VBOXVMM_INSTR_INVLPG_ENABLED_RAW()
10181 | VBOXVMM_INSTR_RDTSC_ENABLED_RAW()
10182 | VBOXVMM_INSTR_RDTSCP_ENABLED_RAW()
10183 | VBOXVMM_INSTR_RDPMC_ENABLED_RAW()
10184 | VBOXVMM_INSTR_RDMSR_ENABLED_RAW()
10185 | VBOXVMM_INSTR_WRMSR_ENABLED_RAW()
10186 | VBOXVMM_INSTR_CRX_READ_ENABLED_RAW()
10187 | VBOXVMM_INSTR_CRX_WRITE_ENABLED_RAW()
10188 | VBOXVMM_INSTR_DRX_READ_ENABLED_RAW()
10189 | VBOXVMM_INSTR_DRX_WRITE_ENABLED_RAW()
10190 | VBOXVMM_INSTR_PAUSE_ENABLED_RAW()
10191 | VBOXVMM_INSTR_XSETBV_ENABLED_RAW()
10192 | VBOXVMM_INSTR_SIDT_ENABLED_RAW()
10193 | VBOXVMM_INSTR_LIDT_ENABLED_RAW()
10194 | VBOXVMM_INSTR_SGDT_ENABLED_RAW()
10195 | VBOXVMM_INSTR_LGDT_ENABLED_RAW()
10196 | VBOXVMM_INSTR_SLDT_ENABLED_RAW()
10197 | VBOXVMM_INSTR_LLDT_ENABLED_RAW()
10198 | VBOXVMM_INSTR_STR_ENABLED_RAW()
10199 | VBOXVMM_INSTR_LTR_ENABLED_RAW()
10200 | VBOXVMM_INSTR_GETSEC_ENABLED_RAW()
10201 | VBOXVMM_INSTR_RSM_ENABLED_RAW()
10202 | VBOXVMM_INSTR_RDRAND_ENABLED_RAW()
10203 | VBOXVMM_INSTR_RDSEED_ENABLED_RAW()
10204 | VBOXVMM_INSTR_XSAVES_ENABLED_RAW()
10205 | VBOXVMM_INSTR_XRSTORS_ENABLED_RAW()
10206 | VBOXVMM_INSTR_VMM_CALL_ENABLED_RAW()
10207 | VBOXVMM_INSTR_VMX_VMCLEAR_ENABLED_RAW()
10208 | VBOXVMM_INSTR_VMX_VMLAUNCH_ENABLED_RAW()
10209 | VBOXVMM_INSTR_VMX_VMPTRLD_ENABLED_RAW()
10210 | VBOXVMM_INSTR_VMX_VMPTRST_ENABLED_RAW()
10211 | VBOXVMM_INSTR_VMX_VMREAD_ENABLED_RAW()
10212 | VBOXVMM_INSTR_VMX_VMRESUME_ENABLED_RAW()
10213 | VBOXVMM_INSTR_VMX_VMWRITE_ENABLED_RAW()
10214 | VBOXVMM_INSTR_VMX_VMXOFF_ENABLED_RAW()
10215 | VBOXVMM_INSTR_VMX_VMXON_ENABLED_RAW()
10216 | VBOXVMM_INSTR_VMX_VMFUNC_ENABLED_RAW()
10217 | VBOXVMM_INSTR_VMX_INVEPT_ENABLED_RAW()
10218 | VBOXVMM_INSTR_VMX_INVVPID_ENABLED_RAW()
10219 | VBOXVMM_INSTR_VMX_INVPCID_ENABLED_RAW()
10220 ) != 0
10221 || ( VBOXVMM_EXIT_TASK_SWITCH_ENABLED_RAW()
10222 | VBOXVMM_EXIT_HALT_ENABLED_RAW()
10223 | VBOXVMM_EXIT_MWAIT_ENABLED_RAW()
10224 | VBOXVMM_EXIT_MONITOR_ENABLED_RAW()
10225 | VBOXVMM_EXIT_CPUID_ENABLED_RAW()
10226 | VBOXVMM_EXIT_INVD_ENABLED_RAW()
10227 | VBOXVMM_EXIT_WBINVD_ENABLED_RAW()
10228 | VBOXVMM_EXIT_INVLPG_ENABLED_RAW()
10229 | VBOXVMM_EXIT_RDTSC_ENABLED_RAW()
10230 | VBOXVMM_EXIT_RDTSCP_ENABLED_RAW()
10231 | VBOXVMM_EXIT_RDPMC_ENABLED_RAW()
10232 | VBOXVMM_EXIT_RDMSR_ENABLED_RAW()
10233 | VBOXVMM_EXIT_WRMSR_ENABLED_RAW()
10234 | VBOXVMM_EXIT_CRX_READ_ENABLED_RAW()
10235 | VBOXVMM_EXIT_CRX_WRITE_ENABLED_RAW()
10236 | VBOXVMM_EXIT_DRX_READ_ENABLED_RAW()
10237 | VBOXVMM_EXIT_DRX_WRITE_ENABLED_RAW()
10238 | VBOXVMM_EXIT_PAUSE_ENABLED_RAW()
10239 | VBOXVMM_EXIT_XSETBV_ENABLED_RAW()
10240 | VBOXVMM_EXIT_SIDT_ENABLED_RAW()
10241 | VBOXVMM_EXIT_LIDT_ENABLED_RAW()
10242 | VBOXVMM_EXIT_SGDT_ENABLED_RAW()
10243 | VBOXVMM_EXIT_LGDT_ENABLED_RAW()
10244 | VBOXVMM_EXIT_SLDT_ENABLED_RAW()
10245 | VBOXVMM_EXIT_LLDT_ENABLED_RAW()
10246 | VBOXVMM_EXIT_STR_ENABLED_RAW()
10247 | VBOXVMM_EXIT_LTR_ENABLED_RAW()
10248 | VBOXVMM_EXIT_GETSEC_ENABLED_RAW()
10249 | VBOXVMM_EXIT_RSM_ENABLED_RAW()
10250 | VBOXVMM_EXIT_RDRAND_ENABLED_RAW()
10251 | VBOXVMM_EXIT_RDSEED_ENABLED_RAW()
10252 | VBOXVMM_EXIT_XSAVES_ENABLED_RAW()
10253 | VBOXVMM_EXIT_XRSTORS_ENABLED_RAW()
10254 | VBOXVMM_EXIT_VMM_CALL_ENABLED_RAW()
10255 | VBOXVMM_EXIT_VMX_VMCLEAR_ENABLED_RAW()
10256 | VBOXVMM_EXIT_VMX_VMLAUNCH_ENABLED_RAW()
10257 | VBOXVMM_EXIT_VMX_VMPTRLD_ENABLED_RAW()
10258 | VBOXVMM_EXIT_VMX_VMPTRST_ENABLED_RAW()
10259 | VBOXVMM_EXIT_VMX_VMREAD_ENABLED_RAW()
10260 | VBOXVMM_EXIT_VMX_VMRESUME_ENABLED_RAW()
10261 | VBOXVMM_EXIT_VMX_VMWRITE_ENABLED_RAW()
10262 | VBOXVMM_EXIT_VMX_VMXOFF_ENABLED_RAW()
10263 | VBOXVMM_EXIT_VMX_VMXON_ENABLED_RAW()
10264 | VBOXVMM_EXIT_VMX_VMFUNC_ENABLED_RAW()
10265 | VBOXVMM_EXIT_VMX_INVEPT_ENABLED_RAW()
10266 | VBOXVMM_EXIT_VMX_INVVPID_ENABLED_RAW()
10267 | VBOXVMM_EXIT_VMX_INVPCID_ENABLED_RAW()
10268 | VBOXVMM_EXIT_VMX_EPT_VIOLATION_ENABLED_RAW()
10269 | VBOXVMM_EXIT_VMX_EPT_MISCONFIG_ENABLED_RAW()
10270 | VBOXVMM_EXIT_VMX_VAPIC_ACCESS_ENABLED_RAW()
10271 | VBOXVMM_EXIT_VMX_VAPIC_WRITE_ENABLED_RAW()
10272 ) != 0;
10273}
10274
10275
10276/**
10277 * Runs the guest code using VT-x.
10278 *
10279 * @returns Strict VBox status code (i.e. informational status codes too).
10280 * @param pVCpu The cross context virtual CPU structure.
10281 */
10282VMMR0DECL(VBOXSTRICTRC) VMXR0RunGuestCode(PVMCPU pVCpu)
10283{
10284 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
10285 Assert(VMMRZCallRing3IsEnabled(pVCpu));
10286 Assert(!ASMAtomicUoReadU64(&pCtx->fExtrn));
10287 HMVMX_ASSERT_PREEMPT_SAFE(pVCpu);
10288
10289 VMMRZCallRing3SetNotification(pVCpu, hmR0VmxCallRing3Callback, pCtx);
10290
10291 VBOXSTRICTRC rcStrict;
10292 if ( !pVCpu->hm.s.fUseDebugLoop
10293 && (!VBOXVMM_ANY_PROBES_ENABLED() || !hmR0VmxAnyExpensiveProbesEnabled())
10294 && !DBGFIsStepping(pVCpu)
10295 && !pVCpu->CTX_SUFF(pVM)->dbgf.ro.cEnabledInt3Breakpoints)
10296 rcStrict = hmR0VmxRunGuestCodeNormal(pVCpu);
10297 else
10298 rcStrict = hmR0VmxRunGuestCodeDebug(pVCpu);
10299
10300 if (rcStrict == VERR_EM_INTERPRETER)
10301 rcStrict = VINF_EM_RAW_EMULATE_INSTR;
10302 else if (rcStrict == VINF_EM_RESET)
10303 rcStrict = VINF_EM_TRIPLE_FAULT;
10304
10305 int rc2 = hmR0VmxExitToRing3(pVCpu, rcStrict);
10306 if (RT_FAILURE(rc2))
10307 {
10308 pVCpu->hm.s.u32HMError = (uint32_t)VBOXSTRICTRC_VAL(rcStrict);
10309 rcStrict = rc2;
10310 }
10311 Assert(!ASMAtomicUoReadU64(&pCtx->fExtrn));
10312 Assert(!VMMRZCallRing3IsNotificationSet(pVCpu));
10313 return rcStrict;
10314}
10315
10316
10317#ifndef HMVMX_USE_FUNCTION_TABLE
10318DECLINLINE(VBOXSTRICTRC) hmR0VmxHandleExit(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient, uint32_t rcReason)
10319{
10320#ifdef DEBUG_ramshankar
10321#define VMEXIT_CALL_RET(a_fSave, a_CallExpr) \
10322 do { \
10323 if (a_fSave != 0) \
10324 hmR0VmxImportGuestState(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL); \
10325 VBOXSTRICTRC rcStrict = a_CallExpr; \
10326 if (a_fSave != 0) \
10327 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST); \
10328 return rcStrict; \
10329 } while (0)
10330#else
10331# define VMEXIT_CALL_RET(a_fSave, a_CallExpr) return a_CallExpr
10332#endif
10333 switch (rcReason)
10334 {
10335 case VMX_EXIT_EPT_MISCONFIG: VMEXIT_CALL_RET(0, hmR0VmxExitEptMisconfig(pVCpu, pVmxTransient));
10336 case VMX_EXIT_EPT_VIOLATION: VMEXIT_CALL_RET(0, hmR0VmxExitEptViolation(pVCpu, pVmxTransient));
10337 case VMX_EXIT_IO_INSTR: VMEXIT_CALL_RET(0, hmR0VmxExitIoInstr(pVCpu, pVmxTransient));
10338 case VMX_EXIT_CPUID: VMEXIT_CALL_RET(0, hmR0VmxExitCpuid(pVCpu, pVmxTransient));
10339 case VMX_EXIT_RDTSC: VMEXIT_CALL_RET(0, hmR0VmxExitRdtsc(pVCpu, pVmxTransient));
10340 case VMX_EXIT_RDTSCP: VMEXIT_CALL_RET(0, hmR0VmxExitRdtscp(pVCpu, pVmxTransient));
10341 case VMX_EXIT_APIC_ACCESS: VMEXIT_CALL_RET(0, hmR0VmxExitApicAccess(pVCpu, pVmxTransient));
10342 case VMX_EXIT_XCPT_OR_NMI: VMEXIT_CALL_RET(0, hmR0VmxExitXcptOrNmi(pVCpu, pVmxTransient));
10343 case VMX_EXIT_MOV_CRX: VMEXIT_CALL_RET(0, hmR0VmxExitMovCRx(pVCpu, pVmxTransient));
10344 case VMX_EXIT_EXT_INT: VMEXIT_CALL_RET(0, hmR0VmxExitExtInt(pVCpu, pVmxTransient));
10345 case VMX_EXIT_INT_WINDOW: VMEXIT_CALL_RET(0, hmR0VmxExitIntWindow(pVCpu, pVmxTransient));
10346 case VMX_EXIT_TPR_BELOW_THRESHOLD: VMEXIT_CALL_RET(0, hmR0VmxExitTprBelowThreshold(pVCpu, pVmxTransient));
10347 case VMX_EXIT_MWAIT: VMEXIT_CALL_RET(0, hmR0VmxExitMwait(pVCpu, pVmxTransient));
10348 case VMX_EXIT_MONITOR: VMEXIT_CALL_RET(0, hmR0VmxExitMonitor(pVCpu, pVmxTransient));
10349 case VMX_EXIT_TASK_SWITCH: VMEXIT_CALL_RET(0, hmR0VmxExitTaskSwitch(pVCpu, pVmxTransient));
10350 case VMX_EXIT_PREEMPT_TIMER: VMEXIT_CALL_RET(0, hmR0VmxExitPreemptTimer(pVCpu, pVmxTransient));
10351 case VMX_EXIT_RDMSR: VMEXIT_CALL_RET(0, hmR0VmxExitRdmsr(pVCpu, pVmxTransient));
10352 case VMX_EXIT_WRMSR: VMEXIT_CALL_RET(0, hmR0VmxExitWrmsr(pVCpu, pVmxTransient));
10353 case VMX_EXIT_VMCALL: VMEXIT_CALL_RET(0, hmR0VmxExitVmcall(pVCpu, pVmxTransient));
10354 case VMX_EXIT_MOV_DRX: VMEXIT_CALL_RET(0, hmR0VmxExitMovDRx(pVCpu, pVmxTransient));
10355 case VMX_EXIT_HLT: VMEXIT_CALL_RET(0, hmR0VmxExitHlt(pVCpu, pVmxTransient));
10356 case VMX_EXIT_INVD: VMEXIT_CALL_RET(0, hmR0VmxExitInvd(pVCpu, pVmxTransient));
10357 case VMX_EXIT_INVLPG: VMEXIT_CALL_RET(0, hmR0VmxExitInvlpg(pVCpu, pVmxTransient));
10358 case VMX_EXIT_RSM: VMEXIT_CALL_RET(0, hmR0VmxExitRsm(pVCpu, pVmxTransient));
10359 case VMX_EXIT_MTF: VMEXIT_CALL_RET(0, hmR0VmxExitMtf(pVCpu, pVmxTransient));
10360 case VMX_EXIT_PAUSE: VMEXIT_CALL_RET(0, hmR0VmxExitPause(pVCpu, pVmxTransient));
10361 case VMX_EXIT_GDTR_IDTR_ACCESS: VMEXIT_CALL_RET(0, hmR0VmxExitXdtrAccess(pVCpu, pVmxTransient));
10362 case VMX_EXIT_LDTR_TR_ACCESS: VMEXIT_CALL_RET(0, hmR0VmxExitXdtrAccess(pVCpu, pVmxTransient));
10363 case VMX_EXIT_WBINVD: VMEXIT_CALL_RET(0, hmR0VmxExitWbinvd(pVCpu, pVmxTransient));
10364 case VMX_EXIT_XSETBV: VMEXIT_CALL_RET(0, hmR0VmxExitXsetbv(pVCpu, pVmxTransient));
10365 case VMX_EXIT_RDRAND: VMEXIT_CALL_RET(0, hmR0VmxExitRdrand(pVCpu, pVmxTransient));
10366 case VMX_EXIT_INVPCID: VMEXIT_CALL_RET(0, hmR0VmxExitInvpcid(pVCpu, pVmxTransient));
10367 case VMX_EXIT_GETSEC: VMEXIT_CALL_RET(0, hmR0VmxExitGetsec(pVCpu, pVmxTransient));
10368 case VMX_EXIT_RDPMC: VMEXIT_CALL_RET(0, hmR0VmxExitRdpmc(pVCpu, pVmxTransient));
10369
10370 case VMX_EXIT_TRIPLE_FAULT: return hmR0VmxExitTripleFault(pVCpu, pVmxTransient);
10371 case VMX_EXIT_NMI_WINDOW: return hmR0VmxExitNmiWindow(pVCpu, pVmxTransient);
10372 case VMX_EXIT_INIT_SIGNAL: return hmR0VmxExitInitSignal(pVCpu, pVmxTransient);
10373 case VMX_EXIT_SIPI: return hmR0VmxExitSipi(pVCpu, pVmxTransient);
10374 case VMX_EXIT_IO_SMI: return hmR0VmxExitIoSmi(pVCpu, pVmxTransient);
10375 case VMX_EXIT_SMI: return hmR0VmxExitSmi(pVCpu, pVmxTransient);
10376 case VMX_EXIT_ERR_MSR_LOAD: return hmR0VmxExitErrMsrLoad(pVCpu, pVmxTransient);
10377 case VMX_EXIT_ERR_INVALID_GUEST_STATE: return hmR0VmxExitErrInvalidGuestState(pVCpu, pVmxTransient);
10378 case VMX_EXIT_ERR_MACHINE_CHECK: return hmR0VmxExitErrMachineCheck(pVCpu, pVmxTransient);
10379
10380 case VMX_EXIT_VMCLEAR:
10381 case VMX_EXIT_VMLAUNCH:
10382 case VMX_EXIT_VMPTRLD:
10383 case VMX_EXIT_VMPTRST:
10384 case VMX_EXIT_VMREAD:
10385 case VMX_EXIT_VMRESUME:
10386 case VMX_EXIT_VMWRITE:
10387 case VMX_EXIT_VMXOFF:
10388 case VMX_EXIT_VMXON:
10389 case VMX_EXIT_INVEPT:
10390 case VMX_EXIT_INVVPID:
10391 case VMX_EXIT_VMFUNC:
10392 case VMX_EXIT_XSAVES:
10393 case VMX_EXIT_XRSTORS:
10394 return hmR0VmxExitSetPendingXcptUD(pVCpu, pVmxTransient);
10395
10396 case VMX_EXIT_ENCLS:
10397 case VMX_EXIT_RDSEED: /* only spurious VM-exits, so undefined */
10398 case VMX_EXIT_PML_FULL:
10399 default:
10400 return hmR0VmxExitErrUndefined(pVCpu, pVmxTransient);
10401 }
10402#undef VMEXIT_CALL_RET
10403}
10404#endif /* !HMVMX_USE_FUNCTION_TABLE */
10405
10406
10407#ifdef VBOX_STRICT
10408/* Is there some generic IPRT define for this that are not in Runtime/internal/\* ?? */
10409# define HMVMX_ASSERT_PREEMPT_CPUID_VAR() \
10410 RTCPUID const idAssertCpu = RTThreadPreemptIsEnabled(NIL_RTTHREAD) ? NIL_RTCPUID : RTMpCpuId()
10411
10412# define HMVMX_ASSERT_PREEMPT_CPUID() \
10413 do { \
10414 RTCPUID const idAssertCpuNow = RTThreadPreemptIsEnabled(NIL_RTTHREAD) ? NIL_RTCPUID : RTMpCpuId(); \
10415 AssertMsg(idAssertCpu == idAssertCpuNow, ("VMX %#x, %#x\n", idAssertCpu, idAssertCpuNow)); \
10416 } while (0)
10417
10418# define HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(a_pVCpu, a_pVmxTransient) \
10419 do { \
10420 AssertPtr((a_pVCpu)); \
10421 AssertPtr((a_pVmxTransient)); \
10422 Assert((a_pVmxTransient)->fVMEntryFailed == false); \
10423 Assert(ASMIntAreEnabled()); \
10424 HMVMX_ASSERT_PREEMPT_SAFE(a_pVCpu); \
10425 HMVMX_ASSERT_PREEMPT_CPUID_VAR(); \
10426 Log4Func(("vcpu[%RU32] -v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v\n", (a_pVCpu)->idCpu)); \
10427 HMVMX_ASSERT_PREEMPT_SAFE(a_pVCpu); \
10428 if (VMMR0IsLogFlushDisabled((a_pVCpu))) \
10429 HMVMX_ASSERT_PREEMPT_CPUID(); \
10430 HMVMX_STOP_EXIT_DISPATCH_PROF(); \
10431 } while (0)
10432
10433# define HMVMX_VALIDATE_EXIT_XCPT_HANDLER_PARAMS(a_pVCpu, a_pVmxTransient) \
10434 do { \
10435 Log4Func(("\n")); \
10436 } while (0)
10437#else
10438# define HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(a_pVCpu, a_pVmxTransient) \
10439 do { \
10440 HMVMX_STOP_EXIT_DISPATCH_PROF(); \
10441 NOREF((a_pVCpu)); NOREF((a_pVmxTransient)); \
10442 } while (0)
10443# define HMVMX_VALIDATE_EXIT_XCPT_HANDLER_PARAMS(a_pVCpu, a_pVmxTransient) do { } while (0)
10444#endif
10445
10446
10447/**
10448 * Advances the guest RIP by the specified number of bytes.
10449 *
10450 * @param pVCpu The cross context virtual CPU structure.
10451 * @param cbInstr Number of bytes to advance the RIP by.
10452 *
10453 * @remarks No-long-jump zone!!!
10454 */
10455DECLINLINE(void) hmR0VmxAdvanceGuestRipBy(PVMCPU pVCpu, uint32_t cbInstr)
10456{
10457 /* Advance the RIP. */
10458 pVCpu->cpum.GstCtx.rip += cbInstr;
10459 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP);
10460
10461 /* Update interrupt inhibition. */
10462 if ( VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS)
10463 && pVCpu->cpum.GstCtx.rip != EMGetInhibitInterruptsPC(pVCpu))
10464 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS);
10465}
10466
10467
10468/**
10469 * Advances the guest RIP after reading it from the VMCS.
10470 *
10471 * @returns VBox status code, no informational status codes.
10472 * @param pVCpu The cross context virtual CPU structure.
10473 * @param pVmxTransient Pointer to the VMX transient structure.
10474 *
10475 * @remarks No-long-jump zone!!!
10476 */
10477static int hmR0VmxAdvanceGuestRip(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
10478{
10479 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
10480 rc |= hmR0VmxImportGuestState(pVCpu, CPUMCTX_EXTRN_RIP | CPUMCTX_EXTRN_RFLAGS);
10481 AssertRCReturn(rc, rc);
10482
10483 hmR0VmxAdvanceGuestRipBy(pVCpu, pVmxTransient->cbInstr);
10484 return VINF_SUCCESS;
10485}
10486
10487
10488/**
10489 * Tries to determine what part of the guest-state VT-x has deemed as invalid
10490 * and update error record fields accordingly.
10491 *
10492 * @return VMX_IGS_* return codes.
10493 * @retval VMX_IGS_REASON_NOT_FOUND if this function could not find anything
10494 * wrong with the guest state.
10495 *
10496 * @param pVCpu The cross context virtual CPU structure.
10497 *
10498 * @remarks This function assumes our cache of the VMCS controls
10499 * are valid, i.e. hmR0VmxCheckVmcsCtls() succeeded.
10500 */
10501static uint32_t hmR0VmxCheckGuestState(PVMCPU pVCpu)
10502{
10503#define HMVMX_ERROR_BREAK(err) { uError = (err); break; }
10504#define HMVMX_CHECK_BREAK(expr, err) if (!(expr)) { \
10505 uError = (err); \
10506 break; \
10507 } else do { } while (0)
10508
10509 int rc;
10510 PVM pVM = pVCpu->CTX_SUFF(pVM);
10511 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
10512 uint32_t uError = VMX_IGS_ERROR;
10513 uint32_t u32Val;
10514 bool const fUnrestrictedGuest = pVM->hm.s.vmx.fUnrestrictedGuest;
10515
10516 do
10517 {
10518 /*
10519 * CR0.
10520 */
10521 uint32_t fSetCr0 = (uint32_t)(pVM->hm.s.vmx.Msrs.u64Cr0Fixed0 & pVM->hm.s.vmx.Msrs.u64Cr0Fixed1);
10522 uint32_t const fZapCr0 = (uint32_t)(pVM->hm.s.vmx.Msrs.u64Cr0Fixed0 | pVM->hm.s.vmx.Msrs.u64Cr0Fixed1);
10523 /* Exceptions for unrestricted-guests for fixed CR0 bits (PE, PG).
10524 See Intel spec. 26.3.1 "Checks on Guest Control Registers, Debug Registers and MSRs." */
10525 if (fUnrestrictedGuest)
10526 fSetCr0 &= ~(X86_CR0_PE | X86_CR0_PG);
10527
10528 uint32_t u32GuestCr0;
10529 rc = VMXReadVmcs32(VMX_VMCS_GUEST_CR0, &u32GuestCr0);
10530 AssertRCBreak(rc);
10531 HMVMX_CHECK_BREAK((u32GuestCr0 & fSetCr0) == fSetCr0, VMX_IGS_CR0_FIXED1);
10532 HMVMX_CHECK_BREAK(!(u32GuestCr0 & ~fZapCr0), VMX_IGS_CR0_FIXED0);
10533 if ( !fUnrestrictedGuest
10534 && (u32GuestCr0 & X86_CR0_PG)
10535 && !(u32GuestCr0 & X86_CR0_PE))
10536 {
10537 HMVMX_ERROR_BREAK(VMX_IGS_CR0_PG_PE_COMBO);
10538 }
10539
10540 /*
10541 * CR4.
10542 */
10543 uint64_t const fSetCr4 = (pVM->hm.s.vmx.Msrs.u64Cr4Fixed0 & pVM->hm.s.vmx.Msrs.u64Cr4Fixed1);
10544 uint64_t const fZapCr4 = (pVM->hm.s.vmx.Msrs.u64Cr4Fixed0 | pVM->hm.s.vmx.Msrs.u64Cr4Fixed1);
10545
10546 uint32_t u32GuestCr4;
10547 rc = VMXReadVmcs32(VMX_VMCS_GUEST_CR4, &u32GuestCr4);
10548 AssertRCBreak(rc);
10549 HMVMX_CHECK_BREAK((u32GuestCr4 & fSetCr4) == fSetCr4, VMX_IGS_CR4_FIXED1);
10550 HMVMX_CHECK_BREAK(!(u32GuestCr4 & ~fZapCr4), VMX_IGS_CR4_FIXED0);
10551
10552 /*
10553 * IA32_DEBUGCTL MSR.
10554 */
10555 uint64_t u64Val;
10556 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_DEBUGCTL_FULL, &u64Val);
10557 AssertRCBreak(rc);
10558 if ( (pVCpu->hm.s.vmx.u32EntryCtls & VMX_ENTRY_CTLS_LOAD_DEBUG)
10559 && (u64Val & 0xfffffe3c)) /* Bits 31:9, bits 5:2 MBZ. */
10560 {
10561 HMVMX_ERROR_BREAK(VMX_IGS_DEBUGCTL_MSR_RESERVED);
10562 }
10563 uint64_t u64DebugCtlMsr = u64Val;
10564
10565#ifdef VBOX_STRICT
10566 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY, &u32Val);
10567 AssertRCBreak(rc);
10568 Assert(u32Val == pVCpu->hm.s.vmx.u32EntryCtls);
10569#endif
10570 bool const fLongModeGuest = RT_BOOL(pVCpu->hm.s.vmx.u32EntryCtls & VMX_ENTRY_CTLS_IA32E_MODE_GUEST);
10571
10572 /*
10573 * RIP and RFLAGS.
10574 */
10575 uint32_t u32Eflags;
10576#if HC_ARCH_BITS == 64
10577 rc = VMXReadVmcs64(VMX_VMCS_GUEST_RIP, &u64Val);
10578 AssertRCBreak(rc);
10579 /* pCtx->rip can be different than the one in the VMCS (e.g. run guest code and VM-exits that don't update it). */
10580 if ( !fLongModeGuest
10581 || !pCtx->cs.Attr.n.u1Long)
10582 {
10583 HMVMX_CHECK_BREAK(!(u64Val & UINT64_C(0xffffffff00000000)), VMX_IGS_LONGMODE_RIP_INVALID);
10584 }
10585 /** @todo If the processor supports N < 64 linear-address bits, bits 63:N
10586 * must be identical if the "IA-32e mode guest" VM-entry
10587 * control is 1 and CS.L is 1. No check applies if the
10588 * CPU supports 64 linear-address bits. */
10589
10590 /* Flags in pCtx can be different (real-on-v86 for instance). We are only concerned about the VMCS contents here. */
10591 rc = VMXReadVmcs64(VMX_VMCS_GUEST_RFLAGS, &u64Val);
10592 AssertRCBreak(rc);
10593 HMVMX_CHECK_BREAK(!(u64Val & UINT64_C(0xffffffffffc08028)), /* Bit 63:22, Bit 15, 5, 3 MBZ. */
10594 VMX_IGS_RFLAGS_RESERVED);
10595 HMVMX_CHECK_BREAK((u64Val & X86_EFL_RA1_MASK), VMX_IGS_RFLAGS_RESERVED1); /* Bit 1 MB1. */
10596 u32Eflags = u64Val;
10597#else
10598 rc = VMXReadVmcs32(VMX_VMCS_GUEST_RFLAGS, &u32Eflags);
10599 AssertRCBreak(rc);
10600 HMVMX_CHECK_BREAK(!(u32Eflags & 0xffc08028), VMX_IGS_RFLAGS_RESERVED); /* Bit 31:22, Bit 15, 5, 3 MBZ. */
10601 HMVMX_CHECK_BREAK((u32Eflags & X86_EFL_RA1_MASK), VMX_IGS_RFLAGS_RESERVED1); /* Bit 1 MB1. */
10602#endif
10603
10604 if ( fLongModeGuest
10605 || ( fUnrestrictedGuest
10606 && !(u32GuestCr0 & X86_CR0_PE)))
10607 {
10608 HMVMX_CHECK_BREAK(!(u32Eflags & X86_EFL_VM), VMX_IGS_RFLAGS_VM_INVALID);
10609 }
10610
10611 uint32_t u32EntryInfo;
10612 rc = VMXReadVmcs32(VMX_VMCS32_CTRL_ENTRY_INTERRUPTION_INFO, &u32EntryInfo);
10613 AssertRCBreak(rc);
10614 if ( VMX_ENTRY_INT_INFO_IS_VALID(u32EntryInfo)
10615 && VMX_ENTRY_INT_INFO_TYPE(u32EntryInfo) == VMX_EXIT_INT_INFO_TYPE_EXT_INT)
10616 {
10617 HMVMX_CHECK_BREAK(u32Eflags & X86_EFL_IF, VMX_IGS_RFLAGS_IF_INVALID);
10618 }
10619
10620 /*
10621 * 64-bit checks.
10622 */
10623#if HC_ARCH_BITS == 64
10624 if (fLongModeGuest)
10625 {
10626 HMVMX_CHECK_BREAK(u32GuestCr0 & X86_CR0_PG, VMX_IGS_CR0_PG_LONGMODE);
10627 HMVMX_CHECK_BREAK(u32GuestCr4 & X86_CR4_PAE, VMX_IGS_CR4_PAE_LONGMODE);
10628 }
10629
10630 if ( !fLongModeGuest
10631 && (u32GuestCr4 & X86_CR4_PCIDE))
10632 {
10633 HMVMX_ERROR_BREAK(VMX_IGS_CR4_PCIDE);
10634 }
10635
10636 /** @todo CR3 field must be such that bits 63:52 and bits in the range
10637 * 51:32 beyond the processor's physical-address width are 0. */
10638
10639 if ( (pVCpu->hm.s.vmx.u32EntryCtls & VMX_ENTRY_CTLS_LOAD_DEBUG)
10640 && (pCtx->dr[7] & X86_DR7_MBZ_MASK))
10641 {
10642 HMVMX_ERROR_BREAK(VMX_IGS_DR7_RESERVED);
10643 }
10644
10645 rc = VMXReadVmcs64(VMX_VMCS_HOST_SYSENTER_ESP, &u64Val);
10646 AssertRCBreak(rc);
10647 HMVMX_CHECK_BREAK(X86_IS_CANONICAL(u64Val), VMX_IGS_SYSENTER_ESP_NOT_CANONICAL);
10648
10649 rc = VMXReadVmcs64(VMX_VMCS_HOST_SYSENTER_EIP, &u64Val);
10650 AssertRCBreak(rc);
10651 HMVMX_CHECK_BREAK(X86_IS_CANONICAL(u64Val), VMX_IGS_SYSENTER_EIP_NOT_CANONICAL);
10652#endif
10653
10654 /*
10655 * PERF_GLOBAL MSR.
10656 */
10657 if (pVCpu->hm.s.vmx.u32EntryCtls & VMX_ENTRY_CTLS_LOAD_PERF_MSR)
10658 {
10659 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_PERF_GLOBAL_CTRL_FULL, &u64Val);
10660 AssertRCBreak(rc);
10661 HMVMX_CHECK_BREAK(!(u64Val & UINT64_C(0xfffffff8fffffffc)),
10662 VMX_IGS_PERF_GLOBAL_MSR_RESERVED); /* Bits 63:35, bits 31:2 MBZ. */
10663 }
10664
10665 /*
10666 * PAT MSR.
10667 */
10668 if (pVCpu->hm.s.vmx.u32EntryCtls & VMX_ENTRY_CTLS_LOAD_PAT_MSR)
10669 {
10670 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_PAT_FULL, &u64Val);
10671 AssertRCBreak(rc);
10672 HMVMX_CHECK_BREAK(!(u64Val & UINT64_C(0x707070707070707)), VMX_IGS_PAT_MSR_RESERVED);
10673 for (unsigned i = 0; i < 8; i++)
10674 {
10675 uint8_t u8Val = (u64Val & 0xff);
10676 if ( u8Val != 0 /* UC */
10677 && u8Val != 1 /* WC */
10678 && u8Val != 4 /* WT */
10679 && u8Val != 5 /* WP */
10680 && u8Val != 6 /* WB */
10681 && u8Val != 7 /* UC- */)
10682 {
10683 HMVMX_ERROR_BREAK(VMX_IGS_PAT_MSR_INVALID);
10684 }
10685 u64Val >>= 8;
10686 }
10687 }
10688
10689 /*
10690 * EFER MSR.
10691 */
10692 if (pVCpu->hm.s.vmx.u32EntryCtls & VMX_ENTRY_CTLS_LOAD_EFER_MSR)
10693 {
10694 Assert(pVM->hm.s.vmx.fSupportsVmcsEfer);
10695 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_EFER_FULL, &u64Val);
10696 AssertRCBreak(rc);
10697 HMVMX_CHECK_BREAK(!(u64Val & UINT64_C(0xfffffffffffff2fe)),
10698 VMX_IGS_EFER_MSR_RESERVED); /* Bits 63:12, bit 9, bits 7:1 MBZ. */
10699 HMVMX_CHECK_BREAK(RT_BOOL(u64Val & MSR_K6_EFER_LMA) == RT_BOOL( pVCpu->hm.s.vmx.u32EntryCtls
10700 & VMX_ENTRY_CTLS_IA32E_MODE_GUEST),
10701 VMX_IGS_EFER_LMA_GUEST_MODE_MISMATCH);
10702 /** @todo r=ramshankar: Unrestricted check here is probably wrong, see
10703 * iemVmxVmentryCheckGuestState(). */
10704 HMVMX_CHECK_BREAK( fUnrestrictedGuest
10705 || !(u32GuestCr0 & X86_CR0_PG)
10706 || RT_BOOL(u64Val & MSR_K6_EFER_LMA) == RT_BOOL(u64Val & MSR_K6_EFER_LME),
10707 VMX_IGS_EFER_LMA_LME_MISMATCH);
10708 }
10709
10710 /*
10711 * Segment registers.
10712 */
10713 HMVMX_CHECK_BREAK( (pCtx->ldtr.Attr.u & X86DESCATTR_UNUSABLE)
10714 || !(pCtx->ldtr.Sel & X86_SEL_LDT), VMX_IGS_LDTR_TI_INVALID);
10715 if (!(u32Eflags & X86_EFL_VM))
10716 {
10717 /* CS */
10718 HMVMX_CHECK_BREAK(pCtx->cs.Attr.n.u1Present, VMX_IGS_CS_ATTR_P_INVALID);
10719 HMVMX_CHECK_BREAK(!(pCtx->cs.Attr.u & 0xf00), VMX_IGS_CS_ATTR_RESERVED);
10720 HMVMX_CHECK_BREAK(!(pCtx->cs.Attr.u & 0xfffe0000), VMX_IGS_CS_ATTR_RESERVED);
10721 HMVMX_CHECK_BREAK( (pCtx->cs.u32Limit & 0xfff) == 0xfff
10722 || !(pCtx->cs.Attr.n.u1Granularity), VMX_IGS_CS_ATTR_G_INVALID);
10723 HMVMX_CHECK_BREAK( !(pCtx->cs.u32Limit & 0xfff00000)
10724 || (pCtx->cs.Attr.n.u1Granularity), VMX_IGS_CS_ATTR_G_INVALID);
10725 /* CS cannot be loaded with NULL in protected mode. */
10726 HMVMX_CHECK_BREAK(pCtx->cs.Attr.u && !(pCtx->cs.Attr.u & X86DESCATTR_UNUSABLE), VMX_IGS_CS_ATTR_UNUSABLE);
10727 HMVMX_CHECK_BREAK(pCtx->cs.Attr.n.u1DescType, VMX_IGS_CS_ATTR_S_INVALID);
10728 if (pCtx->cs.Attr.n.u4Type == 9 || pCtx->cs.Attr.n.u4Type == 11)
10729 HMVMX_CHECK_BREAK(pCtx->cs.Attr.n.u2Dpl == pCtx->ss.Attr.n.u2Dpl, VMX_IGS_CS_SS_ATTR_DPL_UNEQUAL);
10730 else if (pCtx->cs.Attr.n.u4Type == 13 || pCtx->cs.Attr.n.u4Type == 15)
10731 HMVMX_CHECK_BREAK(pCtx->cs.Attr.n.u2Dpl <= pCtx->ss.Attr.n.u2Dpl, VMX_IGS_CS_SS_ATTR_DPL_MISMATCH);
10732 else if (pVM->hm.s.vmx.fUnrestrictedGuest && pCtx->cs.Attr.n.u4Type == 3)
10733 HMVMX_CHECK_BREAK(pCtx->cs.Attr.n.u2Dpl == 0, VMX_IGS_CS_ATTR_DPL_INVALID);
10734 else
10735 HMVMX_ERROR_BREAK(VMX_IGS_CS_ATTR_TYPE_INVALID);
10736
10737 /* SS */
10738 HMVMX_CHECK_BREAK( pVM->hm.s.vmx.fUnrestrictedGuest
10739 || (pCtx->ss.Sel & X86_SEL_RPL) == (pCtx->cs.Sel & X86_SEL_RPL), VMX_IGS_SS_CS_RPL_UNEQUAL);
10740 HMVMX_CHECK_BREAK(pCtx->ss.Attr.n.u2Dpl == (pCtx->ss.Sel & X86_SEL_RPL), VMX_IGS_SS_ATTR_DPL_RPL_UNEQUAL);
10741 if ( !(pCtx->cr0 & X86_CR0_PE)
10742 || pCtx->cs.Attr.n.u4Type == 3)
10743 {
10744 HMVMX_CHECK_BREAK(!pCtx->ss.Attr.n.u2Dpl, VMX_IGS_SS_ATTR_DPL_INVALID);
10745 }
10746 if (!(pCtx->ss.Attr.u & X86DESCATTR_UNUSABLE))
10747 {
10748 HMVMX_CHECK_BREAK(pCtx->ss.Attr.n.u4Type == 3 || pCtx->ss.Attr.n.u4Type == 7, VMX_IGS_SS_ATTR_TYPE_INVALID);
10749 HMVMX_CHECK_BREAK(pCtx->ss.Attr.n.u1Present, VMX_IGS_SS_ATTR_P_INVALID);
10750 HMVMX_CHECK_BREAK(!(pCtx->ss.Attr.u & 0xf00), VMX_IGS_SS_ATTR_RESERVED);
10751 HMVMX_CHECK_BREAK(!(pCtx->ss.Attr.u & 0xfffe0000), VMX_IGS_SS_ATTR_RESERVED);
10752 HMVMX_CHECK_BREAK( (pCtx->ss.u32Limit & 0xfff) == 0xfff
10753 || !(pCtx->ss.Attr.n.u1Granularity), VMX_IGS_SS_ATTR_G_INVALID);
10754 HMVMX_CHECK_BREAK( !(pCtx->ss.u32Limit & 0xfff00000)
10755 || (pCtx->ss.Attr.n.u1Granularity), VMX_IGS_SS_ATTR_G_INVALID);
10756 }
10757
10758 /* DS, ES, FS, GS - only check for usable selectors, see hmR0VmxExportGuestSegmenReg(). */
10759 if (!(pCtx->ds.Attr.u & X86DESCATTR_UNUSABLE))
10760 {
10761 HMVMX_CHECK_BREAK(pCtx->ds.Attr.n.u4Type & X86_SEL_TYPE_ACCESSED, VMX_IGS_DS_ATTR_A_INVALID);
10762 HMVMX_CHECK_BREAK(pCtx->ds.Attr.n.u1Present, VMX_IGS_DS_ATTR_P_INVALID);
10763 HMVMX_CHECK_BREAK( pVM->hm.s.vmx.fUnrestrictedGuest
10764 || pCtx->ds.Attr.n.u4Type > 11
10765 || pCtx->ds.Attr.n.u2Dpl >= (pCtx->ds.Sel & X86_SEL_RPL), VMX_IGS_DS_ATTR_DPL_RPL_UNEQUAL);
10766 HMVMX_CHECK_BREAK(!(pCtx->ds.Attr.u & 0xf00), VMX_IGS_DS_ATTR_RESERVED);
10767 HMVMX_CHECK_BREAK(!(pCtx->ds.Attr.u & 0xfffe0000), VMX_IGS_DS_ATTR_RESERVED);
10768 HMVMX_CHECK_BREAK( (pCtx->ds.u32Limit & 0xfff) == 0xfff
10769 || !(pCtx->ds.Attr.n.u1Granularity), VMX_IGS_DS_ATTR_G_INVALID);
10770 HMVMX_CHECK_BREAK( !(pCtx->ds.u32Limit & 0xfff00000)
10771 || (pCtx->ds.Attr.n.u1Granularity), VMX_IGS_DS_ATTR_G_INVALID);
10772 HMVMX_CHECK_BREAK( !(pCtx->ds.Attr.n.u4Type & X86_SEL_TYPE_CODE)
10773 || (pCtx->ds.Attr.n.u4Type & X86_SEL_TYPE_READ), VMX_IGS_DS_ATTR_TYPE_INVALID);
10774 }
10775 if (!(pCtx->es.Attr.u & X86DESCATTR_UNUSABLE))
10776 {
10777 HMVMX_CHECK_BREAK(pCtx->es.Attr.n.u4Type & X86_SEL_TYPE_ACCESSED, VMX_IGS_ES_ATTR_A_INVALID);
10778 HMVMX_CHECK_BREAK(pCtx->es.Attr.n.u1Present, VMX_IGS_ES_ATTR_P_INVALID);
10779 HMVMX_CHECK_BREAK( pVM->hm.s.vmx.fUnrestrictedGuest
10780 || pCtx->es.Attr.n.u4Type > 11
10781 || pCtx->es.Attr.n.u2Dpl >= (pCtx->es.Sel & X86_SEL_RPL), VMX_IGS_DS_ATTR_DPL_RPL_UNEQUAL);
10782 HMVMX_CHECK_BREAK(!(pCtx->es.Attr.u & 0xf00), VMX_IGS_ES_ATTR_RESERVED);
10783 HMVMX_CHECK_BREAK(!(pCtx->es.Attr.u & 0xfffe0000), VMX_IGS_ES_ATTR_RESERVED);
10784 HMVMX_CHECK_BREAK( (pCtx->es.u32Limit & 0xfff) == 0xfff
10785 || !(pCtx->es.Attr.n.u1Granularity), VMX_IGS_ES_ATTR_G_INVALID);
10786 HMVMX_CHECK_BREAK( !(pCtx->es.u32Limit & 0xfff00000)
10787 || (pCtx->es.Attr.n.u1Granularity), VMX_IGS_ES_ATTR_G_INVALID);
10788 HMVMX_CHECK_BREAK( !(pCtx->es.Attr.n.u4Type & X86_SEL_TYPE_CODE)
10789 || (pCtx->es.Attr.n.u4Type & X86_SEL_TYPE_READ), VMX_IGS_ES_ATTR_TYPE_INVALID);
10790 }
10791 if (!(pCtx->fs.Attr.u & X86DESCATTR_UNUSABLE))
10792 {
10793 HMVMX_CHECK_BREAK(pCtx->fs.Attr.n.u4Type & X86_SEL_TYPE_ACCESSED, VMX_IGS_FS_ATTR_A_INVALID);
10794 HMVMX_CHECK_BREAK(pCtx->fs.Attr.n.u1Present, VMX_IGS_FS_ATTR_P_INVALID);
10795 HMVMX_CHECK_BREAK( pVM->hm.s.vmx.fUnrestrictedGuest
10796 || pCtx->fs.Attr.n.u4Type > 11
10797 || pCtx->fs.Attr.n.u2Dpl >= (pCtx->fs.Sel & X86_SEL_RPL), VMX_IGS_FS_ATTR_DPL_RPL_UNEQUAL);
10798 HMVMX_CHECK_BREAK(!(pCtx->fs.Attr.u & 0xf00), VMX_IGS_FS_ATTR_RESERVED);
10799 HMVMX_CHECK_BREAK(!(pCtx->fs.Attr.u & 0xfffe0000), VMX_IGS_FS_ATTR_RESERVED);
10800 HMVMX_CHECK_BREAK( (pCtx->fs.u32Limit & 0xfff) == 0xfff
10801 || !(pCtx->fs.Attr.n.u1Granularity), VMX_IGS_FS_ATTR_G_INVALID);
10802 HMVMX_CHECK_BREAK( !(pCtx->fs.u32Limit & 0xfff00000)
10803 || (pCtx->fs.Attr.n.u1Granularity), VMX_IGS_FS_ATTR_G_INVALID);
10804 HMVMX_CHECK_BREAK( !(pCtx->fs.Attr.n.u4Type & X86_SEL_TYPE_CODE)
10805 || (pCtx->fs.Attr.n.u4Type & X86_SEL_TYPE_READ), VMX_IGS_FS_ATTR_TYPE_INVALID);
10806 }
10807 if (!(pCtx->gs.Attr.u & X86DESCATTR_UNUSABLE))
10808 {
10809 HMVMX_CHECK_BREAK(pCtx->gs.Attr.n.u4Type & X86_SEL_TYPE_ACCESSED, VMX_IGS_GS_ATTR_A_INVALID);
10810 HMVMX_CHECK_BREAK(pCtx->gs.Attr.n.u1Present, VMX_IGS_GS_ATTR_P_INVALID);
10811 HMVMX_CHECK_BREAK( pVM->hm.s.vmx.fUnrestrictedGuest
10812 || pCtx->gs.Attr.n.u4Type > 11
10813 || pCtx->gs.Attr.n.u2Dpl >= (pCtx->gs.Sel & X86_SEL_RPL), VMX_IGS_GS_ATTR_DPL_RPL_UNEQUAL);
10814 HMVMX_CHECK_BREAK(!(pCtx->gs.Attr.u & 0xf00), VMX_IGS_GS_ATTR_RESERVED);
10815 HMVMX_CHECK_BREAK(!(pCtx->gs.Attr.u & 0xfffe0000), VMX_IGS_GS_ATTR_RESERVED);
10816 HMVMX_CHECK_BREAK( (pCtx->gs.u32Limit & 0xfff) == 0xfff
10817 || !(pCtx->gs.Attr.n.u1Granularity), VMX_IGS_GS_ATTR_G_INVALID);
10818 HMVMX_CHECK_BREAK( !(pCtx->gs.u32Limit & 0xfff00000)
10819 || (pCtx->gs.Attr.n.u1Granularity), VMX_IGS_GS_ATTR_G_INVALID);
10820 HMVMX_CHECK_BREAK( !(pCtx->gs.Attr.n.u4Type & X86_SEL_TYPE_CODE)
10821 || (pCtx->gs.Attr.n.u4Type & X86_SEL_TYPE_READ), VMX_IGS_GS_ATTR_TYPE_INVALID);
10822 }
10823 /* 64-bit capable CPUs. */
10824#if HC_ARCH_BITS == 64
10825 HMVMX_CHECK_BREAK(X86_IS_CANONICAL(pCtx->fs.u64Base), VMX_IGS_FS_BASE_NOT_CANONICAL);
10826 HMVMX_CHECK_BREAK(X86_IS_CANONICAL(pCtx->gs.u64Base), VMX_IGS_GS_BASE_NOT_CANONICAL);
10827 HMVMX_CHECK_BREAK( (pCtx->ldtr.Attr.u & X86DESCATTR_UNUSABLE)
10828 || X86_IS_CANONICAL(pCtx->ldtr.u64Base), VMX_IGS_LDTR_BASE_NOT_CANONICAL);
10829 HMVMX_CHECK_BREAK(!RT_HI_U32(pCtx->cs.u64Base), VMX_IGS_LONGMODE_CS_BASE_INVALID);
10830 HMVMX_CHECK_BREAK((pCtx->ss.Attr.u & X86DESCATTR_UNUSABLE) || !RT_HI_U32(pCtx->ss.u64Base),
10831 VMX_IGS_LONGMODE_SS_BASE_INVALID);
10832 HMVMX_CHECK_BREAK((pCtx->ds.Attr.u & X86DESCATTR_UNUSABLE) || !RT_HI_U32(pCtx->ds.u64Base),
10833 VMX_IGS_LONGMODE_DS_BASE_INVALID);
10834 HMVMX_CHECK_BREAK((pCtx->es.Attr.u & X86DESCATTR_UNUSABLE) || !RT_HI_U32(pCtx->es.u64Base),
10835 VMX_IGS_LONGMODE_ES_BASE_INVALID);
10836#endif
10837 }
10838 else
10839 {
10840 /* V86 mode checks. */
10841 uint32_t u32CSAttr, u32SSAttr, u32DSAttr, u32ESAttr, u32FSAttr, u32GSAttr;
10842 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
10843 {
10844 u32CSAttr = 0xf3; u32SSAttr = 0xf3;
10845 u32DSAttr = 0xf3; u32ESAttr = 0xf3;
10846 u32FSAttr = 0xf3; u32GSAttr = 0xf3;
10847 }
10848 else
10849 {
10850 u32CSAttr = pCtx->cs.Attr.u; u32SSAttr = pCtx->ss.Attr.u;
10851 u32DSAttr = pCtx->ds.Attr.u; u32ESAttr = pCtx->es.Attr.u;
10852 u32FSAttr = pCtx->fs.Attr.u; u32GSAttr = pCtx->gs.Attr.u;
10853 }
10854
10855 /* CS */
10856 HMVMX_CHECK_BREAK((pCtx->cs.u64Base == (uint64_t)pCtx->cs.Sel << 4), VMX_IGS_V86_CS_BASE_INVALID);
10857 HMVMX_CHECK_BREAK(pCtx->cs.u32Limit == 0xffff, VMX_IGS_V86_CS_LIMIT_INVALID);
10858 HMVMX_CHECK_BREAK(u32CSAttr == 0xf3, VMX_IGS_V86_CS_ATTR_INVALID);
10859 /* SS */
10860 HMVMX_CHECK_BREAK((pCtx->ss.u64Base == (uint64_t)pCtx->ss.Sel << 4), VMX_IGS_V86_SS_BASE_INVALID);
10861 HMVMX_CHECK_BREAK(pCtx->ss.u32Limit == 0xffff, VMX_IGS_V86_SS_LIMIT_INVALID);
10862 HMVMX_CHECK_BREAK(u32SSAttr == 0xf3, VMX_IGS_V86_SS_ATTR_INVALID);
10863 /* DS */
10864 HMVMX_CHECK_BREAK((pCtx->ds.u64Base == (uint64_t)pCtx->ds.Sel << 4), VMX_IGS_V86_DS_BASE_INVALID);
10865 HMVMX_CHECK_BREAK(pCtx->ds.u32Limit == 0xffff, VMX_IGS_V86_DS_LIMIT_INVALID);
10866 HMVMX_CHECK_BREAK(u32DSAttr == 0xf3, VMX_IGS_V86_DS_ATTR_INVALID);
10867 /* ES */
10868 HMVMX_CHECK_BREAK((pCtx->es.u64Base == (uint64_t)pCtx->es.Sel << 4), VMX_IGS_V86_ES_BASE_INVALID);
10869 HMVMX_CHECK_BREAK(pCtx->es.u32Limit == 0xffff, VMX_IGS_V86_ES_LIMIT_INVALID);
10870 HMVMX_CHECK_BREAK(u32ESAttr == 0xf3, VMX_IGS_V86_ES_ATTR_INVALID);
10871 /* FS */
10872 HMVMX_CHECK_BREAK((pCtx->fs.u64Base == (uint64_t)pCtx->fs.Sel << 4), VMX_IGS_V86_FS_BASE_INVALID);
10873 HMVMX_CHECK_BREAK(pCtx->fs.u32Limit == 0xffff, VMX_IGS_V86_FS_LIMIT_INVALID);
10874 HMVMX_CHECK_BREAK(u32FSAttr == 0xf3, VMX_IGS_V86_FS_ATTR_INVALID);
10875 /* GS */
10876 HMVMX_CHECK_BREAK((pCtx->gs.u64Base == (uint64_t)pCtx->gs.Sel << 4), VMX_IGS_V86_GS_BASE_INVALID);
10877 HMVMX_CHECK_BREAK(pCtx->gs.u32Limit == 0xffff, VMX_IGS_V86_GS_LIMIT_INVALID);
10878 HMVMX_CHECK_BREAK(u32GSAttr == 0xf3, VMX_IGS_V86_GS_ATTR_INVALID);
10879 /* 64-bit capable CPUs. */
10880#if HC_ARCH_BITS == 64
10881 HMVMX_CHECK_BREAK(X86_IS_CANONICAL(pCtx->fs.u64Base), VMX_IGS_FS_BASE_NOT_CANONICAL);
10882 HMVMX_CHECK_BREAK(X86_IS_CANONICAL(pCtx->gs.u64Base), VMX_IGS_GS_BASE_NOT_CANONICAL);
10883 HMVMX_CHECK_BREAK( (pCtx->ldtr.Attr.u & X86DESCATTR_UNUSABLE)
10884 || X86_IS_CANONICAL(pCtx->ldtr.u64Base), VMX_IGS_LDTR_BASE_NOT_CANONICAL);
10885 HMVMX_CHECK_BREAK(!RT_HI_U32(pCtx->cs.u64Base), VMX_IGS_LONGMODE_CS_BASE_INVALID);
10886 HMVMX_CHECK_BREAK((pCtx->ss.Attr.u & X86DESCATTR_UNUSABLE) || !RT_HI_U32(pCtx->ss.u64Base),
10887 VMX_IGS_LONGMODE_SS_BASE_INVALID);
10888 HMVMX_CHECK_BREAK((pCtx->ds.Attr.u & X86DESCATTR_UNUSABLE) || !RT_HI_U32(pCtx->ds.u64Base),
10889 VMX_IGS_LONGMODE_DS_BASE_INVALID);
10890 HMVMX_CHECK_BREAK((pCtx->es.Attr.u & X86DESCATTR_UNUSABLE) || !RT_HI_U32(pCtx->es.u64Base),
10891 VMX_IGS_LONGMODE_ES_BASE_INVALID);
10892#endif
10893 }
10894
10895 /*
10896 * TR.
10897 */
10898 HMVMX_CHECK_BREAK(!(pCtx->tr.Sel & X86_SEL_LDT), VMX_IGS_TR_TI_INVALID);
10899 /* 64-bit capable CPUs. */
10900#if HC_ARCH_BITS == 64
10901 HMVMX_CHECK_BREAK(X86_IS_CANONICAL(pCtx->tr.u64Base), VMX_IGS_TR_BASE_NOT_CANONICAL);
10902#endif
10903 if (fLongModeGuest)
10904 {
10905 HMVMX_CHECK_BREAK(pCtx->tr.Attr.n.u4Type == 11, /* 64-bit busy TSS. */
10906 VMX_IGS_LONGMODE_TR_ATTR_TYPE_INVALID);
10907 }
10908 else
10909 {
10910 HMVMX_CHECK_BREAK( pCtx->tr.Attr.n.u4Type == 3 /* 16-bit busy TSS. */
10911 || pCtx->tr.Attr.n.u4Type == 11, /* 32-bit busy TSS.*/
10912 VMX_IGS_TR_ATTR_TYPE_INVALID);
10913 }
10914 HMVMX_CHECK_BREAK(!pCtx->tr.Attr.n.u1DescType, VMX_IGS_TR_ATTR_S_INVALID);
10915 HMVMX_CHECK_BREAK(pCtx->tr.Attr.n.u1Present, VMX_IGS_TR_ATTR_P_INVALID);
10916 HMVMX_CHECK_BREAK(!(pCtx->tr.Attr.u & 0xf00), VMX_IGS_TR_ATTR_RESERVED); /* Bits 11:8 MBZ. */
10917 HMVMX_CHECK_BREAK( (pCtx->tr.u32Limit & 0xfff) == 0xfff
10918 || !(pCtx->tr.Attr.n.u1Granularity), VMX_IGS_TR_ATTR_G_INVALID);
10919 HMVMX_CHECK_BREAK( !(pCtx->tr.u32Limit & 0xfff00000)
10920 || (pCtx->tr.Attr.n.u1Granularity), VMX_IGS_TR_ATTR_G_INVALID);
10921 HMVMX_CHECK_BREAK(!(pCtx->tr.Attr.u & X86DESCATTR_UNUSABLE), VMX_IGS_TR_ATTR_UNUSABLE);
10922
10923 /*
10924 * GDTR and IDTR.
10925 */
10926#if HC_ARCH_BITS == 64
10927 rc = VMXReadVmcs64(VMX_VMCS_GUEST_GDTR_BASE, &u64Val);
10928 AssertRCBreak(rc);
10929 HMVMX_CHECK_BREAK(X86_IS_CANONICAL(u64Val), VMX_IGS_GDTR_BASE_NOT_CANONICAL);
10930
10931 rc = VMXReadVmcs64(VMX_VMCS_GUEST_IDTR_BASE, &u64Val);
10932 AssertRCBreak(rc);
10933 HMVMX_CHECK_BREAK(X86_IS_CANONICAL(u64Val), VMX_IGS_IDTR_BASE_NOT_CANONICAL);
10934#endif
10935
10936 rc = VMXReadVmcs32(VMX_VMCS32_GUEST_GDTR_LIMIT, &u32Val);
10937 AssertRCBreak(rc);
10938 HMVMX_CHECK_BREAK(!(u32Val & 0xffff0000), VMX_IGS_GDTR_LIMIT_INVALID); /* Bits 31:16 MBZ. */
10939
10940 rc = VMXReadVmcs32(VMX_VMCS32_GUEST_IDTR_LIMIT, &u32Val);
10941 AssertRCBreak(rc);
10942 HMVMX_CHECK_BREAK(!(u32Val & 0xffff0000), VMX_IGS_IDTR_LIMIT_INVALID); /* Bits 31:16 MBZ. */
10943
10944 /*
10945 * Guest Non-Register State.
10946 */
10947 /* Activity State. */
10948 uint32_t u32ActivityState;
10949 rc = VMXReadVmcs32(VMX_VMCS32_GUEST_ACTIVITY_STATE, &u32ActivityState);
10950 AssertRCBreak(rc);
10951 HMVMX_CHECK_BREAK( !u32ActivityState
10952 || (u32ActivityState & RT_BF_GET(pVM->hm.s.vmx.Msrs.u64Misc, VMX_BF_MISC_ACTIVITY_STATES)),
10953 VMX_IGS_ACTIVITY_STATE_INVALID);
10954 HMVMX_CHECK_BREAK( !(pCtx->ss.Attr.n.u2Dpl)
10955 || u32ActivityState != VMX_VMCS_GUEST_ACTIVITY_HLT, VMX_IGS_ACTIVITY_STATE_HLT_INVALID);
10956 uint32_t u32IntrState;
10957 rc = VMXReadVmcs32(VMX_VMCS32_GUEST_INT_STATE, &u32IntrState);
10958 AssertRCBreak(rc);
10959 if ( u32IntrState == VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS
10960 || u32IntrState == VMX_VMCS_GUEST_INT_STATE_BLOCK_STI)
10961 {
10962 HMVMX_CHECK_BREAK(u32ActivityState == VMX_VMCS_GUEST_ACTIVITY_ACTIVE, VMX_IGS_ACTIVITY_STATE_ACTIVE_INVALID);
10963 }
10964
10965 /** @todo Activity state and injecting interrupts. Left as a todo since we
10966 * currently don't use activity states but ACTIVE. */
10967
10968 HMVMX_CHECK_BREAK( !(pVCpu->hm.s.vmx.u32EntryCtls & VMX_ENTRY_CTLS_ENTRY_TO_SMM)
10969 || u32ActivityState != VMX_VMCS_GUEST_ACTIVITY_SIPI_WAIT, VMX_IGS_ACTIVITY_STATE_SIPI_WAIT_INVALID);
10970
10971 /* Guest interruptibility-state. */
10972 HMVMX_CHECK_BREAK(!(u32IntrState & 0xffffffe0), VMX_IGS_INTERRUPTIBILITY_STATE_RESERVED);
10973 HMVMX_CHECK_BREAK((u32IntrState & (VMX_VMCS_GUEST_INT_STATE_BLOCK_STI | VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS))
10974 != (VMX_VMCS_GUEST_INT_STATE_BLOCK_STI | VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS),
10975 VMX_IGS_INTERRUPTIBILITY_STATE_STI_MOVSS_INVALID);
10976 HMVMX_CHECK_BREAK( (u32Eflags & X86_EFL_IF)
10977 || !(u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_STI),
10978 VMX_IGS_INTERRUPTIBILITY_STATE_STI_EFL_INVALID);
10979 if (VMX_ENTRY_INT_INFO_IS_VALID(u32EntryInfo))
10980 {
10981 if (VMX_ENTRY_INT_INFO_TYPE(u32EntryInfo) == VMX_EXIT_INT_INFO_TYPE_EXT_INT)
10982 {
10983 HMVMX_CHECK_BREAK( !(u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_STI)
10984 && !(u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS),
10985 VMX_IGS_INTERRUPTIBILITY_STATE_EXT_INT_INVALID);
10986 }
10987 else if (VMX_ENTRY_INT_INFO_TYPE(u32EntryInfo) == VMX_EXIT_INT_INFO_TYPE_NMI)
10988 {
10989 HMVMX_CHECK_BREAK(!(u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS),
10990 VMX_IGS_INTERRUPTIBILITY_STATE_MOVSS_INVALID);
10991 HMVMX_CHECK_BREAK(!(u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_STI),
10992 VMX_IGS_INTERRUPTIBILITY_STATE_STI_INVALID);
10993 }
10994 }
10995 /** @todo Assumes the processor is not in SMM. */
10996 HMVMX_CHECK_BREAK(!(u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_SMI),
10997 VMX_IGS_INTERRUPTIBILITY_STATE_SMI_INVALID);
10998 HMVMX_CHECK_BREAK( !(pVCpu->hm.s.vmx.u32EntryCtls & VMX_ENTRY_CTLS_ENTRY_TO_SMM)
10999 || (u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_SMI),
11000 VMX_IGS_INTERRUPTIBILITY_STATE_SMI_SMM_INVALID);
11001 if ( (pVCpu->hm.s.vmx.u32PinCtls & VMX_PIN_CTLS_VIRT_NMI)
11002 && VMX_ENTRY_INT_INFO_IS_VALID(u32EntryInfo)
11003 && VMX_ENTRY_INT_INFO_TYPE(u32EntryInfo) == VMX_EXIT_INT_INFO_TYPE_NMI)
11004 {
11005 HMVMX_CHECK_BREAK(!(u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_NMI),
11006 VMX_IGS_INTERRUPTIBILITY_STATE_NMI_INVALID);
11007 }
11008
11009 /* Pending debug exceptions. */
11010#if HC_ARCH_BITS == 64
11011 rc = VMXReadVmcs64(VMX_VMCS_GUEST_PENDING_DEBUG_XCPTS, &u64Val);
11012 AssertRCBreak(rc);
11013 /* Bits 63:15, Bit 13, Bits 11:4 MBZ. */
11014 HMVMX_CHECK_BREAK(!(u64Val & UINT64_C(0xffffffffffffaff0)), VMX_IGS_LONGMODE_PENDING_DEBUG_RESERVED);
11015 u32Val = u64Val; /* For pending debug exceptions checks below. */
11016#else
11017 rc = VMXReadVmcs32(VMX_VMCS_GUEST_PENDING_DEBUG_XCPTS, &u32Val);
11018 AssertRCBreak(rc);
11019 /* Bits 31:15, Bit 13, Bits 11:4 MBZ. */
11020 HMVMX_CHECK_BREAK(!(u32Val & 0xffffaff0), VMX_IGS_PENDING_DEBUG_RESERVED);
11021#endif
11022
11023 if ( (u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_STI)
11024 || (u32IntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS)
11025 || u32ActivityState == VMX_VMCS_GUEST_ACTIVITY_HLT)
11026 {
11027 if ( (u32Eflags & X86_EFL_TF)
11028 && !(u64DebugCtlMsr & RT_BIT_64(1))) /* Bit 1 is IA32_DEBUGCTL.BTF. */
11029 {
11030 /* Bit 14 is PendingDebug.BS. */
11031 HMVMX_CHECK_BREAK(u32Val & RT_BIT(14), VMX_IGS_PENDING_DEBUG_XCPT_BS_NOT_SET);
11032 }
11033 if ( !(u32Eflags & X86_EFL_TF)
11034 || (u64DebugCtlMsr & RT_BIT_64(1))) /* Bit 1 is IA32_DEBUGCTL.BTF. */
11035 {
11036 /* Bit 14 is PendingDebug.BS. */
11037 HMVMX_CHECK_BREAK(!(u32Val & RT_BIT(14)), VMX_IGS_PENDING_DEBUG_XCPT_BS_NOT_CLEAR);
11038 }
11039 }
11040
11041 /* VMCS link pointer. */
11042 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_VMCS_LINK_PTR_FULL, &u64Val);
11043 AssertRCBreak(rc);
11044 if (u64Val != UINT64_C(0xffffffffffffffff))
11045 {
11046 HMVMX_CHECK_BREAK(!(u64Val & 0xfff), VMX_IGS_VMCS_LINK_PTR_RESERVED);
11047 /** @todo Bits beyond the processor's physical-address width MBZ. */
11048 /** @todo 32-bit located in memory referenced by value of this field (as a
11049 * physical address) must contain the processor's VMCS revision ID. */
11050 /** @todo SMM checks. */
11051 }
11052
11053 /** @todo Checks on Guest Page-Directory-Pointer-Table Entries when guest is
11054 * not using Nested Paging? */
11055 if ( pVM->hm.s.fNestedPaging
11056 && !fLongModeGuest
11057 && CPUMIsGuestInPAEModeEx(pCtx))
11058 {
11059 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_PDPTE0_FULL, &u64Val);
11060 AssertRCBreak(rc);
11061 HMVMX_CHECK_BREAK(!(u64Val & X86_PDPE_PAE_MBZ_MASK), VMX_IGS_PAE_PDPTE_RESERVED);
11062
11063 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_PDPTE1_FULL, &u64Val);
11064 AssertRCBreak(rc);
11065 HMVMX_CHECK_BREAK(!(u64Val & X86_PDPE_PAE_MBZ_MASK), VMX_IGS_PAE_PDPTE_RESERVED);
11066
11067 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_PDPTE2_FULL, &u64Val);
11068 AssertRCBreak(rc);
11069 HMVMX_CHECK_BREAK(!(u64Val & X86_PDPE_PAE_MBZ_MASK), VMX_IGS_PAE_PDPTE_RESERVED);
11070
11071 rc = VMXReadVmcs64(VMX_VMCS64_GUEST_PDPTE3_FULL, &u64Val);
11072 AssertRCBreak(rc);
11073 HMVMX_CHECK_BREAK(!(u64Val & X86_PDPE_PAE_MBZ_MASK), VMX_IGS_PAE_PDPTE_RESERVED);
11074 }
11075
11076 /* Shouldn't happen but distinguish it from AssertRCBreak() errors. */
11077 if (uError == VMX_IGS_ERROR)
11078 uError = VMX_IGS_REASON_NOT_FOUND;
11079 } while (0);
11080
11081 pVCpu->hm.s.u32HMError = uError;
11082 return uError;
11083
11084#undef HMVMX_ERROR_BREAK
11085#undef HMVMX_CHECK_BREAK
11086}
11087
11088
11089/** @name VM-exit handlers.
11090 * @{
11091 */
11092/* -=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= */
11093/* -=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=- VM-exit handlers -=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=- */
11094/* -=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= */
11095
11096/**
11097 * VM-exit handler for external interrupts (VMX_EXIT_EXT_INT).
11098 */
11099HMVMX_EXIT_DECL hmR0VmxExitExtInt(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11100{
11101 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11102 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitExtInt);
11103 /* Windows hosts (32-bit and 64-bit) have DPC latency issues. See @bugref{6853}. */
11104 if (VMMR0ThreadCtxHookIsEnabled(pVCpu))
11105 return VINF_SUCCESS;
11106 return VINF_EM_RAW_INTERRUPT;
11107}
11108
11109
11110/**
11111 * VM-exit handler for exceptions or NMIs (VMX_EXIT_XCPT_OR_NMI).
11112 */
11113HMVMX_EXIT_DECL hmR0VmxExitXcptOrNmi(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11114{
11115 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11116 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatExitXcptNmi, y3);
11117
11118 int rc = hmR0VmxReadExitIntInfoVmcs(pVmxTransient);
11119 AssertRCReturn(rc, rc);
11120
11121 uint32_t uIntType = VMX_EXIT_INT_INFO_TYPE(pVmxTransient->uExitIntInfo);
11122 Assert( !(pVCpu->hm.s.vmx.u32ExitCtls & VMX_EXIT_CTLS_ACK_EXT_INT)
11123 && uIntType != VMX_EXIT_INT_INFO_TYPE_EXT_INT);
11124 Assert(VMX_EXIT_INT_INFO_IS_VALID(pVmxTransient->uExitIntInfo));
11125
11126 if (uIntType == VMX_EXIT_INT_INFO_TYPE_NMI)
11127 {
11128 /*
11129 * This cannot be a guest NMI as the only way for the guest to receive an NMI is if we
11130 * injected it ourselves and anything we inject is not going to cause a VM-exit directly
11131 * for the event being injected[1]. Go ahead and dispatch the NMI to the host[2].
11132 *
11133 * [1] -- See Intel spec. 27.2.3 "Information for VM Exits During Event Delivery".
11134 * [2] -- See Intel spec. 27.5.5 "Updating Non-Register State".
11135 */
11136 VMXDispatchHostNmi();
11137 STAM_REL_COUNTER_INC(&pVCpu->hm.s.StatExitHostNmiInGC);
11138 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExitXcptNmi, y3);
11139 return VINF_SUCCESS;
11140 }
11141
11142 /* If this VM-exit occurred while delivering an event through the guest IDT, handle it accordingly. */
11143 VBOXSTRICTRC rcStrictRc1 = hmR0VmxCheckExitDueToEventDelivery(pVCpu, pVmxTransient);
11144 if (RT_UNLIKELY(rcStrictRc1 == VINF_SUCCESS))
11145 { /* likely */ }
11146 else
11147 {
11148 if (rcStrictRc1 == VINF_HM_DOUBLE_FAULT)
11149 rcStrictRc1 = VINF_SUCCESS;
11150 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExitXcptNmi, y3);
11151 return rcStrictRc1;
11152 }
11153
11154 uint32_t uExitIntInfo = pVmxTransient->uExitIntInfo;
11155 uint32_t uVector = VMX_EXIT_INT_INFO_VECTOR(uExitIntInfo);
11156 switch (uIntType)
11157 {
11158 case VMX_EXIT_INT_INFO_TYPE_PRIV_SW_XCPT: /* Privileged software exception. (#DB from ICEBP) */
11159 Assert(uVector == X86_XCPT_DB);
11160 RT_FALL_THRU();
11161 case VMX_EXIT_INT_INFO_TYPE_SW_XCPT: /* Software exception. (#BP or #OF) */
11162 Assert(uVector == X86_XCPT_BP || uVector == X86_XCPT_OF || uIntType == VMX_EXIT_INT_INFO_TYPE_PRIV_SW_XCPT);
11163 RT_FALL_THRU();
11164 case VMX_EXIT_INT_INFO_TYPE_HW_XCPT:
11165 {
11166 /*
11167 * If there's any exception caused as a result of event injection, the resulting
11168 * secondary/final execption will be pending, we shall continue guest execution
11169 * after injecting the event. The page-fault case is complicated and we manually
11170 * handle any currently pending event in hmR0VmxExitXcptPF.
11171 */
11172 if (!pVCpu->hm.s.Event.fPending)
11173 { /* likely */ }
11174 else if (uVector != X86_XCPT_PF)
11175 {
11176 rc = VINF_SUCCESS;
11177 break;
11178 }
11179
11180 switch (uVector)
11181 {
11182 case X86_XCPT_PF: rc = hmR0VmxExitXcptPF(pVCpu, pVmxTransient); break;
11183 case X86_XCPT_GP: rc = hmR0VmxExitXcptGP(pVCpu, pVmxTransient); break;
11184 case X86_XCPT_MF: rc = hmR0VmxExitXcptMF(pVCpu, pVmxTransient); break;
11185 case X86_XCPT_DB: rc = hmR0VmxExitXcptDB(pVCpu, pVmxTransient); break;
11186 case X86_XCPT_BP: rc = hmR0VmxExitXcptBP(pVCpu, pVmxTransient); break;
11187 case X86_XCPT_AC: rc = hmR0VmxExitXcptAC(pVCpu, pVmxTransient); break;
11188
11189 case X86_XCPT_NM: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestNM);
11190 rc = hmR0VmxExitXcptGeneric(pVCpu, pVmxTransient); break;
11191 case X86_XCPT_XF: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestXF);
11192 rc = hmR0VmxExitXcptGeneric(pVCpu, pVmxTransient); break;
11193 case X86_XCPT_DE: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestDE);
11194 rc = hmR0VmxExitXcptGeneric(pVCpu, pVmxTransient); break;
11195 case X86_XCPT_UD: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestUD);
11196 rc = hmR0VmxExitXcptGeneric(pVCpu, pVmxTransient); break;
11197 case X86_XCPT_SS: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestSS);
11198 rc = hmR0VmxExitXcptGeneric(pVCpu, pVmxTransient); break;
11199 case X86_XCPT_NP: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestNP);
11200 rc = hmR0VmxExitXcptGeneric(pVCpu, pVmxTransient); break;
11201 case X86_XCPT_TS: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestTS);
11202 rc = hmR0VmxExitXcptGeneric(pVCpu, pVmxTransient); break;
11203 default:
11204 {
11205 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestXcpUnk);
11206 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
11207 {
11208 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.vmx.pRealModeTSS);
11209 Assert(PDMVmmDevHeapIsEnabled(pVCpu->CTX_SUFF(pVM)));
11210 Assert(CPUMIsGuestInRealModeEx(&pVCpu->cpum.GstCtx));
11211
11212 rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CR0);
11213 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
11214 rc |= hmR0VmxReadExitIntErrorCodeVmcs(pVmxTransient);
11215 AssertRCReturn(rc, rc);
11216 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_INT_INFO(uExitIntInfo),
11217 pVmxTransient->cbInstr, pVmxTransient->uExitIntErrorCode,
11218 0 /* GCPtrFaultAddress */);
11219 }
11220 else
11221 {
11222 AssertMsgFailed(("Unexpected VM-exit caused by exception %#x\n", uVector));
11223 pVCpu->hm.s.u32HMError = uVector;
11224 rc = VERR_VMX_UNEXPECTED_EXCEPTION;
11225 }
11226 break;
11227 }
11228 }
11229 break;
11230 }
11231
11232 default:
11233 {
11234 pVCpu->hm.s.u32HMError = uExitIntInfo;
11235 rc = VERR_VMX_UNEXPECTED_INTERRUPTION_EXIT_TYPE;
11236 AssertMsgFailed(("Unexpected interruption info %#x\n", VMX_EXIT_INT_INFO_TYPE(uExitIntInfo)));
11237 break;
11238 }
11239 }
11240 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExitXcptNmi, y3);
11241 return rc;
11242}
11243
11244
11245/**
11246 * VM-exit handler for interrupt-window exiting (VMX_EXIT_INT_WINDOW).
11247 */
11248HMVMX_EXIT_NSRC_DECL hmR0VmxExitIntWindow(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11249{
11250 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11251
11252 /* Indicate that we no longer need to VM-exit when the guest is ready to receive interrupts, it is now ready. */
11253 hmR0VmxClearIntWindowExitVmcs(pVCpu);
11254
11255 /* Deliver the pending interrupts via hmR0VmxEvaluatePendingEvent() and resume guest execution. */
11256 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIntWindow);
11257 return VINF_SUCCESS;
11258}
11259
11260
11261/**
11262 * VM-exit handler for NMI-window exiting (VMX_EXIT_NMI_WINDOW).
11263 */
11264HMVMX_EXIT_NSRC_DECL hmR0VmxExitNmiWindow(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11265{
11266 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11267 if (RT_UNLIKELY(!(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_NMI_WINDOW_EXIT)))
11268 {
11269 AssertMsgFailed(("Unexpected NMI-window exit.\n"));
11270 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11271 }
11272
11273 Assert(!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_BLOCK_NMIS));
11274
11275 /*
11276 * If block-by-STI is set when we get this VM-exit, it means the CPU doesn't block NMIs following STI.
11277 * It is therefore safe to unblock STI and deliver the NMI ourselves. See @bugref{7445}.
11278 */
11279 uint32_t fIntrState = 0;
11280 int rc = VMXReadVmcs32(VMX_VMCS32_GUEST_INT_STATE, &fIntrState);
11281 AssertRCReturn(rc, rc);
11282 Assert(!(fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_MOVSS));
11283 if (fIntrState & VMX_VMCS_GUEST_INT_STATE_BLOCK_STI)
11284 {
11285 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS))
11286 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS);
11287
11288 fIntrState &= ~VMX_VMCS_GUEST_INT_STATE_BLOCK_STI;
11289 rc = VMXWriteVmcs32(VMX_VMCS32_GUEST_INT_STATE, fIntrState);
11290 AssertRCReturn(rc, rc);
11291 }
11292
11293 /* Indicate that we no longer need to VM-exit when the guest is ready to receive NMIs, it is now ready */
11294 hmR0VmxClearNmiWindowExitVmcs(pVCpu);
11295
11296 /* Deliver the pending NMI via hmR0VmxEvaluatePendingEvent() and resume guest execution. */
11297 return VINF_SUCCESS;
11298}
11299
11300
11301/**
11302 * VM-exit handler for WBINVD (VMX_EXIT_WBINVD). Conditional VM-exit.
11303 */
11304HMVMX_EXIT_NSRC_DECL hmR0VmxExitWbinvd(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11305{
11306 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11307 return hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
11308}
11309
11310
11311/**
11312 * VM-exit handler for INVD (VMX_EXIT_INVD). Unconditional VM-exit.
11313 */
11314HMVMX_EXIT_NSRC_DECL hmR0VmxExitInvd(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11315{
11316 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11317 return hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
11318}
11319
11320
11321/**
11322 * VM-exit handler for CPUID (VMX_EXIT_CPUID). Unconditional VM-exit.
11323 */
11324HMVMX_EXIT_DECL hmR0VmxExitCpuid(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11325{
11326 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11327
11328 /*
11329 * Get the state we need and update the exit history entry.
11330 */
11331 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
11332 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_EXEC_DECODED_NO_MEM_MASK);
11333 AssertRCReturn(rc, rc);
11334
11335 VBOXSTRICTRC rcStrict;
11336 PCEMEXITREC pExitRec = EMHistoryUpdateFlagsAndTypeAndPC(pVCpu,
11337 EMEXIT_MAKE_FT(EMEXIT_F_KIND_EM | EMEXIT_F_HM, EMEXITTYPE_CPUID),
11338 pVCpu->cpum.GstCtx.rip + pVCpu->cpum.GstCtx.cs.u64Base);
11339 if (!pExitRec)
11340 {
11341 /*
11342 * Regular CPUID instruction execution.
11343 */
11344 rcStrict = IEMExecDecodedCpuid(pVCpu, pVmxTransient->cbInstr);
11345 if (rcStrict == VINF_SUCCESS)
11346 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS);
11347 else if (rcStrict == VINF_IEM_RAISED_XCPT)
11348 {
11349 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
11350 rcStrict = VINF_SUCCESS;
11351 }
11352 }
11353 else
11354 {
11355 /*
11356 * Frequent exit or something needing probing. Get state and call EMHistoryExec.
11357 */
11358 int rc2 = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
11359 AssertRCReturn(rc2, rc2);
11360
11361 Log4(("CpuIdExit/%u: %04x:%08RX64: %#x/%#x -> EMHistoryExec\n",
11362 pVCpu->idCpu, pVCpu->cpum.GstCtx.cs.Sel, pVCpu->cpum.GstCtx.rip, pVCpu->cpum.GstCtx.eax, pVCpu->cpum.GstCtx.ecx));
11363
11364 rcStrict = EMHistoryExec(pVCpu, pExitRec, 0);
11365 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
11366
11367 Log4(("CpuIdExit/%u: %04x:%08RX64: EMHistoryExec -> %Rrc + %04x:%08RX64\n",
11368 pVCpu->idCpu, pVCpu->cpum.GstCtx.cs.Sel, pVCpu->cpum.GstCtx.rip,
11369 VBOXSTRICTRC_VAL(rcStrict), pVCpu->cpum.GstCtx.cs.Sel, pVCpu->cpum.GstCtx.rip));
11370 }
11371 return rcStrict;
11372}
11373
11374
11375/**
11376 * VM-exit handler for GETSEC (VMX_EXIT_GETSEC). Unconditional VM-exit.
11377 */
11378HMVMX_EXIT_DECL hmR0VmxExitGetsec(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11379{
11380 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11381 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CR4);
11382 AssertRCReturn(rc, rc);
11383
11384 if (pVCpu->cpum.GstCtx.cr4 & X86_CR4_SMXE)
11385 return VINF_EM_RAW_EMULATE_INSTR;
11386
11387 AssertMsgFailed(("hmR0VmxExitGetsec: unexpected VM-exit when CR4.SMXE is 0.\n"));
11388 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11389}
11390
11391
11392/**
11393 * VM-exit handler for RDTSC (VMX_EXIT_RDTSC). Conditional VM-exit.
11394 */
11395HMVMX_EXIT_DECL hmR0VmxExitRdtsc(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11396{
11397 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11398 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_MUST_MASK);
11399 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
11400 AssertRCReturn(rc, rc);
11401
11402 VBOXSTRICTRC rcStrict = IEMExecDecodedRdtsc(pVCpu, pVmxTransient->cbInstr);
11403 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
11404 {
11405 /* If we get a spurious VM-exit when offsetting is enabled,
11406 we must reset offsetting on VM-reentry. See @bugref{6634}. */
11407 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TSC_OFFSETTING)
11408 pVmxTransient->fUpdateTscOffsettingAndPreemptTimer = true;
11409 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS);
11410 }
11411 else if (rcStrict == VINF_IEM_RAISED_XCPT)
11412 {
11413 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
11414 rcStrict = VINF_SUCCESS;
11415 }
11416 return rcStrict;
11417}
11418
11419
11420/**
11421 * VM-exit handler for RDTSCP (VMX_EXIT_RDTSCP). Conditional VM-exit.
11422 */
11423HMVMX_EXIT_DECL hmR0VmxExitRdtscp(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11424{
11425 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11426 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_MUST_MASK | CPUMCTX_EXTRN_TSC_AUX);
11427 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
11428 AssertRCReturn(rc, rc);
11429
11430 VBOXSTRICTRC rcStrict = IEMExecDecodedRdtscp(pVCpu, pVmxTransient->cbInstr);
11431 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
11432 {
11433 /* If we get a spurious VM-exit when offsetting is enabled,
11434 we must reset offsetting on VM-reentry. See @bugref{6634}. */
11435 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TSC_OFFSETTING)
11436 pVmxTransient->fUpdateTscOffsettingAndPreemptTimer = true;
11437 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS);
11438 }
11439 else if (rcStrict == VINF_IEM_RAISED_XCPT)
11440 {
11441 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
11442 rcStrict = VINF_SUCCESS;
11443 }
11444 return rcStrict;
11445}
11446
11447
11448/**
11449 * VM-exit handler for RDPMC (VMX_EXIT_RDPMC). Conditional VM-exit.
11450 */
11451HMVMX_EXIT_DECL hmR0VmxExitRdpmc(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11452{
11453 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11454 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CR4 | CPUMCTX_EXTRN_CR0 | CPUMCTX_EXTRN_RFLAGS | CPUMCTX_EXTRN_SS);
11455 AssertRCReturn(rc, rc);
11456
11457 PVM pVM = pVCpu->CTX_SUFF(pVM);
11458 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
11459 rc = EMInterpretRdpmc(pVM, pVCpu, CPUMCTX2CORE(pCtx));
11460 if (RT_LIKELY(rc == VINF_SUCCESS))
11461 {
11462 rc = hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
11463 Assert(pVmxTransient->cbInstr == 2);
11464 }
11465 else
11466 {
11467 AssertMsgFailed(("hmR0VmxExitRdpmc: EMInterpretRdpmc failed with %Rrc\n", rc));
11468 rc = VERR_EM_INTERPRETER;
11469 }
11470 return rc;
11471}
11472
11473
11474/**
11475 * VM-exit handler for VMCALL (VMX_EXIT_VMCALL). Unconditional VM-exit.
11476 */
11477HMVMX_EXIT_DECL hmR0VmxExitVmcall(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11478{
11479 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11480
11481 VBOXSTRICTRC rcStrict = VERR_VMX_IPE_3;
11482 if (EMAreHypercallInstructionsEnabled(pVCpu))
11483 {
11484 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_RIP | CPUMCTX_EXTRN_RFLAGS | CPUMCTX_EXTRN_CR0
11485 | CPUMCTX_EXTRN_SS | CPUMCTX_EXTRN_CS | CPUMCTX_EXTRN_EFER);
11486 AssertRCReturn(rc, rc);
11487
11488 /* Perform the hypercall. */
11489 rcStrict = GIMHypercall(pVCpu, &pVCpu->cpum.GstCtx);
11490 if (rcStrict == VINF_SUCCESS)
11491 {
11492 rc = hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
11493 AssertRCReturn(rc, rc);
11494 }
11495 else
11496 Assert( rcStrict == VINF_GIM_R3_HYPERCALL
11497 || rcStrict == VINF_GIM_HYPERCALL_CONTINUING
11498 || RT_FAILURE(rcStrict));
11499
11500 /* If the hypercall changes anything other than guest's general-purpose registers,
11501 we would need to reload the guest changed bits here before VM-entry. */
11502 }
11503 else
11504 Log4Func(("Hypercalls not enabled\n"));
11505
11506 /* If hypercalls are disabled or the hypercall failed for some reason, raise #UD and continue. */
11507 if (RT_FAILURE(rcStrict))
11508 {
11509 hmR0VmxSetPendingXcptUD(pVCpu);
11510 rcStrict = VINF_SUCCESS;
11511 }
11512
11513 return rcStrict;
11514}
11515
11516
11517/**
11518 * VM-exit handler for INVLPG (VMX_EXIT_INVLPG). Conditional VM-exit.
11519 */
11520HMVMX_EXIT_DECL hmR0VmxExitInvlpg(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11521{
11522 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11523 Assert(!pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging || pVCpu->hm.s.fUsingDebugLoop);
11524
11525 int rc = hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
11526 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
11527 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_EXEC_DECODED_MEM_MASK);
11528 AssertRCReturn(rc, rc);
11529
11530 VBOXSTRICTRC rcStrict = IEMExecDecodedInvlpg(pVCpu, pVmxTransient->cbInstr, pVmxTransient->uExitQual);
11531
11532 if (rcStrict == VINF_SUCCESS || rcStrict == VINF_PGM_SYNC_CR3)
11533 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS);
11534 else if (rcStrict == VINF_IEM_RAISED_XCPT)
11535 {
11536 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
11537 rcStrict = VINF_SUCCESS;
11538 }
11539 else
11540 AssertMsgFailed(("Unexpected IEMExecDecodedInvlpg(%#RX64) sttus: %Rrc\n", pVmxTransient->uExitQual,
11541 VBOXSTRICTRC_VAL(rcStrict)));
11542 return rcStrict;
11543}
11544
11545
11546/**
11547 * VM-exit handler for MONITOR (VMX_EXIT_MONITOR). Conditional VM-exit.
11548 */
11549HMVMX_EXIT_DECL hmR0VmxExitMonitor(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11550{
11551 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11552 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CR0 | CPUMCTX_EXTRN_RFLAGS | CPUMCTX_EXTRN_SS);
11553 AssertRCReturn(rc, rc);
11554
11555 PVM pVM = pVCpu->CTX_SUFF(pVM);
11556 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
11557 rc = EMInterpretMonitor(pVM, pVCpu, CPUMCTX2CORE(pCtx));
11558 if (RT_LIKELY(rc == VINF_SUCCESS))
11559 rc = hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
11560 else
11561 {
11562 AssertMsg(rc == VERR_EM_INTERPRETER, ("hmR0VmxExitMonitor: EMInterpretMonitor failed with %Rrc\n", rc));
11563 rc = VERR_EM_INTERPRETER;
11564 }
11565 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitMonitor);
11566 return rc;
11567}
11568
11569
11570/**
11571 * VM-exit handler for MWAIT (VMX_EXIT_MWAIT). Conditional VM-exit.
11572 */
11573HMVMX_EXIT_DECL hmR0VmxExitMwait(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11574{
11575 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11576 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CR0 | CPUMCTX_EXTRN_RFLAGS | CPUMCTX_EXTRN_SS);
11577 AssertRCReturn(rc, rc);
11578
11579 PVM pVM = pVCpu->CTX_SUFF(pVM);
11580 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
11581 VBOXSTRICTRC rc2 = EMInterpretMWait(pVM, pVCpu, CPUMCTX2CORE(pCtx));
11582 rc = VBOXSTRICTRC_VAL(rc2);
11583 if (RT_LIKELY( rc == VINF_SUCCESS
11584 || rc == VINF_EM_HALT))
11585 {
11586 int rc3 = hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
11587 AssertRCReturn(rc3, rc3);
11588
11589 if ( rc == VINF_EM_HALT
11590 && EMMonitorWaitShouldContinue(pVCpu, pCtx))
11591 rc = VINF_SUCCESS;
11592 }
11593 else
11594 {
11595 AssertMsg(rc == VERR_EM_INTERPRETER, ("hmR0VmxExitMwait: EMInterpretMWait failed with %Rrc\n", rc));
11596 rc = VERR_EM_INTERPRETER;
11597 }
11598 AssertMsg(rc == VINF_SUCCESS || rc == VINF_EM_HALT || rc == VERR_EM_INTERPRETER,
11599 ("hmR0VmxExitMwait: failed, invalid error code %Rrc\n", rc));
11600 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitMwait);
11601 return rc;
11602}
11603
11604
11605/**
11606 * VM-exit handler for RSM (VMX_EXIT_RSM). Unconditional VM-exit.
11607 */
11608HMVMX_EXIT_NSRC_DECL hmR0VmxExitRsm(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11609{
11610 /*
11611 * Execution of RSM outside of SMM mode causes #UD regardless of VMX root or VMX non-root
11612 * mode. In theory, we should never get this VM-exit. This can happen only if dual-monitor
11613 * treatment of SMI and VMX is enabled, which can (only?) be done by executing VMCALL in
11614 * VMX root operation. If we get here, something funny is going on.
11615 *
11616 * See Intel spec. 33.15.5 "Enabling the Dual-Monitor Treatment".
11617 */
11618 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11619 AssertMsgFailed(("Unexpected RSM VM-exit\n"));
11620 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11621}
11622
11623
11624/**
11625 * VM-exit handler for SMI (VMX_EXIT_SMI). Unconditional VM-exit.
11626 */
11627HMVMX_EXIT_NSRC_DECL hmR0VmxExitSmi(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11628{
11629 /*
11630 * This can only happen if we support dual-monitor treatment of SMI, which can be activated
11631 * by executing VMCALL in VMX root operation. Only an STM (SMM transfer monitor) would get
11632 * this VM-exit when we (the executive monitor) execute a VMCALL in VMX root mode or receive
11633 * an SMI. If we get here, something funny is going on.
11634 *
11635 * See Intel spec. 33.15.6 "Activating the Dual-Monitor Treatment"
11636 * See Intel spec. 25.3 "Other Causes of VM-Exits"
11637 */
11638 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11639 AssertMsgFailed(("Unexpected SMI VM-exit\n"));
11640 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11641}
11642
11643
11644/**
11645 * VM-exit handler for IO SMI (VMX_EXIT_IO_SMI). Unconditional VM-exit.
11646 */
11647HMVMX_EXIT_NSRC_DECL hmR0VmxExitIoSmi(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11648{
11649 /* Same treatment as VMX_EXIT_SMI. See comment in hmR0VmxExitSmi(). */
11650 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11651 AssertMsgFailed(("Unexpected IO SMI VM-exit\n"));
11652 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11653}
11654
11655
11656/**
11657 * VM-exit handler for SIPI (VMX_EXIT_SIPI). Conditional VM-exit.
11658 */
11659HMVMX_EXIT_NSRC_DECL hmR0VmxExitSipi(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11660{
11661 /*
11662 * SIPI exits can only occur in VMX non-root operation when the "wait-for-SIPI" guest activity state is used.
11663 * We don't make use of it as our guests don't have direct access to the host LAPIC.
11664 * See Intel spec. 25.3 "Other Causes of VM-exits".
11665 */
11666 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11667 AssertMsgFailed(("Unexpected SIPI VM-exit\n"));
11668 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11669}
11670
11671
11672/**
11673 * VM-exit handler for INIT signal (VMX_EXIT_INIT_SIGNAL). Unconditional
11674 * VM-exit.
11675 */
11676HMVMX_EXIT_NSRC_DECL hmR0VmxExitInitSignal(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11677{
11678 /*
11679 * INIT signals are blocked in VMX root operation by VMXON and by SMI in SMM.
11680 * See Intel spec. 33.14.1 Default Treatment of SMI Delivery" and Intel spec. 29.3 "VMX Instructions" for "VMXON".
11681 *
11682 * It is -NOT- blocked in VMX non-root operation so we can, in theory, still get these VM-exits.
11683 * See Intel spec. "23.8 Restrictions on VMX operation".
11684 */
11685 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11686 return VINF_SUCCESS;
11687}
11688
11689
11690/**
11691 * VM-exit handler for triple faults (VMX_EXIT_TRIPLE_FAULT). Unconditional
11692 * VM-exit.
11693 */
11694HMVMX_EXIT_DECL hmR0VmxExitTripleFault(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11695{
11696 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11697 return VINF_EM_RESET;
11698}
11699
11700
11701/**
11702 * VM-exit handler for HLT (VMX_EXIT_HLT). Conditional VM-exit.
11703 */
11704HMVMX_EXIT_DECL hmR0VmxExitHlt(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11705{
11706 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11707 Assert(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_HLT_EXIT);
11708
11709 int rc = hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
11710 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_RFLAGS);
11711 AssertRCReturn(rc, rc);
11712
11713 if (EMShouldContinueAfterHalt(pVCpu, &pVCpu->cpum.GstCtx)) /* Requires eflags. */
11714 rc = VINF_SUCCESS;
11715 else
11716 rc = VINF_EM_HALT;
11717
11718 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitHlt);
11719 if (rc != VINF_SUCCESS)
11720 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchHltToR3);
11721 return rc;
11722}
11723
11724
11725/**
11726 * VM-exit handler for instructions that result in a \#UD exception delivered to
11727 * the guest.
11728 */
11729HMVMX_EXIT_NSRC_DECL hmR0VmxExitSetPendingXcptUD(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11730{
11731 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11732 hmR0VmxSetPendingXcptUD(pVCpu);
11733 return VINF_SUCCESS;
11734}
11735
11736
11737/**
11738 * VM-exit handler for expiry of the VMX preemption timer.
11739 */
11740HMVMX_EXIT_DECL hmR0VmxExitPreemptTimer(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11741{
11742 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11743
11744 /* If the preemption-timer has expired, reinitialize the preemption timer on next VM-entry. */
11745 pVmxTransient->fUpdateTscOffsettingAndPreemptTimer = true;
11746
11747 /* If there are any timer events pending, fall back to ring-3, otherwise resume guest execution. */
11748 PVM pVM = pVCpu->CTX_SUFF(pVM);
11749 bool fTimersPending = TMTimerPollBool(pVM, pVCpu);
11750 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitPreemptTimer);
11751 return fTimersPending ? VINF_EM_RAW_TIMER_PENDING : VINF_SUCCESS;
11752}
11753
11754
11755/**
11756 * VM-exit handler for XSETBV (VMX_EXIT_XSETBV). Unconditional VM-exit.
11757 */
11758HMVMX_EXIT_DECL hmR0VmxExitXsetbv(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11759{
11760 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11761
11762 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
11763 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_MUST_MASK | CPUMCTX_EXTRN_CR4);
11764 AssertRCReturn(rc, rc);
11765
11766 VBOXSTRICTRC rcStrict = IEMExecDecodedXsetbv(pVCpu, pVmxTransient->cbInstr);
11767 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, rcStrict != VINF_IEM_RAISED_XCPT ? HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS
11768 : HM_CHANGED_RAISED_XCPT_MASK);
11769
11770 PCCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
11771 pVCpu->hm.s.fLoadSaveGuestXcr0 = (pCtx->cr4 & X86_CR4_OSXSAVE) && pCtx->aXcr[0] != ASMGetXcr0();
11772
11773 return rcStrict;
11774}
11775
11776
11777/**
11778 * VM-exit handler for INVPCID (VMX_EXIT_INVPCID). Conditional VM-exit.
11779 */
11780HMVMX_EXIT_DECL hmR0VmxExitInvpcid(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11781{
11782 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11783 /** @todo Use VM-exit instruction information. */
11784 return VERR_EM_INTERPRETER;
11785}
11786
11787
11788/**
11789 * VM-exit handler for invalid-guest-state (VMX_EXIT_ERR_INVALID_GUEST_STATE).
11790 * Error VM-exit.
11791 */
11792HMVMX_EXIT_NSRC_DECL hmR0VmxExitErrInvalidGuestState(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11793{
11794 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
11795 AssertRCReturn(rc, rc);
11796 rc = hmR0VmxCheckVmcsCtls(pVCpu);
11797 if (RT_FAILURE(rc))
11798 return rc;
11799
11800 uint32_t uInvalidReason = hmR0VmxCheckGuestState(pVCpu);
11801 NOREF(uInvalidReason);
11802
11803#ifdef VBOX_STRICT
11804 uint32_t fIntrState;
11805 RTHCUINTREG uHCReg;
11806 uint64_t u64Val;
11807 uint32_t u32Val;
11808
11809 rc = hmR0VmxReadEntryIntInfoVmcs(pVmxTransient);
11810 rc |= hmR0VmxReadEntryXcptErrorCodeVmcs(pVmxTransient);
11811 rc |= hmR0VmxReadEntryInstrLenVmcs(pVmxTransient);
11812 rc |= VMXReadVmcs32(VMX_VMCS32_GUEST_INT_STATE, &fIntrState);
11813 AssertRCReturn(rc, rc);
11814
11815 Log4(("uInvalidReason %u\n", uInvalidReason));
11816 Log4(("VMX_VMCS32_CTRL_ENTRY_INTERRUPTION_INFO %#RX32\n", pVmxTransient->uEntryIntInfo));
11817 Log4(("VMX_VMCS32_CTRL_ENTRY_EXCEPTION_ERRCODE %#RX32\n", pVmxTransient->uEntryXcptErrorCode));
11818 Log4(("VMX_VMCS32_CTRL_ENTRY_INSTR_LENGTH %#RX32\n", pVmxTransient->cbEntryInstr));
11819 Log4(("VMX_VMCS32_GUEST_INT_STATE %#RX32\n", fIntrState));
11820
11821 rc = VMXReadVmcs32(VMX_VMCS_GUEST_CR0, &u32Val); AssertRC(rc);
11822 Log4(("VMX_VMCS_GUEST_CR0 %#RX32\n", u32Val));
11823 rc = VMXReadVmcsHstN(VMX_VMCS_CTRL_CR0_MASK, &uHCReg); AssertRC(rc);
11824 Log4(("VMX_VMCS_CTRL_CR0_MASK %#RHr\n", uHCReg));
11825 rc = VMXReadVmcsHstN(VMX_VMCS_CTRL_CR0_READ_SHADOW, &uHCReg); AssertRC(rc);
11826 Log4(("VMX_VMCS_CTRL_CR4_READ_SHADOW %#RHr\n", uHCReg));
11827 rc = VMXReadVmcsHstN(VMX_VMCS_CTRL_CR4_MASK, &uHCReg); AssertRC(rc);
11828 Log4(("VMX_VMCS_CTRL_CR4_MASK %#RHr\n", uHCReg));
11829 rc = VMXReadVmcsHstN(VMX_VMCS_CTRL_CR4_READ_SHADOW, &uHCReg); AssertRC(rc);
11830 Log4(("VMX_VMCS_CTRL_CR4_READ_SHADOW %#RHr\n", uHCReg));
11831 rc = VMXReadVmcs64(VMX_VMCS64_CTRL_EPTP_FULL, &u64Val); AssertRC(rc);
11832 Log4(("VMX_VMCS64_CTRL_EPTP_FULL %#RX64\n", u64Val));
11833
11834 hmR0DumpRegs(pVCpu);
11835#else
11836 NOREF(pVmxTransient);
11837#endif
11838
11839 return VERR_VMX_INVALID_GUEST_STATE;
11840}
11841
11842
11843/**
11844 * VM-exit handler for VM-entry failure due to an MSR-load
11845 * (VMX_EXIT_ERR_MSR_LOAD). Error VM-exit.
11846 */
11847HMVMX_EXIT_NSRC_DECL hmR0VmxExitErrMsrLoad(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11848{
11849 AssertMsgFailed(("Unexpected MSR-load exit\n"));
11850 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11851}
11852
11853
11854/**
11855 * VM-exit handler for VM-entry failure due to a machine-check event
11856 * (VMX_EXIT_ERR_MACHINE_CHECK). Error VM-exit.
11857 */
11858HMVMX_EXIT_NSRC_DECL hmR0VmxExitErrMachineCheck(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11859{
11860 AssertMsgFailed(("Unexpected machine-check event exit\n"));
11861 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11862}
11863
11864
11865/**
11866 * VM-exit handler for all undefined reasons. Should never ever happen.. in
11867 * theory.
11868 */
11869HMVMX_EXIT_NSRC_DECL hmR0VmxExitErrUndefined(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11870{
11871 RT_NOREF2(pVCpu, pVmxTransient);
11872 AssertMsgFailed(("Huh!? Undefined VM-exit reason %d\n", pVmxTransient->uExitReason));
11873 return VERR_VMX_UNDEFINED_EXIT_CODE;
11874}
11875
11876
11877/**
11878 * VM-exit handler for XDTR (LGDT, SGDT, LIDT, SIDT) accesses
11879 * (VMX_EXIT_GDTR_IDTR_ACCESS) and LDT and TR access (LLDT, LTR, SLDT, STR).
11880 * Conditional VM-exit.
11881 */
11882HMVMX_EXIT_DECL hmR0VmxExitXdtrAccess(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11883{
11884 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11885
11886 /* By default, we don't enable VMX_PROC_CTLS2_DESCRIPTOR_TABLE_EXIT. */
11887 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitXdtrAccess);
11888 if (pVCpu->hm.s.vmx.u32ProcCtls2 & VMX_PROC_CTLS2_DESC_TABLE_EXIT)
11889 return VERR_EM_INTERPRETER;
11890 AssertMsgFailed(("Unexpected XDTR access\n"));
11891 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11892}
11893
11894
11895/**
11896 * VM-exit handler for RDRAND (VMX_EXIT_RDRAND). Conditional VM-exit.
11897 */
11898HMVMX_EXIT_DECL hmR0VmxExitRdrand(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11899{
11900 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11901
11902 /* By default, we don't enable VMX_PROC_CTLS2_RDRAND_EXIT. */
11903 if (pVCpu->hm.s.vmx.u32ProcCtls2 & VMX_PROC_CTLS2_RDRAND_EXIT)
11904 return VERR_EM_INTERPRETER;
11905 AssertMsgFailed(("Unexpected RDRAND exit\n"));
11906 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11907}
11908
11909
11910/**
11911 * VM-exit handler for RDMSR (VMX_EXIT_RDMSR).
11912 */
11913HMVMX_EXIT_DECL hmR0VmxExitRdmsr(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11914{
11915 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11916
11917 /** @todo Optimize this: We currently drag in in the whole MSR state
11918 * (CPUMCTX_EXTRN_ALL_MSRS) here. We should optimize this to only get
11919 * MSRs required. That would require changes to IEM and possibly CPUM too.
11920 * (Should probably do it lazy fashion from CPUMAllMsrs.cpp). */
11921 uint32_t const idMsr = pVCpu->cpum.GstCtx.ecx;
11922 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
11923 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_EXEC_DECODED_NO_MEM_MASK | CPUMCTX_EXTRN_ALL_MSRS);
11924 switch (idMsr)
11925 {
11926 /* The FS and GS base MSRs are not part of the above all-MSRs mask. */
11927 case MSR_K8_FS_BASE: rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_FS); break;
11928 case MSR_K8_GS_BASE: rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_GS); break;
11929 }
11930 AssertRCReturn(rc, rc);
11931
11932 Log4Func(("ecx=%#RX32\n", idMsr));
11933
11934#ifdef VBOX_STRICT
11935 if (pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_MSR_BITMAPS)
11936 {
11937 if ( hmR0VmxIsAutoLoadStoreGuestMsr(pVCpu, idMsr)
11938 && idMsr != MSR_K6_EFER)
11939 {
11940 AssertMsgFailed(("Unexpected RDMSR for an MSR in the auto-load/store area in the VMCS. ecx=%#RX32\n", idMsr));
11941 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11942 }
11943 if (hmR0VmxIsLazyGuestMsr(pVCpu, idMsr))
11944 {
11945 VMXMSREXITREAD enmRead;
11946 VMXMSREXITWRITE enmWrite;
11947 int rc2 = HMVmxGetMsrPermission(pVCpu->hm.s.vmx.pvMsrBitmap, idMsr, &enmRead, &enmWrite);
11948 AssertRCReturn(rc2, rc2);
11949 if (enmRead == VMXMSREXIT_PASSTHRU_READ)
11950 {
11951 AssertMsgFailed(("Unexpected RDMSR for a passthru lazy-restore MSR. ecx=%#RX32\n", idMsr));
11952 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
11953 }
11954 }
11955 }
11956#endif
11957
11958 VBOXSTRICTRC rcStrict = IEMExecDecodedRdmsr(pVCpu, pVmxTransient->cbInstr);
11959 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitRdmsr);
11960 if (rcStrict == VINF_SUCCESS)
11961 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS
11962 | HM_CHANGED_GUEST_RAX | HM_CHANGED_GUEST_RDX);
11963 else if (rcStrict == VINF_IEM_RAISED_XCPT)
11964 {
11965 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
11966 rcStrict = VINF_SUCCESS;
11967 }
11968 else
11969 AssertMsg(rcStrict == VINF_CPUM_R3_MSR_READ, ("Unexpected IEMExecDecodedRdmsr status: %Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
11970
11971 return rcStrict;
11972}
11973
11974
11975/**
11976 * VM-exit handler for WRMSR (VMX_EXIT_WRMSR).
11977 */
11978HMVMX_EXIT_DECL hmR0VmxExitWrmsr(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
11979{
11980 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
11981
11982 /** @todo Optimize this: We currently drag in in the whole MSR state
11983 * (CPUMCTX_EXTRN_ALL_MSRS) here. We should optimize this to only get
11984 * MSRs required. That would require changes to IEM and possibly CPUM too.
11985 * (Should probably do it lazy fashion from CPUMAllMsrs.cpp). */
11986 uint32_t const idMsr = pVCpu->cpum.GstCtx.ecx;
11987 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
11988 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_EXEC_DECODED_NO_MEM_MASK
11989 | CPUMCTX_EXTRN_ALL_MSRS);
11990 switch (idMsr)
11991 {
11992 /*
11993 * The FS and GS base MSRs are not part of the above all-MSRs mask.
11994 *
11995 * Although we don't need to fetch the base as it will be overwritten shortly, while
11996 * loading guest-state we would also load the entire segment register including limit
11997 * and attributes and thus we need to load them here.
11998 */
11999 case MSR_K8_FS_BASE: rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_FS); break;
12000 case MSR_K8_GS_BASE: rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_GS); break;
12001 }
12002 AssertRCReturn(rc, rc);
12003
12004 Log4Func(("ecx=%#RX32 edx:eax=%#RX32:%#RX32\n", idMsr, pVCpu->cpum.GstCtx.edx, pVCpu->cpum.GstCtx.eax));
12005
12006 VBOXSTRICTRC rcStrict = IEMExecDecodedWrmsr(pVCpu, pVmxTransient->cbInstr);
12007 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitWrmsr);
12008
12009 if (rcStrict == VINF_SUCCESS)
12010 {
12011 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS);
12012
12013 /* If this is an X2APIC WRMSR access, update the APIC state as well. */
12014 if ( idMsr == MSR_IA32_APICBASE
12015 || ( idMsr >= MSR_IA32_X2APIC_START
12016 && idMsr <= MSR_IA32_X2APIC_END))
12017 {
12018 /*
12019 * We've already saved the APIC related guest-state (TPR) in hmR0VmxPostRunGuest(). When full APIC register
12020 * virtualization is implemented we'll have to make sure APIC state is saved from the VMCS before IEM changes it.
12021 */
12022 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_APIC_TPR);
12023 }
12024 else if (idMsr == MSR_IA32_TSC) /* Windows 7 does this during bootup. See @bugref{6398}. */
12025 pVmxTransient->fUpdateTscOffsettingAndPreemptTimer = true;
12026 else if (idMsr == MSR_K6_EFER)
12027 {
12028 /*
12029 * If the guest touches EFER we need to update the VM-Entry and VM-Exit controls as well,
12030 * even if it is -not- touching bits that cause paging mode changes (LMA/LME). We care about
12031 * the other bits as well, SCE and NXE. See @bugref{7368}.
12032 */
12033 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_EFER_MSR | HM_CHANGED_VMX_ENTRY_CTLS
12034 | HM_CHANGED_VMX_EXIT_CTLS);
12035 }
12036
12037 /* Update MSRs that are part of the VMCS and auto-load/store area when MSR-bitmaps are not supported. */
12038 if (!(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_MSR_BITMAPS))
12039 {
12040 switch (idMsr)
12041 {
12042 case MSR_IA32_SYSENTER_CS: ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_SYSENTER_CS_MSR); break;
12043 case MSR_IA32_SYSENTER_EIP: ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_SYSENTER_EIP_MSR); break;
12044 case MSR_IA32_SYSENTER_ESP: ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_SYSENTER_ESP_MSR); break;
12045 case MSR_K8_FS_BASE: ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_FS); break;
12046 case MSR_K8_GS_BASE: ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_GS); break;
12047 case MSR_K6_EFER: /* Nothing to do, already handled above. */ break;
12048 default:
12049 {
12050 if (hmR0VmxIsAutoLoadStoreGuestMsr(pVCpu, idMsr))
12051 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_VMX_GUEST_AUTO_MSRS);
12052 else if (hmR0VmxIsLazyGuestMsr(pVCpu, idMsr))
12053 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_VMX_GUEST_LAZY_MSRS);
12054 break;
12055 }
12056 }
12057 }
12058#ifdef VBOX_STRICT
12059 else
12060 {
12061 /* Paranoia. Validate that MSRs in the MSR-bitmaps with write-passthru are not intercepted. */
12062 switch (idMsr)
12063 {
12064 case MSR_IA32_SYSENTER_CS:
12065 case MSR_IA32_SYSENTER_EIP:
12066 case MSR_IA32_SYSENTER_ESP:
12067 case MSR_K8_FS_BASE:
12068 case MSR_K8_GS_BASE:
12069 {
12070 AssertMsgFailed(("Unexpected WRMSR for an MSR in the VMCS. ecx=%#RX32\n", idMsr));
12071 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
12072 }
12073
12074 /* Writes to MSRs in auto-load/store area/swapped MSRs, shouldn't cause VM-exits with MSR-bitmaps. */
12075 default:
12076 {
12077 if (hmR0VmxIsAutoLoadStoreGuestMsr(pVCpu, idMsr))
12078 {
12079 /* EFER writes are always intercepted, see hmR0VmxExportGuestMsrs(). */
12080 if (idMsr != MSR_K6_EFER)
12081 {
12082 AssertMsgFailed(("Unexpected WRMSR for an MSR in the auto-load/store area in the VMCS. ecx=%#RX32\n",
12083 idMsr));
12084 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
12085 }
12086 }
12087
12088 if (hmR0VmxIsLazyGuestMsr(pVCpu, idMsr))
12089 {
12090 VMXMSREXITREAD enmRead;
12091 VMXMSREXITWRITE enmWrite;
12092 int rc2 = HMVmxGetMsrPermission(pVCpu->hm.s.vmx.pvMsrBitmap, idMsr, &enmRead, &enmWrite);
12093 AssertRCReturn(rc2, rc2);
12094 if (enmWrite == VMXMSREXIT_PASSTHRU_WRITE)
12095 {
12096 AssertMsgFailed(("Unexpected WRMSR for passthru, lazy-restore MSR. ecx=%#RX32\n", idMsr));
12097 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
12098 }
12099 }
12100 break;
12101 }
12102 }
12103 }
12104#endif /* VBOX_STRICT */
12105 }
12106 else if (rcStrict == VINF_IEM_RAISED_XCPT)
12107 {
12108 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
12109 rcStrict = VINF_SUCCESS;
12110 }
12111 else
12112 AssertMsg(rcStrict == VINF_CPUM_R3_MSR_WRITE, ("Unexpected IEMExecDecodedWrmsr status: %Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
12113
12114 return rcStrict;
12115}
12116
12117
12118/**
12119 * VM-exit handler for PAUSE (VMX_EXIT_PAUSE). Conditional VM-exit.
12120 */
12121HMVMX_EXIT_DECL hmR0VmxExitPause(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12122{
12123 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12124 /** @todo The guest has likely hit a contended spinlock. We might want to
12125 * poke a schedule different guest VCPU. */
12126 return VINF_EM_RAW_INTERRUPT;
12127}
12128
12129
12130/**
12131 * VM-exit handler for when the TPR value is lowered below the specified
12132 * threshold (VMX_EXIT_TPR_BELOW_THRESHOLD). Conditional VM-exit.
12133 */
12134HMVMX_EXIT_NSRC_DECL hmR0VmxExitTprBelowThreshold(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12135{
12136 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12137 Assert(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TPR_SHADOW);
12138
12139 /*
12140 * The TPR shadow would've been synced with the APIC TPR in hmR0VmxPostRunGuest(). We'll re-evaluate
12141 * pending interrupts and inject them before the next VM-entry so we can just continue execution here.
12142 */
12143 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitTprBelowThreshold);
12144 return VINF_SUCCESS;
12145}
12146
12147
12148/**
12149 * VM-exit handler for control-register accesses (VMX_EXIT_MOV_CRX). Conditional
12150 * VM-exit.
12151 *
12152 * @retval VINF_SUCCESS when guest execution can continue.
12153 * @retval VINF_PGM_SYNC_CR3 CR3 sync is required, back to ring-3.
12154 * @retval VERR_EM_INTERPRETER when something unexpected happened, fallback to
12155 * interpreter.
12156 */
12157HMVMX_EXIT_DECL hmR0VmxExitMovCRx(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12158{
12159 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12160 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatExitMovCRx, y2);
12161
12162 int rc = hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
12163 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
12164 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_MUST_MASK);
12165 AssertRCReturn(rc, rc);
12166
12167 VBOXSTRICTRC rcStrict;
12168 PVM pVM = pVCpu->CTX_SUFF(pVM);
12169 RTGCUINTPTR const uExitQual = pVmxTransient->uExitQual;
12170 uint32_t const uAccessType = VMX_EXIT_QUAL_CRX_ACCESS(uExitQual);
12171 switch (uAccessType)
12172 {
12173 case VMX_EXIT_QUAL_CRX_ACCESS_WRITE: /* MOV to CRx */
12174 {
12175 uint32_t const uOldCr0 = pVCpu->cpum.GstCtx.cr0;
12176 rcStrict = IEMExecDecodedMovCRxWrite(pVCpu, pVmxTransient->cbInstr, VMX_EXIT_QUAL_CRX_REGISTER(uExitQual),
12177 VMX_EXIT_QUAL_CRX_GENREG(uExitQual));
12178 AssertMsg( rcStrict == VINF_SUCCESS
12179 || rcStrict == VINF_IEM_RAISED_XCPT
12180 || rcStrict == VINF_PGM_SYNC_CR3, ("%Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
12181
12182 switch (VMX_EXIT_QUAL_CRX_REGISTER(uExitQual))
12183 {
12184 case 0:
12185 {
12186 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged,
12187 HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_CR0);
12188 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR0Write);
12189 Log4Func(("CR0 write rcStrict=%Rrc CR0=%#RX64\n", VBOXSTRICTRC_VAL(rcStrict), pVCpu->cpum.GstCtx.cr0));
12190
12191 /*
12192 * This is a kludge for handling switches back to real mode when we try to use
12193 * V86 mode to run real mode code directly. Problem is that V86 mode cannot
12194 * deal with special selector values, so we have to return to ring-3 and run
12195 * there till the selector values are V86 mode compatible.
12196 *
12197 * Note! Using VINF_EM_RESCHEDULE_REM here rather than VINF_EM_RESCHEDULE since the
12198 * latter is an alias for VINF_IEM_RAISED_XCPT which is converted to VINF_SUCCESs
12199 * at the end of this function.
12200 */
12201 if ( rc == VINF_SUCCESS
12202 && !pVCpu->CTX_SUFF(pVM)->hm.s.vmx.fUnrestrictedGuest
12203 && CPUMIsGuestInRealModeEx(&pVCpu->cpum.GstCtx)
12204 && (uOldCr0 & X86_CR0_PE)
12205 && !(pVCpu->cpum.GstCtx.cr0 & X86_CR0_PE) )
12206 {
12207 /** @todo check selectors rather than returning all the time. */
12208 Log4Func(("CR0 write, back to real mode -> VINF_EM_RESCHEDULE_REM\n"));
12209 rcStrict = VINF_EM_RESCHEDULE_REM;
12210 }
12211 break;
12212 }
12213
12214 case 2:
12215 {
12216 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR2Write);
12217 /* Nothing to do here, CR2 it's not part of the VMCS. */
12218 break;
12219 }
12220
12221 case 3:
12222 {
12223 Assert( !pVM->hm.s.fNestedPaging
12224 || !CPUMIsGuestPagingEnabledEx(&pVCpu->cpum.GstCtx)
12225 || pVCpu->hm.s.fUsingDebugLoop);
12226 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR3Write);
12227 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged,
12228 HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_CR3);
12229 Log4Func(("CR3 write rcStrict=%Rrc CR3=%#RX64\n", VBOXSTRICTRC_VAL(rcStrict), pVCpu->cpum.GstCtx.cr3));
12230 break;
12231 }
12232
12233 case 4:
12234 {
12235 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR4Write);
12236 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged,
12237 HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_CR4);
12238 Log4Func(("CR4 write rc=%Rrc CR4=%#RX64 fLoadSaveGuestXcr0=%u\n", VBOXSTRICTRC_VAL(rcStrict),
12239 pVCpu->cpum.GstCtx.cr4, pVCpu->hm.s.fLoadSaveGuestXcr0));
12240 break;
12241 }
12242
12243 case 8:
12244 {
12245 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR8Write);
12246 Assert(!(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TPR_SHADOW));
12247 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged,
12248 HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_APIC_TPR);
12249 break;
12250 }
12251 default:
12252 AssertMsgFailed(("Invalid CRx register %#x\n", VMX_EXIT_QUAL_CRX_REGISTER(uExitQual)));
12253 break;
12254 }
12255 break;
12256 }
12257
12258 case VMX_EXIT_QUAL_CRX_ACCESS_READ: /* MOV from CRx */
12259 {
12260 Assert( !pVM->hm.s.fNestedPaging
12261 || !CPUMIsGuestPagingEnabledEx(&pVCpu->cpum.GstCtx)
12262 || pVCpu->hm.s.fUsingDebugLoop
12263 || VMX_EXIT_QUAL_CRX_REGISTER(uExitQual) != 3);
12264 /* CR8 reads only cause a VM-exit when the TPR shadow feature isn't enabled. */
12265 Assert( VMX_EXIT_QUAL_CRX_REGISTER(uExitQual) != 8
12266 || !(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TPR_SHADOW));
12267
12268 rcStrict = IEMExecDecodedMovCRxRead(pVCpu, pVmxTransient->cbInstr, VMX_EXIT_QUAL_CRX_GENREG(uExitQual),
12269 VMX_EXIT_QUAL_CRX_REGISTER(uExitQual));
12270 AssertMsg( rcStrict == VINF_SUCCESS
12271 || rcStrict == VINF_IEM_RAISED_XCPT, ("%Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
12272#ifdef VBOX_WITH_STATISTICS
12273 switch (VMX_EXIT_QUAL_CRX_REGISTER(uExitQual))
12274 {
12275 case 0: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR0Read); break;
12276 case 2: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR2Read); break;
12277 case 3: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR3Read); break;
12278 case 4: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR4Read); break;
12279 case 8: STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCR8Read); break;
12280 }
12281#endif
12282 Log4Func(("CR%d Read access rcStrict=%Rrc\n", VMX_EXIT_QUAL_CRX_REGISTER(uExitQual),
12283 VBOXSTRICTRC_VAL(rcStrict)));
12284 if (VMX_EXIT_QUAL_CRX_GENREG(uExitQual) == X86_GREG_xSP)
12285 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_RSP);
12286 else
12287 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS);
12288 break;
12289 }
12290
12291 case VMX_EXIT_QUAL_CRX_ACCESS_CLTS: /* CLTS (Clear Task-Switch Flag in CR0) */
12292 {
12293 rcStrict = IEMExecDecodedClts(pVCpu, pVmxTransient->cbInstr);
12294 AssertMsg( rcStrict == VINF_SUCCESS
12295 || rcStrict == VINF_IEM_RAISED_XCPT, ("%Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
12296
12297 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_CR0);
12298 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitClts);
12299 Log4Func(("CLTS rcStrict=%d\n", VBOXSTRICTRC_VAL(rcStrict)));
12300 break;
12301 }
12302
12303 case VMX_EXIT_QUAL_CRX_ACCESS_LMSW: /* LMSW (Load Machine-Status Word into CR0) */
12304 {
12305 /* Note! LMSW cannot clear CR0.PE, so no fRealOnV86Active kludge needed here. */
12306 rc = hmR0VmxReadGuestLinearAddrVmcs(pVCpu, pVmxTransient);
12307 AssertRCReturn(rc, rc);
12308 rcStrict = IEMExecDecodedLmsw(pVCpu, pVmxTransient->cbInstr, VMX_EXIT_QUAL_CRX_LMSW_DATA(uExitQual),
12309 pVmxTransient->uGuestLinearAddr);
12310 AssertMsg( rcStrict == VINF_SUCCESS
12311 || rcStrict == VINF_IEM_RAISED_XCPT
12312 , ("%Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
12313
12314 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_CR0);
12315 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitLmsw);
12316 Log4Func(("LMSW rcStrict=%d\n", VBOXSTRICTRC_VAL(rcStrict)));
12317 break;
12318 }
12319
12320 default:
12321 AssertMsgFailedReturn(("Invalid access-type in Mov CRx VM-exit qualification %#x\n", uAccessType),
12322 VERR_VMX_UNEXPECTED_EXCEPTION);
12323 }
12324
12325 Assert( (pVCpu->hm.s.fCtxChanged & (HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS))
12326 == (HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS));
12327 if (rcStrict == VINF_IEM_RAISED_XCPT)
12328 {
12329 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
12330 rcStrict = VINF_SUCCESS;
12331 }
12332
12333 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExitMovCRx, y2);
12334 NOREF(pVM);
12335 return rcStrict;
12336}
12337
12338
12339/**
12340 * VM-exit handler for I/O instructions (VMX_EXIT_IO_INSTR). Conditional
12341 * VM-exit.
12342 */
12343HMVMX_EXIT_DECL hmR0VmxExitIoInstr(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12344{
12345 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12346 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatExitIO, y1);
12347
12348 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
12349 int rc = hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
12350 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
12351 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_MUST_MASK | CPUMCTX_EXTRN_SREG_MASK | CPUMCTX_EXTRN_EFER);
12352 /* EFER also required for longmode checks in EMInterpretDisasCurrent(), but it's always up-to-date. */
12353 AssertRCReturn(rc, rc);
12354
12355 /* Refer Intel spec. 27-5. "Exit Qualifications for I/O Instructions" for the format. */
12356 uint32_t uIOPort = VMX_EXIT_QUAL_IO_PORT(pVmxTransient->uExitQual);
12357 uint8_t uIOWidth = VMX_EXIT_QUAL_IO_WIDTH(pVmxTransient->uExitQual);
12358 bool fIOWrite = (VMX_EXIT_QUAL_IO_DIRECTION(pVmxTransient->uExitQual) == VMX_EXIT_QUAL_IO_DIRECTION_OUT);
12359 bool fIOString = VMX_EXIT_QUAL_IO_IS_STRING(pVmxTransient->uExitQual);
12360 bool fGstStepping = RT_BOOL(pCtx->eflags.Bits.u1TF);
12361 bool fDbgStepping = pVCpu->hm.s.fSingleInstruction;
12362 AssertReturn(uIOWidth <= 3 && uIOWidth != 2, VERR_VMX_IPE_1);
12363
12364 /*
12365 * Update exit history to see if this exit can be optimized.
12366 */
12367 VBOXSTRICTRC rcStrict;
12368 PCEMEXITREC pExitRec = NULL;
12369 if ( !fGstStepping
12370 && !fDbgStepping)
12371 pExitRec = EMHistoryUpdateFlagsAndTypeAndPC(pVCpu,
12372 !fIOString
12373 ? !fIOWrite
12374 ? EMEXIT_MAKE_FT(EMEXIT_F_KIND_EM | EMEXIT_F_HM, EMEXITTYPE_IO_PORT_READ)
12375 : EMEXIT_MAKE_FT(EMEXIT_F_KIND_EM | EMEXIT_F_HM, EMEXITTYPE_IO_PORT_WRITE)
12376 : !fIOWrite
12377 ? EMEXIT_MAKE_FT(EMEXIT_F_KIND_EM | EMEXIT_F_HM, EMEXITTYPE_IO_PORT_STR_READ)
12378 : EMEXIT_MAKE_FT(EMEXIT_F_KIND_EM | EMEXIT_F_HM, EMEXITTYPE_IO_PORT_STR_WRITE),
12379 pVCpu->cpum.GstCtx.rip + pVCpu->cpum.GstCtx.cs.u64Base);
12380 if (!pExitRec)
12381 {
12382 /* I/O operation lookup arrays. */
12383 static uint32_t const s_aIOSizes[4] = { 1, 2, 0, 4 }; /* Size of the I/O accesses. */
12384 static uint32_t const s_aIOOpAnd[4] = { 0xff, 0xffff, 0, 0xffffffff }; /* AND masks for saving result in AL/AX/EAX. */
12385 uint32_t const cbValue = s_aIOSizes[uIOWidth];
12386 uint32_t const cbInstr = pVmxTransient->cbInstr;
12387 bool fUpdateRipAlready = false; /* ugly hack, should be temporary. */
12388 PVM pVM = pVCpu->CTX_SUFF(pVM);
12389 if (fIOString)
12390 {
12391 /*
12392 * INS/OUTS - I/O String instruction.
12393 *
12394 * Use instruction-information if available, otherwise fall back on
12395 * interpreting the instruction.
12396 */
12397 Log4Func(("CS:RIP=%04x:%08RX64 %#06x/%u %c str\n", pCtx->cs.Sel, pCtx->rip, uIOPort, cbValue, fIOWrite ? 'w' : 'r'));
12398 AssertReturn(pCtx->dx == uIOPort, VERR_VMX_IPE_2);
12399 bool const fInsOutsInfo = RT_BF_GET(pVM->hm.s.vmx.Msrs.u64Basic, VMX_BF_BASIC_VMCS_INS_OUTS);
12400 if (fInsOutsInfo)
12401 {
12402 int rc2 = hmR0VmxReadExitInstrInfoVmcs(pVmxTransient);
12403 AssertRCReturn(rc2, rc2);
12404 AssertReturn(pVmxTransient->ExitInstrInfo.StrIo.u3AddrSize <= 2, VERR_VMX_IPE_3);
12405 AssertCompile(IEMMODE_16BIT == 0 && IEMMODE_32BIT == 1 && IEMMODE_64BIT == 2);
12406 IEMMODE const enmAddrMode = (IEMMODE)pVmxTransient->ExitInstrInfo.StrIo.u3AddrSize;
12407 bool const fRep = VMX_EXIT_QUAL_IO_IS_REP(pVmxTransient->uExitQual);
12408 if (fIOWrite)
12409 rcStrict = IEMExecStringIoWrite(pVCpu, cbValue, enmAddrMode, fRep, cbInstr,
12410 pVmxTransient->ExitInstrInfo.StrIo.iSegReg, true /*fIoChecked*/);
12411 else
12412 {
12413 /*
12414 * The segment prefix for INS cannot be overridden and is always ES. We can safely assume X86_SREG_ES.
12415 * Hence "iSegReg" field is undefined in the instruction-information field in VT-x for INS.
12416 * See Intel Instruction spec. for "INS".
12417 * See Intel spec. Table 27-8 "Format of the VM-Exit Instruction-Information Field as Used for INS and OUTS".
12418 */
12419 rcStrict = IEMExecStringIoRead(pVCpu, cbValue, enmAddrMode, fRep, cbInstr, true /*fIoChecked*/);
12420 }
12421 }
12422 else
12423 rcStrict = IEMExecOne(pVCpu);
12424
12425 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP);
12426 fUpdateRipAlready = true;
12427 }
12428 else
12429 {
12430 /*
12431 * IN/OUT - I/O instruction.
12432 */
12433 Log4Func(("CS:RIP=%04x:%08RX64 %#06x/%u %c\n", pCtx->cs.Sel, pCtx->rip, uIOPort, cbValue, fIOWrite ? 'w' : 'r'));
12434 uint32_t const uAndVal = s_aIOOpAnd[uIOWidth];
12435 Assert(!VMX_EXIT_QUAL_IO_IS_REP(pVmxTransient->uExitQual));
12436 if (fIOWrite)
12437 {
12438 rcStrict = IOMIOPortWrite(pVM, pVCpu, uIOPort, pCtx->eax & uAndVal, cbValue);
12439 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIOWrite);
12440 if ( rcStrict == VINF_IOM_R3_IOPORT_WRITE
12441 && !pCtx->eflags.Bits.u1TF)
12442 rcStrict = EMRZSetPendingIoPortWrite(pVCpu, uIOPort, cbInstr, cbValue, pCtx->eax & uAndVal);
12443 }
12444 else
12445 {
12446 uint32_t u32Result = 0;
12447 rcStrict = IOMIOPortRead(pVM, pVCpu, uIOPort, &u32Result, cbValue);
12448 if (IOM_SUCCESS(rcStrict))
12449 {
12450 /* Save result of I/O IN instr. in AL/AX/EAX. */
12451 pCtx->eax = (pCtx->eax & ~uAndVal) | (u32Result & uAndVal);
12452 }
12453 if ( rcStrict == VINF_IOM_R3_IOPORT_READ
12454 && !pCtx->eflags.Bits.u1TF)
12455 rcStrict = EMRZSetPendingIoPortRead(pVCpu, uIOPort, cbInstr, cbValue);
12456 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIORead);
12457 }
12458 }
12459
12460 if (IOM_SUCCESS(rcStrict))
12461 {
12462 if (!fUpdateRipAlready)
12463 {
12464 hmR0VmxAdvanceGuestRipBy(pVCpu, cbInstr);
12465 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP);
12466 }
12467
12468 /*
12469 * INS/OUTS with REP prefix updates RFLAGS, can be observed with triple-fault guru
12470 * while booting Fedora 17 64-bit guest.
12471 *
12472 * See Intel Instruction reference for REP/REPE/REPZ/REPNE/REPNZ.
12473 */
12474 if (fIOString)
12475 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RFLAGS);
12476
12477 /*
12478 * If any I/O breakpoints are armed, we need to check if one triggered
12479 * and take appropriate action.
12480 * Note that the I/O breakpoint type is undefined if CR4.DE is 0.
12481 */
12482 rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_DR7);
12483 AssertRCReturn(rc, rc);
12484
12485 /** @todo Optimize away the DBGFBpIsHwIoArmed call by having DBGF tell the
12486 * execution engines about whether hyper BPs and such are pending. */
12487 uint32_t const uDr7 = pCtx->dr[7];
12488 if (RT_UNLIKELY( ( (uDr7 & X86_DR7_ENABLED_MASK)
12489 && X86_DR7_ANY_RW_IO(uDr7)
12490 && (pCtx->cr4 & X86_CR4_DE))
12491 || DBGFBpIsHwIoArmed(pVM)))
12492 {
12493 STAM_COUNTER_INC(&pVCpu->hm.s.StatDRxIoCheck);
12494
12495 /* We're playing with the host CPU state here, make sure we don't preempt or longjmp. */
12496 VMMRZCallRing3Disable(pVCpu);
12497 HM_DISABLE_PREEMPT(pVCpu);
12498
12499 bool fIsGuestDbgActive = CPUMR0DebugStateMaybeSaveGuest(pVCpu, true /* fDr6 */);
12500
12501 VBOXSTRICTRC rcStrict2 = DBGFBpCheckIo(pVM, pVCpu, pCtx, uIOPort, cbValue);
12502 if (rcStrict2 == VINF_EM_RAW_GUEST_TRAP)
12503 {
12504 /* Raise #DB. */
12505 if (fIsGuestDbgActive)
12506 ASMSetDR6(pCtx->dr[6]);
12507 if (pCtx->dr[7] != uDr7)
12508 pVCpu->hm.s.fCtxChanged |= HM_CHANGED_GUEST_DR7;
12509
12510 hmR0VmxSetPendingXcptDB(pVCpu);
12511 }
12512 /* rcStrict is VINF_SUCCESS, VINF_IOM_R3_IOPORT_COMMIT_WRITE, or in [VINF_EM_FIRST..VINF_EM_LAST],
12513 however we can ditch VINF_IOM_R3_IOPORT_COMMIT_WRITE as it has VMCPU_FF_IOM as backup. */
12514 else if ( rcStrict2 != VINF_SUCCESS
12515 && (rcStrict == VINF_SUCCESS || rcStrict2 < rcStrict))
12516 rcStrict = rcStrict2;
12517 AssertCompile(VINF_EM_LAST < VINF_IOM_R3_IOPORT_COMMIT_WRITE);
12518
12519 HM_RESTORE_PREEMPT();
12520 VMMRZCallRing3Enable(pVCpu);
12521 }
12522 }
12523
12524#ifdef VBOX_STRICT
12525 if ( rcStrict == VINF_IOM_R3_IOPORT_READ
12526 || rcStrict == VINF_EM_PENDING_R3_IOPORT_READ)
12527 Assert(!fIOWrite);
12528 else if ( rcStrict == VINF_IOM_R3_IOPORT_WRITE
12529 || rcStrict == VINF_IOM_R3_IOPORT_COMMIT_WRITE
12530 || rcStrict == VINF_EM_PENDING_R3_IOPORT_WRITE)
12531 Assert(fIOWrite);
12532 else
12533 {
12534# if 0 /** @todo r=bird: This is missing a bunch of VINF_EM_FIRST..VINF_EM_LAST
12535 * statuses, that the VMM device and some others may return. See
12536 * IOM_SUCCESS() for guidance. */
12537 AssertMsg( RT_FAILURE(rcStrict)
12538 || rcStrict == VINF_SUCCESS
12539 || rcStrict == VINF_EM_RAW_EMULATE_INSTR
12540 || rcStrict == VINF_EM_DBG_BREAKPOINT
12541 || rcStrict == VINF_EM_RAW_GUEST_TRAP
12542 || rcStrict == VINF_EM_RAW_TO_R3
12543 || rcStrict == VINF_TRPM_XCPT_DISPATCHED, ("%Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
12544# endif
12545 }
12546#endif
12547 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExitIO, y1);
12548 }
12549 else
12550 {
12551 /*
12552 * Frequent exit or something needing probing. Get state and call EMHistoryExec.
12553 */
12554 int rc2 = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
12555 AssertRCReturn(rc2, rc2);
12556 STAM_COUNTER_INC(!fIOString ? fIOWrite ? &pVCpu->hm.s.StatExitIOWrite : &pVCpu->hm.s.StatExitIORead
12557 : fIOWrite ? &pVCpu->hm.s.StatExitIOStringWrite : &pVCpu->hm.s.StatExitIOStringRead);
12558 Log4(("IOExit/%u: %04x:%08RX64: %s%s%s %#x LB %u -> EMHistoryExec\n",
12559 pVCpu->idCpu, pVCpu->cpum.GstCtx.cs.Sel, pVCpu->cpum.GstCtx.rip,
12560 VMX_EXIT_QUAL_IO_IS_REP(pVmxTransient->uExitQual) ? "REP " : "",
12561 fIOWrite ? "OUT" : "IN", fIOString ? "S" : "", uIOPort, uIOWidth));
12562
12563 rcStrict = EMHistoryExec(pVCpu, pExitRec, 0);
12564 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
12565
12566 Log4(("IOExit/%u: %04x:%08RX64: EMHistoryExec -> %Rrc + %04x:%08RX64\n",
12567 pVCpu->idCpu, pVCpu->cpum.GstCtx.cs.Sel, pVCpu->cpum.GstCtx.rip,
12568 VBOXSTRICTRC_VAL(rcStrict), pVCpu->cpum.GstCtx.cs.Sel, pVCpu->cpum.GstCtx.rip));
12569 }
12570 return rcStrict;
12571}
12572
12573
12574/**
12575 * VM-exit handler for task switches (VMX_EXIT_TASK_SWITCH). Unconditional
12576 * VM-exit.
12577 */
12578HMVMX_EXIT_DECL hmR0VmxExitTaskSwitch(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12579{
12580 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12581
12582 /* Check if this task-switch occurred while delivery an event through the guest IDT. */
12583 int rc = hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
12584 AssertRCReturn(rc, rc);
12585 if (VMX_EXIT_QUAL_TASK_SWITCH_TYPE(pVmxTransient->uExitQual) == VMX_EXIT_QUAL_TASK_SWITCH_TYPE_IDT)
12586 {
12587 rc = hmR0VmxReadIdtVectoringInfoVmcs(pVmxTransient);
12588 AssertRCReturn(rc, rc);
12589 if (VMX_IDT_VECTORING_INFO_IS_VALID(pVmxTransient->uIdtVectoringInfo))
12590 {
12591 uint32_t uErrCode;
12592 RTGCUINTPTR GCPtrFaultAddress;
12593 uint32_t const uIntType = VMX_IDT_VECTORING_INFO_TYPE(pVmxTransient->uIdtVectoringInfo);
12594 uint32_t const uVector = VMX_IDT_VECTORING_INFO_VECTOR(pVmxTransient->uIdtVectoringInfo);
12595 bool const fErrorCodeValid = VMX_IDT_VECTORING_INFO_IS_ERROR_CODE_VALID(pVmxTransient->uIdtVectoringInfo);
12596 if (fErrorCodeValid)
12597 {
12598 rc = hmR0VmxReadIdtVectoringErrorCodeVmcs(pVmxTransient);
12599 AssertRCReturn(rc, rc);
12600 uErrCode = pVmxTransient->uIdtVectoringErrorCode;
12601 }
12602 else
12603 uErrCode = 0;
12604
12605 if ( uIntType == VMX_IDT_VECTORING_INFO_TYPE_HW_XCPT
12606 && uVector == X86_XCPT_PF)
12607 GCPtrFaultAddress = pVCpu->cpum.GstCtx.cr2;
12608 else
12609 GCPtrFaultAddress = 0;
12610
12611 rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
12612 AssertRCReturn(rc, rc);
12613
12614 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_IDT_INFO(pVmxTransient->uIdtVectoringInfo),
12615 pVmxTransient->cbInstr, uErrCode, GCPtrFaultAddress);
12616
12617 Log4Func(("Pending event. uIntType=%#x uVector=%#x\n", uIntType, uVector));
12618 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitTaskSwitch);
12619 return VINF_EM_RAW_INJECT_TRPM_EVENT;
12620 }
12621 }
12622
12623 /* Fall back to the interpreter to emulate the task-switch. */
12624 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitTaskSwitch);
12625 return VERR_EM_INTERPRETER;
12626}
12627
12628
12629/**
12630 * VM-exit handler for monitor-trap-flag (VMX_EXIT_MTF). Conditional VM-exit.
12631 */
12632HMVMX_EXIT_DECL hmR0VmxExitMtf(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12633{
12634 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12635 Assert(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_MONITOR_TRAP_FLAG);
12636 pVCpu->hm.s.vmx.u32ProcCtls &= ~VMX_PROC_CTLS_MONITOR_TRAP_FLAG;
12637 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, pVCpu->hm.s.vmx.u32ProcCtls);
12638 AssertRCReturn(rc, rc);
12639 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitMtf);
12640 return VINF_EM_DBG_STEPPED;
12641}
12642
12643
12644/**
12645 * VM-exit handler for APIC access (VMX_EXIT_APIC_ACCESS). Conditional VM-exit.
12646 */
12647HMVMX_EXIT_DECL hmR0VmxExitApicAccess(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12648{
12649 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12650
12651 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitApicAccess);
12652
12653 /* If this VM-exit occurred while delivering an event through the guest IDT, handle it accordingly. */
12654 VBOXSTRICTRC rcStrict1 = hmR0VmxCheckExitDueToEventDelivery(pVCpu, pVmxTransient);
12655 if (RT_LIKELY(rcStrict1 == VINF_SUCCESS))
12656 {
12657 /* For some crazy guest, if an event delivery causes an APIC-access VM-exit, go to instruction emulation. */
12658 if (RT_UNLIKELY(pVCpu->hm.s.Event.fPending))
12659 {
12660 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectPendingInterpret);
12661 return VINF_EM_RAW_INJECT_TRPM_EVENT;
12662 }
12663 }
12664 else
12665 {
12666 if (rcStrict1 == VINF_HM_DOUBLE_FAULT)
12667 rcStrict1 = VINF_SUCCESS;
12668 return rcStrict1;
12669 }
12670
12671 /* IOMMIOPhysHandler() below may call into IEM, save the necessary state. */
12672 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_MUST_MASK);
12673 rc |= hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
12674 AssertRCReturn(rc, rc);
12675
12676 /* See Intel spec. 27-6 "Exit Qualifications for APIC-access VM-exits from Linear Accesses & Guest-Phyiscal Addresses" */
12677 uint32_t uAccessType = VMX_EXIT_QUAL_APIC_ACCESS_TYPE(pVmxTransient->uExitQual);
12678 VBOXSTRICTRC rcStrict2;
12679 switch (uAccessType)
12680 {
12681 case VMX_APIC_ACCESS_TYPE_LINEAR_WRITE:
12682 case VMX_APIC_ACCESS_TYPE_LINEAR_READ:
12683 {
12684 AssertMsg( !(pVCpu->hm.s.vmx.u32ProcCtls & VMX_PROC_CTLS_USE_TPR_SHADOW)
12685 || VMX_EXIT_QUAL_APIC_ACCESS_OFFSET(pVmxTransient->uExitQual) != XAPIC_OFF_TPR,
12686 ("hmR0VmxExitApicAccess: can't access TPR offset while using TPR shadowing.\n"));
12687
12688 RTGCPHYS GCPhys = pVCpu->hm.s.vmx.u64MsrApicBase; /* Always up-to-date, u64MsrApicBase is not part of the VMCS. */
12689 GCPhys &= PAGE_BASE_GC_MASK;
12690 GCPhys += VMX_EXIT_QUAL_APIC_ACCESS_OFFSET(pVmxTransient->uExitQual);
12691 PVM pVM = pVCpu->CTX_SUFF(pVM);
12692 Log4Func(("Linear access uAccessType=%#x GCPhys=%#RGp Off=%#x\n", uAccessType, GCPhys,
12693 VMX_EXIT_QUAL_APIC_ACCESS_OFFSET(pVmxTransient->uExitQual)));
12694
12695 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
12696 rcStrict2 = IOMMMIOPhysHandler(pVM, pVCpu,
12697 uAccessType == VMX_APIC_ACCESS_TYPE_LINEAR_READ ? 0 : X86_TRAP_PF_RW,
12698 CPUMCTX2CORE(pCtx), GCPhys);
12699 Log4Func(("IOMMMIOPhysHandler returned %Rrc\n", VBOXSTRICTRC_VAL(rcStrict2)));
12700 if ( rcStrict2 == VINF_SUCCESS
12701 || rcStrict2 == VERR_PAGE_TABLE_NOT_PRESENT
12702 || rcStrict2 == VERR_PAGE_NOT_PRESENT)
12703 {
12704 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RSP | HM_CHANGED_GUEST_RFLAGS
12705 | HM_CHANGED_GUEST_APIC_TPR);
12706 rcStrict2 = VINF_SUCCESS;
12707 }
12708 break;
12709 }
12710
12711 default:
12712 Log4Func(("uAccessType=%#x\n", uAccessType));
12713 rcStrict2 = VINF_EM_RAW_EMULATE_INSTR;
12714 break;
12715 }
12716
12717 if (rcStrict2 != VINF_SUCCESS)
12718 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchApicAccessToR3);
12719 return rcStrict2;
12720}
12721
12722
12723/**
12724 * VM-exit handler for debug-register accesses (VMX_EXIT_MOV_DRX). Conditional
12725 * VM-exit.
12726 */
12727HMVMX_EXIT_DECL hmR0VmxExitMovDRx(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12728{
12729 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12730
12731 /* We should -not- get this VM-exit if the guest's debug registers were active. */
12732 if (pVmxTransient->fWasGuestDebugStateActive)
12733 {
12734 AssertMsgFailed(("Unexpected MOV DRx exit\n"));
12735 HMVMX_UNEXPECTED_EXIT_RET(pVCpu, pVmxTransient);
12736 }
12737
12738 if ( !pVCpu->hm.s.fSingleInstruction
12739 && !pVmxTransient->fWasHyperDebugStateActive)
12740 {
12741 Assert(!DBGFIsStepping(pVCpu));
12742 Assert(pVCpu->hm.s.vmx.u32XcptBitmap & RT_BIT_32(X86_XCPT_DB));
12743
12744 /* Don't intercept MOV DRx any more. */
12745 pVCpu->hm.s.vmx.u32ProcCtls &= ~VMX_PROC_CTLS_MOV_DR_EXIT;
12746 int rc = VMXWriteVmcs32(VMX_VMCS32_CTRL_PROC_EXEC, pVCpu->hm.s.vmx.u32ProcCtls);
12747 AssertRCReturn(rc, rc);
12748
12749 /* We're playing with the host CPU state here, make sure we can't preempt or longjmp. */
12750 VMMRZCallRing3Disable(pVCpu);
12751 HM_DISABLE_PREEMPT(pVCpu);
12752
12753 /* Save the host & load the guest debug state, restart execution of the MOV DRx instruction. */
12754 CPUMR0LoadGuestDebugState(pVCpu, true /* include DR6 */);
12755 Assert(CPUMIsGuestDebugStateActive(pVCpu) || HC_ARCH_BITS == 32);
12756
12757 HM_RESTORE_PREEMPT();
12758 VMMRZCallRing3Enable(pVCpu);
12759
12760#ifdef VBOX_WITH_STATISTICS
12761 rc = hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
12762 AssertRCReturn(rc, rc);
12763 if (VMX_EXIT_QUAL_DRX_DIRECTION(pVmxTransient->uExitQual) == VMX_EXIT_QUAL_DRX_DIRECTION_WRITE)
12764 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitDRxWrite);
12765 else
12766 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitDRxRead);
12767#endif
12768 STAM_COUNTER_INC(&pVCpu->hm.s.StatDRxContextSwitch);
12769 return VINF_SUCCESS;
12770 }
12771
12772 /*
12773 * EMInterpretDRx[Write|Read]() calls CPUMIsGuestIn64BitCode() which requires EFER, CS. EFER is always up-to-date.
12774 * Update the segment registers and DR7 from the CPU.
12775 */
12776 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
12777 int rc = hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
12778 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_SREG_MASK | CPUMCTX_EXTRN_DR7);
12779 AssertRCReturn(rc, rc);
12780 Log4Func(("CS:RIP=%04x:%08RX64\n", pCtx->cs.Sel, pCtx->rip));
12781
12782 PVM pVM = pVCpu->CTX_SUFF(pVM);
12783 if (VMX_EXIT_QUAL_DRX_DIRECTION(pVmxTransient->uExitQual) == VMX_EXIT_QUAL_DRX_DIRECTION_WRITE)
12784 {
12785 rc = EMInterpretDRxWrite(pVM, pVCpu, CPUMCTX2CORE(pCtx),
12786 VMX_EXIT_QUAL_DRX_REGISTER(pVmxTransient->uExitQual),
12787 VMX_EXIT_QUAL_DRX_GENREG(pVmxTransient->uExitQual));
12788 if (RT_SUCCESS(rc))
12789 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_DR7);
12790 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitDRxWrite);
12791 }
12792 else
12793 {
12794 rc = EMInterpretDRxRead(pVM, pVCpu, CPUMCTX2CORE(pCtx),
12795 VMX_EXIT_QUAL_DRX_GENREG(pVmxTransient->uExitQual),
12796 VMX_EXIT_QUAL_DRX_REGISTER(pVmxTransient->uExitQual));
12797 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitDRxRead);
12798 }
12799
12800 Assert(rc == VINF_SUCCESS || rc == VERR_EM_INTERPRETER);
12801 if (RT_SUCCESS(rc))
12802 {
12803 int rc2 = hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
12804 AssertRCReturn(rc2, rc2);
12805 return VINF_SUCCESS;
12806 }
12807 return rc;
12808}
12809
12810
12811/**
12812 * VM-exit handler for EPT misconfiguration (VMX_EXIT_EPT_MISCONFIG).
12813 * Conditional VM-exit.
12814 */
12815HMVMX_EXIT_DECL hmR0VmxExitEptMisconfig(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12816{
12817 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12818 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging);
12819
12820 /* If this VM-exit occurred while delivering an event through the guest IDT, handle it accordingly. */
12821 VBOXSTRICTRC rcStrict1 = hmR0VmxCheckExitDueToEventDelivery(pVCpu, pVmxTransient);
12822 if (RT_LIKELY(rcStrict1 == VINF_SUCCESS))
12823 {
12824 /* If event delivery causes an EPT misconfig (MMIO), go back to instruction emulation as otherwise
12825 injecting the original pending event would most likely cause the same EPT misconfig VM-exit. */
12826 if (RT_UNLIKELY(pVCpu->hm.s.Event.fPending))
12827 {
12828 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectPendingInterpret);
12829 return VINF_EM_RAW_INJECT_TRPM_EVENT;
12830 }
12831 }
12832 else
12833 {
12834 if (rcStrict1 == VINF_HM_DOUBLE_FAULT)
12835 rcStrict1 = VINF_SUCCESS;
12836 return rcStrict1;
12837 }
12838
12839 /*
12840 * Get sufficent state and update the exit history entry.
12841 */
12842 RTGCPHYS GCPhys;
12843 int rc = VMXReadVmcs64(VMX_VMCS64_RO_GUEST_PHYS_ADDR_FULL, &GCPhys);
12844 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_MUST_MASK);
12845 AssertRCReturn(rc, rc);
12846
12847 VBOXSTRICTRC rcStrict;
12848 PCEMEXITREC pExitRec = EMHistoryUpdateFlagsAndTypeAndPC(pVCpu,
12849 EMEXIT_MAKE_FT(EMEXIT_F_KIND_EM | EMEXIT_F_HM, EMEXITTYPE_MMIO),
12850 pVCpu->cpum.GstCtx.rip + pVCpu->cpum.GstCtx.cs.u64Base);
12851 if (!pExitRec)
12852 {
12853 /*
12854 * If we succeed, resume guest execution.
12855 * If we fail in interpreting the instruction because we couldn't get the guest physical address
12856 * of the page containing the instruction via the guest's page tables (we would invalidate the guest page
12857 * in the host TLB), resume execution which would cause a guest page fault to let the guest handle this
12858 * weird case. See @bugref{6043}.
12859 */
12860 PVM pVM = pVCpu->CTX_SUFF(pVM);
12861 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
12862 rcStrict = PGMR0Trap0eHandlerNPMisconfig(pVM, pVCpu, PGMMODE_EPT, CPUMCTX2CORE(pCtx), GCPhys, UINT32_MAX);
12863 Log4Func(("At %#RGp RIP=%#RX64 rc=%Rrc\n", GCPhys, pCtx->rip, VBOXSTRICTRC_VAL(rcStrict)));
12864 if ( rcStrict == VINF_SUCCESS
12865 || rcStrict == VERR_PAGE_TABLE_NOT_PRESENT
12866 || rcStrict == VERR_PAGE_NOT_PRESENT)
12867 {
12868 /* Successfully handled MMIO operation. */
12869 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RSP | HM_CHANGED_GUEST_RFLAGS
12870 | HM_CHANGED_GUEST_APIC_TPR);
12871 rcStrict = VINF_SUCCESS;
12872 }
12873 }
12874 else
12875 {
12876 /*
12877 * Frequent exit or something needing probing. Get state and call EMHistoryExec.
12878 */
12879 int rc2 = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_MUST_MASK);
12880 AssertRCReturn(rc2, rc2);
12881
12882 Log4(("EptMisscfgExit/%u: %04x:%08RX64: %RGp -> EMHistoryExec\n",
12883 pVCpu->idCpu, pVCpu->cpum.GstCtx.cs.Sel, pVCpu->cpum.GstCtx.rip, GCPhys));
12884
12885 rcStrict = EMHistoryExec(pVCpu, pExitRec, 0);
12886 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
12887
12888 Log4(("EptMisscfgExit/%u: %04x:%08RX64: EMHistoryExec -> %Rrc + %04x:%08RX64\n",
12889 pVCpu->idCpu, pVCpu->cpum.GstCtx.cs.Sel, pVCpu->cpum.GstCtx.rip,
12890 VBOXSTRICTRC_VAL(rcStrict), pVCpu->cpum.GstCtx.cs.Sel, pVCpu->cpum.GstCtx.rip));
12891 }
12892 return VBOXSTRICTRC_TODO(rcStrict);
12893}
12894
12895
12896/**
12897 * VM-exit handler for EPT violation (VMX_EXIT_EPT_VIOLATION). Conditional
12898 * VM-exit.
12899 */
12900HMVMX_EXIT_DECL hmR0VmxExitEptViolation(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12901{
12902 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12903 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging);
12904
12905 /* If this VM-exit occurred while delivering an event through the guest IDT, handle it accordingly. */
12906 VBOXSTRICTRC rcStrict1 = hmR0VmxCheckExitDueToEventDelivery(pVCpu, pVmxTransient);
12907 if (RT_LIKELY(rcStrict1 == VINF_SUCCESS))
12908 {
12909 /* In the unlikely case that the EPT violation happened as a result of delivering an event, log it. */
12910 if (RT_UNLIKELY(pVCpu->hm.s.Event.fPending))
12911 Log4Func(("EPT violation with an event pending u64IntInfo=%#RX64\n", pVCpu->hm.s.Event.u64IntInfo));
12912 }
12913 else
12914 {
12915 if (rcStrict1 == VINF_HM_DOUBLE_FAULT)
12916 rcStrict1 = VINF_SUCCESS;
12917 return rcStrict1;
12918 }
12919
12920 RTGCPHYS GCPhys;
12921 int rc = VMXReadVmcs64(VMX_VMCS64_RO_GUEST_PHYS_ADDR_FULL, &GCPhys);
12922 rc |= hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
12923 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_MUST_MASK);
12924 AssertRCReturn(rc, rc);
12925
12926 /* Intel spec. Table 27-7 "Exit Qualifications for EPT violations". */
12927 AssertMsg(((pVmxTransient->uExitQual >> 7) & 3) != 2, ("%#RX64", pVmxTransient->uExitQual));
12928
12929 RTGCUINT uErrorCode = 0;
12930 if (pVmxTransient->uExitQual & VMX_EXIT_QUAL_EPT_INSTR_FETCH)
12931 uErrorCode |= X86_TRAP_PF_ID;
12932 if (pVmxTransient->uExitQual & VMX_EXIT_QUAL_EPT_DATA_WRITE)
12933 uErrorCode |= X86_TRAP_PF_RW;
12934 if (pVmxTransient->uExitQual & VMX_EXIT_QUAL_EPT_ENTRY_PRESENT)
12935 uErrorCode |= X86_TRAP_PF_P;
12936
12937 TRPMAssertXcptPF(pVCpu, GCPhys, uErrorCode);
12938
12939
12940 /* Handle the pagefault trap for the nested shadow table. */
12941 PVM pVM = pVCpu->CTX_SUFF(pVM);
12942 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
12943
12944 Log4Func(("EPT violation %#x at %#RX64 ErrorCode %#x CS:RIP=%04x:%08RX64\n", pVmxTransient->uExitQual, GCPhys, uErrorCode,
12945 pCtx->cs.Sel, pCtx->rip));
12946
12947 VBOXSTRICTRC rcStrict2 = PGMR0Trap0eHandlerNestedPaging(pVM, pVCpu, PGMMODE_EPT, uErrorCode, CPUMCTX2CORE(pCtx), GCPhys);
12948 TRPMResetTrap(pVCpu);
12949
12950 /* Same case as PGMR0Trap0eHandlerNPMisconfig(). See comment above, @bugref{6043}. */
12951 if ( rcStrict2 == VINF_SUCCESS
12952 || rcStrict2 == VERR_PAGE_TABLE_NOT_PRESENT
12953 || rcStrict2 == VERR_PAGE_NOT_PRESENT)
12954 {
12955 /* Successfully synced our nested page tables. */
12956 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitReasonNpf);
12957 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RSP | HM_CHANGED_GUEST_RFLAGS);
12958 return VINF_SUCCESS;
12959 }
12960
12961 Log4Func(("EPT return to ring-3 rcStrict2=%Rrc\n", VBOXSTRICTRC_VAL(rcStrict2)));
12962 return rcStrict2;
12963}
12964
12965/** @} */
12966
12967/** @name VM-exit exception handlers.
12968 * @{
12969 */
12970/* -=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= */
12971/* -=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= VM-exit exception handlers =-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=- */
12972/* -=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= */
12973
12974/**
12975 * VM-exit exception handler for \#MF (Math Fault: floating point exception).
12976 */
12977static int hmR0VmxExitXcptMF(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
12978{
12979 HMVMX_VALIDATE_EXIT_XCPT_HANDLER_PARAMS(pVCpu, pVmxTransient);
12980 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestMF);
12981
12982 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CR0);
12983 AssertRCReturn(rc, rc);
12984
12985 if (!(pVCpu->cpum.GstCtx.cr0 & X86_CR0_NE))
12986 {
12987 /* Convert a #MF into a FERR -> IRQ 13. See @bugref{6117}. */
12988 rc = PDMIsaSetIrq(pVCpu->CTX_SUFF(pVM), 13, 1, 0 /* uTagSrc */);
12989
12990 /** @todo r=ramshankar: The Intel spec. does -not- specify that this VM-exit
12991 * provides VM-exit instruction length. If this causes problem later,
12992 * disassemble the instruction like it's done on AMD-V. */
12993 int rc2 = hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
12994 AssertRCReturn(rc2, rc2);
12995 return rc;
12996 }
12997
12998 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_INT_INFO(pVmxTransient->uExitIntInfo), pVmxTransient->cbInstr,
12999 pVmxTransient->uExitIntErrorCode, 0 /* GCPtrFaultAddress */);
13000 return rc;
13001}
13002
13003
13004/**
13005 * VM-exit exception handler for \#BP (Breakpoint exception).
13006 */
13007static int hmR0VmxExitXcptBP(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13008{
13009 HMVMX_VALIDATE_EXIT_XCPT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13010 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestBP);
13011
13012 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
13013 AssertRCReturn(rc, rc);
13014
13015 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
13016 rc = DBGFRZTrap03Handler(pVCpu->CTX_SUFF(pVM), pVCpu, CPUMCTX2CORE(pCtx));
13017 if (rc == VINF_EM_RAW_GUEST_TRAP)
13018 {
13019 rc = hmR0VmxReadExitIntInfoVmcs(pVmxTransient);
13020 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13021 rc |= hmR0VmxReadExitIntErrorCodeVmcs(pVmxTransient);
13022 AssertRCReturn(rc, rc);
13023
13024 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_INT_INFO(pVmxTransient->uExitIntInfo), pVmxTransient->cbInstr,
13025 pVmxTransient->uExitIntErrorCode, 0 /* GCPtrFaultAddress */);
13026 }
13027
13028 Assert(rc == VINF_SUCCESS || rc == VINF_EM_RAW_GUEST_TRAP || rc == VINF_EM_DBG_BREAKPOINT);
13029 return rc;
13030}
13031
13032
13033/**
13034 * VM-exit exception handler for \#AC (alignment check exception).
13035 */
13036static int hmR0VmxExitXcptAC(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13037{
13038 HMVMX_VALIDATE_EXIT_XCPT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13039
13040 /*
13041 * Re-inject it. We'll detect any nesting before getting here.
13042 */
13043 int rc = hmR0VmxReadExitIntErrorCodeVmcs(pVmxTransient);
13044 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13045 AssertRCReturn(rc, rc);
13046 Assert(ASMAtomicUoReadU32(&pVmxTransient->fVmcsFieldsRead) & HMVMX_READ_EXIT_INTERRUPTION_INFO);
13047
13048 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_INT_INFO(pVmxTransient->uExitIntInfo), pVmxTransient->cbInstr,
13049 pVmxTransient->uExitIntErrorCode, 0 /* GCPtrFaultAddress */);
13050 return VINF_SUCCESS;
13051}
13052
13053
13054/**
13055 * VM-exit exception handler for \#DB (Debug exception).
13056 */
13057static int hmR0VmxExitXcptDB(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13058{
13059 HMVMX_VALIDATE_EXIT_XCPT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13060 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestDB);
13061
13062 /*
13063 * Get the DR6-like values from the VM-exit qualification and pass it to DBGF
13064 * for processing.
13065 */
13066 int rc = hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
13067
13068 /* Refer Intel spec. Table 27-1. "Exit Qualifications for debug exceptions" for the format. */
13069 uint64_t uDR6 = X86_DR6_INIT_VAL;
13070 uDR6 |= (pVmxTransient->uExitQual & (X86_DR6_B0 | X86_DR6_B1 | X86_DR6_B2 | X86_DR6_B3 | X86_DR6_BD | X86_DR6_BS));
13071
13072 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
13073 rc = DBGFRZTrap01Handler(pVCpu->CTX_SUFF(pVM), pVCpu, CPUMCTX2CORE(pCtx), uDR6, pVCpu->hm.s.fSingleInstruction);
13074 Log6Func(("rc=%Rrc\n", rc));
13075 if (rc == VINF_EM_RAW_GUEST_TRAP)
13076 {
13077 /*
13078 * The exception was for the guest. Update DR6, DR7.GD and
13079 * IA32_DEBUGCTL.LBR before forwarding it.
13080 * (See Intel spec. 27.1 "Architectural State before a VM-Exit".)
13081 */
13082 VMMRZCallRing3Disable(pVCpu);
13083 HM_DISABLE_PREEMPT(pVCpu);
13084
13085 pCtx->dr[6] &= ~X86_DR6_B_MASK;
13086 pCtx->dr[6] |= uDR6;
13087 if (CPUMIsGuestDebugStateActive(pVCpu))
13088 ASMSetDR6(pCtx->dr[6]);
13089
13090 HM_RESTORE_PREEMPT();
13091 VMMRZCallRing3Enable(pVCpu);
13092
13093 rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_DR7);
13094 AssertRCReturn(rc, rc);
13095
13096 /* X86_DR7_GD will be cleared if DRx accesses should be trapped inside the guest. */
13097 pCtx->dr[7] &= ~X86_DR7_GD;
13098
13099 /* Paranoia. */
13100 pCtx->dr[7] &= ~X86_DR7_RAZ_MASK;
13101 pCtx->dr[7] |= X86_DR7_RA1_MASK;
13102
13103 rc = VMXWriteVmcs32(VMX_VMCS_GUEST_DR7, (uint32_t)pCtx->dr[7]);
13104 AssertRCReturn(rc, rc);
13105
13106 /*
13107 * Raise #DB in the guest.
13108 *
13109 * It is important to reflect exactly what the VM-exit gave us (preserving the
13110 * interruption-type) rather than use hmR0VmxSetPendingXcptDB() as the #DB could've
13111 * been raised while executing ICEBP (INT1) and not the regular #DB. Thus it may
13112 * trigger different handling in the CPU (like skipping DPL checks), see @bugref{6398}.
13113 *
13114 * Intel re-documented ICEBP/INT1 on May 2018 previously documented as part of
13115 * Intel 386, see Intel spec. 24.8.3 "VM-Entry Controls for Event Injection".
13116 */
13117 rc = hmR0VmxReadExitIntInfoVmcs(pVmxTransient);
13118 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13119 rc |= hmR0VmxReadExitIntErrorCodeVmcs(pVmxTransient);
13120 AssertRCReturn(rc, rc);
13121 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_INT_INFO(pVmxTransient->uExitIntInfo), pVmxTransient->cbInstr,
13122 pVmxTransient->uExitIntErrorCode, 0 /* GCPtrFaultAddress */);
13123 return VINF_SUCCESS;
13124 }
13125
13126 /*
13127 * Not a guest trap, must be a hypervisor related debug event then.
13128 * Update DR6 in case someone is interested in it.
13129 */
13130 AssertMsg(rc == VINF_EM_DBG_STEPPED || rc == VINF_EM_DBG_BREAKPOINT, ("%Rrc\n", rc));
13131 AssertReturn(pVmxTransient->fWasHyperDebugStateActive, VERR_HM_IPE_5);
13132 CPUMSetHyperDR6(pVCpu, uDR6);
13133
13134 return rc;
13135}
13136
13137
13138/**
13139 * Hacks its way around the lovely mesa driver's backdoor accesses.
13140 *
13141 * @sa hmR0SvmHandleMesaDrvGp
13142 */
13143static int hmR0VmxHandleMesaDrvGp(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient, PCPUMCTX pCtx)
13144{
13145 Log(("hmR0VmxHandleMesaDrvGp: at %04x:%08RX64 rcx=%RX64 rbx=%RX64\n", pCtx->cs.Sel, pCtx->rip, pCtx->rcx, pCtx->rbx));
13146 RT_NOREF(pCtx);
13147
13148 /* For now we'll just skip the instruction. */
13149 return hmR0VmxAdvanceGuestRip(pVCpu, pVmxTransient);
13150}
13151
13152
13153/**
13154 * Checks if the \#GP'ing instruction is the mesa driver doing it's lovely
13155 * backdoor logging w/o checking what it is running inside.
13156 *
13157 * This recognizes an "IN EAX,DX" instruction executed in flat ring-3, with the
13158 * backdoor port and magic numbers loaded in registers.
13159 *
13160 * @returns true if it is, false if it isn't.
13161 * @sa hmR0SvmIsMesaDrvGp
13162 */
13163DECLINLINE(bool) hmR0VmxIsMesaDrvGp(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient, PCPUMCTX pCtx)
13164{
13165 /* 0xed: IN eAX,dx */
13166 uint8_t abInstr[1];
13167 if (pVmxTransient->cbInstr != sizeof(abInstr))
13168 return false;
13169
13170 /* Check that it is #GP(0). */
13171 if (pVmxTransient->uExitIntErrorCode != 0)
13172 return false;
13173
13174 /* Check magic and port. */
13175 Assert(!(pCtx->fExtrn & (CPUMCTX_EXTRN_RAX | CPUMCTX_EXTRN_RDX | CPUMCTX_EXTRN_RCX)));
13176 /*Log(("hmR0VmxIsMesaDrvGp: rax=%RX64 rdx=%RX64\n", pCtx->rax, pCtx->rdx));*/
13177 if (pCtx->rax != UINT32_C(0x564d5868))
13178 return false;
13179 if (pCtx->dx != UINT32_C(0x5658))
13180 return false;
13181
13182 /* Flat ring-3 CS. */
13183 AssertCompile(HMVMX_CPUMCTX_EXTRN_ALL & CPUMCTX_EXTRN_CS);
13184 Assert(!(pCtx->fExtrn & CPUMCTX_EXTRN_CS));
13185 /*Log(("hmR0VmxIsMesaDrvGp: cs.Attr.n.u2Dpl=%d base=%Rx64\n", pCtx->cs.Attr.n.u2Dpl, pCtx->cs.u64Base));*/
13186 if (pCtx->cs.Attr.n.u2Dpl != 3)
13187 return false;
13188 if (pCtx->cs.u64Base != 0)
13189 return false;
13190
13191 /* Check opcode. */
13192 AssertCompile(HMVMX_CPUMCTX_EXTRN_ALL & CPUMCTX_EXTRN_RIP);
13193 Assert(!(pCtx->fExtrn & CPUMCTX_EXTRN_RIP));
13194 int rc = PGMPhysSimpleReadGCPtr(pVCpu, abInstr, pCtx->rip, sizeof(abInstr));
13195 /*Log(("hmR0VmxIsMesaDrvGp: PGMPhysSimpleReadGCPtr -> %Rrc %#x\n", rc, abInstr[0]));*/
13196 if (RT_FAILURE(rc))
13197 return false;
13198 if (abInstr[0] != 0xed)
13199 return false;
13200
13201 return true;
13202}
13203
13204
13205/**
13206 * VM-exit exception handler for \#GP (General-protection exception).
13207 *
13208 * @remarks Requires pVmxTransient->uExitIntInfo to be up-to-date.
13209 */
13210static int hmR0VmxExitXcptGP(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13211{
13212 HMVMX_VALIDATE_EXIT_XCPT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13213 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestGP);
13214
13215 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
13216 if (pVCpu->hm.s.vmx.RealMode.fRealOnV86Active)
13217 { /* likely */ }
13218 else
13219 {
13220#ifndef HMVMX_ALWAYS_TRAP_ALL_XCPTS
13221 Assert(pVCpu->hm.s.fUsingDebugLoop || pVCpu->hm.s.fTrapXcptGpForLovelyMesaDrv);
13222#endif
13223 /* If the guest is not in real-mode or we have unrestricted execution support, reflect #GP to the guest. */
13224 int rc = hmR0VmxReadExitIntInfoVmcs(pVmxTransient);
13225 rc |= hmR0VmxReadExitIntErrorCodeVmcs(pVmxTransient);
13226 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13227 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
13228 AssertRCReturn(rc, rc);
13229 Log4Func(("Gst: CS:RIP %04x:%08RX64 ErrorCode=%#x CR0=%#RX64 CPL=%u TR=%#04x\n", pCtx->cs.Sel, pCtx->rip,
13230 pVmxTransient->uExitIntErrorCode, pCtx->cr0, CPUMGetGuestCPL(pVCpu), pCtx->tr.Sel));
13231
13232 if ( !pVCpu->hm.s.fTrapXcptGpForLovelyMesaDrv
13233 || !hmR0VmxIsMesaDrvGp(pVCpu, pVmxTransient, pCtx))
13234 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_INT_INFO(pVmxTransient->uExitIntInfo), pVmxTransient->cbInstr,
13235 pVmxTransient->uExitIntErrorCode, 0 /* GCPtrFaultAddress */);
13236 else
13237 rc = hmR0VmxHandleMesaDrvGp(pVCpu, pVmxTransient, pCtx);
13238 return rc;
13239 }
13240
13241 Assert(CPUMIsGuestInRealModeEx(pCtx));
13242 Assert(!pVCpu->CTX_SUFF(pVM)->hm.s.vmx.fUnrestrictedGuest);
13243
13244 int rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
13245 AssertRCReturn(rc, rc);
13246
13247 VBOXSTRICTRC rcStrict = IEMExecOne(pVCpu);
13248 if (rcStrict == VINF_SUCCESS)
13249 {
13250 if (!CPUMIsGuestInRealModeEx(pCtx))
13251 {
13252 /*
13253 * The guest is no longer in real-mode, check if we can continue executing the
13254 * guest using hardware-assisted VMX. Otherwise, fall back to emulation.
13255 */
13256 if (HMVmxCanExecuteGuest(pVCpu, pCtx))
13257 {
13258 Log4Func(("Mode changed but guest still suitable for executing using VT-x\n"));
13259 pVCpu->hm.s.vmx.RealMode.fRealOnV86Active = false;
13260 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
13261 }
13262 else
13263 {
13264 Log4Func(("Mode changed -> VINF_EM_RESCHEDULE\n"));
13265 rcStrict = VINF_EM_RESCHEDULE;
13266 }
13267 }
13268 else
13269 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
13270 }
13271 else if (rcStrict == VINF_IEM_RAISED_XCPT)
13272 {
13273 rcStrict = VINF_SUCCESS;
13274 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
13275 }
13276 return VBOXSTRICTRC_VAL(rcStrict);
13277}
13278
13279
13280/**
13281 * VM-exit exception handler wrapper for generic exceptions. Simply re-injects
13282 * the exception reported in the VMX transient structure back into the VM.
13283 *
13284 * @remarks Requires uExitIntInfo in the VMX transient structure to be
13285 * up-to-date.
13286 */
13287static int hmR0VmxExitXcptGeneric(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13288{
13289 HMVMX_VALIDATE_EXIT_XCPT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13290#ifndef HMVMX_ALWAYS_TRAP_ALL_XCPTS
13291 AssertMsg(pVCpu->hm.s.fUsingDebugLoop || pVCpu->hm.s.vmx.RealMode.fRealOnV86Active,
13292 ("uVector=%#x u32XcptBitmap=%#X32\n",
13293 VMX_EXIT_INT_INFO_VECTOR(pVmxTransient->uExitIntInfo), pVCpu->hm.s.vmx.u32XcptBitmap));
13294#endif
13295
13296 /* Re-inject the exception into the guest. This cannot be a double-fault condition which would have been handled in
13297 hmR0VmxCheckExitDueToEventDelivery(). */
13298 int rc = hmR0VmxReadExitIntErrorCodeVmcs(pVmxTransient);
13299 rc |= hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13300 AssertRCReturn(rc, rc);
13301 Assert(ASMAtomicUoReadU32(&pVmxTransient->fVmcsFieldsRead) & HMVMX_READ_EXIT_INTERRUPTION_INFO);
13302
13303#ifdef DEBUG_ramshankar
13304 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CS | CPUMCTX_EXTRN_RIP);
13305 uint8_t uVector = VMX_EXIT_INT_INFO_VECTOR(pVmxTransient->uExitIntInfo);
13306 Log(("hmR0VmxExitXcptGeneric: Reinjecting Xcpt. uVector=%#x cs:rip=%#04x:%#RX64\n", uVector, pCtx->cs.Sel, pCtx->rip));
13307#endif
13308
13309 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_INT_INFO(pVmxTransient->uExitIntInfo), pVmxTransient->cbInstr,
13310 pVmxTransient->uExitIntErrorCode, 0 /* GCPtrFaultAddress */);
13311 return VINF_SUCCESS;
13312}
13313
13314
13315/**
13316 * VM-exit exception handler for \#PF (Page-fault exception).
13317 */
13318static int hmR0VmxExitXcptPF(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13319{
13320 HMVMX_VALIDATE_EXIT_XCPT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13321 PVM pVM = pVCpu->CTX_SUFF(pVM);
13322 int rc = hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
13323 rc |= hmR0VmxReadExitIntInfoVmcs(pVmxTransient);
13324 rc |= hmR0VmxReadExitIntErrorCodeVmcs(pVmxTransient);
13325 AssertRCReturn(rc, rc);
13326
13327 if (!pVM->hm.s.fNestedPaging)
13328 { /* likely */ }
13329 else
13330 {
13331#if !defined(HMVMX_ALWAYS_TRAP_ALL_XCPTS) && !defined(HMVMX_ALWAYS_TRAP_PF)
13332 Assert(pVCpu->hm.s.fUsingDebugLoop);
13333#endif
13334 pVCpu->hm.s.Event.fPending = false; /* In case it's a contributory or vectoring #PF. */
13335 if (RT_LIKELY(!pVmxTransient->fVectoringDoublePF))
13336 {
13337 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_INT_INFO(pVmxTransient->uExitIntInfo), 0 /* cbInstr */,
13338 pVmxTransient->uExitIntErrorCode, pVmxTransient->uExitQual);
13339 }
13340 else
13341 {
13342 /* A guest page-fault occurred during delivery of a page-fault. Inject #DF. */
13343 hmR0VmxSetPendingXcptDF(pVCpu);
13344 Log4Func(("Pending #DF due to vectoring #PF w/ NestedPaging\n"));
13345 }
13346 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestPF);
13347 return rc;
13348 }
13349
13350 /* If it's a vectoring #PF, emulate injecting the original event injection as PGMTrap0eHandler() is incapable
13351 of differentiating between instruction emulation and event injection that caused a #PF. See @bugref{6607}. */
13352 if (pVmxTransient->fVectoringPF)
13353 {
13354 Assert(pVCpu->hm.s.Event.fPending);
13355 return VINF_EM_RAW_INJECT_TRPM_EVENT;
13356 }
13357
13358 PCPUMCTX pCtx = &pVCpu->cpum.GstCtx;
13359 rc = HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, HMVMX_CPUMCTX_EXTRN_ALL);
13360 AssertRCReturn(rc, rc);
13361
13362 Log4Func(("#PF: cr2=%#RX64 cs:rip=%#04x:%#RX64 uErrCode %#RX32 cr3=%#RX64\n", pVmxTransient->uExitQual, pCtx->cs.Sel,
13363 pCtx->rip, pVmxTransient->uExitIntErrorCode, pCtx->cr3));
13364
13365 TRPMAssertXcptPF(pVCpu, pVmxTransient->uExitQual, (RTGCUINT)pVmxTransient->uExitIntErrorCode);
13366 rc = PGMTrap0eHandler(pVCpu, pVmxTransient->uExitIntErrorCode, CPUMCTX2CORE(pCtx), (RTGCPTR)pVmxTransient->uExitQual);
13367
13368 Log4Func(("#PF: rc=%Rrc\n", rc));
13369 if (rc == VINF_SUCCESS)
13370 {
13371 /*
13372 * This is typically a shadow page table sync or a MMIO instruction. But we may have
13373 * emulated something like LTR or a far jump. Any part of the CPU context may have changed.
13374 */
13375 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
13376 TRPMResetTrap(pVCpu);
13377 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitShadowPF);
13378 return rc;
13379 }
13380
13381 if (rc == VINF_EM_RAW_GUEST_TRAP)
13382 {
13383 if (!pVmxTransient->fVectoringDoublePF)
13384 {
13385 /* It's a guest page fault and needs to be reflected to the guest. */
13386 uint32_t uGstErrorCode = TRPMGetErrorCode(pVCpu);
13387 TRPMResetTrap(pVCpu);
13388 pVCpu->hm.s.Event.fPending = false; /* In case it's a contributory #PF. */
13389 hmR0VmxSetPendingEvent(pVCpu, VMX_ENTRY_INT_INFO_FROM_EXIT_INT_INFO(pVmxTransient->uExitIntInfo), 0 /* cbInstr */,
13390 uGstErrorCode, pVmxTransient->uExitQual);
13391 }
13392 else
13393 {
13394 /* A guest page-fault occurred during delivery of a page-fault. Inject #DF. */
13395 TRPMResetTrap(pVCpu);
13396 pVCpu->hm.s.Event.fPending = false; /* Clear pending #PF to replace it with #DF. */
13397 hmR0VmxSetPendingXcptDF(pVCpu);
13398 Log4Func(("#PF: Pending #DF due to vectoring #PF\n"));
13399 }
13400
13401 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestPF);
13402 return VINF_SUCCESS;
13403 }
13404
13405 TRPMResetTrap(pVCpu);
13406 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitShadowPFEM);
13407 return rc;
13408}
13409
13410/** @} */
13411
13412#ifdef VBOX_WITH_NESTED_HWVIRT_VMX
13413/** @name Nested-guest VM-exit handlers.
13414 * @{
13415 */
13416/* -=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= */
13417/* -=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= Nested-guest VM-exit handlers =-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= */
13418/* -=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= */
13419
13420/**
13421 * VM-exit handler for VMCLEAR (VMX_EXIT_VMCLEAR). Unconditional VM-exit.
13422 */
13423HMVMX_EXIT_DECL hmR0VmxExitVmclear(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13424{
13425 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13426
13427 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13428 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_RSP | CPUMCTX_EXTRN_SREG_MASK
13429 | IEM_CPUMCTX_EXTRN_EXEC_DECODED_MEM_MASK);
13430 rc |= hmR0VmxReadExitInstrInfoVmcs(pVmxTransient);
13431 rc |= hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
13432 AssertRCReturn(rc, rc);
13433
13434 HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(pVCpu, pVmxTransient->uExitReason);
13435
13436 VMXVEXITINFO ExitInfo;
13437 RT_ZERO(ExitInfo);
13438 ExitInfo.uReason = pVmxTransient->uExitReason;
13439 ExitInfo.u64Qual = pVmxTransient->uExitQual;
13440 ExitInfo.InstrInfo.u = pVmxTransient->ExitInstrInfo.u;
13441 ExitInfo.cbInstr = pVmxTransient->cbInstr;
13442 HMVMX_DECODE_MEM_OPERAND(pVCpu, ExitInfo.InstrInfo.u, ExitInfo.u64Qual, VMXMEMACCESS_READ, &ExitInfo.GCPtrEffAddr);
13443
13444 VBOXSTRICTRC rcStrict = IEMExecDecodedVmclear(pVCpu, &ExitInfo);
13445 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
13446 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_HWVIRT);
13447 else if (rcStrict == VINF_IEM_RAISED_XCPT)
13448 {
13449 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
13450 rcStrict = VINF_SUCCESS;
13451 }
13452 return rcStrict;
13453}
13454
13455
13456/**
13457 * VM-exit handler for VMLAUNCH (VMX_EXIT_VMLAUNCH). Unconditional VM-exit.
13458 */
13459HMVMX_EXIT_DECL hmR0VmxExitVmlaunch(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13460{
13461 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13462
13463 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13464 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_VMX_VMENTRY_MASK);
13465 AssertRCReturn(rc, rc);
13466
13467 HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(pVCpu, pVmxTransient->uExitReason);
13468
13469 VBOXSTRICTRC rcStrict = IEMExecDecodedVmlaunchVmresume(pVCpu, pVmxTransient->cbInstr, VMXINSTRID_VMLAUNCH);
13470 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
13471 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
13472 Assert(rcStrict != VINF_IEM_RAISED_XCPT);
13473 return rcStrict;
13474}
13475
13476
13477/**
13478 * VM-exit handler for VMPTRLD (VMX_EXIT_VMPTRLD). Unconditional VM-exit.
13479 */
13480HMVMX_EXIT_DECL hmR0VmxExitVmptrld(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13481{
13482 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13483
13484 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13485 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_RSP | CPUMCTX_EXTRN_SREG_MASK
13486 | IEM_CPUMCTX_EXTRN_EXEC_DECODED_MEM_MASK);
13487 rc |= hmR0VmxReadExitInstrInfoVmcs(pVmxTransient);
13488 rc |= hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
13489 AssertRCReturn(rc, rc);
13490
13491 HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(pVCpu, pVmxTransient->uExitReason);
13492
13493 VMXVEXITINFO ExitInfo;
13494 RT_ZERO(ExitInfo);
13495 ExitInfo.uReason = pVmxTransient->uExitReason;
13496 ExitInfo.u64Qual = pVmxTransient->uExitQual;
13497 ExitInfo.InstrInfo.u = pVmxTransient->ExitInstrInfo.u;
13498 ExitInfo.cbInstr = pVmxTransient->cbInstr;
13499 HMVMX_DECODE_MEM_OPERAND(pVCpu, ExitInfo.InstrInfo.u, ExitInfo.u64Qual, VMXMEMACCESS_READ, &ExitInfo.GCPtrEffAddr);
13500
13501 VBOXSTRICTRC rcStrict = IEMExecDecodedVmptrld(pVCpu, &ExitInfo);
13502 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
13503 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_HWVIRT);
13504 else if (rcStrict == VINF_IEM_RAISED_XCPT)
13505 {
13506 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
13507 rcStrict = VINF_SUCCESS;
13508 }
13509 return rcStrict;
13510}
13511
13512
13513/**
13514 * VM-exit handler for VMPTRST (VMX_EXIT_VMPTRST). Unconditional VM-exit.
13515 */
13516HMVMX_EXIT_DECL hmR0VmxExitVmptrst(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13517{
13518 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13519
13520 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13521 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_RSP | CPUMCTX_EXTRN_SREG_MASK
13522 | IEM_CPUMCTX_EXTRN_EXEC_DECODED_MEM_MASK);
13523 rc |= hmR0VmxReadExitInstrInfoVmcs(pVmxTransient);
13524 rc |= hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
13525 AssertRCReturn(rc, rc);
13526
13527 HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(pVCpu, pVmxTransient->uExitReason);
13528
13529 VMXVEXITINFO ExitInfo;
13530 RT_ZERO(ExitInfo);
13531 ExitInfo.uReason = pVmxTransient->uExitReason;
13532 ExitInfo.u64Qual = pVmxTransient->uExitQual;
13533 ExitInfo.InstrInfo.u = pVmxTransient->ExitInstrInfo.u;
13534 ExitInfo.cbInstr = pVmxTransient->cbInstr;
13535 HMVMX_DECODE_MEM_OPERAND(pVCpu, ExitInfo.InstrInfo.u, ExitInfo.u64Qual, VMXMEMACCESS_WRITE, &ExitInfo.GCPtrEffAddr);
13536
13537 VBOXSTRICTRC rcStrict = IEMExecDecodedVmptrst(pVCpu, &ExitInfo);
13538 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
13539 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_HWVIRT);
13540 else if (rcStrict == VINF_IEM_RAISED_XCPT)
13541 {
13542 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
13543 rcStrict = VINF_SUCCESS;
13544 }
13545 return rcStrict;
13546}
13547
13548
13549/**
13550 * VM-exit handler for VMREAD (VMX_EXIT_VMREAD). Unconditional VM-exit.
13551 */
13552HMVMX_EXIT_DECL hmR0VmxExitVmread(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13553{
13554 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13555
13556 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13557 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_RSP | CPUMCTX_EXTRN_SREG_MASK
13558 | IEM_CPUMCTX_EXTRN_EXEC_DECODED_MEM_MASK);
13559 rc |= hmR0VmxReadExitInstrInfoVmcs(pVmxTransient);
13560 rc |= hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
13561 AssertRCReturn(rc, rc);
13562
13563 HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(pVCpu, pVmxTransient->uExitReason);
13564
13565 VMXVEXITINFO ExitInfo;
13566 RT_ZERO(ExitInfo);
13567 ExitInfo.uReason = pVmxTransient->uExitReason;
13568 ExitInfo.u64Qual = pVmxTransient->uExitQual;
13569 ExitInfo.InstrInfo.u = pVmxTransient->ExitInstrInfo.u;
13570 ExitInfo.cbInstr = pVmxTransient->cbInstr;
13571 if (!ExitInfo.InstrInfo.VmreadVmwrite.fIsRegOperand)
13572 HMVMX_DECODE_MEM_OPERAND(pVCpu, ExitInfo.InstrInfo.u, ExitInfo.u64Qual, VMXMEMACCESS_WRITE, &ExitInfo.GCPtrEffAddr);
13573
13574 VBOXSTRICTRC rcStrict = IEMExecDecodedVmread(pVCpu, &ExitInfo);
13575 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
13576 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_HWVIRT);
13577 else if (rcStrict == VINF_IEM_RAISED_XCPT)
13578 {
13579 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
13580 rcStrict = VINF_SUCCESS;
13581 }
13582 return rcStrict;
13583}
13584
13585
13586/**
13587 * VM-exit handler for VMRESUME (VMX_EXIT_VMRESUME). Unconditional VM-exit.
13588 */
13589HMVMX_EXIT_DECL hmR0VmxExitVmresume(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13590{
13591 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13592
13593 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13594 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, IEM_CPUMCTX_EXTRN_VMX_VMENTRY_MASK);
13595 AssertRCReturn(rc, rc);
13596
13597 HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(pVCpu, pVmxTransient->uExitReason);
13598
13599 VBOXSTRICTRC rcStrict = IEMExecDecodedVmlaunchVmresume(pVCpu, pVmxTransient->cbInstr, VMXINSTRID_VMRESUME);
13600 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
13601 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_ALL_GUEST);
13602 Assert(rcStrict != VINF_IEM_RAISED_XCPT);
13603 return rcStrict;
13604}
13605
13606
13607/**
13608 * VM-exit handler for VMWRITE (VMX_EXIT_VMWRITE). Unconditional VM-exit.
13609 */
13610HMVMX_EXIT_DECL hmR0VmxExitVmwrite(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13611{
13612 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13613
13614 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13615 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_RSP | CPUMCTX_EXTRN_SREG_MASK
13616 | IEM_CPUMCTX_EXTRN_EXEC_DECODED_MEM_MASK);
13617 rc |= hmR0VmxReadExitInstrInfoVmcs(pVmxTransient);
13618 rc |= hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
13619 AssertRCReturn(rc, rc);
13620
13621 HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(pVCpu, pVmxTransient->uExitReason);
13622
13623 VMXVEXITINFO ExitInfo;
13624 RT_ZERO(ExitInfo);
13625 ExitInfo.uReason = pVmxTransient->uExitReason;
13626 ExitInfo.u64Qual = pVmxTransient->uExitQual;
13627 ExitInfo.InstrInfo.u = pVmxTransient->ExitInstrInfo.u;
13628 ExitInfo.cbInstr = pVmxTransient->cbInstr;
13629 if (!ExitInfo.InstrInfo.VmreadVmwrite.fIsRegOperand)
13630 HMVMX_DECODE_MEM_OPERAND(pVCpu, ExitInfo.InstrInfo.u, ExitInfo.u64Qual, VMXMEMACCESS_READ, &ExitInfo.GCPtrEffAddr);
13631
13632 VBOXSTRICTRC rcStrict = IEMExecDecodedVmwrite(pVCpu, &ExitInfo);
13633 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
13634 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_HWVIRT);
13635 else if (rcStrict == VINF_IEM_RAISED_XCPT)
13636 {
13637 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
13638 rcStrict = VINF_SUCCESS;
13639 }
13640 return rcStrict;
13641}
13642
13643
13644/**
13645 * VM-exit handler for VMXOFF (VMX_EXIT_VMXOFF). Unconditional VM-exit.
13646 */
13647HMVMX_EXIT_DECL hmR0VmxExitVmxoff(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13648{
13649 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13650
13651 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13652 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_CR4 | IEM_CPUMCTX_EXTRN_EXEC_DECODED_NO_MEM_MASK);
13653 AssertRCReturn(rc, rc);
13654
13655 HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(pVCpu, pVmxTransient->uExitReason);
13656
13657 VBOXSTRICTRC rcStrict = IEMExecDecodedVmxoff(pVCpu, pVmxTransient->cbInstr);
13658 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
13659 {
13660 /* VMXOFF changes the internal hwvirt. state but not anything that's visible to the guest other than RIP. */
13661 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_HWVIRT);
13662 }
13663 else if (rcStrict == VINF_IEM_RAISED_XCPT)
13664 {
13665 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
13666 rcStrict = VINF_SUCCESS;
13667 }
13668 return rcStrict;
13669}
13670
13671
13672/**
13673 * VM-exit handler for VMXON (VMX_EXIT_VMXON). Unconditional VM-exit.
13674 */
13675HMVMX_EXIT_DECL hmR0VmxExitVmxon(PVMCPU pVCpu, PVMXTRANSIENT pVmxTransient)
13676{
13677 HMVMX_VALIDATE_EXIT_HANDLER_PARAMS(pVCpu, pVmxTransient);
13678
13679 int rc = hmR0VmxReadExitInstrLenVmcs(pVmxTransient);
13680 rc |= HMVMX_CPUMCTX_IMPORT_STATE(pVCpu, CPUMCTX_EXTRN_RSP | CPUMCTX_EXTRN_SREG_MASK
13681 | IEM_CPUMCTX_EXTRN_EXEC_DECODED_MEM_MASK);
13682 rc |= hmR0VmxReadExitInstrInfoVmcs(pVmxTransient);
13683 rc |= hmR0VmxReadExitQualVmcs(pVCpu, pVmxTransient);
13684 AssertRCReturn(rc, rc);
13685
13686 HMVMX_CHECK_EXIT_DUE_TO_VMX_INSTR(pVCpu, pVmxTransient->uExitReason);
13687
13688 VMXVEXITINFO ExitInfo;
13689 RT_ZERO(ExitInfo);
13690 ExitInfo.uReason = pVmxTransient->uExitReason;
13691 ExitInfo.u64Qual = pVmxTransient->uExitQual;
13692 ExitInfo.InstrInfo.u = pVmxTransient->ExitInstrInfo.u;
13693 ExitInfo.cbInstr = pVmxTransient->cbInstr;
13694 HMVMX_DECODE_MEM_OPERAND(pVCpu, ExitInfo.InstrInfo.u, ExitInfo.u64Qual, VMXMEMACCESS_READ, &ExitInfo.GCPtrEffAddr);
13695
13696 VBOXSTRICTRC rcStrict = IEMExecDecodedVmxon(pVCpu, &ExitInfo);
13697 if (RT_LIKELY(rcStrict == VINF_SUCCESS))
13698 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_GUEST_RIP | HM_CHANGED_GUEST_RFLAGS | HM_CHANGED_GUEST_HWVIRT);
13699 else if (rcStrict == VINF_IEM_RAISED_XCPT)
13700 {
13701 ASMAtomicUoOrU64(&pVCpu->hm.s.fCtxChanged, HM_CHANGED_RAISED_XCPT_MASK);
13702 rcStrict = VINF_SUCCESS;
13703 }
13704 return rcStrict;
13705}
13706
13707/** @} */
13708#endif /* VBOX_WITH_NESTED_HWVIRT_VMX */
13709
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette