VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMR0/HMSVMR0.cpp@ 66706

Last change on this file since 66706 was 66581, checked in by vboxsync, 8 years ago

VMM: Nested Hw.virt: Implemented various SVM intercepts in IEM, addressed some todos.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 215.3 KB
Line 
1/* $Id: HMSVMR0.cpp 66581 2017-04-17 03:00:00Z vboxsync $ */
2/** @file
3 * HM SVM (AMD-V) - Host Context Ring-0.
4 */
5
6/*
7 * Copyright (C) 2013-2016 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*********************************************************************************************************************************
20* Header Files *
21*********************************************************************************************************************************/
22#define LOG_GROUP LOG_GROUP_HM
23#include <iprt/asm-amd64-x86.h>
24#include <iprt/thread.h>
25
26#include <VBox/vmm/pdmapi.h>
27#include <VBox/vmm/dbgf.h>
28#include <VBox/vmm/iem.h>
29#include <VBox/vmm/iom.h>
30#include <VBox/vmm/tm.h>
31#include <VBox/vmm/gim.h>
32#include <VBox/vmm/apic.h>
33#include "HMInternal.h"
34#include <VBox/vmm/vm.h>
35#include "HMSVMR0.h"
36#include "dtrace/VBoxVMM.h"
37
38#ifdef DEBUG_ramshankar
39# define HMSVM_SYNC_FULL_GUEST_STATE
40# define HMSVM_ALWAYS_TRAP_ALL_XCPTS
41# define HMSVM_ALWAYS_TRAP_PF
42# define HMSVM_ALWAYS_TRAP_TASK_SWITCH
43#endif
44
45
46/*********************************************************************************************************************************
47* Defined Constants And Macros *
48*********************************************************************************************************************************/
49#ifdef VBOX_WITH_STATISTICS
50# define HMSVM_EXITCODE_STAM_COUNTER_INC(u64ExitCode) do { \
51 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitAll); \
52 if ((u64ExitCode) == SVM_EXIT_NPF) \
53 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitReasonNpf); \
54 else \
55 STAM_COUNTER_INC(&pVCpu->hm.s.paStatExitReasonR0[(u64ExitCode) & MASK_EXITREASON_STAT]); \
56 } while (0)
57#else
58# define HMSVM_EXITCODE_STAM_COUNTER_INC(u64ExitCode) do { } while (0)
59#endif
60
61/** If we decide to use a function table approach this can be useful to
62 * switch to a "static DECLCALLBACK(int)". */
63#define HMSVM_EXIT_DECL static int
64
65/** Macro for checking and returning from the using function for
66 * \#VMEXIT intercepts that maybe caused during delivering of another
67 * event in the guest. */
68#define HMSVM_CHECK_EXIT_DUE_TO_EVENT_DELIVERY() \
69 do \
70 { \
71 int rc = hmR0SvmCheckExitDueToEventDelivery(pVCpu, pCtx, pSvmTransient); \
72 if (RT_LIKELY(rc == VINF_SUCCESS)) { /* likely */ } \
73 else if (rc == VINF_HM_DOUBLE_FAULT) \
74 return VINF_SUCCESS; \
75 else \
76 return rc; \
77 } while (0)
78
79/** Macro for upgrading a @a a_rc to VINF_EM_DBG_STEPPED after emulating an
80 * instruction that exited. */
81#define HMSVM_CHECK_SINGLE_STEP(a_pVCpu, a_rc) \
82 do { \
83 if ((a_pVCpu)->hm.s.fSingleInstruction && (a_rc) == VINF_SUCCESS) \
84 (a_rc) = VINF_EM_DBG_STEPPED; \
85 } while (0)
86
87/** Assert that preemption is disabled or covered by thread-context hooks. */
88#define HMSVM_ASSERT_PREEMPT_SAFE() Assert( VMMR0ThreadCtxHookIsEnabled(pVCpu) \
89 || !RTThreadPreemptIsEnabled(NIL_RTTHREAD));
90
91/** Assert that we haven't migrated CPUs when thread-context hooks are not
92 * used. */
93#define HMSVM_ASSERT_CPU_SAFE() AssertMsg( VMMR0ThreadCtxHookIsEnabled(pVCpu) \
94 || pVCpu->hm.s.idEnteredCpu == RTMpCpuId(), \
95 ("Illegal migration! Entered on CPU %u Current %u\n", \
96 pVCpu->hm.s.idEnteredCpu, RTMpCpuId()));
97
98/** Exception bitmap mask for all contributory exceptions.
99 *
100 * Page fault is deliberately excluded here as it's conditional as to whether
101 * it's contributory or benign. Page faults are handled separately.
102 */
103#define HMSVM_CONTRIBUTORY_XCPT_MASK ( RT_BIT(X86_XCPT_GP) | RT_BIT(X86_XCPT_NP) | RT_BIT(X86_XCPT_SS) | RT_BIT(X86_XCPT_TS) \
104 | RT_BIT(X86_XCPT_DE))
105
106/** @name VMCB Clean Bits.
107 *
108 * These flags are used for VMCB-state caching. A set VMCB Clean bit indicates
109 * AMD-V doesn't need to reload the corresponding value(s) from the VMCB in
110 * memory.
111 *
112 * @{ */
113/** All intercepts vectors, TSC offset, PAUSE filter counter. */
114#define HMSVM_VMCB_CLEAN_INTERCEPTS RT_BIT(0)
115/** I/O permission bitmap, MSR permission bitmap. */
116#define HMSVM_VMCB_CLEAN_IOPM_MSRPM RT_BIT(1)
117/** ASID. */
118#define HMSVM_VMCB_CLEAN_ASID RT_BIT(2)
119/** TRP: V_TPR, V_IRQ, V_INTR_PRIO, V_IGN_TPR, V_INTR_MASKING,
120V_INTR_VECTOR. */
121#define HMSVM_VMCB_CLEAN_TPR RT_BIT(3)
122/** Nested Paging: Nested CR3 (nCR3), PAT. */
123#define HMSVM_VMCB_CLEAN_NP RT_BIT(4)
124/** Control registers (CR0, CR3, CR4, EFER). */
125#define HMSVM_VMCB_CLEAN_CRX_EFER RT_BIT(5)
126/** Debug registers (DR6, DR7). */
127#define HMSVM_VMCB_CLEAN_DRX RT_BIT(6)
128/** GDT, IDT limit and base. */
129#define HMSVM_VMCB_CLEAN_DT RT_BIT(7)
130/** Segment register: CS, SS, DS, ES limit and base. */
131#define HMSVM_VMCB_CLEAN_SEG RT_BIT(8)
132/** CR2.*/
133#define HMSVM_VMCB_CLEAN_CR2 RT_BIT(9)
134/** Last-branch record (DbgCtlMsr, br_from, br_to, lastint_from, lastint_to) */
135#define HMSVM_VMCB_CLEAN_LBR RT_BIT(10)
136/** AVIC (AVIC APIC_BAR; AVIC APIC_BACKING_PAGE, AVIC
137PHYSICAL_TABLE and AVIC LOGICAL_TABLE Pointers). */
138#define HMSVM_VMCB_CLEAN_AVIC RT_BIT(11)
139/** Mask of all valid VMCB Clean bits. */
140#define HMSVM_VMCB_CLEAN_ALL ( HMSVM_VMCB_CLEAN_INTERCEPTS \
141 | HMSVM_VMCB_CLEAN_IOPM_MSRPM \
142 | HMSVM_VMCB_CLEAN_ASID \
143 | HMSVM_VMCB_CLEAN_TPR \
144 | HMSVM_VMCB_CLEAN_NP \
145 | HMSVM_VMCB_CLEAN_CRX_EFER \
146 | HMSVM_VMCB_CLEAN_DRX \
147 | HMSVM_VMCB_CLEAN_DT \
148 | HMSVM_VMCB_CLEAN_SEG \
149 | HMSVM_VMCB_CLEAN_CR2 \
150 | HMSVM_VMCB_CLEAN_LBR \
151 | HMSVM_VMCB_CLEAN_AVIC)
152/** @} */
153
154/** @name SVM transient.
155 *
156 * A state structure for holding miscellaneous information across AMD-V
157 * VMRUN/\#VMEXIT operation, restored after the transition.
158 *
159 * @{ */
160typedef struct SVMTRANSIENT
161{
162 /** The host's rflags/eflags. */
163 RTCCUINTREG fEFlags;
164#if HC_ARCH_BITS == 32
165 uint32_t u32Alignment0;
166#endif
167
168 /** The \#VMEXIT exit code (the EXITCODE field in the VMCB). */
169 uint64_t u64ExitCode;
170 /** The guest's TPR value used for TPR shadowing. */
171 uint8_t u8GuestTpr;
172 /** Alignment. */
173 uint8_t abAlignment0[7];
174
175 /** Whether the guest FPU state was active at the time of \#VMEXIT. */
176 bool fWasGuestFPUStateActive;
177 /** Whether the guest debug state was active at the time of \#VMEXIT. */
178 bool fWasGuestDebugStateActive;
179 /** Whether the hyper debug state was active at the time of \#VMEXIT. */
180 bool fWasHyperDebugStateActive;
181 /** Whether the TSC offset mode needs to be updated. */
182 bool fUpdateTscOffsetting;
183 /** Whether the TSC_AUX MSR needs restoring on \#VMEXIT. */
184 bool fRestoreTscAuxMsr;
185 /** Whether the \#VMEXIT was caused by a page-fault during delivery of a
186 * contributary exception or a page-fault. */
187 bool fVectoringDoublePF;
188 /** Whether the \#VMEXIT was caused by a page-fault during delivery of an
189 * external interrupt or NMI. */
190 bool fVectoringPF;
191} SVMTRANSIENT, *PSVMTRANSIENT;
192AssertCompileMemberAlignment(SVMTRANSIENT, u64ExitCode, sizeof(uint64_t));
193AssertCompileMemberAlignment(SVMTRANSIENT, fWasGuestFPUStateActive, sizeof(uint64_t));
194/** @} */
195
196/**
197 * MSRPM (MSR permission bitmap) read permissions (for guest RDMSR).
198 */
199typedef enum SVMMSREXITREAD
200{
201 /** Reading this MSR causes a \#VMEXIT. */
202 SVMMSREXIT_INTERCEPT_READ = 0xb,
203 /** Reading this MSR does not cause a \#VMEXIT. */
204 SVMMSREXIT_PASSTHRU_READ
205} SVMMSREXITREAD;
206
207/**
208 * MSRPM (MSR permission bitmap) write permissions (for guest WRMSR).
209 */
210typedef enum SVMMSREXITWRITE
211{
212 /** Writing to this MSR causes a \#VMEXIT. */
213 SVMMSREXIT_INTERCEPT_WRITE = 0xd,
214 /** Writing to this MSR does not cause a \#VMEXIT. */
215 SVMMSREXIT_PASSTHRU_WRITE
216} SVMMSREXITWRITE;
217
218/**
219 * SVM \#VMEXIT handler.
220 *
221 * @returns VBox status code.
222 * @param pVCpu The cross context virtual CPU structure.
223 * @param pMixedCtx Pointer to the guest-CPU context.
224 * @param pSvmTransient Pointer to the SVM-transient structure.
225 */
226typedef int FNSVMEXITHANDLER(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient);
227
228
229/*********************************************************************************************************************************
230* Internal Functions *
231*********************************************************************************************************************************/
232static void hmR0SvmSetMsrPermission(PVMCPU pVCpu, unsigned uMsr, SVMMSREXITREAD enmRead, SVMMSREXITWRITE enmWrite);
233static void hmR0SvmPendingEventToTrpmTrap(PVMCPU pVCpu);
234static void hmR0SvmLeave(PVMCPU pVCpu);
235
236/** @name \#VMEXIT handlers.
237 * @{
238 */
239static FNSVMEXITHANDLER hmR0SvmExitIntr;
240static FNSVMEXITHANDLER hmR0SvmExitWbinvd;
241static FNSVMEXITHANDLER hmR0SvmExitInvd;
242static FNSVMEXITHANDLER hmR0SvmExitCpuid;
243static FNSVMEXITHANDLER hmR0SvmExitRdtsc;
244static FNSVMEXITHANDLER hmR0SvmExitRdtscp;
245static FNSVMEXITHANDLER hmR0SvmExitRdpmc;
246static FNSVMEXITHANDLER hmR0SvmExitInvlpg;
247static FNSVMEXITHANDLER hmR0SvmExitHlt;
248static FNSVMEXITHANDLER hmR0SvmExitMonitor;
249static FNSVMEXITHANDLER hmR0SvmExitMwait;
250static FNSVMEXITHANDLER hmR0SvmExitShutdown;
251static FNSVMEXITHANDLER hmR0SvmExitReadCRx;
252static FNSVMEXITHANDLER hmR0SvmExitWriteCRx;
253static FNSVMEXITHANDLER hmR0SvmExitSetPendingXcptUD;
254static FNSVMEXITHANDLER hmR0SvmExitMsr;
255static FNSVMEXITHANDLER hmR0SvmExitReadDRx;
256static FNSVMEXITHANDLER hmR0SvmExitWriteDRx;
257static FNSVMEXITHANDLER hmR0SvmExitXsetbv;
258static FNSVMEXITHANDLER hmR0SvmExitIOInstr;
259static FNSVMEXITHANDLER hmR0SvmExitNestedPF;
260static FNSVMEXITHANDLER hmR0SvmExitVIntr;
261static FNSVMEXITHANDLER hmR0SvmExitTaskSwitch;
262static FNSVMEXITHANDLER hmR0SvmExitVmmCall;
263static FNSVMEXITHANDLER hmR0SvmExitPause;
264static FNSVMEXITHANDLER hmR0SvmExitIret;
265static FNSVMEXITHANDLER hmR0SvmExitXcptPF;
266static FNSVMEXITHANDLER hmR0SvmExitXcptNM;
267static FNSVMEXITHANDLER hmR0SvmExitXcptUD;
268static FNSVMEXITHANDLER hmR0SvmExitXcptMF;
269static FNSVMEXITHANDLER hmR0SvmExitXcptDB;
270static FNSVMEXITHANDLER hmR0SvmExitXcptAC;
271static FNSVMEXITHANDLER hmR0SvmExitXcptBP;
272#ifdef VBOX_WITH_NESTED_HWVIRT
273static FNSVMEXITHANDLER hmR0SvmExitClgi;
274static FNSVMEXITHANDLER hmR0SvmExitStgi;
275static FNSVMEXITHANDLER hmR0SvmExitVmload;
276static FNSVMEXITHANDLER hmR0SvmExitVmsave;
277static FNSVMEXITHANDLER hmR0SvmExitInvlpga;
278#endif
279/** @} */
280
281DECLINLINE(int) hmR0SvmHandleExit(PVMCPU pVCpu, PCPUMCTX pMixedCtx, PSVMTRANSIENT pSvmTransient);
282
283
284/*********************************************************************************************************************************
285* Global Variables *
286*********************************************************************************************************************************/
287/** Ring-0 memory object for the IO bitmap. */
288RTR0MEMOBJ g_hMemObjIOBitmap = NIL_RTR0MEMOBJ;
289/** Physical address of the IO bitmap. */
290RTHCPHYS g_HCPhysIOBitmap = 0;
291/** Virtual address of the IO bitmap. */
292R0PTRTYPE(void *) g_pvIOBitmap = NULL;
293
294
295/**
296 * Sets up and activates AMD-V on the current CPU.
297 *
298 * @returns VBox status code.
299 * @param pCpu Pointer to the CPU info struct.
300 * @param pVM The cross context VM structure. Can be
301 * NULL after a resume!
302 * @param pvCpuPage Pointer to the global CPU page.
303 * @param HCPhysCpuPage Physical address of the global CPU page.
304 * @param fEnabledByHost Whether the host OS has already initialized AMD-V.
305 * @param pvArg Unused on AMD-V.
306 */
307VMMR0DECL(int) SVMR0EnableCpu(PHMGLOBALCPUINFO pCpu, PVM pVM, void *pvCpuPage, RTHCPHYS HCPhysCpuPage, bool fEnabledByHost,
308 void *pvArg)
309{
310 Assert(!fEnabledByHost);
311 Assert(HCPhysCpuPage && HCPhysCpuPage != NIL_RTHCPHYS);
312 Assert(RT_ALIGN_T(HCPhysCpuPage, _4K, RTHCPHYS) == HCPhysCpuPage);
313 Assert(pvCpuPage); NOREF(pvCpuPage);
314 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
315
316 NOREF(pvArg);
317 NOREF(fEnabledByHost);
318
319 /* Paranoid: Disable interrupt as, in theory, interrupt handlers might mess with EFER. */
320 RTCCUINTREG fEFlags = ASMIntDisableFlags();
321
322 /*
323 * We must turn on AMD-V and setup the host state physical address, as those MSRs are per CPU.
324 */
325 uint64_t u64HostEfer = ASMRdMsr(MSR_K6_EFER);
326 if (u64HostEfer & MSR_K6_EFER_SVME)
327 {
328 /* If the VBOX_HWVIRTEX_IGNORE_SVM_IN_USE is active, then we blindly use AMD-V. */
329 if ( pVM
330 && pVM->hm.s.svm.fIgnoreInUseError)
331 {
332 pCpu->fIgnoreAMDVInUseError = true;
333 }
334
335 if (!pCpu->fIgnoreAMDVInUseError)
336 {
337 ASMSetFlags(fEFlags);
338 return VERR_SVM_IN_USE;
339 }
340 }
341
342 /* Turn on AMD-V in the EFER MSR. */
343 ASMWrMsr(MSR_K6_EFER, u64HostEfer | MSR_K6_EFER_SVME);
344
345 /* Write the physical page address where the CPU will store the host state while executing the VM. */
346 ASMWrMsr(MSR_K8_VM_HSAVE_PA, HCPhysCpuPage);
347
348 /* Restore interrupts. */
349 ASMSetFlags(fEFlags);
350
351 /*
352 * Theoretically, other hypervisors may have used ASIDs, ideally we should flush all non-zero ASIDs
353 * when enabling SVM. AMD doesn't have an SVM instruction to flush all ASIDs (flushing is done
354 * upon VMRUN). Therefore, just set the fFlushAsidBeforeUse flag which instructs hmR0SvmSetupTLB()
355 * to flush the TLB with before using a new ASID.
356 */
357 pCpu->fFlushAsidBeforeUse = true;
358
359 /*
360 * Ensure each VCPU scheduled on this CPU gets a new VPID on resume. See @bugref{6255}.
361 */
362 ++pCpu->cTlbFlushes;
363
364 return VINF_SUCCESS;
365}
366
367
368/**
369 * Deactivates AMD-V on the current CPU.
370 *
371 * @returns VBox status code.
372 * @param pCpu Pointer to the CPU info struct.
373 * @param pvCpuPage Pointer to the global CPU page.
374 * @param HCPhysCpuPage Physical address of the global CPU page.
375 */
376VMMR0DECL(int) SVMR0DisableCpu(PHMGLOBALCPUINFO pCpu, void *pvCpuPage, RTHCPHYS HCPhysCpuPage)
377{
378 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
379 AssertReturn( HCPhysCpuPage
380 && HCPhysCpuPage != NIL_RTHCPHYS, VERR_INVALID_PARAMETER);
381 AssertReturn(pvCpuPage, VERR_INVALID_PARAMETER);
382 NOREF(pCpu);
383
384 /* Paranoid: Disable interrupts as, in theory, interrupt handlers might mess with EFER. */
385 RTCCUINTREG fEFlags = ASMIntDisableFlags();
386
387 /* Turn off AMD-V in the EFER MSR. */
388 uint64_t u64HostEfer = ASMRdMsr(MSR_K6_EFER);
389 ASMWrMsr(MSR_K6_EFER, u64HostEfer & ~MSR_K6_EFER_SVME);
390
391 /* Invalidate host state physical address. */
392 ASMWrMsr(MSR_K8_VM_HSAVE_PA, 0);
393
394 /* Restore interrupts. */
395 ASMSetFlags(fEFlags);
396
397 return VINF_SUCCESS;
398}
399
400
401/**
402 * Does global AMD-V initialization (called during module initialization).
403 *
404 * @returns VBox status code.
405 */
406VMMR0DECL(int) SVMR0GlobalInit(void)
407{
408 /*
409 * Allocate 12 KB for the IO bitmap. Since this is non-optional and we always intercept all IO accesses, it's done
410 * once globally here instead of per-VM.
411 */
412 Assert(g_hMemObjIOBitmap == NIL_RTR0MEMOBJ);
413 int rc = RTR0MemObjAllocCont(&g_hMemObjIOBitmap, SVM_IOPM_PAGES << X86_PAGE_4K_SHIFT, false /* fExecutable */);
414 if (RT_FAILURE(rc))
415 return rc;
416
417 g_pvIOBitmap = RTR0MemObjAddress(g_hMemObjIOBitmap);
418 g_HCPhysIOBitmap = RTR0MemObjGetPagePhysAddr(g_hMemObjIOBitmap, 0 /* iPage */);
419
420 /* Set all bits to intercept all IO accesses. */
421 ASMMemFill32(g_pvIOBitmap, SVM_IOPM_PAGES << X86_PAGE_4K_SHIFT, UINT32_C(0xffffffff));
422 return VINF_SUCCESS;
423}
424
425
426/**
427 * Does global AMD-V termination (called during module termination).
428 */
429VMMR0DECL(void) SVMR0GlobalTerm(void)
430{
431 if (g_hMemObjIOBitmap != NIL_RTR0MEMOBJ)
432 {
433 RTR0MemObjFree(g_hMemObjIOBitmap, true /* fFreeMappings */);
434 g_pvIOBitmap = NULL;
435 g_HCPhysIOBitmap = 0;
436 g_hMemObjIOBitmap = NIL_RTR0MEMOBJ;
437 }
438}
439
440
441/**
442 * Frees any allocated per-VCPU structures for a VM.
443 *
444 * @param pVM The cross context VM structure.
445 */
446DECLINLINE(void) hmR0SvmFreeStructs(PVM pVM)
447{
448 for (uint32_t i = 0; i < pVM->cCpus; i++)
449 {
450 PVMCPU pVCpu = &pVM->aCpus[i];
451 AssertPtr(pVCpu);
452
453 if (pVCpu->hm.s.svm.hMemObjVmcbHost != NIL_RTR0MEMOBJ)
454 {
455 RTR0MemObjFree(pVCpu->hm.s.svm.hMemObjVmcbHost, false);
456 pVCpu->hm.s.svm.pvVmcbHost = 0;
457 pVCpu->hm.s.svm.HCPhysVmcbHost = 0;
458 pVCpu->hm.s.svm.hMemObjVmcbHost = NIL_RTR0MEMOBJ;
459 }
460
461 if (pVCpu->hm.s.svm.hMemObjVmcb != NIL_RTR0MEMOBJ)
462 {
463 RTR0MemObjFree(pVCpu->hm.s.svm.hMemObjVmcb, false);
464 pVCpu->hm.s.svm.pvVmcb = 0;
465 pVCpu->hm.s.svm.HCPhysVmcb = 0;
466 pVCpu->hm.s.svm.hMemObjVmcb = NIL_RTR0MEMOBJ;
467 }
468
469 if (pVCpu->hm.s.svm.hMemObjMsrBitmap != NIL_RTR0MEMOBJ)
470 {
471 RTR0MemObjFree(pVCpu->hm.s.svm.hMemObjMsrBitmap, false);
472 pVCpu->hm.s.svm.pvMsrBitmap = 0;
473 pVCpu->hm.s.svm.HCPhysMsrBitmap = 0;
474 pVCpu->hm.s.svm.hMemObjMsrBitmap = NIL_RTR0MEMOBJ;
475 }
476 }
477}
478
479
480/**
481 * Does per-VM AMD-V initialization.
482 *
483 * @returns VBox status code.
484 * @param pVM The cross context VM structure.
485 */
486VMMR0DECL(int) SVMR0InitVM(PVM pVM)
487{
488 int rc = VERR_INTERNAL_ERROR_5;
489
490 /*
491 * Check for an AMD CPU erratum which requires us to flush the TLB before every world-switch.
492 */
493 uint32_t u32Family;
494 uint32_t u32Model;
495 uint32_t u32Stepping;
496 if (HMAmdIsSubjectToErratum170(&u32Family, &u32Model, &u32Stepping))
497 {
498 Log4(("SVMR0InitVM: AMD cpu with erratum 170 family %#x model %#x stepping %#x\n", u32Family, u32Model, u32Stepping));
499 pVM->hm.s.svm.fAlwaysFlushTLB = true;
500 }
501
502 /*
503 * Initialize the R0 memory objects up-front so we can properly cleanup on allocation failures.
504 */
505 for (VMCPUID i = 0; i < pVM->cCpus; i++)
506 {
507 PVMCPU pVCpu = &pVM->aCpus[i];
508 pVCpu->hm.s.svm.hMemObjVmcbHost = NIL_RTR0MEMOBJ;
509 pVCpu->hm.s.svm.hMemObjVmcb = NIL_RTR0MEMOBJ;
510 pVCpu->hm.s.svm.hMemObjMsrBitmap = NIL_RTR0MEMOBJ;
511 }
512
513 for (VMCPUID i = 0; i < pVM->cCpus; i++)
514 {
515 PVMCPU pVCpu = &pVM->aCpus[i];
516
517 /*
518 * Allocate one page for the host-context VM control block (VMCB). This is used for additional host-state (such as
519 * FS, GS, Kernel GS Base, etc.) apart from the host-state save area specified in MSR_K8_VM_HSAVE_PA.
520 */
521 rc = RTR0MemObjAllocCont(&pVCpu->hm.s.svm.hMemObjVmcbHost, SVM_VMCB_PAGES << PAGE_SHIFT, false /* fExecutable */);
522 if (RT_FAILURE(rc))
523 goto failure_cleanup;
524
525 pVCpu->hm.s.svm.pvVmcbHost = RTR0MemObjAddress(pVCpu->hm.s.svm.hMemObjVmcbHost);
526 pVCpu->hm.s.svm.HCPhysVmcbHost = RTR0MemObjGetPagePhysAddr(pVCpu->hm.s.svm.hMemObjVmcbHost, 0 /* iPage */);
527 Assert(pVCpu->hm.s.svm.HCPhysVmcbHost < _4G);
528 ASMMemZeroPage(pVCpu->hm.s.svm.pvVmcbHost);
529
530 /*
531 * Allocate one page for the guest-state VMCB.
532 */
533 rc = RTR0MemObjAllocCont(&pVCpu->hm.s.svm.hMemObjVmcb, SVM_VMCB_PAGES << PAGE_SHIFT, false /* fExecutable */);
534 if (RT_FAILURE(rc))
535 goto failure_cleanup;
536
537 pVCpu->hm.s.svm.pvVmcb = RTR0MemObjAddress(pVCpu->hm.s.svm.hMemObjVmcb);
538 pVCpu->hm.s.svm.HCPhysVmcb = RTR0MemObjGetPagePhysAddr(pVCpu->hm.s.svm.hMemObjVmcb, 0 /* iPage */);
539 Assert(pVCpu->hm.s.svm.HCPhysVmcb < _4G);
540 ASMMemZeroPage(pVCpu->hm.s.svm.pvVmcb);
541
542 /*
543 * Allocate two pages (8 KB) for the MSR permission bitmap. There doesn't seem to be a way to convince
544 * SVM to not require one.
545 */
546 rc = RTR0MemObjAllocCont(&pVCpu->hm.s.svm.hMemObjMsrBitmap, SVM_MSRPM_PAGES << X86_PAGE_4K_SHIFT,
547 false /* fExecutable */);
548 if (RT_FAILURE(rc))
549 goto failure_cleanup;
550
551 pVCpu->hm.s.svm.pvMsrBitmap = RTR0MemObjAddress(pVCpu->hm.s.svm.hMemObjMsrBitmap);
552 pVCpu->hm.s.svm.HCPhysMsrBitmap = RTR0MemObjGetPagePhysAddr(pVCpu->hm.s.svm.hMemObjMsrBitmap, 0 /* iPage */);
553 /* Set all bits to intercept all MSR accesses (changed later on). */
554 ASMMemFill32(pVCpu->hm.s.svm.pvMsrBitmap, SVM_MSRPM_PAGES << X86_PAGE_4K_SHIFT, UINT32_C(0xffffffff));
555 }
556
557 return VINF_SUCCESS;
558
559failure_cleanup:
560 hmR0SvmFreeStructs(pVM);
561 return rc;
562}
563
564
565/**
566 * Does per-VM AMD-V termination.
567 *
568 * @returns VBox status code.
569 * @param pVM The cross context VM structure.
570 */
571VMMR0DECL(int) SVMR0TermVM(PVM pVM)
572{
573 hmR0SvmFreeStructs(pVM);
574 return VINF_SUCCESS;
575}
576
577
578/**
579 * Sets the permission bits for the specified MSR in the MSRPM.
580 *
581 * @param pVCpu The cross context virtual CPU structure.
582 * @param uMsr The MSR for which the access permissions are being set.
583 * @param enmRead MSR read permissions.
584 * @param enmWrite MSR write permissions.
585 */
586static void hmR0SvmSetMsrPermission(PVMCPU pVCpu, unsigned uMsr, SVMMSREXITREAD enmRead, SVMMSREXITWRITE enmWrite)
587{
588 uint16_t offMsrpm;
589 uint32_t uMsrpmBit;
590 int rc = hmSvmGetMsrpmOffsetAndBit(uMsr, &offMsrpm, &uMsrpmBit);
591 AssertRC(rc);
592
593 Assert(uMsrpmBit < 0x3fff);
594 Assert(offMsrpm < SVM_MSRPM_PAGES << X86_PAGE_4K_SHIFT);
595
596 uint8_t *pbMsrBitmap = (uint8_t *)pVCpu->hm.s.svm.pvMsrBitmap;
597 pbMsrBitmap += offMsrpm;
598
599 if (enmRead == SVMMSREXIT_INTERCEPT_READ)
600 ASMBitSet(pbMsrBitmap, uMsrpmBit);
601 else
602 ASMBitClear(pbMsrBitmap, uMsrpmBit);
603
604 if (enmWrite == SVMMSREXIT_INTERCEPT_WRITE)
605 ASMBitSet(pbMsrBitmap, uMsrpmBit + 1);
606 else
607 ASMBitClear(pbMsrBitmap, uMsrpmBit + 1);
608
609 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
610 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_IOPM_MSRPM;
611}
612
613
614/**
615 * Sets up AMD-V for the specified VM.
616 * This function is only called once per-VM during initalization.
617 *
618 * @returns VBox status code.
619 * @param pVM The cross context VM structure.
620 */
621VMMR0DECL(int) SVMR0SetupVM(PVM pVM)
622{
623 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
624 AssertReturn(pVM, VERR_INVALID_PARAMETER);
625 Assert(pVM->hm.s.svm.fSupported);
626
627 bool const fPauseFilter = RT_BOOL(pVM->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_PAUSE_FILTER);
628 bool const fPauseFilterThreshold = RT_BOOL(pVM->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_PAUSE_FILTER_THRESHOLD);
629 bool const fUsePauseFilter = fPauseFilter && pVM->hm.s.svm.cPauseFilter && pVM->hm.s.svm.cPauseFilterThresholdTicks;
630
631 for (VMCPUID i = 0; i < pVM->cCpus; i++)
632 {
633 PVMCPU pVCpu = &pVM->aCpus[i];
634 PSVMVMCB pVmcb = (PSVMVMCB)pVM->aCpus[i].hm.s.svm.pvVmcb;
635
636 AssertMsgReturn(pVmcb, ("Invalid pVmcb for vcpu[%u]\n", i), VERR_SVM_INVALID_PVMCB);
637
638 /* Initialize the #VMEXIT history array with end-of-array markers (UINT16_MAX). */
639 Assert(!pVCpu->hm.s.idxExitHistoryFree);
640 HMCPU_EXIT_HISTORY_RESET(pVCpu);
641
642 /* Always trap #AC for reasons of security. */
643 pVmcb->ctrl.u32InterceptXcpt |= RT_BIT_32(X86_XCPT_AC);
644
645 /* Always trap #DB for reasons of security. */
646 pVmcb->ctrl.u32InterceptXcpt |= RT_BIT_32(X86_XCPT_DB);
647
648 /* Trap exceptions unconditionally (debug purposes). */
649#ifdef HMSVM_ALWAYS_TRAP_PF
650 pVmcb->ctrl.u32InterceptXcpt |= RT_BIT(X86_XCPT_PF);
651#endif
652#ifdef HMSVM_ALWAYS_TRAP_ALL_XCPTS
653 /* If you add any exceptions here, make sure to update hmR0SvmHandleExit(). */
654 pVmcb->ctrl.u32InterceptXcpt |= 0
655 | RT_BIT(X86_XCPT_BP)
656 | RT_BIT(X86_XCPT_DE)
657 | RT_BIT(X86_XCPT_NM)
658 | RT_BIT(X86_XCPT_UD)
659 | RT_BIT(X86_XCPT_NP)
660 | RT_BIT(X86_XCPT_SS)
661 | RT_BIT(X86_XCPT_GP)
662 | RT_BIT(X86_XCPT_PF)
663 | RT_BIT(X86_XCPT_MF)
664 ;
665#endif
666
667 /* Set up unconditional intercepts and conditions. */
668 pVmcb->ctrl.u64InterceptCtrl = SVM_CTRL_INTERCEPT_INTR /* External interrupt causes a #VMEXIT. */
669 | SVM_CTRL_INTERCEPT_NMI /* Non-maskable interrupts causes a #VMEXIT. */
670 | SVM_CTRL_INTERCEPT_INIT /* INIT signal causes a #VMEXIT. */
671 | SVM_CTRL_INTERCEPT_RDPMC /* RDPMC causes a #VMEXIT. */
672 | SVM_CTRL_INTERCEPT_CPUID /* CPUID causes a #VMEXIT. */
673 | SVM_CTRL_INTERCEPT_RSM /* RSM causes a #VMEXIT. */
674 | SVM_CTRL_INTERCEPT_HLT /* HLT causes a #VMEXIT. */
675 | SVM_CTRL_INTERCEPT_IOIO_PROT /* Use the IOPM to cause IOIO #VMEXITs. */
676 | SVM_CTRL_INTERCEPT_MSR_PROT /* MSR access not covered by MSRPM causes a #VMEXIT.*/
677 | SVM_CTRL_INTERCEPT_INVLPGA /* INVLPGA causes a #VMEXIT. */
678 | SVM_CTRL_INTERCEPT_SHUTDOWN /* Shutdown events causes a #VMEXIT. */
679 | SVM_CTRL_INTERCEPT_FERR_FREEZE /* Intercept "freezing" during legacy FPU handling. */
680 | SVM_CTRL_INTERCEPT_VMRUN /* VMRUN causes a #VMEXIT. */
681 | SVM_CTRL_INTERCEPT_VMMCALL /* VMMCALL causes a #VMEXIT. */
682 | SVM_CTRL_INTERCEPT_VMLOAD /* VMLOAD causes a #VMEXIT. */
683 | SVM_CTRL_INTERCEPT_VMSAVE /* VMSAVE causes a #VMEXIT. */
684 | SVM_CTRL_INTERCEPT_STGI /* STGI causes a #VMEXIT. */
685 | SVM_CTRL_INTERCEPT_CLGI /* CLGI causes a #VMEXIT. */
686 | SVM_CTRL_INTERCEPT_SKINIT /* SKINIT causes a #VMEXIT. */
687 | SVM_CTRL_INTERCEPT_WBINVD /* WBINVD causes a #VMEXIT. */
688 | SVM_CTRL_INTERCEPT_MONITOR /* MONITOR causes a #VMEXIT. */
689 | SVM_CTRL_INTERCEPT_MWAIT /* MWAIT causes a #VMEXIT. */
690 | SVM_CTRL_INTERCEPT_XSETBV; /* XSETBV causes a #VMEXIT. */
691
692 /* CR0, CR4 reads must be intercepted, our shadow values are not necessarily the same as the guest's. */
693 pVmcb->ctrl.u16InterceptRdCRx = RT_BIT(0) | RT_BIT(4);
694
695 /* CR0, CR4 writes must be intercepted for the same reasons as above. */
696 pVmcb->ctrl.u16InterceptWrCRx = RT_BIT(0) | RT_BIT(4);
697
698 /* Intercept all DRx reads and writes by default. Changed later on. */
699 pVmcb->ctrl.u16InterceptRdDRx = 0xffff;
700 pVmcb->ctrl.u16InterceptWrDRx = 0xffff;
701
702 /* Virtualize masking of INTR interrupts. (reads/writes from/to CR8 go to the V_TPR register) */
703 pVmcb->ctrl.IntCtrl.n.u1VIntrMasking = 1;
704
705 /* Ignore the priority in the virtual TPR. This is necessary for delivering PIC style (ExtInt) interrupts
706 and we currently deliver both PIC and APIC interrupts alike. See hmR0SvmInjectPendingEvent() */
707 pVmcb->ctrl.IntCtrl.n.u1IgnoreTPR = 1;
708
709 /* Set IO and MSR bitmap permission bitmap physical addresses. */
710 pVmcb->ctrl.u64IOPMPhysAddr = g_HCPhysIOBitmap;
711 pVmcb->ctrl.u64MSRPMPhysAddr = pVCpu->hm.s.svm.HCPhysMsrBitmap;
712
713 /* No LBR virtualization. */
714 pVmcb->ctrl.u64LBRVirt = 0;
715
716 /* Initially set all VMCB clean bits to 0 indicating that everything should be loaded from the VMCB in memory. */
717 pVmcb->ctrl.u64VmcbCleanBits = 0;
718
719 /* The host ASID MBZ, for the guest start with 1. */
720 pVmcb->ctrl.TLBCtrl.n.u32ASID = 1;
721
722 /*
723 * Setup the PAT MSR (applicable for Nested Paging only).
724 * The default value should be 0x0007040600070406ULL, but we want to treat all guest memory as WB,
725 * so choose type 6 for all PAT slots.
726 */
727 pVmcb->guest.u64GPAT = UINT64_C(0x0006060606060606);
728
729 /* Setup Nested Paging. This doesn't change throughout the execution time of the VM. */
730 pVmcb->ctrl.NestedPaging.n.u1NestedPaging = pVM->hm.s.fNestedPaging;
731
732 /* Without Nested Paging, we need additionally intercepts. */
733 if (!pVM->hm.s.fNestedPaging)
734 {
735 /* CR3 reads/writes must be intercepted; our shadow values differ from the guest values. */
736 pVmcb->ctrl.u16InterceptRdCRx |= RT_BIT(3);
737 pVmcb->ctrl.u16InterceptWrCRx |= RT_BIT(3);
738
739 /* Intercept INVLPG and task switches (may change CR3, EFLAGS, LDT). */
740 pVmcb->ctrl.u64InterceptCtrl |= SVM_CTRL_INTERCEPT_INVLPG
741 | SVM_CTRL_INTERCEPT_TASK_SWITCH;
742
743 /* Page faults must be intercepted to implement shadow paging. */
744 pVmcb->ctrl.u32InterceptXcpt |= RT_BIT(X86_XCPT_PF);
745 }
746
747#ifdef HMSVM_ALWAYS_TRAP_TASK_SWITCH
748 pVmcb->ctrl.u64InterceptCtrl |= SVM_CTRL_INTERCEPT_TASK_SWITCH;
749#endif
750
751 /* Apply the exceptions intercepts needed by the GIM provider. */
752 if (pVCpu->hm.s.fGIMTrapXcptUD)
753 pVmcb->ctrl.u32InterceptXcpt |= RT_BIT(X86_XCPT_UD);
754
755 /* Setup Pause Filter for guest pause-loop (spinlock) exiting. */
756 if (fUsePauseFilter)
757 {
758 pVmcb->ctrl.u16PauseFilterCount = pVM->hm.s.svm.cPauseFilter;
759 if (fPauseFilterThreshold)
760 pVmcb->ctrl.u16PauseFilterThreshold = pVM->hm.s.svm.cPauseFilterThresholdTicks;
761 }
762
763 /*
764 * The following MSRs are saved/restored automatically during the world-switch.
765 * Don't intercept guest read/write accesses to these MSRs.
766 */
767 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_LSTAR, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
768 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_CSTAR, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
769 hmR0SvmSetMsrPermission(pVCpu, MSR_K6_STAR, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
770 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_SF_MASK, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
771 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_FS_BASE, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
772 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_GS_BASE, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
773 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_KERNEL_GS_BASE, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
774 hmR0SvmSetMsrPermission(pVCpu, MSR_IA32_SYSENTER_CS, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
775 hmR0SvmSetMsrPermission(pVCpu, MSR_IA32_SYSENTER_ESP, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
776 hmR0SvmSetMsrPermission(pVCpu, MSR_IA32_SYSENTER_EIP, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
777 }
778
779 return VINF_SUCCESS;
780}
781
782
783/**
784 * Invalidates a guest page by guest virtual address.
785 *
786 * @returns VBox status code.
787 * @param pVM The cross context VM structure.
788 * @param pVCpu The cross context virtual CPU structure.
789 * @param GCVirt Guest virtual address of the page to invalidate.
790 */
791VMMR0DECL(int) SVMR0InvalidatePage(PVM pVM, PVMCPU pVCpu, RTGCPTR GCVirt)
792{
793 AssertReturn(pVM, VERR_INVALID_PARAMETER);
794 Assert(pVM->hm.s.svm.fSupported);
795
796 bool fFlushPending = pVM->hm.s.svm.fAlwaysFlushTLB || VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_TLB_FLUSH);
797
798 /* Skip it if a TLB flush is already pending. */
799 if (!fFlushPending)
800 {
801 Log4(("SVMR0InvalidatePage %RGv\n", GCVirt));
802
803 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
804 AssertMsgReturn(pVmcb, ("Invalid pVmcb!\n"), VERR_SVM_INVALID_PVMCB);
805
806#if HC_ARCH_BITS == 32
807 /* If we get a flush in 64-bit guest mode, then force a full TLB flush. INVLPGA takes only 32-bit addresses. */
808 if (CPUMIsGuestInLongMode(pVCpu))
809 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
810 else
811#endif
812 {
813 SVMR0InvlpgA(GCVirt, pVmcb->ctrl.TLBCtrl.n.u32ASID);
814 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlbInvlpgVirt);
815 }
816 }
817 return VINF_SUCCESS;
818}
819
820
821/**
822 * Flushes the appropriate tagged-TLB entries.
823 *
824 * @param pVCpu The cross context virtual CPU structure.
825 */
826static void hmR0SvmFlushTaggedTlb(PVMCPU pVCpu)
827{
828 PVM pVM = pVCpu->CTX_SUFF(pVM);
829 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
830 PHMGLOBALCPUINFO pCpu = hmR0GetCurrentCpu();
831
832 /*
833 * Force a TLB flush for the first world switch if the current CPU differs from the one we ran on last.
834 * This can happen both for start & resume due to long jumps back to ring-3.
835 * If the TLB flush count changed, another VM (VCPU rather) has hit the ASID limit while flushing the TLB,
836 * so we cannot reuse the ASIDs without flushing.
837 */
838 bool fNewAsid = false;
839 Assert(pCpu->idCpu != NIL_RTCPUID);
840 if ( pVCpu->hm.s.idLastCpu != pCpu->idCpu
841 || pVCpu->hm.s.cTlbFlushes != pCpu->cTlbFlushes)
842 {
843 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlbWorldSwitch);
844 pVCpu->hm.s.fForceTLBFlush = true;
845 fNewAsid = true;
846 }
847
848 /* Set TLB flush state as checked until we return from the world switch. */
849 ASMAtomicWriteBool(&pVCpu->hm.s.fCheckedTLBFlush, true);
850
851 /* Check for explicit TLB flushes. */
852 if (VMCPU_FF_TEST_AND_CLEAR(pVCpu, VMCPU_FF_TLB_FLUSH))
853 {
854 pVCpu->hm.s.fForceTLBFlush = true;
855 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlb);
856 }
857
858 pVmcb->ctrl.TLBCtrl.n.u8TLBFlush = SVM_TLB_FLUSH_NOTHING;
859
860 if (pVM->hm.s.svm.fAlwaysFlushTLB)
861 {
862 /*
863 * This is the AMD erratum 170. We need to flush the entire TLB for each world switch. Sad.
864 */
865 pCpu->uCurrentAsid = 1;
866 pVCpu->hm.s.uCurrentAsid = 1;
867 pVCpu->hm.s.cTlbFlushes = pCpu->cTlbFlushes;
868 pVmcb->ctrl.TLBCtrl.n.u8TLBFlush = SVM_TLB_FLUSH_ENTIRE;
869
870 /* Clear the VMCB Clean Bit for NP while flushing the TLB. See @bugref{7152}. */
871 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_NP;
872
873 /* Keep track of last CPU ID even when flushing all the time. */
874 if (fNewAsid)
875 pVCpu->hm.s.idLastCpu = pCpu->idCpu;
876 }
877 else if (pVCpu->hm.s.fForceTLBFlush)
878 {
879 /* Clear the VMCB Clean Bit for NP while flushing the TLB. See @bugref{7152}. */
880 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_NP;
881
882 if (fNewAsid)
883 {
884 ++pCpu->uCurrentAsid;
885 bool fHitASIDLimit = false;
886 if (pCpu->uCurrentAsid >= pVM->hm.s.uMaxAsid)
887 {
888 pCpu->uCurrentAsid = 1; /* Wraparound at 1; host uses 0 */
889 pCpu->cTlbFlushes++; /* All VCPUs that run on this host CPU must use a new VPID. */
890 fHitASIDLimit = true;
891
892 if (pVM->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_FLUSH_BY_ASID)
893 {
894 pVmcb->ctrl.TLBCtrl.n.u8TLBFlush = SVM_TLB_FLUSH_SINGLE_CONTEXT;
895 pCpu->fFlushAsidBeforeUse = true;
896 }
897 else
898 {
899 pVmcb->ctrl.TLBCtrl.n.u8TLBFlush = SVM_TLB_FLUSH_ENTIRE;
900 pCpu->fFlushAsidBeforeUse = false;
901 }
902 }
903
904 if ( !fHitASIDLimit
905 && pCpu->fFlushAsidBeforeUse)
906 {
907 if (pVM->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_FLUSH_BY_ASID)
908 pVmcb->ctrl.TLBCtrl.n.u8TLBFlush = SVM_TLB_FLUSH_SINGLE_CONTEXT;
909 else
910 {
911 pVmcb->ctrl.TLBCtrl.n.u8TLBFlush = SVM_TLB_FLUSH_ENTIRE;
912 pCpu->fFlushAsidBeforeUse = false;
913 }
914 }
915
916 pVCpu->hm.s.uCurrentAsid = pCpu->uCurrentAsid;
917 pVCpu->hm.s.idLastCpu = pCpu->idCpu;
918 pVCpu->hm.s.cTlbFlushes = pCpu->cTlbFlushes;
919 }
920 else
921 {
922 if (pVM->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_FLUSH_BY_ASID)
923 pVmcb->ctrl.TLBCtrl.n.u8TLBFlush = SVM_TLB_FLUSH_SINGLE_CONTEXT;
924 else
925 pVmcb->ctrl.TLBCtrl.n.u8TLBFlush = SVM_TLB_FLUSH_ENTIRE;
926 }
927
928 pVCpu->hm.s.fForceTLBFlush = false;
929 }
930
931 /* Update VMCB with the ASID. */
932 if (pVmcb->ctrl.TLBCtrl.n.u32ASID != pVCpu->hm.s.uCurrentAsid)
933 {
934 pVmcb->ctrl.TLBCtrl.n.u32ASID = pVCpu->hm.s.uCurrentAsid;
935 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_ASID;
936 }
937
938 AssertMsg(pVCpu->hm.s.idLastCpu == pCpu->idCpu,
939 ("vcpu idLastCpu=%u pcpu idCpu=%u\n", pVCpu->hm.s.idLastCpu, pCpu->idCpu));
940 AssertMsg(pVCpu->hm.s.cTlbFlushes == pCpu->cTlbFlushes,
941 ("Flush count mismatch for cpu %u (%u vs %u)\n", pCpu->idCpu, pVCpu->hm.s.cTlbFlushes, pCpu->cTlbFlushes));
942 AssertMsg(pCpu->uCurrentAsid >= 1 && pCpu->uCurrentAsid < pVM->hm.s.uMaxAsid,
943 ("cpu%d uCurrentAsid = %x\n", pCpu->idCpu, pCpu->uCurrentAsid));
944 AssertMsg(pVCpu->hm.s.uCurrentAsid >= 1 && pVCpu->hm.s.uCurrentAsid < pVM->hm.s.uMaxAsid,
945 ("cpu%d VM uCurrentAsid = %x\n", pCpu->idCpu, pVCpu->hm.s.uCurrentAsid));
946
947#ifdef VBOX_WITH_STATISTICS
948 if (pVmcb->ctrl.TLBCtrl.n.u8TLBFlush == SVM_TLB_FLUSH_NOTHING)
949 STAM_COUNTER_INC(&pVCpu->hm.s.StatNoFlushTlbWorldSwitch);
950 else if ( pVmcb->ctrl.TLBCtrl.n.u8TLBFlush == SVM_TLB_FLUSH_SINGLE_CONTEXT
951 || pVmcb->ctrl.TLBCtrl.n.u8TLBFlush == SVM_TLB_FLUSH_SINGLE_CONTEXT_RETAIN_GLOBALS)
952 {
953 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushAsid);
954 }
955 else
956 {
957 Assert(pVmcb->ctrl.TLBCtrl.n.u8TLBFlush == SVM_TLB_FLUSH_ENTIRE);
958 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushEntire);
959 }
960#endif
961}
962
963
964/** @name 64-bit guest on 32-bit host OS helper functions.
965 *
966 * The host CPU is still 64-bit capable but the host OS is running in 32-bit
967 * mode (code segment, paging). These wrappers/helpers perform the necessary
968 * bits for the 32->64 switcher.
969 *
970 * @{ */
971#if HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS)
972/**
973 * Prepares for and executes VMRUN (64-bit guests on a 32-bit host).
974 *
975 * @returns VBox status code.
976 * @param HCPhysVmcbHost Physical address of host VMCB.
977 * @param HCPhysVmcb Physical address of the VMCB.
978 * @param pCtx Pointer to the guest-CPU context.
979 * @param pVM The cross context VM structure.
980 * @param pVCpu The cross context virtual CPU structure.
981 */
982DECLASM(int) SVMR0VMSwitcherRun64(RTHCPHYS HCPhysVmcbHost, RTHCPHYS HCPhysVmcb, PCPUMCTX pCtx, PVM pVM, PVMCPU pVCpu)
983{
984 uint32_t aParam[8];
985 aParam[0] = (uint32_t)(HCPhysVmcbHost); /* Param 1: HCPhysVmcbHost - Lo. */
986 aParam[1] = (uint32_t)(HCPhysVmcbHost >> 32); /* Param 1: HCPhysVmcbHost - Hi. */
987 aParam[2] = (uint32_t)(HCPhysVmcb); /* Param 2: HCPhysVmcb - Lo. */
988 aParam[3] = (uint32_t)(HCPhysVmcb >> 32); /* Param 2: HCPhysVmcb - Hi. */
989 aParam[4] = VM_RC_ADDR(pVM, pVM);
990 aParam[5] = 0;
991 aParam[6] = VM_RC_ADDR(pVM, pVCpu);
992 aParam[7] = 0;
993
994 return SVMR0Execute64BitsHandler(pVM, pVCpu, pCtx, HM64ON32OP_SVMRCVMRun64, RT_ELEMENTS(aParam), &aParam[0]);
995}
996
997
998/**
999 * Executes the specified VMRUN handler in 64-bit mode.
1000 *
1001 * @returns VBox status code.
1002 * @param pVM The cross context VM structure.
1003 * @param pVCpu The cross context virtual CPU structure.
1004 * @param pCtx Pointer to the guest-CPU context.
1005 * @param enmOp The operation to perform.
1006 * @param cParams Number of parameters.
1007 * @param paParam Array of 32-bit parameters.
1008 */
1009VMMR0DECL(int) SVMR0Execute64BitsHandler(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx, HM64ON32OP enmOp,
1010 uint32_t cParams, uint32_t *paParam)
1011{
1012 AssertReturn(pVM->hm.s.pfnHost32ToGuest64R0, VERR_HM_NO_32_TO_64_SWITCHER);
1013 Assert(enmOp > HM64ON32OP_INVALID && enmOp < HM64ON32OP_END);
1014
1015 NOREF(pCtx);
1016
1017 /* Disable interrupts. */
1018 RTHCUINTREG uOldEFlags = ASMIntDisableFlags();
1019
1020#ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
1021 RTCPUID idHostCpu = RTMpCpuId();
1022 CPUMR0SetLApic(pVCpu, idHostCpu);
1023#endif
1024
1025 CPUMSetHyperESP(pVCpu, VMMGetStackRC(pVCpu));
1026 CPUMSetHyperEIP(pVCpu, enmOp);
1027 for (int i = (int)cParams - 1; i >= 0; i--)
1028 CPUMPushHyper(pVCpu, paParam[i]);
1029
1030 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatWorldSwitch3264, z);
1031 /* Call the switcher. */
1032 int rc = pVM->hm.s.pfnHost32ToGuest64R0(pVM, RT_OFFSETOF(VM, aCpus[pVCpu->idCpu].cpum) - RT_OFFSETOF(VM, cpum));
1033 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatWorldSwitch3264, z);
1034
1035 /* Restore interrupts. */
1036 ASMSetFlags(uOldEFlags);
1037 return rc;
1038}
1039
1040#endif /* HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS) */
1041/** @} */
1042
1043
1044/**
1045 * Adds an exception to the intercept exception bitmap in the VMCB and updates
1046 * the corresponding VMCB Clean bit.
1047 *
1048 * @param pVmcb Pointer to the VM control block.
1049 * @param u32Xcpt The value of the exception (X86_XCPT_*).
1050 */
1051DECLINLINE(void) hmR0SvmAddXcptIntercept(PSVMVMCB pVmcb, uint32_t u32Xcpt)
1052{
1053 if (!(pVmcb->ctrl.u32InterceptXcpt & RT_BIT(u32Xcpt)))
1054 {
1055 pVmcb->ctrl.u32InterceptXcpt |= RT_BIT(u32Xcpt);
1056 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_INTERCEPTS;
1057 }
1058}
1059
1060
1061/**
1062 * Removes an exception from the intercept-exception bitmap in the VMCB and
1063 * updates the corresponding VMCB Clean bit.
1064 *
1065 * @param pVmcb Pointer to the VM control block.
1066 * @param u32Xcpt The value of the exception (X86_XCPT_*).
1067 */
1068DECLINLINE(void) hmR0SvmRemoveXcptIntercept(PSVMVMCB pVmcb, uint32_t u32Xcpt)
1069{
1070 Assert(u32Xcpt != X86_XCPT_DB);
1071 Assert(u32Xcpt != X86_XCPT_AC);
1072#ifndef HMSVM_ALWAYS_TRAP_ALL_XCPTS
1073 if (pVmcb->ctrl.u32InterceptXcpt & RT_BIT(u32Xcpt))
1074 {
1075 pVmcb->ctrl.u32InterceptXcpt &= ~RT_BIT(u32Xcpt);
1076 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_INTERCEPTS;
1077 }
1078#endif
1079}
1080
1081
1082/**
1083 * Loads the guest CR0 control register into the guest-state area in the VMCB.
1084 * Although the guest CR0 is a separate field in the VMCB we have to consider
1085 * the FPU state itself which is shared between the host and the guest.
1086 *
1087 * @returns VBox status code.
1088 * @param pVCpu The cross context virtual CPU structure.
1089 * @param pVmcb Pointer to the VM control block.
1090 * @param pCtx Pointer to the guest-CPU context.
1091 *
1092 * @remarks No-long-jump zone!!!
1093 */
1094static void hmR0SvmLoadSharedCR0(PVMCPU pVCpu, PSVMVMCB pVmcb, PCPUMCTX pCtx)
1095{
1096 /*
1097 * Guest CR0.
1098 */
1099 PVM pVM = pVCpu->CTX_SUFF(pVM);
1100 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_CR0))
1101 {
1102 uint64_t u64GuestCR0 = pCtx->cr0;
1103
1104 /* Always enable caching. */
1105 u64GuestCR0 &= ~(X86_CR0_CD | X86_CR0_NW);
1106
1107 /*
1108 * When Nested Paging is not available use shadow page tables and intercept #PFs (the latter done in SVMR0SetupVM()).
1109 */
1110 if (!pVM->hm.s.fNestedPaging)
1111 {
1112 u64GuestCR0 |= X86_CR0_PG; /* When Nested Paging is not available, use shadow page tables. */
1113 u64GuestCR0 |= X86_CR0_WP; /* Guest CPL 0 writes to its read-only pages should cause a #PF #VMEXIT. */
1114 }
1115
1116 /*
1117 * Guest FPU bits.
1118 */
1119 bool fInterceptNM = false;
1120 bool fInterceptMF = false;
1121 u64GuestCR0 |= X86_CR0_NE; /* Use internal x87 FPU exceptions handling rather than external interrupts. */
1122 if (CPUMIsGuestFPUStateActive(pVCpu))
1123 {
1124 /* Catch floating point exceptions if we need to report them to the guest in a different way. */
1125 if (!(pCtx->cr0 & X86_CR0_NE))
1126 {
1127 Log4(("hmR0SvmLoadGuestControlRegs: Intercepting Guest CR0.MP Old-style FPU handling!!!\n"));
1128 fInterceptMF = true;
1129 }
1130 }
1131 else
1132 {
1133 fInterceptNM = true; /* Guest FPU inactive, #VMEXIT on #NM for lazy FPU loading. */
1134 u64GuestCR0 |= X86_CR0_TS /* Guest can task switch quickly and do lazy FPU syncing. */
1135 | X86_CR0_MP; /* FWAIT/WAIT should not ignore CR0.TS and should generate #NM. */
1136 }
1137
1138 /*
1139 * Update the exception intercept bitmap.
1140 */
1141 if (fInterceptNM)
1142 hmR0SvmAddXcptIntercept(pVmcb, X86_XCPT_NM);
1143 else
1144 hmR0SvmRemoveXcptIntercept(pVmcb, X86_XCPT_NM);
1145
1146 if (fInterceptMF)
1147 hmR0SvmAddXcptIntercept(pVmcb, X86_XCPT_MF);
1148 else
1149 hmR0SvmRemoveXcptIntercept(pVmcb, X86_XCPT_MF);
1150
1151 pVmcb->guest.u64CR0 = u64GuestCR0;
1152 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_CRX_EFER;
1153 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_CR0);
1154 }
1155}
1156
1157
1158/**
1159 * Loads the guest control registers (CR2, CR3, CR4) into the VMCB.
1160 *
1161 * @returns VBox status code.
1162 * @param pVCpu The cross context virtual CPU structure.
1163 * @param pVmcb Pointer to the VM control block.
1164 * @param pCtx Pointer to the guest-CPU context.
1165 *
1166 * @remarks No-long-jump zone!!!
1167 */
1168static int hmR0SvmLoadGuestControlRegs(PVMCPU pVCpu, PSVMVMCB pVmcb, PCPUMCTX pCtx)
1169{
1170 PVM pVM = pVCpu->CTX_SUFF(pVM);
1171
1172 /*
1173 * Guest CR2.
1174 */
1175 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_CR2))
1176 {
1177 pVmcb->guest.u64CR2 = pCtx->cr2;
1178 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_CR2;
1179 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_CR2);
1180 }
1181
1182 /*
1183 * Guest CR3.
1184 */
1185 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_CR3))
1186 {
1187 if (pVM->hm.s.fNestedPaging)
1188 {
1189 PGMMODE enmShwPagingMode;
1190#if HC_ARCH_BITS == 32
1191 if (CPUMIsGuestInLongModeEx(pCtx))
1192 enmShwPagingMode = PGMMODE_AMD64_NX;
1193 else
1194#endif
1195 enmShwPagingMode = PGMGetHostMode(pVM);
1196
1197 pVmcb->ctrl.u64NestedPagingCR3 = PGMGetNestedCR3(pVCpu, enmShwPagingMode);
1198 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_NP;
1199 Assert(pVmcb->ctrl.u64NestedPagingCR3);
1200 pVmcb->guest.u64CR3 = pCtx->cr3;
1201 }
1202 else
1203 pVmcb->guest.u64CR3 = PGMGetHyperCR3(pVCpu);
1204
1205 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_CRX_EFER;
1206 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_CR3);
1207 }
1208
1209 /*
1210 * Guest CR4.
1211 * ASSUMES this is done everytime we get in from ring-3! (XCR0)
1212 */
1213 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_CR4))
1214 {
1215 uint64_t u64GuestCR4 = pCtx->cr4;
1216 if (!pVM->hm.s.fNestedPaging)
1217 {
1218 switch (pVCpu->hm.s.enmShadowMode)
1219 {
1220 case PGMMODE_REAL:
1221 case PGMMODE_PROTECTED: /* Protected mode, no paging. */
1222 AssertFailed();
1223 return VERR_PGM_UNSUPPORTED_SHADOW_PAGING_MODE;
1224
1225 case PGMMODE_32_BIT: /* 32-bit paging. */
1226 u64GuestCR4 &= ~X86_CR4_PAE;
1227 break;
1228
1229 case PGMMODE_PAE: /* PAE paging. */
1230 case PGMMODE_PAE_NX: /* PAE paging with NX enabled. */
1231 /** Must use PAE paging as we could use physical memory > 4 GB */
1232 u64GuestCR4 |= X86_CR4_PAE;
1233 break;
1234
1235 case PGMMODE_AMD64: /* 64-bit AMD paging (long mode). */
1236 case PGMMODE_AMD64_NX: /* 64-bit AMD paging (long mode) with NX enabled. */
1237#ifdef VBOX_ENABLE_64_BITS_GUESTS
1238 break;
1239#else
1240 AssertFailed();
1241 return VERR_PGM_UNSUPPORTED_SHADOW_PAGING_MODE;
1242#endif
1243
1244 default: /* shut up gcc */
1245 AssertFailed();
1246 return VERR_PGM_UNSUPPORTED_SHADOW_PAGING_MODE;
1247 }
1248 }
1249
1250 pVmcb->guest.u64CR4 = u64GuestCR4;
1251 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_CRX_EFER;
1252
1253 /* Whether to save/load/restore XCR0 during world switch depends on CR4.OSXSAVE and host+guest XCR0. */
1254 pVCpu->hm.s.fLoadSaveGuestXcr0 = (u64GuestCR4 & X86_CR4_OSXSAVE) && pCtx->aXcr[0] != ASMGetXcr0();
1255
1256 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_CR4);
1257 }
1258
1259 return VINF_SUCCESS;
1260}
1261
1262
1263/**
1264 * Loads the guest segment registers into the VMCB.
1265 *
1266 * @returns VBox status code.
1267 * @param pVCpu The cross context virtual CPU structure.
1268 * @param pVmcb Pointer to the VM control block.
1269 * @param pCtx Pointer to the guest-CPU context.
1270 *
1271 * @remarks No-long-jump zone!!!
1272 */
1273static void hmR0SvmLoadGuestSegmentRegs(PVMCPU pVCpu, PSVMVMCB pVmcb, PCPUMCTX pCtx)
1274{
1275 /* Guest Segment registers: CS, SS, DS, ES, FS, GS. */
1276 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_SEGMENT_REGS))
1277 {
1278 HMSVM_SEG_REG_COPY_TO_VMCB(pCtx, &pVmcb->guest, CS, cs);
1279 HMSVM_SEG_REG_COPY_TO_VMCB(pCtx, &pVmcb->guest, SS, ss);
1280 HMSVM_SEG_REG_COPY_TO_VMCB(pCtx, &pVmcb->guest, DS, ds);
1281 HMSVM_SEG_REG_COPY_TO_VMCB(pCtx, &pVmcb->guest, ES, es);
1282 HMSVM_SEG_REG_COPY_TO_VMCB(pCtx, &pVmcb->guest, FS, fs);
1283 HMSVM_SEG_REG_COPY_TO_VMCB(pCtx, &pVmcb->guest, GS, gs);
1284
1285 pVmcb->guest.u8CPL = pCtx->ss.Attr.n.u2Dpl;
1286 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_SEG;
1287 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_SEGMENT_REGS);
1288 }
1289
1290 /* Guest TR. */
1291 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_TR))
1292 {
1293 HMSVM_SEG_REG_COPY_TO_VMCB(pCtx, &pVmcb->guest, TR, tr);
1294 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_TR);
1295 }
1296
1297 /* Guest LDTR. */
1298 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_LDTR))
1299 {
1300 HMSVM_SEG_REG_COPY_TO_VMCB(pCtx, &pVmcb->guest, LDTR, ldtr);
1301 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_LDTR);
1302 }
1303
1304 /* Guest GDTR. */
1305 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_GDTR))
1306 {
1307 pVmcb->guest.GDTR.u32Limit = pCtx->gdtr.cbGdt;
1308 pVmcb->guest.GDTR.u64Base = pCtx->gdtr.pGdt;
1309 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_DT;
1310 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_GDTR);
1311 }
1312
1313 /* Guest IDTR. */
1314 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_IDTR))
1315 {
1316 pVmcb->guest.IDTR.u32Limit = pCtx->idtr.cbIdt;
1317 pVmcb->guest.IDTR.u64Base = pCtx->idtr.pIdt;
1318 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_DT;
1319 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_IDTR);
1320 }
1321}
1322
1323
1324/**
1325 * Loads the guest MSRs into the VMCB.
1326 *
1327 * @param pVCpu The cross context virtual CPU structure.
1328 * @param pVmcb Pointer to the VM control block.
1329 * @param pCtx Pointer to the guest-CPU context.
1330 *
1331 * @remarks No-long-jump zone!!!
1332 */
1333static void hmR0SvmLoadGuestMsrs(PVMCPU pVCpu, PSVMVMCB pVmcb, PCPUMCTX pCtx)
1334{
1335 /* Guest Sysenter MSRs. */
1336 pVmcb->guest.u64SysEnterCS = pCtx->SysEnter.cs;
1337 pVmcb->guest.u64SysEnterEIP = pCtx->SysEnter.eip;
1338 pVmcb->guest.u64SysEnterESP = pCtx->SysEnter.esp;
1339
1340 /*
1341 * Guest EFER MSR.
1342 * AMD-V requires guest EFER.SVME to be set. Weird.
1343 * See AMD spec. 15.5.1 "Basic Operation" | "Canonicalization and Consistency Checks".
1344 */
1345 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_EFER_MSR))
1346 {
1347 pVmcb->guest.u64EFER = pCtx->msrEFER | MSR_K6_EFER_SVME;
1348 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_CRX_EFER;
1349 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_EFER_MSR);
1350 }
1351
1352 /* 64-bit MSRs. */
1353 if (CPUMIsGuestInLongModeEx(pCtx))
1354 {
1355 pVmcb->guest.FS.u64Base = pCtx->fs.u64Base;
1356 pVmcb->guest.GS.u64Base = pCtx->gs.u64Base;
1357 }
1358 else
1359 {
1360 /* If the guest isn't in 64-bit mode, clear MSR_K6_LME bit from guest EFER otherwise AMD-V expects amd64 shadow paging. */
1361 if (pCtx->msrEFER & MSR_K6_EFER_LME)
1362 {
1363 pVmcb->guest.u64EFER &= ~MSR_K6_EFER_LME;
1364 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_CRX_EFER;
1365 }
1366 }
1367
1368
1369 /** @todo The following are used in 64-bit only (SYSCALL/SYSRET) but they might
1370 * be writable in 32-bit mode. Clarify with AMD spec. */
1371 pVmcb->guest.u64STAR = pCtx->msrSTAR;
1372 pVmcb->guest.u64LSTAR = pCtx->msrLSTAR;
1373 pVmcb->guest.u64CSTAR = pCtx->msrCSTAR;
1374 pVmcb->guest.u64SFMASK = pCtx->msrSFMASK;
1375 pVmcb->guest.u64KernelGSBase = pCtx->msrKERNELGSBASE;
1376}
1377
1378
1379/**
1380 * Loads the guest state into the VMCB and programs the necessary intercepts
1381 * accordingly.
1382 *
1383 * @param pVCpu The cross context virtual CPU structure.
1384 * @param pVmcb Pointer to the VM control block.
1385 * @param pCtx Pointer to the guest-CPU context.
1386 *
1387 * @remarks No-long-jump zone!!!
1388 * @remarks Requires EFLAGS to be up-to-date in the VMCB!
1389 */
1390static void hmR0SvmLoadSharedDebugState(PVMCPU pVCpu, PSVMVMCB pVmcb, PCPUMCTX pCtx)
1391{
1392 if (!HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_DEBUG))
1393 return;
1394 Assert((pCtx->dr[6] & X86_DR6_RA1_MASK) == X86_DR6_RA1_MASK); Assert((pCtx->dr[6] & X86_DR6_RAZ_MASK) == 0);
1395 Assert((pCtx->dr[7] & X86_DR7_RA1_MASK) == X86_DR7_RA1_MASK); Assert((pCtx->dr[7] & X86_DR7_RAZ_MASK) == 0);
1396
1397 bool fInterceptMovDRx = false;
1398
1399 /*
1400 * Anyone single stepping on the host side? If so, we'll have to use the
1401 * trap flag in the guest EFLAGS since AMD-V doesn't have a trap flag on
1402 * the VMM level like the VT-x implementations does.
1403 */
1404 bool const fStepping = pVCpu->hm.s.fSingleInstruction;
1405 if (fStepping)
1406 {
1407 pVCpu->hm.s.fClearTrapFlag = true;
1408 pVmcb->guest.u64RFlags |= X86_EFL_TF;
1409 fInterceptMovDRx = true; /* Need clean DR6, no guest mess. */
1410 }
1411 else
1412 Assert(!DBGFIsStepping(pVCpu));
1413
1414 if ( fStepping
1415 || (CPUMGetHyperDR7(pVCpu) & X86_DR7_ENABLED_MASK))
1416 {
1417 /*
1418 * Use the combined guest and host DRx values found in the hypervisor
1419 * register set because the debugger has breakpoints active or someone
1420 * is single stepping on the host side.
1421 *
1422 * Note! DBGF expects a clean DR6 state before executing guest code.
1423 */
1424#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS)
1425 if ( CPUMIsGuestInLongModeEx(pCtx)
1426 && !CPUMIsHyperDebugStateActivePending(pVCpu))
1427 {
1428 CPUMR0LoadHyperDebugState(pVCpu, false /* include DR6 */);
1429 Assert(!CPUMIsGuestDebugStateActivePending(pVCpu));
1430 Assert(CPUMIsHyperDebugStateActivePending(pVCpu));
1431 }
1432 else
1433#endif
1434 if (!CPUMIsHyperDebugStateActive(pVCpu))
1435 {
1436 CPUMR0LoadHyperDebugState(pVCpu, false /* include DR6 */);
1437 Assert(!CPUMIsGuestDebugStateActive(pVCpu));
1438 Assert(CPUMIsHyperDebugStateActive(pVCpu));
1439 }
1440
1441 /* Update DR6 & DR7. (The other DRx values are handled by CPUM one way or the other.) */
1442 if ( pVmcb->guest.u64DR6 != X86_DR6_INIT_VAL
1443 || pVmcb->guest.u64DR7 != CPUMGetHyperDR7(pVCpu))
1444 {
1445 pVmcb->guest.u64DR7 = CPUMGetHyperDR7(pVCpu);
1446 pVmcb->guest.u64DR6 = X86_DR6_INIT_VAL;
1447 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_DRX;
1448 pVCpu->hm.s.fUsingHyperDR7 = true;
1449 }
1450
1451 /** @todo If we cared, we could optimize to allow the guest to read registers
1452 * with the same values. */
1453 fInterceptMovDRx = true;
1454 Log5(("hmR0SvmLoadSharedDebugState: Loaded hyper DRx\n"));
1455 }
1456 else
1457 {
1458 /*
1459 * Update DR6, DR7 with the guest values if necessary.
1460 */
1461 if ( pVmcb->guest.u64DR7 != pCtx->dr[7]
1462 || pVmcb->guest.u64DR6 != pCtx->dr[6])
1463 {
1464 pVmcb->guest.u64DR7 = pCtx->dr[7];
1465 pVmcb->guest.u64DR6 = pCtx->dr[6];
1466 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_DRX;
1467 pVCpu->hm.s.fUsingHyperDR7 = false;
1468 }
1469
1470 /*
1471 * If the guest has enabled debug registers, we need to load them prior to
1472 * executing guest code so they'll trigger at the right time.
1473 */
1474 if (pCtx->dr[7] & (X86_DR7_ENABLED_MASK | X86_DR7_GD)) /** @todo Why GD? */
1475 {
1476#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS)
1477 if ( CPUMIsGuestInLongModeEx(pCtx)
1478 && !CPUMIsGuestDebugStateActivePending(pVCpu))
1479 {
1480 CPUMR0LoadGuestDebugState(pVCpu, false /* include DR6 */);
1481 STAM_COUNTER_INC(&pVCpu->hm.s.StatDRxArmed);
1482 Assert(!CPUMIsHyperDebugStateActivePending(pVCpu));
1483 Assert(CPUMIsGuestDebugStateActivePending(pVCpu));
1484 }
1485 else
1486#endif
1487 if (!CPUMIsGuestDebugStateActive(pVCpu))
1488 {
1489 CPUMR0LoadGuestDebugState(pVCpu, false /* include DR6 */);
1490 STAM_COUNTER_INC(&pVCpu->hm.s.StatDRxArmed);
1491 Assert(!CPUMIsHyperDebugStateActive(pVCpu));
1492 Assert(CPUMIsGuestDebugStateActive(pVCpu));
1493 }
1494 Log5(("hmR0SvmLoadSharedDebugState: Loaded guest DRx\n"));
1495 }
1496 /*
1497 * If no debugging enabled, we'll lazy load DR0-3. We don't need to
1498 * intercept #DB as DR6 is updated in the VMCB.
1499 *
1500 * Note! If we cared and dared, we could skip intercepting \#DB here.
1501 * However, \#DB shouldn't be performance critical, so we'll play safe
1502 * and keep the code similar to the VT-x code and always intercept it.
1503 */
1504#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS)
1505 else if ( !CPUMIsGuestDebugStateActivePending(pVCpu)
1506 && !CPUMIsGuestDebugStateActive(pVCpu))
1507#else
1508 else if (!CPUMIsGuestDebugStateActive(pVCpu))
1509#endif
1510 {
1511 fInterceptMovDRx = true;
1512 }
1513 }
1514
1515 Assert(pVmcb->ctrl.u32InterceptXcpt & RT_BIT_32(X86_XCPT_DB));
1516 if (fInterceptMovDRx)
1517 {
1518 if ( pVmcb->ctrl.u16InterceptRdDRx != 0xffff
1519 || pVmcb->ctrl.u16InterceptWrDRx != 0xffff)
1520 {
1521 pVmcb->ctrl.u16InterceptRdDRx = 0xffff;
1522 pVmcb->ctrl.u16InterceptWrDRx = 0xffff;
1523 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_INTERCEPTS;
1524 }
1525 }
1526 else
1527 {
1528 if ( pVmcb->ctrl.u16InterceptRdDRx
1529 || pVmcb->ctrl.u16InterceptWrDRx)
1530 {
1531 pVmcb->ctrl.u16InterceptRdDRx = 0;
1532 pVmcb->ctrl.u16InterceptWrDRx = 0;
1533 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_INTERCEPTS;
1534 }
1535 }
1536
1537 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_DEBUG);
1538}
1539
1540
1541/**
1542 * Loads the guest APIC state (currently just the TPR).
1543 *
1544 * @returns VBox status code.
1545 * @param pVCpu The cross context virtual CPU structure.
1546 * @param pVmcb Pointer to the VM control block.
1547 * @param pCtx Pointer to the guest-CPU context.
1548 */
1549static int hmR0SvmLoadGuestApicState(PVMCPU pVCpu, PSVMVMCB pVmcb, PCPUMCTX pCtx)
1550{
1551 if (!HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_SVM_GUEST_APIC_STATE))
1552 return VINF_SUCCESS;
1553
1554 int rc = VINF_SUCCESS;
1555 PVM pVM = pVCpu->CTX_SUFF(pVM);
1556 if ( PDMHasApic(pVM)
1557 && APICIsEnabled(pVCpu))
1558 {
1559 bool fPendingIntr;
1560 uint8_t u8Tpr;
1561 rc = APICGetTpr(pVCpu, &u8Tpr, &fPendingIntr, NULL /* pu8PendingIrq */);
1562 AssertRCReturn(rc, rc);
1563
1564 /* Assume that we need to trap all TPR accesses and thus need not check on
1565 every #VMEXIT if we should update the TPR. */
1566 Assert(pVmcb->ctrl.IntCtrl.n.u1VIntrMasking);
1567 pVCpu->hm.s.svm.fSyncVTpr = false;
1568
1569 /* 32-bit guests uses LSTAR MSR for patching guest code which touches the TPR. */
1570 if (pVM->hm.s.fTPRPatchingActive)
1571 {
1572 pCtx->msrLSTAR = u8Tpr;
1573
1574 /* If there are interrupts pending, intercept LSTAR writes, otherwise don't intercept reads or writes. */
1575 if (fPendingIntr)
1576 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_LSTAR, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_INTERCEPT_WRITE);
1577 else
1578 {
1579 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_LSTAR, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
1580 pVCpu->hm.s.svm.fSyncVTpr = true;
1581 }
1582 }
1583 else
1584 {
1585 /* Bits 3-0 of the VTPR field correspond to bits 7-4 of the TPR (which is the Task-Priority Class). */
1586 pVmcb->ctrl.IntCtrl.n.u8VTPR = (u8Tpr >> 4);
1587
1588 /* If there are interrupts pending, intercept CR8 writes to evaluate ASAP if we can deliver the interrupt to the guest. */
1589 if (fPendingIntr)
1590 pVmcb->ctrl.u16InterceptWrCRx |= RT_BIT(8);
1591 else
1592 {
1593 pVmcb->ctrl.u16InterceptWrCRx &= ~RT_BIT(8);
1594 pVCpu->hm.s.svm.fSyncVTpr = true;
1595 }
1596
1597 pVmcb->ctrl.u64VmcbCleanBits &= ~(HMSVM_VMCB_CLEAN_INTERCEPTS | HMSVM_VMCB_CLEAN_TPR);
1598 }
1599 }
1600
1601 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_SVM_GUEST_APIC_STATE);
1602 return rc;
1603}
1604
1605
1606/**
1607 * Loads the exception interrupts required for guest execution in the VMCB.
1608 *
1609 * @returns VBox status code.
1610 * @param pVCpu The cross context virtual CPU structure.
1611 * @param pVmcb Pointer to the VM control block.
1612 * @param pCtx Pointer to the guest-CPU context.
1613 */
1614static int hmR0SvmLoadGuestXcptIntercepts(PVMCPU pVCpu, PSVMVMCB pVmcb, PCPUMCTX pCtx)
1615{
1616 NOREF(pCtx);
1617 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_XCPT_INTERCEPTS))
1618 {
1619 /* Trap #UD for GIM provider (e.g. for hypercalls). */
1620 if (pVCpu->hm.s.fGIMTrapXcptUD)
1621 hmR0SvmAddXcptIntercept(pVmcb, X86_XCPT_UD);
1622 else
1623 hmR0SvmRemoveXcptIntercept(pVmcb, X86_XCPT_UD);
1624
1625 /* Trap #BP for INT3 debug breakpoints set by the VM debugger. */
1626 if (pVCpu->CTX_SUFF(pVM)->dbgf.ro.cEnabledInt3Breakpoints)
1627 hmR0SvmAddXcptIntercept(pVmcb, X86_XCPT_BP);
1628 else
1629 hmR0SvmRemoveXcptIntercept(pVmcb, X86_XCPT_BP);
1630
1631 /* The remaining intercepts are handled elsewhere, e.g. in hmR0SvmLoadSharedCR0(). */
1632 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_XCPT_INTERCEPTS);
1633 }
1634 return VINF_SUCCESS;
1635}
1636
1637
1638/**
1639 * Sets up the appropriate function to run guest code.
1640 *
1641 * @returns VBox status code.
1642 * @param pVCpu The cross context virtual CPU structure.
1643 * @param pCtx Pointer to the guest-CPU context.
1644 *
1645 * @remarks No-long-jump zone!!!
1646 */
1647static int hmR0SvmSetupVMRunHandler(PVMCPU pVCpu, PCPUMCTX pCtx)
1648{
1649 if (CPUMIsGuestInLongModeEx(pCtx))
1650 {
1651#ifndef VBOX_ENABLE_64_BITS_GUESTS
1652 return VERR_PGM_UNSUPPORTED_SHADOW_PAGING_MODE;
1653#endif
1654 Assert(pVCpu->CTX_SUFF(pVM)->hm.s.fAllow64BitGuests); /* Guaranteed by hmR3InitFinalizeR0(). */
1655#if HC_ARCH_BITS == 32
1656 /* 32-bit host. We need to switch to 64-bit before running the 64-bit guest. */
1657 pVCpu->hm.s.svm.pfnVMRun = SVMR0VMSwitcherRun64;
1658#else
1659 /* 64-bit host or hybrid host. */
1660 pVCpu->hm.s.svm.pfnVMRun = SVMR0VMRun64;
1661#endif
1662 }
1663 else
1664 {
1665 /* Guest is not in long mode, use the 32-bit handler. */
1666 pVCpu->hm.s.svm.pfnVMRun = SVMR0VMRun;
1667 }
1668 return VINF_SUCCESS;
1669}
1670
1671
1672/**
1673 * Enters the AMD-V session.
1674 *
1675 * @returns VBox status code.
1676 * @param pVM The cross context VM structure.
1677 * @param pVCpu The cross context virtual CPU structure.
1678 * @param pCpu Pointer to the CPU info struct.
1679 */
1680VMMR0DECL(int) SVMR0Enter(PVM pVM, PVMCPU pVCpu, PHMGLOBALCPUINFO pCpu)
1681{
1682 AssertPtr(pVM);
1683 AssertPtr(pVCpu);
1684 Assert(pVM->hm.s.svm.fSupported);
1685 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1686 NOREF(pVM); NOREF(pCpu);
1687
1688 LogFlowFunc(("pVM=%p pVCpu=%p\n", pVM, pVCpu));
1689 Assert(HMCPU_CF_IS_SET(pVCpu, HM_CHANGED_HOST_CONTEXT | HM_CHANGED_HOST_GUEST_SHARED_STATE));
1690
1691 pVCpu->hm.s.fLeaveDone = false;
1692 return VINF_SUCCESS;
1693}
1694
1695
1696/**
1697 * Thread-context callback for AMD-V.
1698 *
1699 * @param enmEvent The thread-context event.
1700 * @param pVCpu The cross context virtual CPU structure.
1701 * @param fGlobalInit Whether global VT-x/AMD-V init. is used.
1702 * @thread EMT(pVCpu)
1703 */
1704VMMR0DECL(void) SVMR0ThreadCtxCallback(RTTHREADCTXEVENT enmEvent, PVMCPU pVCpu, bool fGlobalInit)
1705{
1706 NOREF(fGlobalInit);
1707
1708 switch (enmEvent)
1709 {
1710 case RTTHREADCTXEVENT_OUT:
1711 {
1712 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1713 Assert(VMMR0ThreadCtxHookIsEnabled(pVCpu));
1714 VMCPU_ASSERT_EMT(pVCpu);
1715
1716 /* No longjmps (log-flush, locks) in this fragile context. */
1717 VMMRZCallRing3Disable(pVCpu);
1718
1719 if (!pVCpu->hm.s.fLeaveDone)
1720 {
1721 hmR0SvmLeave(pVCpu);
1722 pVCpu->hm.s.fLeaveDone = true;
1723 }
1724
1725 /* Leave HM context, takes care of local init (term). */
1726 int rc = HMR0LeaveCpu(pVCpu);
1727 AssertRC(rc); NOREF(rc);
1728
1729 /* Restore longjmp state. */
1730 VMMRZCallRing3Enable(pVCpu);
1731 STAM_REL_COUNTER_INC(&pVCpu->hm.s.StatSwitchPreempt);
1732 break;
1733 }
1734
1735 case RTTHREADCTXEVENT_IN:
1736 {
1737 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1738 Assert(VMMR0ThreadCtxHookIsEnabled(pVCpu));
1739 VMCPU_ASSERT_EMT(pVCpu);
1740
1741 /* No longjmps (log-flush, locks) in this fragile context. */
1742 VMMRZCallRing3Disable(pVCpu);
1743
1744 /*
1745 * Initialize the bare minimum state required for HM. This takes care of
1746 * initializing AMD-V if necessary (onlined CPUs, local init etc.)
1747 */
1748 int rc = HMR0EnterCpu(pVCpu);
1749 AssertRC(rc); NOREF(rc);
1750 Assert(HMCPU_CF_IS_SET(pVCpu, HM_CHANGED_HOST_CONTEXT | HM_CHANGED_HOST_GUEST_SHARED_STATE));
1751
1752 pVCpu->hm.s.fLeaveDone = false;
1753
1754 /* Restore longjmp state. */
1755 VMMRZCallRing3Enable(pVCpu);
1756 break;
1757 }
1758
1759 default:
1760 break;
1761 }
1762}
1763
1764
1765/**
1766 * Saves the host state.
1767 *
1768 * @returns VBox status code.
1769 * @param pVM The cross context VM structure.
1770 * @param pVCpu The cross context virtual CPU structure.
1771 *
1772 * @remarks No-long-jump zone!!!
1773 */
1774VMMR0DECL(int) SVMR0SaveHostState(PVM pVM, PVMCPU pVCpu)
1775{
1776 NOREF(pVM);
1777 NOREF(pVCpu);
1778 /* Nothing to do here. AMD-V does this for us automatically during the world-switch. */
1779 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_HOST_CONTEXT);
1780 return VINF_SUCCESS;
1781}
1782
1783
1784/**
1785 * Loads the guest state into the VMCB.
1786 *
1787 * The CPU state will be loaded from these fields on every successful VM-entry.
1788 * Also sets up the appropriate VMRUN function to execute guest code based on
1789 * the guest CPU mode.
1790 *
1791 * @returns VBox status code.
1792 * @param pVM The cross context VM structure.
1793 * @param pVCpu The cross context virtual CPU structure.
1794 * @param pCtx Pointer to the guest-CPU context.
1795 *
1796 * @remarks No-long-jump zone!!!
1797 */
1798static int hmR0SvmLoadGuestState(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
1799{
1800 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
1801 AssertMsgReturn(pVmcb, ("Invalid pVmcb\n"), VERR_SVM_INVALID_PVMCB);
1802
1803 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatLoadGuestState, x);
1804
1805 int rc = hmR0SvmLoadGuestControlRegs(pVCpu, pVmcb, pCtx);
1806 AssertLogRelMsgRCReturn(rc, ("hmR0SvmLoadGuestControlRegs! rc=%Rrc (pVM=%p pVCpu=%p)\n", rc, pVM, pVCpu), rc);
1807
1808 hmR0SvmLoadGuestSegmentRegs(pVCpu, pVmcb, pCtx);
1809 hmR0SvmLoadGuestMsrs(pVCpu, pVmcb, pCtx);
1810
1811 pVmcb->guest.u64RIP = pCtx->rip;
1812 pVmcb->guest.u64RSP = pCtx->rsp;
1813 pVmcb->guest.u64RFlags = pCtx->eflags.u32;
1814 pVmcb->guest.u64RAX = pCtx->rax;
1815
1816 rc = hmR0SvmLoadGuestApicState(pVCpu, pVmcb, pCtx);
1817 AssertLogRelMsgRCReturn(rc, ("hmR0SvmLoadGuestApicState! rc=%Rrc (pVM=%p pVCpu=%p)\n", rc, pVM, pVCpu), rc);
1818
1819 rc = hmR0SvmLoadGuestXcptIntercepts(pVCpu, pVmcb, pCtx);
1820 AssertLogRelMsgRCReturn(rc, ("hmR0SvmLoadGuestXcptIntercepts! rc=%Rrc (pVM=%p pVCpu=%p)\n", rc, pVM, pVCpu), rc);
1821
1822 rc = hmR0SvmSetupVMRunHandler(pVCpu, pCtx);
1823 AssertLogRelMsgRCReturn(rc, ("hmR0SvmSetupVMRunHandler! rc=%Rrc (pVM=%p pVCpu=%p)\n", rc, pVM, pVCpu), rc);
1824
1825 /* Clear any unused and reserved bits. */
1826 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_RIP /* Unused (loaded unconditionally). */
1827 | HM_CHANGED_GUEST_RSP
1828 | HM_CHANGED_GUEST_RFLAGS
1829 | HM_CHANGED_GUEST_SYSENTER_CS_MSR
1830 | HM_CHANGED_GUEST_SYSENTER_EIP_MSR
1831 | HM_CHANGED_GUEST_SYSENTER_ESP_MSR
1832 | HM_CHANGED_GUEST_LAZY_MSRS /* Unused. */
1833 | HM_CHANGED_SVM_RESERVED1 /* Reserved. */
1834 | HM_CHANGED_SVM_RESERVED2
1835 | HM_CHANGED_SVM_RESERVED3
1836 | HM_CHANGED_SVM_RESERVED4);
1837
1838 /* All the guest state bits should be loaded except maybe the host context and/or shared host/guest bits. */
1839 AssertMsg( !HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_ALL_GUEST)
1840 || HMCPU_CF_IS_PENDING_ONLY(pVCpu, HM_CHANGED_HOST_CONTEXT | HM_CHANGED_HOST_GUEST_SHARED_STATE),
1841 ("fContextUseFlags=%#RX32\n", HMCPU_CF_VALUE(pVCpu)));
1842
1843 Log4(("Load: CS:RIP=%04x:%RX64 EFL=%#x SS:RSP=%04x:%RX64\n", pCtx->cs.Sel, pCtx->rip, pCtx->eflags.u, pCtx->ss.Sel, pCtx->rsp));
1844 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatLoadGuestState, x);
1845 return rc;
1846}
1847
1848
1849/**
1850 * Loads the state shared between the host and guest into the
1851 * VMCB.
1852 *
1853 * @param pVCpu The cross context virtual CPU structure.
1854 * @param pVmcb Pointer to the VM control block.
1855 * @param pCtx Pointer to the guest-CPU context.
1856 *
1857 * @remarks No-long-jump zone!!!
1858 */
1859static void hmR0SvmLoadSharedState(PVMCPU pVCpu, PSVMVMCB pVmcb, PCPUMCTX pCtx)
1860{
1861 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
1862 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
1863
1864 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_CR0))
1865 hmR0SvmLoadSharedCR0(pVCpu, pVmcb, pCtx);
1866
1867 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_DEBUG))
1868 hmR0SvmLoadSharedDebugState(pVCpu, pVmcb, pCtx);
1869
1870 /* Unused on AMD-V. */
1871 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_GUEST_LAZY_MSRS);
1872
1873 AssertMsg(!HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_HOST_GUEST_SHARED_STATE),
1874 ("fContextUseFlags=%#RX32\n", HMCPU_CF_VALUE(pVCpu)));
1875}
1876
1877
1878/**
1879 * Saves the entire guest state from the VMCB into the
1880 * guest-CPU context. Currently there is no residual state left in the CPU that
1881 * is not updated in the VMCB.
1882 *
1883 * @returns VBox status code.
1884 * @param pVCpu The cross context virtual CPU structure.
1885 * @param pMixedCtx Pointer to the guest-CPU context. The data may be
1886 * out-of-sync. Make sure to update the required fields
1887 * before using them.
1888 */
1889static void hmR0SvmSaveGuestState(PVMCPU pVCpu, PCPUMCTX pMixedCtx)
1890{
1891 Assert(VMMRZCallRing3IsEnabled(pVCpu));
1892
1893 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
1894
1895 pMixedCtx->rip = pVmcb->guest.u64RIP;
1896 pMixedCtx->rsp = pVmcb->guest.u64RSP;
1897 pMixedCtx->eflags.u32 = pVmcb->guest.u64RFlags;
1898 pMixedCtx->rax = pVmcb->guest.u64RAX;
1899
1900 /*
1901 * Guest interrupt shadow.
1902 */
1903 if (pVmcb->ctrl.u64IntShadow & SVM_INTERRUPT_SHADOW_ACTIVE)
1904 EMSetInhibitInterruptsPC(pVCpu, pMixedCtx->rip);
1905 else if (VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS))
1906 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS);
1907
1908 /*
1909 * Guest Control registers: CR2, CR3 (handled at the end) - accesses to other control registers are always intercepted.
1910 */
1911 pMixedCtx->cr2 = pVmcb->guest.u64CR2;
1912
1913 /*
1914 * Guest MSRs.
1915 */
1916 pMixedCtx->msrSTAR = pVmcb->guest.u64STAR; /* legacy syscall eip, cs & ss */
1917 pMixedCtx->msrLSTAR = pVmcb->guest.u64LSTAR; /* 64-bit mode syscall rip */
1918 pMixedCtx->msrCSTAR = pVmcb->guest.u64CSTAR; /* compatibility mode syscall rip */
1919 pMixedCtx->msrSFMASK = pVmcb->guest.u64SFMASK; /* syscall flag mask */
1920 pMixedCtx->msrKERNELGSBASE = pVmcb->guest.u64KernelGSBase; /* swapgs exchange value */
1921 pMixedCtx->SysEnter.cs = pVmcb->guest.u64SysEnterCS;
1922 pMixedCtx->SysEnter.eip = pVmcb->guest.u64SysEnterEIP;
1923 pMixedCtx->SysEnter.esp = pVmcb->guest.u64SysEnterESP;
1924
1925 /*
1926 * Guest segment registers (includes FS, GS base MSRs for 64-bit guests).
1927 */
1928 HMSVM_SEG_REG_COPY_FROM_VMCB(pMixedCtx, &pVmcb->guest, CS, cs);
1929 HMSVM_SEG_REG_COPY_FROM_VMCB(pMixedCtx, &pVmcb->guest, SS, ss);
1930 HMSVM_SEG_REG_COPY_FROM_VMCB(pMixedCtx, &pVmcb->guest, DS, ds);
1931 HMSVM_SEG_REG_COPY_FROM_VMCB(pMixedCtx, &pVmcb->guest, ES, es);
1932 HMSVM_SEG_REG_COPY_FROM_VMCB(pMixedCtx, &pVmcb->guest, FS, fs);
1933 HMSVM_SEG_REG_COPY_FROM_VMCB(pMixedCtx, &pVmcb->guest, GS, gs);
1934
1935 /*
1936 * Correct the hidden CS granularity bit. Haven't seen it being wrong in any other
1937 * register (yet).
1938 */
1939 /** @todo SELM might need to be fixed as it too should not care about the
1940 * granularity bit. See @bugref{6785}. */
1941 if ( !pMixedCtx->cs.Attr.n.u1Granularity
1942 && pMixedCtx->cs.Attr.n.u1Present
1943 && pMixedCtx->cs.u32Limit > UINT32_C(0xfffff))
1944 {
1945 Assert((pMixedCtx->cs.u32Limit & 0xfff) == 0xfff);
1946 pMixedCtx->cs.Attr.n.u1Granularity = 1;
1947 }
1948
1949#ifdef VBOX_STRICT
1950# define HMSVM_ASSERT_SEG_GRANULARITY(reg) \
1951 AssertMsg( !pMixedCtx->reg.Attr.n.u1Present \
1952 || ( pMixedCtx->reg.Attr.n.u1Granularity \
1953 ? (pMixedCtx->reg.u32Limit & 0xfff) == 0xfff \
1954 : pMixedCtx->reg.u32Limit <= UINT32_C(0xfffff)), \
1955 ("Invalid Segment Attributes Limit=%#RX32 Attr=%#RX32 Base=%#RX64\n", pMixedCtx->reg.u32Limit, \
1956 pMixedCtx->reg.Attr.u, pMixedCtx->reg.u64Base))
1957
1958 HMSVM_ASSERT_SEG_GRANULARITY(cs);
1959 HMSVM_ASSERT_SEG_GRANULARITY(ss);
1960 HMSVM_ASSERT_SEG_GRANULARITY(ds);
1961 HMSVM_ASSERT_SEG_GRANULARITY(es);
1962 HMSVM_ASSERT_SEG_GRANULARITY(fs);
1963 HMSVM_ASSERT_SEG_GRANULARITY(gs);
1964
1965# undef HMSVM_ASSERT_SEL_GRANULARITY
1966#endif
1967
1968 /*
1969 * Sync the hidden SS DPL field. AMD CPUs have a separate CPL field in the VMCB and uses that
1970 * and thus it's possible that when the CPL changes during guest execution that the SS DPL
1971 * isn't updated by AMD-V. Observed on some AMD Fusion CPUs with 64-bit guests.
1972 * See AMD spec. 15.5.1 "Basic operation".
1973 */
1974 Assert(!(pVmcb->guest.u8CPL & ~0x3));
1975 pMixedCtx->ss.Attr.n.u2Dpl = pVmcb->guest.u8CPL & 0x3;
1976
1977 /*
1978 * Guest TR.
1979 * Fixup TR attributes so it's compatible with Intel. Important when saved-states are used
1980 * between Intel and AMD. See @bugref{6208#c39}.
1981 * ASSUME that it's normally correct and that we're in 32-bit or 64-bit mode.
1982 */
1983 HMSVM_SEG_REG_COPY_FROM_VMCB(pMixedCtx, &pVmcb->guest, TR, tr);
1984 if (pMixedCtx->tr.Attr.n.u4Type != X86_SEL_TYPE_SYS_386_TSS_BUSY)
1985 {
1986 if ( pMixedCtx->tr.Attr.n.u4Type == X86_SEL_TYPE_SYS_386_TSS_AVAIL
1987 || CPUMIsGuestInLongModeEx(pMixedCtx))
1988 pMixedCtx->tr.Attr.n.u4Type = X86_SEL_TYPE_SYS_386_TSS_BUSY;
1989 else if (pMixedCtx->tr.Attr.n.u4Type == X86_SEL_TYPE_SYS_286_TSS_AVAIL)
1990 pMixedCtx->tr.Attr.n.u4Type = X86_SEL_TYPE_SYS_286_TSS_BUSY;
1991 }
1992
1993 /*
1994 * Guest Descriptor-Table registers.
1995 */
1996 HMSVM_SEG_REG_COPY_FROM_VMCB(pMixedCtx, &pVmcb->guest, LDTR, ldtr);
1997 pMixedCtx->gdtr.cbGdt = pVmcb->guest.GDTR.u32Limit;
1998 pMixedCtx->gdtr.pGdt = pVmcb->guest.GDTR.u64Base;
1999
2000 pMixedCtx->idtr.cbIdt = pVmcb->guest.IDTR.u32Limit;
2001 pMixedCtx->idtr.pIdt = pVmcb->guest.IDTR.u64Base;
2002
2003 /*
2004 * Guest Debug registers.
2005 */
2006 if (!pVCpu->hm.s.fUsingHyperDR7)
2007 {
2008 pMixedCtx->dr[6] = pVmcb->guest.u64DR6;
2009 pMixedCtx->dr[7] = pVmcb->guest.u64DR7;
2010 }
2011 else
2012 {
2013 Assert(pVmcb->guest.u64DR7 == CPUMGetHyperDR7(pVCpu));
2014 CPUMSetHyperDR6(pVCpu, pVmcb->guest.u64DR6);
2015 }
2016
2017 /*
2018 * With Nested Paging, CR3 changes are not intercepted. Therefore, sync. it now.
2019 * This is done as the very last step of syncing the guest state, as PGMUpdateCR3() may cause longjmp's to ring-3.
2020 */
2021 if ( pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging
2022 && pMixedCtx->cr3 != pVmcb->guest.u64CR3)
2023 {
2024 CPUMSetGuestCR3(pVCpu, pVmcb->guest.u64CR3);
2025 PGMUpdateCR3(pVCpu, pVmcb->guest.u64CR3);
2026 }
2027}
2028
2029
2030/**
2031 * Does the necessary state syncing before returning to ring-3 for any reason
2032 * (longjmp, preemption, voluntary exits to ring-3) from AMD-V.
2033 *
2034 * @param pVCpu The cross context virtual CPU structure.
2035 *
2036 * @remarks No-long-jmp zone!!!
2037 */
2038static void hmR0SvmLeave(PVMCPU pVCpu)
2039{
2040 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
2041 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
2042 Assert(VMMR0IsLogFlushDisabled(pVCpu));
2043
2044 /*
2045 * !!! IMPORTANT !!!
2046 * If you modify code here, make sure to check whether hmR0SvmCallRing3Callback() needs to be updated too.
2047 */
2048
2049 /* Restore host FPU state if necessary and resync on next R0 reentry .*/
2050 if (CPUMR0FpuStateMaybeSaveGuestAndRestoreHost(pVCpu))
2051 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_CR0);
2052
2053 /*
2054 * Restore host debug registers if necessary and resync on next R0 reentry.
2055 */
2056#ifdef VBOX_STRICT
2057 if (CPUMIsHyperDebugStateActive(pVCpu))
2058 {
2059 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
2060 Assert(pVmcb->ctrl.u16InterceptRdDRx == 0xffff);
2061 Assert(pVmcb->ctrl.u16InterceptWrDRx == 0xffff);
2062 }
2063#endif
2064 if (CPUMR0DebugStateMaybeSaveGuestAndRestoreHost(pVCpu, false /* save DR6 */))
2065 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_DEBUG);
2066
2067 Assert(!CPUMIsHyperDebugStateActive(pVCpu));
2068 Assert(!CPUMIsGuestDebugStateActive(pVCpu));
2069
2070 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatEntry);
2071 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatLoadGuestState);
2072 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatExit1);
2073 STAM_PROFILE_ADV_SET_STOPPED(&pVCpu->hm.s.StatExit2);
2074 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchLongJmpToR3);
2075
2076 VMCPU_CMPXCHG_STATE(pVCpu, VMCPUSTATE_STARTED_HM, VMCPUSTATE_STARTED_EXEC);
2077}
2078
2079
2080/**
2081 * Leaves the AMD-V session.
2082 *
2083 * @returns VBox status code.
2084 * @param pVCpu The cross context virtual CPU structure.
2085 */
2086static int hmR0SvmLeaveSession(PVMCPU pVCpu)
2087{
2088 HM_DISABLE_PREEMPT();
2089 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
2090 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
2091
2092 /* When thread-context hooks are used, we can avoid doing the leave again if we had been preempted before
2093 and done this from the SVMR0ThreadCtxCallback(). */
2094 if (!pVCpu->hm.s.fLeaveDone)
2095 {
2096 hmR0SvmLeave(pVCpu);
2097 pVCpu->hm.s.fLeaveDone = true;
2098 }
2099
2100 /*
2101 * !!! IMPORTANT !!!
2102 * If you modify code here, make sure to check whether hmR0SvmCallRing3Callback() needs to be updated too.
2103 */
2104
2105 /** @todo eliminate the need for calling VMMR0ThreadCtxHookDisable here! */
2106 /* Deregister hook now that we've left HM context before re-enabling preemption. */
2107 VMMR0ThreadCtxHookDisable(pVCpu);
2108
2109 /* Leave HM context. This takes care of local init (term). */
2110 int rc = HMR0LeaveCpu(pVCpu);
2111
2112 HM_RESTORE_PREEMPT();
2113 return rc;
2114}
2115
2116
2117/**
2118 * Does the necessary state syncing before doing a longjmp to ring-3.
2119 *
2120 * @returns VBox status code.
2121 * @param pVCpu The cross context virtual CPU structure.
2122 *
2123 * @remarks No-long-jmp zone!!!
2124 */
2125static int hmR0SvmLongJmpToRing3(PVMCPU pVCpu)
2126{
2127 return hmR0SvmLeaveSession(pVCpu);
2128}
2129
2130
2131/**
2132 * VMMRZCallRing3() callback wrapper which saves the guest state (or restores
2133 * any remaining host state) before we longjump to ring-3 and possibly get
2134 * preempted.
2135 *
2136 * @param pVCpu The cross context virtual CPU structure.
2137 * @param enmOperation The operation causing the ring-3 longjump.
2138 * @param pvUser The user argument (pointer to the possibly
2139 * out-of-date guest-CPU context).
2140 */
2141static DECLCALLBACK(int) hmR0SvmCallRing3Callback(PVMCPU pVCpu, VMMCALLRING3 enmOperation, void *pvUser)
2142{
2143 RT_NOREF_PV(pvUser);
2144
2145 if (enmOperation == VMMCALLRING3_VM_R0_ASSERTION)
2146 {
2147 /*
2148 * !!! IMPORTANT !!!
2149 * If you modify code here, make sure to check whether hmR0SvmLeave() and hmR0SvmLeaveSession() needs
2150 * to be updated too. This is a stripped down version which gets out ASAP trying to not trigger any assertion.
2151 */
2152 VMMRZCallRing3RemoveNotification(pVCpu);
2153 VMMRZCallRing3Disable(pVCpu);
2154 HM_DISABLE_PREEMPT();
2155
2156 /* Restore host FPU state if necessary and resync on next R0 reentry. */
2157 CPUMR0FpuStateMaybeSaveGuestAndRestoreHost(pVCpu);
2158
2159 /* Restore host debug registers if necessary and resync on next R0 reentry. */
2160 CPUMR0DebugStateMaybeSaveGuestAndRestoreHost(pVCpu, false /* save DR6 */);
2161
2162 /* Deregister the hook now that we've left HM context before re-enabling preemption. */
2163 /** @todo eliminate the need for calling VMMR0ThreadCtxHookDisable here! */
2164 VMMR0ThreadCtxHookDisable(pVCpu);
2165
2166 /* Leave HM context. This takes care of local init (term). */
2167 HMR0LeaveCpu(pVCpu);
2168
2169 HM_RESTORE_PREEMPT();
2170 return VINF_SUCCESS;
2171 }
2172
2173 Assert(pVCpu);
2174 Assert(pvUser);
2175 Assert(VMMRZCallRing3IsEnabled(pVCpu));
2176 HMSVM_ASSERT_PREEMPT_SAFE();
2177
2178 VMMRZCallRing3Disable(pVCpu);
2179 Assert(VMMR0IsLogFlushDisabled(pVCpu));
2180
2181 Log4(("hmR0SvmCallRing3Callback->hmR0SvmLongJmpToRing3\n"));
2182 int rc = hmR0SvmLongJmpToRing3(pVCpu);
2183 AssertRCReturn(rc, rc);
2184
2185 VMMRZCallRing3Enable(pVCpu);
2186 return VINF_SUCCESS;
2187}
2188
2189
2190/**
2191 * Take necessary actions before going back to ring-3.
2192 *
2193 * An action requires us to go back to ring-3. This function does the necessary
2194 * steps before we can safely return to ring-3. This is not the same as longjmps
2195 * to ring-3, this is voluntary.
2196 *
2197 * @param pVM The cross context VM structure.
2198 * @param pVCpu The cross context virtual CPU structure.
2199 * @param pCtx Pointer to the guest-CPU context.
2200 * @param rcExit The reason for exiting to ring-3. Can be
2201 * VINF_VMM_UNKNOWN_RING3_CALL.
2202 */
2203static void hmR0SvmExitToRing3(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx, int rcExit)
2204{
2205 Assert(pVM);
2206 Assert(pVCpu);
2207 Assert(pCtx);
2208 HMSVM_ASSERT_PREEMPT_SAFE();
2209
2210 /* Please, no longjumps here (any logging shouldn't flush jump back to ring-3). NO LOGGING BEFORE THIS POINT! */
2211 VMMRZCallRing3Disable(pVCpu);
2212 Log4(("hmR0SvmExitToRing3: rcExit=%d\n", rcExit));
2213
2214 /* We need to do this only while truly exiting the "inner loop" back to ring-3 and -not- for any longjmp to ring3. */
2215 if (pVCpu->hm.s.Event.fPending)
2216 {
2217 hmR0SvmPendingEventToTrpmTrap(pVCpu);
2218 Assert(!pVCpu->hm.s.Event.fPending);
2219 }
2220
2221 /* If we're emulating an instruction, we shouldn't have any TRPM traps pending
2222 and if we're injecting an event we should have a TRPM trap pending. */
2223 AssertMsg(rcExit != VINF_EM_RAW_INJECT_TRPM_EVENT || TRPMHasTrap(pVCpu), ("rcExit=%Rrc\n", rcExit));
2224 AssertMsg(rcExit != VINF_EM_RAW_EMULATE_INSTR || !TRPMHasTrap(pVCpu), ("rcExit=%Rrc\n", rcExit));
2225
2226 /* Sync. the necessary state for going back to ring-3. */
2227 hmR0SvmLeaveSession(pVCpu);
2228 STAM_COUNTER_DEC(&pVCpu->hm.s.StatSwitchLongJmpToR3);
2229
2230 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_TO_R3);
2231 CPUMSetChangedFlags(pVCpu, CPUM_CHANGED_SYSENTER_MSR
2232 | CPUM_CHANGED_LDTR
2233 | CPUM_CHANGED_GDTR
2234 | CPUM_CHANGED_IDTR
2235 | CPUM_CHANGED_TR
2236 | CPUM_CHANGED_HIDDEN_SEL_REGS);
2237 if ( pVM->hm.s.fNestedPaging
2238 && CPUMIsGuestPagingEnabledEx(pCtx))
2239 {
2240 CPUMSetChangedFlags(pVCpu, CPUM_CHANGED_GLOBAL_TLB_FLUSH);
2241 }
2242
2243 /* On our way back from ring-3 reload the guest state if there is a possibility of it being changed. */
2244 if (rcExit != VINF_EM_RAW_INTERRUPT)
2245 HMCPU_CF_SET(pVCpu, HM_CHANGED_ALL_GUEST);
2246
2247 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchExitToR3);
2248
2249 /* We do -not- want any longjmp notifications after this! We must return to ring-3 ASAP. */
2250 VMMRZCallRing3RemoveNotification(pVCpu);
2251 VMMRZCallRing3Enable(pVCpu);
2252}
2253
2254
2255/**
2256 * Updates the use of TSC offsetting mode for the CPU and adjusts the necessary
2257 * intercepts.
2258 *
2259 * @param pVM The cross context VM structure.
2260 * @param pVCpu The cross context virtual CPU structure.
2261 *
2262 * @remarks No-long-jump zone!!!
2263 */
2264static void hmR0SvmUpdateTscOffsetting(PVM pVM, PVMCPU pVCpu)
2265{
2266 bool fParavirtTsc;
2267 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
2268 bool fCanUseRealTsc = TMCpuTickCanUseRealTSC(pVM, pVCpu, &pVmcb->ctrl.u64TSCOffset, &fParavirtTsc);
2269 if (fCanUseRealTsc)
2270 {
2271 pVmcb->ctrl.u64InterceptCtrl &= ~SVM_CTRL_INTERCEPT_RDTSC;
2272 pVmcb->ctrl.u64InterceptCtrl &= ~SVM_CTRL_INTERCEPT_RDTSCP;
2273 STAM_COUNTER_INC(&pVCpu->hm.s.StatTscOffset);
2274 }
2275 else
2276 {
2277 pVmcb->ctrl.u64InterceptCtrl |= SVM_CTRL_INTERCEPT_RDTSC;
2278 pVmcb->ctrl.u64InterceptCtrl |= SVM_CTRL_INTERCEPT_RDTSCP;
2279 STAM_COUNTER_INC(&pVCpu->hm.s.StatTscIntercept);
2280 }
2281 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_INTERCEPTS;
2282
2283 /** @todo later optimize this to be done elsewhere and not before every
2284 * VM-entry. */
2285 if (fParavirtTsc)
2286 {
2287 /* Currently neither Hyper-V nor KVM need to update their paravirt. TSC
2288 information before every VM-entry, hence disable it for performance sake. */
2289#if 0
2290 int rc = GIMR0UpdateParavirtTsc(pVM, 0 /* u64Offset */);
2291 AssertRC(rc);
2292#endif
2293 STAM_COUNTER_INC(&pVCpu->hm.s.StatTscParavirt);
2294 }
2295}
2296
2297
2298/**
2299 * Sets an event as a pending event to be injected into the guest.
2300 *
2301 * @param pVCpu The cross context virtual CPU structure.
2302 * @param pEvent Pointer to the SVM event.
2303 * @param GCPtrFaultAddress The fault-address (CR2) in case it's a
2304 * page-fault.
2305 *
2306 * @remarks Statistics counter assumes this is a guest event being reflected to
2307 * the guest i.e. 'StatInjectPendingReflect' is incremented always.
2308 */
2309DECLINLINE(void) hmR0SvmSetPendingEvent(PVMCPU pVCpu, PSVMEVENT pEvent, RTGCUINTPTR GCPtrFaultAddress)
2310{
2311 Assert(!pVCpu->hm.s.Event.fPending);
2312 Assert(pEvent->n.u1Valid);
2313
2314 pVCpu->hm.s.Event.u64IntInfo = pEvent->u;
2315 pVCpu->hm.s.Event.fPending = true;
2316 pVCpu->hm.s.Event.GCPtrFaultAddress = GCPtrFaultAddress;
2317
2318 Log4(("hmR0SvmSetPendingEvent: u=%#RX64 u8Vector=%#x Type=%#x ErrorCodeValid=%RTbool ErrorCode=%#RX32\n", pEvent->u,
2319 pEvent->n.u8Vector, (uint8_t)pEvent->n.u3Type, !!pEvent->n.u1ErrorCodeValid, pEvent->n.u32ErrorCode));
2320}
2321
2322
2323/**
2324 * Injects an event into the guest upon VMRUN by updating the relevant field
2325 * in the VMCB.
2326 *
2327 * @param pVCpu The cross context virtual CPU structure.
2328 * @param pVmcb Pointer to the guest VM control block.
2329 * @param pCtx Pointer to the guest-CPU context.
2330 * @param pEvent Pointer to the event.
2331 *
2332 * @remarks No-long-jump zone!!!
2333 * @remarks Requires CR0!
2334 */
2335DECLINLINE(void) hmR0SvmInjectEventVmcb(PVMCPU pVCpu, PSVMVMCB pVmcb, PCPUMCTX pCtx, PSVMEVENT pEvent)
2336{
2337 NOREF(pVCpu); NOREF(pCtx);
2338
2339 pVmcb->ctrl.EventInject.u = pEvent->u;
2340 STAM_COUNTER_INC(&pVCpu->hm.s.paStatInjectedIrqsR0[pEvent->n.u8Vector & MASK_INJECT_IRQ_STAT]);
2341
2342 Log4(("hmR0SvmInjectEventVmcb: u=%#RX64 u8Vector=%#x Type=%#x ErrorCodeValid=%RTbool ErrorCode=%#RX32\n", pEvent->u,
2343 pEvent->n.u8Vector, (uint8_t)pEvent->n.u3Type, !!pEvent->n.u1ErrorCodeValid, pEvent->n.u32ErrorCode));
2344}
2345
2346
2347
2348/**
2349 * Converts any TRPM trap into a pending HM event. This is typically used when
2350 * entering from ring-3 (not longjmp returns).
2351 *
2352 * @param pVCpu The cross context virtual CPU structure.
2353 */
2354static void hmR0SvmTrpmTrapToPendingEvent(PVMCPU pVCpu)
2355{
2356 Assert(TRPMHasTrap(pVCpu));
2357 Assert(!pVCpu->hm.s.Event.fPending);
2358
2359 uint8_t uVector;
2360 TRPMEVENT enmTrpmEvent;
2361 RTGCUINT uErrCode;
2362 RTGCUINTPTR GCPtrFaultAddress;
2363 uint8_t cbInstr;
2364
2365 int rc = TRPMQueryTrapAll(pVCpu, &uVector, &enmTrpmEvent, &uErrCode, &GCPtrFaultAddress, &cbInstr);
2366 AssertRC(rc);
2367
2368 SVMEVENT Event;
2369 Event.u = 0;
2370 Event.n.u1Valid = 1;
2371 Event.n.u8Vector = uVector;
2372
2373 /* Refer AMD spec. 15.20 "Event Injection" for the format. */
2374 if (enmTrpmEvent == TRPM_TRAP)
2375 {
2376 Event.n.u3Type = SVM_EVENT_EXCEPTION;
2377 switch (uVector)
2378 {
2379 case X86_XCPT_NMI:
2380 {
2381 Event.n.u3Type = SVM_EVENT_NMI;
2382 break;
2383 }
2384
2385 case X86_XCPT_PF:
2386 case X86_XCPT_DF:
2387 case X86_XCPT_TS:
2388 case X86_XCPT_NP:
2389 case X86_XCPT_SS:
2390 case X86_XCPT_GP:
2391 case X86_XCPT_AC:
2392 {
2393 Event.n.u1ErrorCodeValid = 1;
2394 Event.n.u32ErrorCode = uErrCode;
2395 break;
2396 }
2397 }
2398 }
2399 else if (enmTrpmEvent == TRPM_HARDWARE_INT)
2400 Event.n.u3Type = SVM_EVENT_EXTERNAL_IRQ;
2401 else if (enmTrpmEvent == TRPM_SOFTWARE_INT)
2402 Event.n.u3Type = SVM_EVENT_SOFTWARE_INT;
2403 else
2404 AssertMsgFailed(("Invalid TRPM event type %d\n", enmTrpmEvent));
2405
2406 rc = TRPMResetTrap(pVCpu);
2407 AssertRC(rc);
2408
2409 Log4(("TRPM->HM event: u=%#RX64 u8Vector=%#x uErrorCodeValid=%RTbool uErrorCode=%#RX32\n", Event.u, Event.n.u8Vector,
2410 !!Event.n.u1ErrorCodeValid, Event.n.u32ErrorCode));
2411
2412 hmR0SvmSetPendingEvent(pVCpu, &Event, GCPtrFaultAddress);
2413}
2414
2415
2416/**
2417 * Converts any pending SVM event into a TRPM trap. Typically used when leaving
2418 * AMD-V to execute any instruction.
2419 *
2420 * @param pVCpu The cross context virtual CPU structure.
2421 */
2422static void hmR0SvmPendingEventToTrpmTrap(PVMCPU pVCpu)
2423{
2424 Assert(pVCpu->hm.s.Event.fPending);
2425 Assert(TRPMQueryTrap(pVCpu, NULL /* pu8TrapNo */, NULL /* pEnmType */) == VERR_TRPM_NO_ACTIVE_TRAP);
2426
2427 SVMEVENT Event;
2428 Event.u = pVCpu->hm.s.Event.u64IntInfo;
2429
2430 uint8_t uVector = Event.n.u8Vector;
2431 uint8_t uVectorType = Event.n.u3Type;
2432 TRPMEVENT enmTrapType = hmSvmEventToTrpmEventType(&Event);
2433
2434 Log4(("HM event->TRPM: uVector=%#x enmTrapType=%d\n", uVector, uVectorType));
2435
2436 int rc = TRPMAssertTrap(pVCpu, uVector, enmTrapType);
2437 AssertRC(rc);
2438
2439 if (Event.n.u1ErrorCodeValid)
2440 TRPMSetErrorCode(pVCpu, Event.n.u32ErrorCode);
2441
2442 if ( uVectorType == SVM_EVENT_EXCEPTION
2443 && uVector == X86_XCPT_PF)
2444 {
2445 TRPMSetFaultAddress(pVCpu, pVCpu->hm.s.Event.GCPtrFaultAddress);
2446 Assert(pVCpu->hm.s.Event.GCPtrFaultAddress == CPUMGetGuestCR2(pVCpu));
2447 }
2448 else if (uVectorType == SVM_EVENT_SOFTWARE_INT)
2449 {
2450 AssertMsg( uVectorType == SVM_EVENT_SOFTWARE_INT
2451 || (uVector == X86_XCPT_BP || uVector == X86_XCPT_OF),
2452 ("Invalid vector: uVector=%#x uVectorType=%#x\n", uVector, uVectorType));
2453 TRPMSetInstrLength(pVCpu, pVCpu->hm.s.Event.cbInstr);
2454 }
2455 pVCpu->hm.s.Event.fPending = false;
2456}
2457
2458
2459/**
2460 * Gets the guest's interrupt-shadow.
2461 *
2462 * @returns The guest's interrupt-shadow.
2463 * @param pVCpu The cross context virtual CPU structure.
2464 * @param pCtx Pointer to the guest-CPU context.
2465 *
2466 * @remarks No-long-jump zone!!!
2467 * @remarks Has side-effects with VMCPU_FF_INHIBIT_INTERRUPTS force-flag.
2468 */
2469DECLINLINE(uint32_t) hmR0SvmGetGuestIntrShadow(PVMCPU pVCpu, PCPUMCTX pCtx)
2470{
2471 /*
2472 * Instructions like STI and MOV SS inhibit interrupts till the next instruction completes. Check if we should
2473 * inhibit interrupts or clear any existing interrupt-inhibition.
2474 */
2475 uint32_t uIntrState = 0;
2476 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS))
2477 {
2478 if (pCtx->rip != EMGetInhibitInterruptsPC(pVCpu))
2479 {
2480 /*
2481 * We can clear the inhibit force flag as even if we go back to the recompiler without executing guest code in
2482 * AMD-V, the flag's condition to be cleared is met and thus the cleared state is correct.
2483 */
2484 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS);
2485 }
2486 else
2487 uIntrState = SVM_INTERRUPT_SHADOW_ACTIVE;
2488 }
2489 return uIntrState;
2490}
2491
2492
2493/**
2494 * Sets the virtual interrupt intercept control in the VMCB which
2495 * instructs AMD-V to cause a \#VMEXIT as soon as the guest is in a state to
2496 * receive interrupts.
2497 *
2498 * @param pVmcb Pointer to the VM control block.
2499 */
2500DECLINLINE(void) hmR0SvmSetVirtIntrIntercept(PSVMVMCB pVmcb)
2501{
2502 if (!(pVmcb->ctrl.u64InterceptCtrl & SVM_CTRL_INTERCEPT_VINTR))
2503 {
2504 pVmcb->ctrl.IntCtrl.n.u1VIrqPending = 1; /* A virtual interrupt is pending. */
2505 pVmcb->ctrl.IntCtrl.n.u8VIntrVector = 0; /* Vector not necessary as we #VMEXIT for delivering the interrupt. */
2506 pVmcb->ctrl.u64InterceptCtrl |= SVM_CTRL_INTERCEPT_VINTR;
2507 pVmcb->ctrl.u64VmcbCleanBits &= ~(HMSVM_VMCB_CLEAN_INTERCEPTS | HMSVM_VMCB_CLEAN_TPR);
2508
2509 Log4(("Setting VINTR intercept\n"));
2510 }
2511}
2512
2513
2514#if 0
2515/**
2516 * Clears the virtual interrupt intercept control in the VMCB as
2517 * we are figured the guest is unable process any interrupts
2518 * at this point of time.
2519 *
2520 * @param pVmcb Pointer to the VM control block.
2521 */
2522DECLINLINE(void) hmR0SvmClearVirtIntrIntercept(PSVMVMCB pVmcb)
2523{
2524 if (pVmcb->ctrl.u64InterceptCtrl & SVM_CTRL_INTERCEPT_VINTR)
2525 {
2526 pVmcb->ctrl.u64InterceptCtrl &= ~SVM_CTRL_INTERCEPT_VINTR;
2527 pVmcb->ctrl.u64VmcbCleanBits &= ~(HMSVM_VMCB_CLEAN_INTERCEPTS);
2528 Log4(("Clearing VINTR intercept\n"));
2529 }
2530}
2531#endif
2532
2533
2534/**
2535 * Sets the IRET intercept control in the VMCB which instructs AMD-V to cause a
2536 * \#VMEXIT as soon as a guest starts executing an IRET. This is used to unblock
2537 * virtual NMIs.
2538 *
2539 * @param pVmcb Pointer to the VM control block.
2540 */
2541DECLINLINE(void) hmR0SvmSetIretIntercept(PSVMVMCB pVmcb)
2542{
2543 if (!(pVmcb->ctrl.u64InterceptCtrl & SVM_CTRL_INTERCEPT_IRET))
2544 {
2545 pVmcb->ctrl.u64InterceptCtrl |= SVM_CTRL_INTERCEPT_IRET;
2546 pVmcb->ctrl.u64VmcbCleanBits &= ~(HMSVM_VMCB_CLEAN_INTERCEPTS);
2547
2548 Log4(("Setting IRET intercept\n"));
2549 }
2550}
2551
2552
2553/**
2554 * Clears the IRET intercept control in the VMCB.
2555 *
2556 * @param pVmcb Pointer to the VM control block.
2557 */
2558DECLINLINE(void) hmR0SvmClearIretIntercept(PSVMVMCB pVmcb)
2559{
2560 if (pVmcb->ctrl.u64InterceptCtrl & SVM_CTRL_INTERCEPT_IRET)
2561 {
2562 pVmcb->ctrl.u64InterceptCtrl &= ~SVM_CTRL_INTERCEPT_IRET;
2563 pVmcb->ctrl.u64VmcbCleanBits &= ~(HMSVM_VMCB_CLEAN_INTERCEPTS);
2564
2565 Log4(("Clearing IRET intercept\n"));
2566 }
2567}
2568
2569
2570/**
2571 * Evaluates the event to be delivered to the guest and sets it as the pending
2572 * event.
2573 *
2574 * @param pVCpu The cross context virtual CPU structure.
2575 * @param pCtx Pointer to the guest-CPU context.
2576 */
2577static void hmR0SvmEvaluatePendingEvent(PVMCPU pVCpu, PCPUMCTX pCtx)
2578{
2579 Assert(!pVCpu->hm.s.Event.fPending);
2580 Log4Func(("\n"));
2581
2582 bool const fIntShadow = RT_BOOL(hmR0SvmGetGuestIntrShadow(pVCpu, pCtx));
2583 bool const fBlockInt = !(pCtx->eflags.u32 & X86_EFL_IF);
2584 bool const fBlockNmi = VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_BLOCK_NMIS);
2585 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
2586
2587 if (VMCPU_FF_TEST_AND_CLEAR(pVCpu, VMCPU_FF_UPDATE_APIC))
2588 APICUpdatePendingInterrupts(pVCpu);
2589
2590 SVMEVENT Event;
2591 Event.u = 0;
2592 /** @todo SMI. SMIs take priority over NMIs. */
2593 if (VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_INTERRUPT_NMI)) /* NMI. NMIs take priority over regular interrupts . */
2594 {
2595 if (fBlockNmi)
2596 hmR0SvmSetIretIntercept(pVmcb);
2597 else if (fIntShadow)
2598 hmR0SvmSetVirtIntrIntercept(pVmcb);
2599 else
2600 {
2601 Log4(("Pending NMI\n"));
2602
2603 Event.n.u1Valid = 1;
2604 Event.n.u8Vector = X86_XCPT_NMI;
2605 Event.n.u3Type = SVM_EVENT_NMI;
2606
2607 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
2608 hmR0SvmSetIretIntercept(pVmcb);
2609 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INTERRUPT_NMI);
2610 }
2611 }
2612 else if ( VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_INTERRUPT_APIC | VMCPU_FF_INTERRUPT_PIC)
2613 && !pVCpu->hm.s.fSingleInstruction)
2614 {
2615 /*
2616 * Check if the guest can receive external interrupts (PIC/APIC). Once PDMGetInterrupt() returns
2617 * a valid interrupt we -must- deliver the interrupt. We can no longer re-request it from the APIC.
2618 */
2619 if ( !fBlockInt
2620 && !fIntShadow)
2621 {
2622 uint8_t u8Interrupt;
2623 int rc = PDMGetInterrupt(pVCpu, &u8Interrupt);
2624 if (RT_SUCCESS(rc))
2625 {
2626 Log4(("Injecting external interrupt u8Interrupt=%#x\n", u8Interrupt));
2627
2628 Event.n.u1Valid = 1;
2629 Event.n.u8Vector = u8Interrupt;
2630 Event.n.u3Type = SVM_EVENT_EXTERNAL_IRQ;
2631
2632 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
2633 }
2634 else if (rc == VERR_APIC_INTR_MASKED_BY_TPR)
2635 {
2636 /*
2637 * AMD-V has no TPR thresholding feature. We just avoid posting the interrupt.
2638 * We just avoid delivering the TPR-masked interrupt here. TPR will be updated
2639 * always via hmR0SvmLoadGuestState() -> hmR0SvmLoadGuestApicState().
2640 */
2641 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchTprMaskedIrq);
2642 }
2643 else
2644 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchGuestIrq);
2645 }
2646 else
2647 hmR0SvmSetVirtIntrIntercept(pVmcb);
2648 }
2649}
2650
2651
2652/**
2653 * Injects any pending events into the guest if the guest is in a state to
2654 * receive them.
2655 *
2656 * @param pVCpu The cross context virtual CPU structure.
2657 * @param pCtx Pointer to the guest-CPU context.
2658 */
2659static void hmR0SvmInjectPendingEvent(PVMCPU pVCpu, PCPUMCTX pCtx)
2660{
2661 Assert(!TRPMHasTrap(pVCpu));
2662 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
2663
2664 bool const fIntShadow = RT_BOOL(hmR0SvmGetGuestIntrShadow(pVCpu, pCtx));
2665 bool const fBlockInt = !(pCtx->eflags.u32 & X86_EFL_IF);
2666 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
2667
2668 if (pVCpu->hm.s.Event.fPending) /* First, inject any pending HM events. */
2669 {
2670 SVMEVENT Event;
2671 Event.u = pVCpu->hm.s.Event.u64IntInfo;
2672 Assert(Event.n.u1Valid);
2673#ifdef VBOX_STRICT
2674 if (Event.n.u3Type == SVM_EVENT_EXTERNAL_IRQ)
2675 {
2676 Assert(!fBlockInt);
2677 Assert(!fIntShadow);
2678 }
2679 else if (Event.n.u3Type == SVM_EVENT_NMI)
2680 Assert(!fIntShadow);
2681#endif
2682
2683 Log4(("Injecting pending HM event.\n"));
2684 hmR0SvmInjectEventVmcb(pVCpu, pVmcb, pCtx, &Event);
2685 pVCpu->hm.s.Event.fPending = false;
2686
2687#ifdef VBOX_WITH_STATISTICS
2688 if (Event.n.u3Type == SVM_EVENT_EXTERNAL_IRQ)
2689 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectInterrupt);
2690 else
2691 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectXcpt);
2692#endif
2693 }
2694
2695 /* Update the guest interrupt shadow in the VMCB. */
2696 pVmcb->ctrl.u64IntShadow = !!fIntShadow;
2697 NOREF(fBlockInt);
2698}
2699
2700
2701/**
2702 * Reports world-switch error and dumps some useful debug info.
2703 *
2704 * @param pVM The cross context VM structure.
2705 * @param pVCpu The cross context virtual CPU structure.
2706 * @param rcVMRun The return code from VMRUN (or
2707 * VERR_SVM_INVALID_GUEST_STATE for invalid
2708 * guest-state).
2709 * @param pCtx Pointer to the guest-CPU context.
2710 */
2711static void hmR0SvmReportWorldSwitchError(PVM pVM, PVMCPU pVCpu, int rcVMRun, PCPUMCTX pCtx)
2712{
2713 NOREF(pCtx);
2714 HMSVM_ASSERT_PREEMPT_SAFE();
2715 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
2716
2717 if (rcVMRun == VERR_SVM_INVALID_GUEST_STATE)
2718 {
2719 hmR0DumpRegs(pVM, pVCpu, pCtx); NOREF(pVM);
2720#ifdef VBOX_STRICT
2721 Log4(("ctrl.u64VmcbCleanBits %#RX64\n", pVmcb->ctrl.u64VmcbCleanBits));
2722 Log4(("ctrl.u16InterceptRdCRx %#x\n", pVmcb->ctrl.u16InterceptRdCRx));
2723 Log4(("ctrl.u16InterceptWrCRx %#x\n", pVmcb->ctrl.u16InterceptWrCRx));
2724 Log4(("ctrl.u16InterceptRdDRx %#x\n", pVmcb->ctrl.u16InterceptRdDRx));
2725 Log4(("ctrl.u16InterceptWrDRx %#x\n", pVmcb->ctrl.u16InterceptWrDRx));
2726 Log4(("ctrl.u32InterceptXcpt %#x\n", pVmcb->ctrl.u32InterceptXcpt));
2727 Log4(("ctrl.u64InterceptCtrl %#RX64\n", pVmcb->ctrl.u64InterceptCtrl));
2728 Log4(("ctrl.u64IOPMPhysAddr %#RX64\n", pVmcb->ctrl.u64IOPMPhysAddr));
2729 Log4(("ctrl.u64MSRPMPhysAddr %#RX64\n", pVmcb->ctrl.u64MSRPMPhysAddr));
2730 Log4(("ctrl.u64TSCOffset %#RX64\n", pVmcb->ctrl.u64TSCOffset));
2731
2732 Log4(("ctrl.TLBCtrl.u32ASID %#x\n", pVmcb->ctrl.TLBCtrl.n.u32ASID));
2733 Log4(("ctrl.TLBCtrl.u8TLBFlush %#x\n", pVmcb->ctrl.TLBCtrl.n.u8TLBFlush));
2734 Log4(("ctrl.TLBCtrl.u24Reserved %#x\n", pVmcb->ctrl.TLBCtrl.n.u24Reserved));
2735
2736 Log4(("ctrl.IntCtrl.u8VTPR %#x\n", pVmcb->ctrl.IntCtrl.n.u8VTPR));
2737 Log4(("ctrl.IntCtrl.u1VIrqPending %#x\n", pVmcb->ctrl.IntCtrl.n.u1VIrqPending));
2738 Log4(("ctrl.IntCtrl.u7Reserved %#x\n", pVmcb->ctrl.IntCtrl.n.u7Reserved));
2739 Log4(("ctrl.IntCtrl.u4VIntrPrio %#x\n", pVmcb->ctrl.IntCtrl.n.u4VIntrPrio));
2740 Log4(("ctrl.IntCtrl.u1IgnoreTPR %#x\n", pVmcb->ctrl.IntCtrl.n.u1IgnoreTPR));
2741 Log4(("ctrl.IntCtrl.u3Reserved %#x\n", pVmcb->ctrl.IntCtrl.n.u3Reserved));
2742 Log4(("ctrl.IntCtrl.u1VIntrMasking %#x\n", pVmcb->ctrl.IntCtrl.n.u1VIntrMasking));
2743 Log4(("ctrl.IntCtrl.u6Reserved %#x\n", pVmcb->ctrl.IntCtrl.n.u6Reserved));
2744 Log4(("ctrl.IntCtrl.u8VIntrVector %#x\n", pVmcb->ctrl.IntCtrl.n.u8VIntrVector));
2745 Log4(("ctrl.IntCtrl.u24Reserved %#x\n", pVmcb->ctrl.IntCtrl.n.u24Reserved));
2746
2747 Log4(("ctrl.u64IntShadow %#RX64\n", pVmcb->ctrl.u64IntShadow));
2748 Log4(("ctrl.u64ExitCode %#RX64\n", pVmcb->ctrl.u64ExitCode));
2749 Log4(("ctrl.u64ExitInfo1 %#RX64\n", pVmcb->ctrl.u64ExitInfo1));
2750 Log4(("ctrl.u64ExitInfo2 %#RX64\n", pVmcb->ctrl.u64ExitInfo2));
2751 Log4(("ctrl.ExitIntInfo.u8Vector %#x\n", pVmcb->ctrl.ExitIntInfo.n.u8Vector));
2752 Log4(("ctrl.ExitIntInfo.u3Type %#x\n", pVmcb->ctrl.ExitIntInfo.n.u3Type));
2753 Log4(("ctrl.ExitIntInfo.u1ErrorCodeValid %#x\n", pVmcb->ctrl.ExitIntInfo.n.u1ErrorCodeValid));
2754 Log4(("ctrl.ExitIntInfo.u19Reserved %#x\n", pVmcb->ctrl.ExitIntInfo.n.u19Reserved));
2755 Log4(("ctrl.ExitIntInfo.u1Valid %#x\n", pVmcb->ctrl.ExitIntInfo.n.u1Valid));
2756 Log4(("ctrl.ExitIntInfo.u32ErrorCode %#x\n", pVmcb->ctrl.ExitIntInfo.n.u32ErrorCode));
2757 Log4(("ctrl.NestedPaging %#RX64\n", pVmcb->ctrl.NestedPaging.u));
2758 Log4(("ctrl.EventInject.u8Vector %#x\n", pVmcb->ctrl.EventInject.n.u8Vector));
2759 Log4(("ctrl.EventInject.u3Type %#x\n", pVmcb->ctrl.EventInject.n.u3Type));
2760 Log4(("ctrl.EventInject.u1ErrorCodeValid %#x\n", pVmcb->ctrl.EventInject.n.u1ErrorCodeValid));
2761 Log4(("ctrl.EventInject.u19Reserved %#x\n", pVmcb->ctrl.EventInject.n.u19Reserved));
2762 Log4(("ctrl.EventInject.u1Valid %#x\n", pVmcb->ctrl.EventInject.n.u1Valid));
2763 Log4(("ctrl.EventInject.u32ErrorCode %#x\n", pVmcb->ctrl.EventInject.n.u32ErrorCode));
2764
2765 Log4(("ctrl.u64NestedPagingCR3 %#RX64\n", pVmcb->ctrl.u64NestedPagingCR3));
2766 Log4(("ctrl.u64LBRVirt %#RX64\n", pVmcb->ctrl.u64LBRVirt));
2767
2768 Log4(("guest.CS.u16Sel %RTsel\n", pVmcb->guest.CS.u16Sel));
2769 Log4(("guest.CS.u16Attr %#x\n", pVmcb->guest.CS.u16Attr));
2770 Log4(("guest.CS.u32Limit %#RX32\n", pVmcb->guest.CS.u32Limit));
2771 Log4(("guest.CS.u64Base %#RX64\n", pVmcb->guest.CS.u64Base));
2772 Log4(("guest.DS.u16Sel %#RTsel\n", pVmcb->guest.DS.u16Sel));
2773 Log4(("guest.DS.u16Attr %#x\n", pVmcb->guest.DS.u16Attr));
2774 Log4(("guest.DS.u32Limit %#RX32\n", pVmcb->guest.DS.u32Limit));
2775 Log4(("guest.DS.u64Base %#RX64\n", pVmcb->guest.DS.u64Base));
2776 Log4(("guest.ES.u16Sel %RTsel\n", pVmcb->guest.ES.u16Sel));
2777 Log4(("guest.ES.u16Attr %#x\n", pVmcb->guest.ES.u16Attr));
2778 Log4(("guest.ES.u32Limit %#RX32\n", pVmcb->guest.ES.u32Limit));
2779 Log4(("guest.ES.u64Base %#RX64\n", pVmcb->guest.ES.u64Base));
2780 Log4(("guest.FS.u16Sel %RTsel\n", pVmcb->guest.FS.u16Sel));
2781 Log4(("guest.FS.u16Attr %#x\n", pVmcb->guest.FS.u16Attr));
2782 Log4(("guest.FS.u32Limit %#RX32\n", pVmcb->guest.FS.u32Limit));
2783 Log4(("guest.FS.u64Base %#RX64\n", pVmcb->guest.FS.u64Base));
2784 Log4(("guest.GS.u16Sel %RTsel\n", pVmcb->guest.GS.u16Sel));
2785 Log4(("guest.GS.u16Attr %#x\n", pVmcb->guest.GS.u16Attr));
2786 Log4(("guest.GS.u32Limit %#RX32\n", pVmcb->guest.GS.u32Limit));
2787 Log4(("guest.GS.u64Base %#RX64\n", pVmcb->guest.GS.u64Base));
2788
2789 Log4(("guest.GDTR.u32Limit %#RX32\n", pVmcb->guest.GDTR.u32Limit));
2790 Log4(("guest.GDTR.u64Base %#RX64\n", pVmcb->guest.GDTR.u64Base));
2791
2792 Log4(("guest.LDTR.u16Sel %RTsel\n", pVmcb->guest.LDTR.u16Sel));
2793 Log4(("guest.LDTR.u16Attr %#x\n", pVmcb->guest.LDTR.u16Attr));
2794 Log4(("guest.LDTR.u32Limit %#RX32\n", pVmcb->guest.LDTR.u32Limit));
2795 Log4(("guest.LDTR.u64Base %#RX64\n", pVmcb->guest.LDTR.u64Base));
2796
2797 Log4(("guest.IDTR.u32Limit %#RX32\n", pVmcb->guest.IDTR.u32Limit));
2798 Log4(("guest.IDTR.u64Base %#RX64\n", pVmcb->guest.IDTR.u64Base));
2799
2800 Log4(("guest.TR.u16Sel %RTsel\n", pVmcb->guest.TR.u16Sel));
2801 Log4(("guest.TR.u16Attr %#x\n", pVmcb->guest.TR.u16Attr));
2802 Log4(("guest.TR.u32Limit %#RX32\n", pVmcb->guest.TR.u32Limit));
2803 Log4(("guest.TR.u64Base %#RX64\n", pVmcb->guest.TR.u64Base));
2804
2805 Log4(("guest.u8CPL %#x\n", pVmcb->guest.u8CPL));
2806 Log4(("guest.u64CR0 %#RX64\n", pVmcb->guest.u64CR0));
2807 Log4(("guest.u64CR2 %#RX64\n", pVmcb->guest.u64CR2));
2808 Log4(("guest.u64CR3 %#RX64\n", pVmcb->guest.u64CR3));
2809 Log4(("guest.u64CR4 %#RX64\n", pVmcb->guest.u64CR4));
2810 Log4(("guest.u64DR6 %#RX64\n", pVmcb->guest.u64DR6));
2811 Log4(("guest.u64DR7 %#RX64\n", pVmcb->guest.u64DR7));
2812
2813 Log4(("guest.u64RIP %#RX64\n", pVmcb->guest.u64RIP));
2814 Log4(("guest.u64RSP %#RX64\n", pVmcb->guest.u64RSP));
2815 Log4(("guest.u64RAX %#RX64\n", pVmcb->guest.u64RAX));
2816 Log4(("guest.u64RFlags %#RX64\n", pVmcb->guest.u64RFlags));
2817
2818 Log4(("guest.u64SysEnterCS %#RX64\n", pVmcb->guest.u64SysEnterCS));
2819 Log4(("guest.u64SysEnterEIP %#RX64\n", pVmcb->guest.u64SysEnterEIP));
2820 Log4(("guest.u64SysEnterESP %#RX64\n", pVmcb->guest.u64SysEnterESP));
2821
2822 Log4(("guest.u64EFER %#RX64\n", pVmcb->guest.u64EFER));
2823 Log4(("guest.u64STAR %#RX64\n", pVmcb->guest.u64STAR));
2824 Log4(("guest.u64LSTAR %#RX64\n", pVmcb->guest.u64LSTAR));
2825 Log4(("guest.u64CSTAR %#RX64\n", pVmcb->guest.u64CSTAR));
2826 Log4(("guest.u64SFMASK %#RX64\n", pVmcb->guest.u64SFMASK));
2827 Log4(("guest.u64KernelGSBase %#RX64\n", pVmcb->guest.u64KernelGSBase));
2828 Log4(("guest.u64GPAT %#RX64\n", pVmcb->guest.u64GPAT));
2829 Log4(("guest.u64DBGCTL %#RX64\n", pVmcb->guest.u64DBGCTL));
2830 Log4(("guest.u64BR_FROM %#RX64\n", pVmcb->guest.u64BR_FROM));
2831 Log4(("guest.u64BR_TO %#RX64\n", pVmcb->guest.u64BR_TO));
2832 Log4(("guest.u64LASTEXCPFROM %#RX64\n", pVmcb->guest.u64LASTEXCPFROM));
2833 Log4(("guest.u64LASTEXCPTO %#RX64\n", pVmcb->guest.u64LASTEXCPTO));
2834#endif /* VBOX_STRICT */
2835 }
2836 else
2837 Log4(("hmR0SvmReportWorldSwitchError: rcVMRun=%d\n", rcVMRun));
2838
2839 NOREF(pVmcb);
2840}
2841
2842
2843/**
2844 * Check per-VM and per-VCPU force flag actions that require us to go back to
2845 * ring-3 for one reason or another.
2846 *
2847 * @returns VBox status code (information status code included).
2848 * @retval VINF_SUCCESS if we don't have any actions that require going back to
2849 * ring-3.
2850 * @retval VINF_PGM_SYNC_CR3 if we have pending PGM CR3 sync.
2851 * @retval VINF_EM_PENDING_REQUEST if we have pending requests (like hardware
2852 * interrupts)
2853 * @retval VINF_PGM_POOL_FLUSH_PENDING if PGM is doing a pool flush and requires
2854 * all EMTs to be in ring-3.
2855 * @retval VINF_EM_RAW_TO_R3 if there is pending DMA requests.
2856 * @retval VINF_EM_NO_MEMORY PGM is out of memory, we need to return
2857 * to the EM loop.
2858 *
2859 * @param pVM The cross context VM structure.
2860 * @param pVCpu The cross context virtual CPU structure.
2861 * @param pCtx Pointer to the guest-CPU context.
2862 */
2863static int hmR0SvmCheckForceFlags(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
2864{
2865 Assert(VMMRZCallRing3IsEnabled(pVCpu));
2866
2867 /* On AMD-V we don't need to update CR3, PAE PDPES lazily. See hmR0SvmSaveGuestState(). */
2868 Assert(!VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_HM_UPDATE_CR3));
2869 Assert(!VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_HM_UPDATE_PAE_PDPES));
2870
2871 if ( VM_FF_IS_PENDING(pVM, !pVCpu->hm.s.fSingleInstruction
2872 ? VM_FF_HP_R0_PRE_HM_MASK : VM_FF_HP_R0_PRE_HM_STEP_MASK)
2873 || VMCPU_FF_IS_PENDING(pVCpu, !pVCpu->hm.s.fSingleInstruction
2874 ? VMCPU_FF_HP_R0_PRE_HM_MASK : VMCPU_FF_HP_R0_PRE_HM_STEP_MASK) )
2875 {
2876 /* Pending PGM C3 sync. */
2877 if (VMCPU_FF_IS_PENDING(pVCpu,VMCPU_FF_PGM_SYNC_CR3 | VMCPU_FF_PGM_SYNC_CR3_NON_GLOBAL))
2878 {
2879 int rc = PGMSyncCR3(pVCpu, pCtx->cr0, pCtx->cr3, pCtx->cr4, VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_PGM_SYNC_CR3));
2880 if (rc != VINF_SUCCESS)
2881 {
2882 Log4(("hmR0SvmCheckForceFlags: PGMSyncCR3 forcing us back to ring-3. rc=%d\n", rc));
2883 return rc;
2884 }
2885 }
2886
2887 /* Pending HM-to-R3 operations (critsects, timers, EMT rendezvous etc.) */
2888 /* -XXX- what was that about single stepping? */
2889 if ( VM_FF_IS_PENDING(pVM, VM_FF_HM_TO_R3_MASK)
2890 || VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_HM_TO_R3_MASK))
2891 {
2892 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchHmToR3FF);
2893 int rc = RT_UNLIKELY(VM_FF_IS_PENDING(pVM, VM_FF_PGM_NO_MEMORY)) ? VINF_EM_NO_MEMORY : VINF_EM_RAW_TO_R3;
2894 Log4(("hmR0SvmCheckForceFlags: HM_TO_R3 forcing us back to ring-3. rc=%d\n", rc));
2895 return rc;
2896 }
2897
2898 /* Pending VM request packets, such as hardware interrupts. */
2899 if ( VM_FF_IS_PENDING(pVM, VM_FF_REQUEST)
2900 || VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_REQUEST))
2901 {
2902 Log4(("hmR0SvmCheckForceFlags: Pending VM request forcing us back to ring-3\n"));
2903 return VINF_EM_PENDING_REQUEST;
2904 }
2905
2906 /* Pending PGM pool flushes. */
2907 if (VM_FF_IS_PENDING(pVM, VM_FF_PGM_POOL_FLUSH_PENDING))
2908 {
2909 Log4(("hmR0SvmCheckForceFlags: PGM pool flush pending forcing us back to ring-3\n"));
2910 return VINF_PGM_POOL_FLUSH_PENDING;
2911 }
2912
2913 /* Pending DMA requests. */
2914 if (VM_FF_IS_PENDING(pVM, VM_FF_PDM_DMA))
2915 {
2916 Log4(("hmR0SvmCheckForceFlags: Pending DMA request forcing us back to ring-3\n"));
2917 return VINF_EM_RAW_TO_R3;
2918 }
2919 }
2920
2921 return VINF_SUCCESS;
2922}
2923
2924
2925/**
2926 * Does the preparations before executing guest code in AMD-V.
2927 *
2928 * This may cause longjmps to ring-3 and may even result in rescheduling to the
2929 * recompiler. We must be cautious what we do here regarding committing
2930 * guest-state information into the VMCB assuming we assuredly execute the guest
2931 * in AMD-V. If we fall back to the recompiler after updating the VMCB and
2932 * clearing the common-state (TRPM/forceflags), we must undo those changes so
2933 * that the recompiler can (and should) use them when it resumes guest
2934 * execution. Otherwise such operations must be done when we can no longer
2935 * exit to ring-3.
2936 *
2937 * @returns VBox status code (informational status codes included).
2938 * @retval VINF_SUCCESS if we can proceed with running the guest.
2939 * @retval VINF_* scheduling changes, we have to go back to ring-3.
2940 *
2941 * @param pVM The cross context VM structure.
2942 * @param pVCpu The cross context virtual CPU structure.
2943 * @param pCtx Pointer to the guest-CPU context.
2944 * @param pSvmTransient Pointer to the SVM transient structure.
2945 */
2946static int hmR0SvmPreRunGuest(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
2947{
2948 HMSVM_ASSERT_PREEMPT_SAFE();
2949
2950 /* Check force flag actions that might require us to go back to ring-3. */
2951 int rc = hmR0SvmCheckForceFlags(pVM, pVCpu, pCtx);
2952 if (rc != VINF_SUCCESS)
2953 return rc;
2954
2955 if (TRPMHasTrap(pVCpu))
2956 hmR0SvmTrpmTrapToPendingEvent(pVCpu);
2957 else if (!pVCpu->hm.s.Event.fPending)
2958 hmR0SvmEvaluatePendingEvent(pVCpu, pCtx);
2959
2960 /*
2961 * On the oldest AMD-V systems, we may not get enough information to reinject an NMI.
2962 * Just do it in software, see @bugref{8411}.
2963 * NB: If we could continue a task switch exit we wouldn't need to do this.
2964 */
2965 if (RT_UNLIKELY(pVCpu->hm.s.Event.fPending && (((pVCpu->hm.s.Event.u64IntInfo >> 8) & 7) == SVM_EVENT_NMI)))
2966 if (RT_UNLIKELY(!pVM->hm.s.svm.u32Features))
2967 return VINF_EM_RAW_INJECT_TRPM_EVENT;
2968
2969#ifdef HMSVM_SYNC_FULL_GUEST_STATE
2970 HMCPU_CF_SET(pVCpu, HM_CHANGED_ALL_GUEST);
2971#endif
2972
2973 /* Load the guest bits that are not shared with the host in any way since we can longjmp or get preempted. */
2974 rc = hmR0SvmLoadGuestState(pVM, pVCpu, pCtx);
2975 AssertRCReturn(rc, rc);
2976 STAM_COUNTER_INC(&pVCpu->hm.s.StatLoadFull);
2977
2978 /*
2979 * If we're not intercepting TPR changes in the guest, save the guest TPR before the world-switch
2980 * so we can update it on the way back if the guest changed the TPR.
2981 */
2982 if (pVCpu->hm.s.svm.fSyncVTpr)
2983 {
2984 if (pVM->hm.s.fTPRPatchingActive)
2985 pSvmTransient->u8GuestTpr = pCtx->msrLSTAR;
2986 else
2987 {
2988 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
2989 pSvmTransient->u8GuestTpr = pVmcb->ctrl.IntCtrl.n.u8VTPR;
2990 }
2991 }
2992
2993 /*
2994 * No longjmps to ring-3 from this point on!!!
2995 * Asserts() will still longjmp to ring-3 (but won't return), which is intentional, better than a kernel panic.
2996 * This also disables flushing of the R0-logger instance (if any).
2997 */
2998 VMMRZCallRing3Disable(pVCpu);
2999
3000 /*
3001 * We disable interrupts so that we don't miss any interrupts that would flag preemption (IPI/timers etc.)
3002 * when thread-context hooks aren't used and we've been running with preemption disabled for a while.
3003 *
3004 * We need to check for force-flags that could've possible been altered since we last checked them (e.g.
3005 * by PDMGetInterrupt() leaving the PDM critical section, see @bugref{6398}).
3006 *
3007 * We also check a couple of other force-flags as a last opportunity to get the EMT back to ring-3 before
3008 * executing guest code.
3009 */
3010 pSvmTransient->fEFlags = ASMIntDisableFlags();
3011 if ( VM_FF_IS_PENDING(pVM, VM_FF_EMT_RENDEZVOUS | VM_FF_TM_VIRTUAL_SYNC)
3012 || VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_HM_TO_R3_MASK))
3013 {
3014 ASMSetFlags(pSvmTransient->fEFlags);
3015 VMMRZCallRing3Enable(pVCpu);
3016 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchHmToR3FF);
3017 return VINF_EM_RAW_TO_R3;
3018 }
3019 if (RTThreadPreemptIsPending(NIL_RTTHREAD))
3020 {
3021 ASMSetFlags(pSvmTransient->fEFlags);
3022 VMMRZCallRing3Enable(pVCpu);
3023 STAM_COUNTER_INC(&pVCpu->hm.s.StatPendingHostIrq);
3024 return VINF_EM_RAW_INTERRUPT;
3025 }
3026
3027 /*
3028 * If we are injecting an NMI, we must set VMCPU_FF_BLOCK_NMIS only when we are going to execute
3029 * guest code for certain (no exits to ring-3). Otherwise, we could re-read the flag on re-entry into
3030 * AMD-V and conclude that NMI inhibition is active when we have not even delivered the NMI.
3031 *
3032 * With VT-x, this is handled by the Guest interruptibility information VMCS field which will set the
3033 * VMCS field after actually delivering the NMI which we read on VM-exit to determine the state.
3034 */
3035 if (pVCpu->hm.s.Event.fPending)
3036 {
3037 SVMEVENT Event;
3038 Event.u = pVCpu->hm.s.Event.u64IntInfo;
3039 if ( Event.n.u1Valid
3040 && Event.n.u3Type == SVM_EVENT_NMI
3041 && Event.n.u8Vector == X86_XCPT_NMI
3042 && !VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_BLOCK_NMIS))
3043 {
3044 VMCPU_FF_SET(pVCpu, VMCPU_FF_BLOCK_NMIS);
3045 }
3046 }
3047
3048 return VINF_SUCCESS;
3049}
3050
3051
3052/**
3053 * Prepares to run guest code in AMD-V and we've committed to doing so. This
3054 * means there is no backing out to ring-3 or anywhere else at this
3055 * point.
3056 *
3057 * @param pVM The cross context VM structure.
3058 * @param pVCpu The cross context virtual CPU structure.
3059 * @param pCtx Pointer to the guest-CPU context.
3060 * @param pSvmTransient Pointer to the SVM transient structure.
3061 *
3062 * @remarks Called with preemption disabled.
3063 * @remarks No-long-jump zone!!!
3064 */
3065static void hmR0SvmPreRunGuestCommitted(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
3066{
3067 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
3068 Assert(VMMR0IsLogFlushDisabled(pVCpu));
3069 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
3070
3071 VMCPU_ASSERT_STATE(pVCpu, VMCPUSTATE_STARTED_HM);
3072 VMCPU_SET_STATE(pVCpu, VMCPUSTATE_STARTED_EXEC); /* Indicate the start of guest execution. */
3073
3074 hmR0SvmInjectPendingEvent(pVCpu, pCtx);
3075
3076 if ( pVCpu->hm.s.fPreloadGuestFpu
3077 && !CPUMIsGuestFPUStateActive(pVCpu))
3078 {
3079 CPUMR0LoadGuestFPU(pVM, pVCpu); /* (Ignore rc, no need to set HM_CHANGED_HOST_CONTEXT for SVM.) */
3080 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_CR0);
3081 }
3082
3083 /* Load the state shared between host and guest (FPU, debug). */
3084 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
3085 if (HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_HOST_GUEST_SHARED_STATE))
3086 hmR0SvmLoadSharedState(pVCpu, pVmcb, pCtx);
3087 HMCPU_CF_CLEAR(pVCpu, HM_CHANGED_HOST_CONTEXT); /* Preemption might set this, nothing to do on AMD-V. */
3088 AssertMsg(!HMCPU_CF_VALUE(pVCpu), ("fContextUseFlags=%#RX32\n", HMCPU_CF_VALUE(pVCpu)));
3089
3090 /* Setup TSC offsetting. */
3091 RTCPUID idCurrentCpu = hmR0GetCurrentCpu()->idCpu;
3092 if ( pSvmTransient->fUpdateTscOffsetting
3093 || idCurrentCpu != pVCpu->hm.s.idLastCpu)
3094 {
3095 hmR0SvmUpdateTscOffsetting(pVM, pVCpu);
3096 pSvmTransient->fUpdateTscOffsetting = false;
3097 }
3098
3099 /* If we've migrating CPUs, mark the VMCB Clean bits as dirty. */
3100 if (idCurrentCpu != pVCpu->hm.s.idLastCpu)
3101 pVmcb->ctrl.u64VmcbCleanBits = 0;
3102
3103 /* Store status of the shared guest-host state at the time of VMRUN. */
3104#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS)
3105 if (CPUMIsGuestInLongModeEx(pCtx))
3106 {
3107 pSvmTransient->fWasGuestDebugStateActive = CPUMIsGuestDebugStateActivePending(pVCpu);
3108 pSvmTransient->fWasHyperDebugStateActive = CPUMIsHyperDebugStateActivePending(pVCpu);
3109 }
3110 else
3111#endif
3112 {
3113 pSvmTransient->fWasGuestDebugStateActive = CPUMIsGuestDebugStateActive(pVCpu);
3114 pSvmTransient->fWasHyperDebugStateActive = CPUMIsHyperDebugStateActive(pVCpu);
3115 }
3116 pSvmTransient->fWasGuestFPUStateActive = CPUMIsGuestFPUStateActive(pVCpu);
3117
3118 /* Flush the appropriate tagged-TLB entries. */
3119 ASMAtomicWriteBool(&pVCpu->hm.s.fCheckedTLBFlush, true); /* Used for TLB flushing, set this across the world switch. */
3120 hmR0SvmFlushTaggedTlb(pVCpu);
3121 Assert(hmR0GetCurrentCpu()->idCpu == pVCpu->hm.s.idLastCpu);
3122
3123 STAM_PROFILE_ADV_STOP_START(&pVCpu->hm.s.StatEntry, &pVCpu->hm.s.StatInGC, x);
3124
3125 TMNotifyStartOfExecution(pVCpu); /* Finally, notify TM to resume its clocks as we're about
3126 to start executing. */
3127
3128 /*
3129 * Save the current Host TSC_AUX and write the guest TSC_AUX to the host, so that
3130 * RDTSCPs (that don't cause exits) reads the guest MSR. See @bugref{3324}.
3131 *
3132 * This should be done -after- any RDTSCPs for obtaining the host timestamp (TM, STAM etc).
3133 */
3134 if ( (pVM->hm.s.cpuid.u32AMDFeatureEDX & X86_CPUID_EXT_FEATURE_EDX_RDTSCP)
3135 && !(pVmcb->ctrl.u64InterceptCtrl & SVM_CTRL_INTERCEPT_RDTSCP))
3136 {
3137 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_TSC_AUX, SVMMSREXIT_PASSTHRU_READ, SVMMSREXIT_PASSTHRU_WRITE);
3138 pVCpu->hm.s.u64HostTscAux = ASMRdMsr(MSR_K8_TSC_AUX);
3139 uint64_t u64GuestTscAux = CPUMR0GetGuestTscAux(pVCpu);
3140 if (u64GuestTscAux != pVCpu->hm.s.u64HostTscAux)
3141 ASMWrMsr(MSR_K8_TSC_AUX, u64GuestTscAux);
3142 pSvmTransient->fRestoreTscAuxMsr = true;
3143 }
3144 else
3145 {
3146 hmR0SvmSetMsrPermission(pVCpu, MSR_K8_TSC_AUX, SVMMSREXIT_INTERCEPT_READ, SVMMSREXIT_INTERCEPT_WRITE);
3147 pSvmTransient->fRestoreTscAuxMsr = false;
3148 }
3149
3150 /* If VMCB Clean bits isn't supported by the CPU, simply mark all state-bits as dirty, indicating (re)load-from-VMCB. */
3151 if (!(pVM->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_VMCB_CLEAN))
3152 pVmcb->ctrl.u64VmcbCleanBits = 0;
3153}
3154
3155
3156/**
3157 * Wrapper for running the guest code in AMD-V.
3158 *
3159 * @returns VBox strict status code.
3160 * @param pVM The cross context VM structure.
3161 * @param pVCpu The cross context virtual CPU structure.
3162 * @param pCtx Pointer to the guest-CPU context.
3163 *
3164 * @remarks No-long-jump zone!!!
3165 */
3166DECLINLINE(int) hmR0SvmRunGuest(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
3167{
3168 /*
3169 * 64-bit Windows uses XMM registers in the kernel as the Microsoft compiler expresses floating-point operations
3170 * using SSE instructions. Some XMM registers (XMM6-XMM15) are callee-saved and thus the need for this XMM wrapper.
3171 * Refer MSDN docs. "Configuring Programs for 64-bit / x64 Software Conventions / Register Usage" for details.
3172 */
3173#ifdef VBOX_WITH_KERNEL_USING_XMM
3174 return hmR0SVMRunWrapXMM(pVCpu->hm.s.svm.HCPhysVmcbHost, pVCpu->hm.s.svm.HCPhysVmcb, pCtx, pVM, pVCpu,
3175 pVCpu->hm.s.svm.pfnVMRun);
3176#else
3177 return pVCpu->hm.s.svm.pfnVMRun(pVCpu->hm.s.svm.HCPhysVmcbHost, pVCpu->hm.s.svm.HCPhysVmcb, pCtx, pVM, pVCpu);
3178#endif
3179}
3180
3181
3182/**
3183 * Performs some essential restoration of state after running guest code in
3184 * AMD-V.
3185 *
3186 * @param pVM The cross context VM structure.
3187 * @param pVCpu The cross context virtual CPU structure.
3188 * @param pMixedCtx Pointer to the guest-CPU context. The data maybe
3189 * out-of-sync. Make sure to update the required fields
3190 * before using them.
3191 * @param pSvmTransient Pointer to the SVM transient structure.
3192 * @param rcVMRun Return code of VMRUN.
3193 *
3194 * @remarks Called with interrupts disabled.
3195 * @remarks No-long-jump zone!!! This function will however re-enable longjmps
3196 * unconditionally when it is safe to do so.
3197 */
3198static void hmR0SvmPostRunGuest(PVM pVM, PVMCPU pVCpu, PCPUMCTX pMixedCtx, PSVMTRANSIENT pSvmTransient, int rcVMRun)
3199{
3200 Assert(!VMMRZCallRing3IsEnabled(pVCpu));
3201
3202 ASMAtomicWriteBool(&pVCpu->hm.s.fCheckedTLBFlush, false); /* See HMInvalidatePageOnAllVCpus(): used for TLB flushing. */
3203 ASMAtomicIncU32(&pVCpu->hm.s.cWorldSwitchExits); /* Initialized in vmR3CreateUVM(): used for EMT poking. */
3204
3205 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
3206 pVmcb->ctrl.u64VmcbCleanBits = HMSVM_VMCB_CLEAN_ALL; /* Mark the VMCB-state cache as unmodified by VMM. */
3207
3208 /* TSC read must be done early for maximum accuracy. */
3209 if (!(pVmcb->ctrl.u64InterceptCtrl & SVM_CTRL_INTERCEPT_RDTSC))
3210 TMCpuTickSetLastSeen(pVCpu, ASMReadTSC() + pVmcb->ctrl.u64TSCOffset);
3211
3212 if (pSvmTransient->fRestoreTscAuxMsr)
3213 {
3214 uint64_t u64GuestTscAuxMsr = ASMRdMsr(MSR_K8_TSC_AUX);
3215 CPUMR0SetGuestTscAux(pVCpu, u64GuestTscAuxMsr);
3216 if (u64GuestTscAuxMsr != pVCpu->hm.s.u64HostTscAux)
3217 ASMWrMsr(MSR_K8_TSC_AUX, pVCpu->hm.s.u64HostTscAux);
3218 }
3219
3220 STAM_PROFILE_ADV_STOP_START(&pVCpu->hm.s.StatInGC, &pVCpu->hm.s.StatExit1, x);
3221 TMNotifyEndOfExecution(pVCpu); /* Notify TM that the guest is no longer running. */
3222 VMCPU_SET_STATE(pVCpu, VMCPUSTATE_STARTED_HM);
3223
3224 Assert(!(ASMGetFlags() & X86_EFL_IF));
3225 ASMSetFlags(pSvmTransient->fEFlags); /* Enable interrupts. */
3226 VMMRZCallRing3Enable(pVCpu); /* It is now safe to do longjmps to ring-3!!! */
3227
3228 /* If VMRUN failed, we can bail out early. This does -not- cover SVM_EXIT_INVALID. */
3229 if (RT_UNLIKELY(rcVMRun != VINF_SUCCESS))
3230 {
3231 Log4(("VMRUN failure: rcVMRun=%Rrc\n", rcVMRun));
3232 return;
3233 }
3234
3235 pSvmTransient->u64ExitCode = pVmcb->ctrl.u64ExitCode; /* Save the #VMEXIT reason. */
3236 HMCPU_EXIT_HISTORY_ADD(pVCpu, pVmcb->ctrl.u64ExitCode); /* Update the #VMEXIT history array. */
3237 pSvmTransient->fVectoringDoublePF = false; /* Vectoring double page-fault needs to be determined later. */
3238 pSvmTransient->fVectoringPF = false; /* Vectoring page-fault needs to be determined later. */
3239
3240 hmR0SvmSaveGuestState(pVCpu, pMixedCtx); /* Save the guest state from the VMCB to the guest-CPU context. */
3241
3242 if (RT_LIKELY(pSvmTransient->u64ExitCode != SVM_EXIT_INVALID))
3243 {
3244 if (pVCpu->hm.s.svm.fSyncVTpr)
3245 {
3246 /* TPR patching (for 32-bit guests) uses LSTAR MSR for holding the TPR value, otherwise uses the VTPR. */
3247 if ( pVM->hm.s.fTPRPatchingActive
3248 && (pMixedCtx->msrLSTAR & 0xff) != pSvmTransient->u8GuestTpr)
3249 {
3250 int rc = APICSetTpr(pVCpu, pMixedCtx->msrLSTAR & 0xff);
3251 AssertRC(rc);
3252 HMCPU_CF_SET(pVCpu, HM_CHANGED_SVM_GUEST_APIC_STATE);
3253 }
3254 else if (pSvmTransient->u8GuestTpr != pVmcb->ctrl.IntCtrl.n.u8VTPR)
3255 {
3256 int rc = APICSetTpr(pVCpu, pVmcb->ctrl.IntCtrl.n.u8VTPR << 4);
3257 AssertRC(rc);
3258 HMCPU_CF_SET(pVCpu, HM_CHANGED_SVM_GUEST_APIC_STATE);
3259 }
3260 }
3261 }
3262}
3263
3264
3265/**
3266 * Runs the guest code using AMD-V.
3267 *
3268 * @returns VBox status code.
3269 * @param pVM The cross context VM structure.
3270 * @param pVCpu The cross context virtual CPU structure.
3271 * @param pCtx Pointer to the guest-CPU context.
3272 */
3273static int hmR0SvmRunGuestCodeNormal(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
3274{
3275 SVMTRANSIENT SvmTransient;
3276 SvmTransient.fUpdateTscOffsetting = true;
3277 uint32_t cLoops = 0;
3278 int rc = VERR_INTERNAL_ERROR_5;
3279
3280 for (;; cLoops++)
3281 {
3282 Assert(!HMR0SuspendPending());
3283 HMSVM_ASSERT_CPU_SAFE();
3284
3285 /* Preparatory work for running guest code, this may force us to return
3286 to ring-3. This bugger disables interrupts on VINF_SUCCESS! */
3287 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatEntry, x);
3288 rc = hmR0SvmPreRunGuest(pVM, pVCpu, pCtx, &SvmTransient);
3289 if (rc != VINF_SUCCESS)
3290 break;
3291
3292 /*
3293 * No longjmps to ring-3 from this point on!!!
3294 * Asserts() will still longjmp to ring-3 (but won't return), which is intentional, better than a kernel panic.
3295 * This also disables flushing of the R0-logger instance (if any).
3296 */
3297 hmR0SvmPreRunGuestCommitted(pVM, pVCpu, pCtx, &SvmTransient);
3298 rc = hmR0SvmRunGuest(pVM, pVCpu, pCtx);
3299
3300 /* Restore any residual host-state and save any bits shared between host
3301 and guest into the guest-CPU state. Re-enables interrupts! */
3302 hmR0SvmPostRunGuest(pVM, pVCpu, pCtx, &SvmTransient, rc);
3303
3304 if (RT_UNLIKELY( rc != VINF_SUCCESS /* Check for VMRUN errors. */
3305 || SvmTransient.u64ExitCode == SVM_EXIT_INVALID)) /* Check for invalid guest-state errors. */
3306 {
3307 if (rc == VINF_SUCCESS)
3308 rc = VERR_SVM_INVALID_GUEST_STATE;
3309 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExit1, x);
3310 hmR0SvmReportWorldSwitchError(pVM, pVCpu, rc, pCtx);
3311 break;
3312 }
3313
3314 /* Handle the #VMEXIT. */
3315 HMSVM_EXITCODE_STAM_COUNTER_INC(SvmTransient.u64ExitCode);
3316 STAM_PROFILE_ADV_STOP_START(&pVCpu->hm.s.StatExit1, &pVCpu->hm.s.StatExit2, x);
3317 VBOXVMM_R0_HMSVM_VMEXIT(pVCpu, pCtx, SvmTransient.u64ExitCode, (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb);
3318 rc = hmR0SvmHandleExit(pVCpu, pCtx, &SvmTransient);
3319 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExit2, x);
3320 if (rc != VINF_SUCCESS)
3321 break;
3322 if (cLoops > pVM->hm.s.cMaxResumeLoops)
3323 {
3324 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchMaxResumeLoops);
3325 rc = VINF_EM_RAW_INTERRUPT;
3326 break;
3327 }
3328 }
3329
3330 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatEntry, x);
3331 return rc;
3332}
3333
3334
3335/**
3336 * Runs the guest code using AMD-V in single step mode.
3337 *
3338 * @returns VBox status code.
3339 * @param pVM The cross context VM structure.
3340 * @param pVCpu The cross context virtual CPU structure.
3341 * @param pCtx Pointer to the guest-CPU context.
3342 */
3343static int hmR0SvmRunGuestCodeStep(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
3344{
3345 SVMTRANSIENT SvmTransient;
3346 SvmTransient.fUpdateTscOffsetting = true;
3347 uint32_t cLoops = 0;
3348 int rc = VERR_INTERNAL_ERROR_5;
3349 uint16_t uCsStart = pCtx->cs.Sel;
3350 uint64_t uRipStart = pCtx->rip;
3351
3352 for (;; cLoops++)
3353 {
3354 Assert(!HMR0SuspendPending());
3355 AssertMsg(pVCpu->hm.s.idEnteredCpu == RTMpCpuId(),
3356 ("Illegal migration! Entered on CPU %u Current %u cLoops=%u\n", (unsigned)pVCpu->hm.s.idEnteredCpu,
3357 (unsigned)RTMpCpuId(), cLoops));
3358
3359 /* Preparatory work for running guest code, this may force us to return
3360 to ring-3. This bugger disables interrupts on VINF_SUCCESS! */
3361 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatEntry, x);
3362 rc = hmR0SvmPreRunGuest(pVM, pVCpu, pCtx, &SvmTransient);
3363 if (rc != VINF_SUCCESS)
3364 break;
3365
3366 /*
3367 * No longjmps to ring-3 from this point on!!!
3368 * Asserts() will still longjmp to ring-3 (but won't return), which is intentional, better than a kernel panic.
3369 * This also disables flushing of the R0-logger instance (if any).
3370 */
3371 VMMRZCallRing3Disable(pVCpu);
3372 VMMRZCallRing3RemoveNotification(pVCpu);
3373 hmR0SvmPreRunGuestCommitted(pVM, pVCpu, pCtx, &SvmTransient);
3374
3375 rc = hmR0SvmRunGuest(pVM, pVCpu, pCtx);
3376
3377 /*
3378 * Restore any residual host-state and save any bits shared between host and guest into the guest-CPU state.
3379 * This will also re-enable longjmps to ring-3 when it has reached a safe point!!!
3380 */
3381 hmR0SvmPostRunGuest(pVM, pVCpu, pCtx, &SvmTransient, rc);
3382 if (RT_UNLIKELY( rc != VINF_SUCCESS /* Check for VMRUN errors. */
3383 || SvmTransient.u64ExitCode == SVM_EXIT_INVALID)) /* Check for invalid guest-state errors. */
3384 {
3385 if (rc == VINF_SUCCESS)
3386 rc = VERR_SVM_INVALID_GUEST_STATE;
3387 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExit1, x);
3388 hmR0SvmReportWorldSwitchError(pVM, pVCpu, rc, pCtx);
3389 return rc;
3390 }
3391
3392 /* Handle the #VMEXIT. */
3393 HMSVM_EXITCODE_STAM_COUNTER_INC(SvmTransient.u64ExitCode);
3394 STAM_PROFILE_ADV_STOP_START(&pVCpu->hm.s.StatExit1, &pVCpu->hm.s.StatExit2, x);
3395 VBOXVMM_R0_HMSVM_VMEXIT(pVCpu, pCtx, SvmTransient.u64ExitCode, (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb);
3396 rc = hmR0SvmHandleExit(pVCpu, pCtx, &SvmTransient);
3397 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatExit2, x);
3398 if (rc != VINF_SUCCESS)
3399 break;
3400 if (cLoops > pVM->hm.s.cMaxResumeLoops)
3401 {
3402 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchMaxResumeLoops);
3403 rc = VINF_EM_RAW_INTERRUPT;
3404 break;
3405 }
3406
3407 /*
3408 * Did the RIP change, if so, consider it a single step.
3409 * Otherwise, make sure one of the TFs gets set.
3410 */
3411 if ( pCtx->rip != uRipStart
3412 || pCtx->cs.Sel != uCsStart)
3413 {
3414 rc = VINF_EM_DBG_STEPPED;
3415 break;
3416 }
3417 pVCpu->hm.s.fContextUseFlags |= HM_CHANGED_GUEST_DEBUG;
3418 }
3419
3420 /*
3421 * Clear the X86_EFL_TF if necessary.
3422 */
3423 if (pVCpu->hm.s.fClearTrapFlag)
3424 {
3425 pVCpu->hm.s.fClearTrapFlag = false;
3426 pCtx->eflags.Bits.u1TF = 0;
3427 }
3428
3429 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatEntry, x);
3430 return rc;
3431}
3432
3433
3434/**
3435 * Runs the guest code using AMD-V.
3436 *
3437 * @returns Strict VBox status code.
3438 * @param pVM The cross context VM structure.
3439 * @param pVCpu The cross context virtual CPU structure.
3440 * @param pCtx Pointer to the guest-CPU context.
3441 */
3442VMMR0DECL(VBOXSTRICTRC) SVMR0RunGuestCode(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
3443{
3444 Assert(VMMRZCallRing3IsEnabled(pVCpu));
3445 HMSVM_ASSERT_PREEMPT_SAFE();
3446 VMMRZCallRing3SetNotification(pVCpu, hmR0SvmCallRing3Callback, pCtx);
3447
3448 int rc;
3449 if (!pVCpu->hm.s.fSingleInstruction)
3450 rc = hmR0SvmRunGuestCodeNormal(pVM, pVCpu, pCtx);
3451 else
3452 rc = hmR0SvmRunGuestCodeStep(pVM, pVCpu, pCtx);
3453
3454 if (rc == VERR_EM_INTERPRETER)
3455 rc = VINF_EM_RAW_EMULATE_INSTR;
3456 else if (rc == VINF_EM_RESET)
3457 rc = VINF_EM_TRIPLE_FAULT;
3458
3459 /* Prepare to return to ring-3. This will remove longjmp notifications. */
3460 hmR0SvmExitToRing3(pVM, pVCpu, pCtx, rc);
3461 Assert(!VMMRZCallRing3IsNotificationSet(pVCpu));
3462 return rc;
3463}
3464
3465
3466/**
3467 * Handles a \#VMEXIT (for all EXITCODE values except SVM_EXIT_INVALID).
3468 *
3469 * @returns VBox status code (informational status codes included).
3470 * @param pVCpu The cross context virtual CPU structure.
3471 * @param pCtx Pointer to the guest-CPU context.
3472 * @param pSvmTransient Pointer to the SVM transient structure.
3473 */
3474DECLINLINE(int) hmR0SvmHandleExit(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
3475{
3476 Assert(pSvmTransient->u64ExitCode != SVM_EXIT_INVALID);
3477 Assert(pSvmTransient->u64ExitCode <= SVM_EXIT_MAX);
3478
3479 /*
3480 * The ordering of the case labels is based on most-frequently-occurring #VMEXITs for most guests under
3481 * normal workloads (for some definition of "normal").
3482 */
3483 uint32_t u32ExitCode = pSvmTransient->u64ExitCode;
3484 switch (pSvmTransient->u64ExitCode)
3485 {
3486 case SVM_EXIT_NPF:
3487 return hmR0SvmExitNestedPF(pVCpu, pCtx, pSvmTransient);
3488
3489 case SVM_EXIT_IOIO:
3490 return hmR0SvmExitIOInstr(pVCpu, pCtx, pSvmTransient);
3491
3492 case SVM_EXIT_RDTSC:
3493 return hmR0SvmExitRdtsc(pVCpu, pCtx, pSvmTransient);
3494
3495 case SVM_EXIT_RDTSCP:
3496 return hmR0SvmExitRdtscp(pVCpu, pCtx, pSvmTransient);
3497
3498 case SVM_EXIT_CPUID:
3499 return hmR0SvmExitCpuid(pVCpu, pCtx, pSvmTransient);
3500
3501 case SVM_EXIT_EXCEPTION_14: /* X86_XCPT_PF */
3502 return hmR0SvmExitXcptPF(pVCpu, pCtx, pSvmTransient);
3503
3504 case SVM_EXIT_EXCEPTION_7: /* X86_XCPT_NM */
3505 return hmR0SvmExitXcptNM(pVCpu, pCtx, pSvmTransient);
3506
3507 case SVM_EXIT_EXCEPTION_6: /* X86_XCPT_UD */
3508 return hmR0SvmExitXcptUD(pVCpu, pCtx, pSvmTransient);
3509
3510 case SVM_EXIT_EXCEPTION_16: /* X86_XCPT_MF */
3511 return hmR0SvmExitXcptMF(pVCpu, pCtx, pSvmTransient);
3512
3513 case SVM_EXIT_EXCEPTION_1: /* X86_XCPT_DB */
3514 return hmR0SvmExitXcptDB(pVCpu, pCtx, pSvmTransient);
3515
3516 case SVM_EXIT_EXCEPTION_17: /* X86_XCPT_AC */
3517 return hmR0SvmExitXcptAC(pVCpu, pCtx, pSvmTransient);
3518
3519 case SVM_EXIT_EXCEPTION_3: /* X86_XCPT_BP */
3520 return hmR0SvmExitXcptBP(pVCpu, pCtx, pSvmTransient);
3521
3522 case SVM_EXIT_MONITOR:
3523 return hmR0SvmExitMonitor(pVCpu, pCtx, pSvmTransient);
3524
3525 case SVM_EXIT_MWAIT:
3526 return hmR0SvmExitMwait(pVCpu, pCtx, pSvmTransient);
3527
3528 case SVM_EXIT_HLT:
3529 return hmR0SvmExitHlt(pVCpu, pCtx, pSvmTransient);
3530
3531 case SVM_EXIT_READ_CR0:
3532 case SVM_EXIT_READ_CR3:
3533 case SVM_EXIT_READ_CR4:
3534 return hmR0SvmExitReadCRx(pVCpu, pCtx, pSvmTransient);
3535
3536 case SVM_EXIT_WRITE_CR0:
3537 case SVM_EXIT_WRITE_CR3:
3538 case SVM_EXIT_WRITE_CR4:
3539 case SVM_EXIT_WRITE_CR8:
3540 return hmR0SvmExitWriteCRx(pVCpu, pCtx, pSvmTransient);
3541
3542 case SVM_EXIT_PAUSE:
3543 return hmR0SvmExitPause(pVCpu, pCtx, pSvmTransient);
3544
3545 case SVM_EXIT_VMMCALL:
3546 return hmR0SvmExitVmmCall(pVCpu, pCtx, pSvmTransient);
3547
3548 case SVM_EXIT_VINTR:
3549 return hmR0SvmExitVIntr(pVCpu, pCtx, pSvmTransient);
3550
3551 case SVM_EXIT_INTR:
3552 case SVM_EXIT_FERR_FREEZE:
3553 case SVM_EXIT_NMI:
3554 return hmR0SvmExitIntr(pVCpu, pCtx, pSvmTransient);
3555
3556 case SVM_EXIT_MSR:
3557 return hmR0SvmExitMsr(pVCpu, pCtx, pSvmTransient);
3558
3559 case SVM_EXIT_INVLPG:
3560 return hmR0SvmExitInvlpg(pVCpu, pCtx, pSvmTransient);
3561
3562 case SVM_EXIT_WBINVD:
3563 return hmR0SvmExitWbinvd(pVCpu, pCtx, pSvmTransient);
3564
3565 case SVM_EXIT_INVD:
3566 return hmR0SvmExitInvd(pVCpu, pCtx, pSvmTransient);
3567
3568 case SVM_EXIT_RDPMC:
3569 return hmR0SvmExitRdpmc(pVCpu, pCtx, pSvmTransient);
3570
3571 default:
3572 {
3573 switch (pSvmTransient->u64ExitCode)
3574 {
3575 case SVM_EXIT_READ_DR0: case SVM_EXIT_READ_DR1: case SVM_EXIT_READ_DR2: case SVM_EXIT_READ_DR3:
3576 case SVM_EXIT_READ_DR6: case SVM_EXIT_READ_DR7: case SVM_EXIT_READ_DR8: case SVM_EXIT_READ_DR9:
3577 case SVM_EXIT_READ_DR10: case SVM_EXIT_READ_DR11: case SVM_EXIT_READ_DR12: case SVM_EXIT_READ_DR13:
3578 case SVM_EXIT_READ_DR14: case SVM_EXIT_READ_DR15:
3579 return hmR0SvmExitReadDRx(pVCpu, pCtx, pSvmTransient);
3580
3581 case SVM_EXIT_WRITE_DR0: case SVM_EXIT_WRITE_DR1: case SVM_EXIT_WRITE_DR2: case SVM_EXIT_WRITE_DR3:
3582 case SVM_EXIT_WRITE_DR6: case SVM_EXIT_WRITE_DR7: case SVM_EXIT_WRITE_DR8: case SVM_EXIT_WRITE_DR9:
3583 case SVM_EXIT_WRITE_DR10: case SVM_EXIT_WRITE_DR11: case SVM_EXIT_WRITE_DR12: case SVM_EXIT_WRITE_DR13:
3584 case SVM_EXIT_WRITE_DR14: case SVM_EXIT_WRITE_DR15:
3585 return hmR0SvmExitWriteDRx(pVCpu, pCtx, pSvmTransient);
3586
3587 case SVM_EXIT_XSETBV:
3588 return hmR0SvmExitXsetbv(pVCpu, pCtx, pSvmTransient);
3589
3590 case SVM_EXIT_TASK_SWITCH:
3591 return hmR0SvmExitTaskSwitch(pVCpu, pCtx, pSvmTransient);
3592
3593 case SVM_EXIT_IRET:
3594 return hmR0SvmExitIret(pVCpu, pCtx, pSvmTransient);
3595
3596 case SVM_EXIT_SHUTDOWN:
3597 return hmR0SvmExitShutdown(pVCpu, pCtx, pSvmTransient);
3598
3599 case SVM_EXIT_SMI:
3600 case SVM_EXIT_INIT:
3601 {
3602 /*
3603 * We don't intercept NMIs. As for INIT signals, it really shouldn't ever happen here. If it ever does,
3604 * we want to know about it so log the exit code and bail.
3605 */
3606 AssertMsgFailed(("hmR0SvmHandleExit: Unexpected exit %#RX32\n", (uint32_t)pSvmTransient->u64ExitCode));
3607 pVCpu->hm.s.u32HMError = (uint32_t)pSvmTransient->u64ExitCode;
3608 return VERR_SVM_UNEXPECTED_EXIT;
3609 }
3610
3611#ifdef VBOX_WITH_NESTED_HWVIRT
3612 case SVM_EXIT_CLGI: return hmR0SvmExitClgi(pVCpu, pCtx, pSvmTransient);
3613 case SVM_EXIT_STGI: return hmR0SvmExitStgi(pVCpu, pCtx, pSvmTransient);
3614 case SVM_EXIT_VMLOAD: return hmR0SvmExitVmload(pVCpu, pCtx, pSvmTransient);
3615 case SVM_EXIT_VMSAVE: return hmR0SvmExitVmsave(pVCpu, pCtx, pSvmTransient);
3616 case SVM_EXIT_INVLPGA: return hmR0SvmExitInvlpga(pVCpu, pCtx, pSvmTransient);
3617#else
3618 case SVM_EXIT_CLGI:
3619 case SVM_EXIT_STGI:
3620 case SVM_EXIT_VMLOAD:
3621 case SVM_EXIT_VMSAVE:
3622 case SVM_EXIT_INVLPGA:
3623#endif
3624 case SVM_EXIT_RSM:
3625 case SVM_EXIT_VMRUN:
3626 case SVM_EXIT_SKINIT:
3627 return hmR0SvmExitSetPendingXcptUD(pVCpu, pCtx, pSvmTransient);
3628
3629#ifdef HMSVM_ALWAYS_TRAP_ALL_XCPTS
3630 case SVM_EXIT_EXCEPTION_0: /* X86_XCPT_DE */
3631 /* SVM_EXIT_EXCEPTION_1: */ /* X86_XCPT_DB - Handled above. */
3632 case SVM_EXIT_EXCEPTION_2: /* X86_XCPT_NMI */
3633 /* SVM_EXIT_EXCEPTION_3: */ /* X86_XCPT_BP - Handled above. */
3634 case SVM_EXIT_EXCEPTION_4: /* X86_XCPT_OF */
3635 case SVM_EXIT_EXCEPTION_5: /* X86_XCPT_BR */
3636 /* SVM_EXIT_EXCEPTION_6: */ /* X86_XCPT_UD - Handled above. */
3637 /* SVM_EXIT_EXCEPTION_7: */ /* X86_XCPT_NM - Handled above. */
3638 case SVM_EXIT_EXCEPTION_8: /* X86_XCPT_DF */
3639 case SVM_EXIT_EXCEPTION_9: /* X86_XCPT_CO_SEG_OVERRUN */
3640 case SVM_EXIT_EXCEPTION_10: /* X86_XCPT_TS */
3641 case SVM_EXIT_EXCEPTION_11: /* X86_XCPT_NP */
3642 case SVM_EXIT_EXCEPTION_12: /* X86_XCPT_SS */
3643 case SVM_EXIT_EXCEPTION_13: /* X86_XCPT_GP */
3644 /* SVM_EXIT_EXCEPTION_14: */ /* X86_XCPT_PF - Handled above. */
3645 case SVM_EXIT_EXCEPTION_15: /* Reserved. */
3646 /* SVM_EXIT_EXCEPTION_16: */ /* X86_XCPT_MF - Handled above. */
3647 /* SVM_EXIT_EXCEPTION_17: */ /* X86_XCPT_AC - Handled above. */
3648 case SVM_EXIT_EXCEPTION_18: /* X86_XCPT_MC */
3649 case SVM_EXIT_EXCEPTION_19: /* X86_XCPT_XF */
3650 case SVM_EXIT_EXCEPTION_20: case SVM_EXIT_EXCEPTION_21: case SVM_EXIT_EXCEPTION_22:
3651 case SVM_EXIT_EXCEPTION_23: case SVM_EXIT_EXCEPTION_24: case SVM_EXIT_EXCEPTION_25:
3652 case SVM_EXIT_EXCEPTION_26: case SVM_EXIT_EXCEPTION_27: case SVM_EXIT_EXCEPTION_28:
3653 case SVM_EXIT_EXCEPTION_29: case SVM_EXIT_EXCEPTION_30: case SVM_EXIT_EXCEPTION_31:
3654 {
3655 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
3656 SVMEVENT Event;
3657 Event.u = 0;
3658 Event.n.u1Valid = 1;
3659 Event.n.u3Type = SVM_EVENT_EXCEPTION;
3660 Event.n.u8Vector = pSvmTransient->u64ExitCode - SVM_EXIT_EXCEPTION_0;
3661
3662 switch (Event.n.u8Vector)
3663 {
3664 case X86_XCPT_DE:
3665 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestDE);
3666 break;
3667
3668 case X86_XCPT_NP:
3669 Event.n.u1ErrorCodeValid = 1;
3670 Event.n.u32ErrorCode = pVmcb->ctrl.u64ExitInfo1;
3671 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestNP);
3672 break;
3673
3674 case X86_XCPT_SS:
3675 Event.n.u1ErrorCodeValid = 1;
3676 Event.n.u32ErrorCode = pVmcb->ctrl.u64ExitInfo1;
3677 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestSS);
3678 break;
3679
3680 case X86_XCPT_GP:
3681 Event.n.u1ErrorCodeValid = 1;
3682 Event.n.u32ErrorCode = pVmcb->ctrl.u64ExitInfo1;
3683 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestGP);
3684 break;
3685
3686 default:
3687 AssertMsgFailed(("hmR0SvmHandleExit: Unexpected exit caused by exception %#x\n", Event.n.u8Vector));
3688 pVCpu->hm.s.u32HMError = Event.n.u8Vector;
3689 return VERR_SVM_UNEXPECTED_XCPT_EXIT;
3690 }
3691
3692 Log4(("#Xcpt: Vector=%#x at CS:RIP=%04x:%RGv\n", Event.n.u8Vector, pCtx->cs.Sel, (RTGCPTR)pCtx->rip));
3693 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
3694 return VINF_SUCCESS;
3695 }
3696#endif /* HMSVM_ALWAYS_TRAP_ALL_XCPTS */
3697
3698 default:
3699 {
3700 AssertMsgFailed(("hmR0SvmHandleExit: Unknown exit code %#x\n", u32ExitCode));
3701 pVCpu->hm.s.u32HMError = u32ExitCode;
3702 return VERR_SVM_UNKNOWN_EXIT;
3703 }
3704 }
3705 }
3706 }
3707 /* not reached */
3708}
3709
3710
3711#ifdef DEBUG
3712/* Is there some generic IPRT define for this that are not in Runtime/internal/\* ?? */
3713# define HMSVM_ASSERT_PREEMPT_CPUID_VAR() \
3714 RTCPUID const idAssertCpu = RTThreadPreemptIsEnabled(NIL_RTTHREAD) ? NIL_RTCPUID : RTMpCpuId()
3715
3716# define HMSVM_ASSERT_PREEMPT_CPUID() \
3717 do \
3718 { \
3719 RTCPUID const idAssertCpuNow = RTThreadPreemptIsEnabled(NIL_RTTHREAD) ? NIL_RTCPUID : RTMpCpuId(); \
3720 AssertMsg(idAssertCpu == idAssertCpuNow, ("SVM %#x, %#x\n", idAssertCpu, idAssertCpuNow)); \
3721 } while (0)
3722
3723# define HMSVM_VALIDATE_EXIT_HANDLER_PARAMS() \
3724 do { \
3725 AssertPtr(pVCpu); \
3726 AssertPtr(pCtx); \
3727 AssertPtr(pSvmTransient); \
3728 Assert(ASMIntAreEnabled()); \
3729 HMSVM_ASSERT_PREEMPT_SAFE(); \
3730 HMSVM_ASSERT_PREEMPT_CPUID_VAR(); \
3731 Log4Func(("vcpu[%u] -v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-v-\n", (uint32_t)pVCpu->idCpu)); \
3732 HMSVM_ASSERT_PREEMPT_SAFE(); \
3733 if (VMMR0IsLogFlushDisabled(pVCpu)) \
3734 HMSVM_ASSERT_PREEMPT_CPUID(); \
3735 } while (0)
3736#else /* Release builds */
3737# define HMSVM_VALIDATE_EXIT_HANDLER_PARAMS() do { NOREF(pVCpu); NOREF(pCtx); NOREF(pSvmTransient); } while (0)
3738#endif
3739
3740
3741/**
3742 * Worker for hmR0SvmInterpretInvlpg().
3743 *
3744 * @return VBox status code.
3745 * @param pVCpu The cross context virtual CPU structure.
3746 * @param pCpu Pointer to the disassembler state.
3747 * @param pCtx The guest CPU context.
3748 */
3749static int hmR0SvmInterpretInvlPgEx(PVMCPU pVCpu, PDISCPUSTATE pCpu, PCPUMCTX pCtx)
3750{
3751 DISQPVPARAMVAL Param1;
3752 RTGCPTR GCPtrPage;
3753
3754 int rc = DISQueryParamVal(CPUMCTX2CORE(pCtx), pCpu, &pCpu->Param1, &Param1, DISQPVWHICH_SRC);
3755 if (RT_FAILURE(rc))
3756 return VERR_EM_INTERPRETER;
3757
3758 if ( Param1.type == DISQPV_TYPE_IMMEDIATE
3759 || Param1.type == DISQPV_TYPE_ADDRESS)
3760 {
3761 if (!(Param1.flags & (DISQPV_FLAG_32 | DISQPV_FLAG_64)))
3762 return VERR_EM_INTERPRETER;
3763
3764 GCPtrPage = Param1.val.val64;
3765 VBOXSTRICTRC rc2 = EMInterpretInvlpg(pVCpu->CTX_SUFF(pVM), pVCpu, CPUMCTX2CORE(pCtx), GCPtrPage);
3766 rc = VBOXSTRICTRC_VAL(rc2);
3767 }
3768 else
3769 {
3770 Log4(("hmR0SvmInterpretInvlPgEx invalid parameter type %#x\n", Param1.type));
3771 rc = VERR_EM_INTERPRETER;
3772 }
3773
3774 return rc;
3775}
3776
3777
3778/**
3779 * Interprets INVLPG.
3780 *
3781 * @returns VBox status code.
3782 * @retval VINF_* Scheduling instructions.
3783 * @retval VERR_EM_INTERPRETER Something we can't cope with.
3784 * @retval VERR_* Fatal errors.
3785 *
3786 * @param pVM The cross context VM structure.
3787 * @param pVCpu The cross context virtual CPU structure.
3788 * @param pCtx The guest CPU context.
3789 *
3790 * @remarks Updates the RIP if the instruction was executed successfully.
3791 */
3792static int hmR0SvmInterpretInvlpg(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
3793{
3794 /* Only allow 32 & 64 bit code. */
3795 if (CPUMGetGuestCodeBits(pVCpu) != 16)
3796 {
3797 PDISSTATE pDis = &pVCpu->hm.s.DisState;
3798 int rc = EMInterpretDisasCurrent(pVM, pVCpu, pDis, NULL /* pcbInstr */);
3799 if ( RT_SUCCESS(rc)
3800 && pDis->pCurInstr->uOpcode == OP_INVLPG)
3801 {
3802 rc = hmR0SvmInterpretInvlPgEx(pVCpu, pDis, pCtx);
3803 if (RT_SUCCESS(rc))
3804 pCtx->rip += pDis->cbInstr;
3805 return rc;
3806 }
3807 else
3808 Log4(("hmR0SvmInterpretInvlpg: EMInterpretDisasCurrent returned %Rrc uOpCode=%#x\n", rc, pDis->pCurInstr->uOpcode));
3809 }
3810 return VERR_EM_INTERPRETER;
3811}
3812
3813
3814/**
3815 * Sets an invalid-opcode (\#UD) exception as pending-for-injection into the VM.
3816 *
3817 * @param pVCpu The cross context virtual CPU structure.
3818 */
3819DECLINLINE(void) hmR0SvmSetPendingXcptUD(PVMCPU pVCpu)
3820{
3821 SVMEVENT Event;
3822 Event.u = 0;
3823 Event.n.u1Valid = 1;
3824 Event.n.u3Type = SVM_EVENT_EXCEPTION;
3825 Event.n.u8Vector = X86_XCPT_UD;
3826 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
3827}
3828
3829
3830/**
3831 * Sets a debug (\#DB) exception as pending-for-injection into the VM.
3832 *
3833 * @param pVCpu The cross context virtual CPU structure.
3834 */
3835DECLINLINE(void) hmR0SvmSetPendingXcptDB(PVMCPU pVCpu)
3836{
3837 SVMEVENT Event;
3838 Event.u = 0;
3839 Event.n.u1Valid = 1;
3840 Event.n.u3Type = SVM_EVENT_EXCEPTION;
3841 Event.n.u8Vector = X86_XCPT_DB;
3842 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
3843}
3844
3845
3846/**
3847 * Sets a page fault (\#PF) exception as pending-for-injection into the VM.
3848 *
3849 * @param pVCpu The cross context virtual CPU structure.
3850 * @param pCtx Pointer to the guest-CPU context.
3851 * @param u32ErrCode The error-code for the page-fault.
3852 * @param uFaultAddress The page fault address (CR2).
3853 *
3854 * @remarks This updates the guest CR2 with @a uFaultAddress!
3855 */
3856DECLINLINE(void) hmR0SvmSetPendingXcptPF(PVMCPU pVCpu, PCPUMCTX pCtx, uint32_t u32ErrCode, RTGCUINTPTR uFaultAddress)
3857{
3858 SVMEVENT Event;
3859 Event.u = 0;
3860 Event.n.u1Valid = 1;
3861 Event.n.u3Type = SVM_EVENT_EXCEPTION;
3862 Event.n.u8Vector = X86_XCPT_PF;
3863 Event.n.u1ErrorCodeValid = 1;
3864 Event.n.u32ErrorCode = u32ErrCode;
3865
3866 /* Update CR2 of the guest. */
3867 if (pCtx->cr2 != uFaultAddress)
3868 {
3869 pCtx->cr2 = uFaultAddress;
3870 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_CR2);
3871 }
3872
3873 hmR0SvmSetPendingEvent(pVCpu, &Event, uFaultAddress);
3874}
3875
3876
3877/**
3878 * Sets a device-not-available (\#NM) exception as pending-for-injection into
3879 * the VM.
3880 *
3881 * @param pVCpu The cross context virtual CPU structure.
3882 */
3883DECLINLINE(void) hmR0SvmSetPendingXcptNM(PVMCPU pVCpu)
3884{
3885 SVMEVENT Event;
3886 Event.u = 0;
3887 Event.n.u1Valid = 1;
3888 Event.n.u3Type = SVM_EVENT_EXCEPTION;
3889 Event.n.u8Vector = X86_XCPT_NM;
3890 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
3891}
3892
3893
3894/**
3895 * Sets a math-fault (\#MF) exception as pending-for-injection into the VM.
3896 *
3897 * @param pVCpu The cross context virtual CPU structure.
3898 */
3899DECLINLINE(void) hmR0SvmSetPendingXcptMF(PVMCPU pVCpu)
3900{
3901 SVMEVENT Event;
3902 Event.u = 0;
3903 Event.n.u1Valid = 1;
3904 Event.n.u3Type = SVM_EVENT_EXCEPTION;
3905 Event.n.u8Vector = X86_XCPT_MF;
3906 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
3907}
3908
3909
3910/**
3911 * Sets a double fault (\#DF) exception as pending-for-injection into the VM.
3912 *
3913 * @param pVCpu The cross context virtual CPU structure.
3914 */
3915DECLINLINE(void) hmR0SvmSetPendingXcptDF(PVMCPU pVCpu)
3916{
3917 SVMEVENT Event;
3918 Event.u = 0;
3919 Event.n.u1Valid = 1;
3920 Event.n.u3Type = SVM_EVENT_EXCEPTION;
3921 Event.n.u8Vector = X86_XCPT_DF;
3922 Event.n.u1ErrorCodeValid = 1;
3923 Event.n.u32ErrorCode = 0;
3924 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
3925}
3926
3927
3928/**
3929 * Determines if an exception is a contributory exception.
3930 *
3931 * Contributory exceptions are ones which can cause double-faults unless the
3932 * original exception was a benign exception. Page-fault is intentionally not
3933 * included here as it's a conditional contributory exception.
3934 *
3935 * @returns true if the exception is contributory, false otherwise.
3936 * @param uVector The exception vector.
3937 */
3938DECLINLINE(bool) hmR0SvmIsContributoryXcpt(const uint32_t uVector)
3939{
3940 switch (uVector)
3941 {
3942 case X86_XCPT_GP:
3943 case X86_XCPT_SS:
3944 case X86_XCPT_NP:
3945 case X86_XCPT_TS:
3946 case X86_XCPT_DE:
3947 return true;
3948 default:
3949 break;
3950 }
3951 return false;
3952}
3953
3954
3955/**
3956 * Handle a condition that occurred while delivering an event through the guest
3957 * IDT.
3958 *
3959 * @returns VBox status code (informational error codes included).
3960 * @retval VINF_SUCCESS if we should continue handling the \#VMEXIT.
3961 * @retval VINF_HM_DOUBLE_FAULT if a \#DF condition was detected and we ought to
3962 * continue execution of the guest which will delivery the \#DF.
3963 * @retval VINF_EM_RESET if we detected a triple-fault condition.
3964 * @retval VERR_EM_GUEST_CPU_HANG if we detected a guest CPU hang.
3965 *
3966 * @param pVCpu The cross context virtual CPU structure.
3967 * @param pCtx Pointer to the guest-CPU context.
3968 * @param pSvmTransient Pointer to the SVM transient structure.
3969 *
3970 * @remarks No-long-jump zone!!!
3971 */
3972static int hmR0SvmCheckExitDueToEventDelivery(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
3973{
3974 int rc = VINF_SUCCESS;
3975 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
3976
3977 Log4(("EXITINTINFO: Pending vectoring event %#RX64 Valid=%RTbool ErrValid=%RTbool Err=%#RX32 Type=%u Vector=%u\n",
3978 pVmcb->ctrl.ExitIntInfo.u, !!pVmcb->ctrl.ExitIntInfo.n.u1Valid, !!pVmcb->ctrl.ExitIntInfo.n.u1ErrorCodeValid,
3979 pVmcb->ctrl.ExitIntInfo.n.u32ErrorCode, pVmcb->ctrl.ExitIntInfo.n.u3Type, pVmcb->ctrl.ExitIntInfo.n.u8Vector));
3980
3981 /* See AMD spec. 15.7.3 "EXITINFO Pseudo-Code". The EXITINTINFO (if valid) contains the prior exception (IDT vector)
3982 * that was trying to be delivered to the guest which caused a #VMEXIT which was intercepted (Exit vector). */
3983 if (pVmcb->ctrl.ExitIntInfo.n.u1Valid)
3984 {
3985 uint8_t uIdtVector = pVmcb->ctrl.ExitIntInfo.n.u8Vector;
3986
3987 typedef enum
3988 {
3989 SVMREFLECTXCPT_XCPT, /* Reflect the exception to the guest or for further evaluation by VMM. */
3990 SVMREFLECTXCPT_DF, /* Reflect the exception as a double-fault to the guest. */
3991 SVMREFLECTXCPT_TF, /* Indicate a triple faulted state to the VMM. */
3992 SVMREFLECTXCPT_HANG, /* Indicate bad VM trying to deadlock the CPU. */
3993 SVMREFLECTXCPT_NONE /* Nothing to reflect. */
3994 } SVMREFLECTXCPT;
3995
3996 SVMREFLECTXCPT enmReflect = SVMREFLECTXCPT_NONE;
3997 bool fReflectingNmi = false;
3998 if (pVmcb->ctrl.ExitIntInfo.n.u3Type == SVM_EVENT_EXCEPTION)
3999 {
4000 if (pSvmTransient->u64ExitCode - SVM_EXIT_EXCEPTION_0 <= SVM_EXIT_EXCEPTION_31)
4001 {
4002 uint8_t uExitVector = (uint8_t)(pSvmTransient->u64ExitCode - SVM_EXIT_EXCEPTION_0);
4003
4004#ifdef VBOX_STRICT
4005 if ( hmR0SvmIsContributoryXcpt(uIdtVector)
4006 && uExitVector == X86_XCPT_PF)
4007 {
4008 Log4(("IDT: Contributory #PF idCpu=%u uCR2=%#RX64\n", pVCpu->idCpu, pCtx->cr2));
4009 }
4010#endif
4011
4012 if ( uIdtVector == X86_XCPT_BP
4013 || uIdtVector == X86_XCPT_OF)
4014 {
4015 /* Ignore INT3/INTO, just re-execute. See @bugref{8357}. */
4016 }
4017 else if ( uExitVector == X86_XCPT_PF
4018 && uIdtVector == X86_XCPT_PF)
4019 {
4020 pSvmTransient->fVectoringDoublePF = true;
4021 Log4(("IDT: Vectoring double #PF uCR2=%#RX64\n", pCtx->cr2));
4022 }
4023 else if ( uExitVector == X86_XCPT_AC
4024 && uIdtVector == X86_XCPT_AC)
4025 {
4026 enmReflect = SVMREFLECTXCPT_HANG;
4027 Log4(("IDT: Nested #AC - Bad guest\n"));
4028 }
4029 else if ( (pVmcb->ctrl.u32InterceptXcpt & HMSVM_CONTRIBUTORY_XCPT_MASK)
4030 && hmR0SvmIsContributoryXcpt(uExitVector)
4031 && ( hmR0SvmIsContributoryXcpt(uIdtVector)
4032 || uIdtVector == X86_XCPT_PF))
4033 {
4034 enmReflect = SVMREFLECTXCPT_DF;
4035 Log4(("IDT: Pending vectoring #DF %#RX64 uIdtVector=%#x uExitVector=%#x\n", pVCpu->hm.s.Event.u64IntInfo,
4036 uIdtVector, uExitVector));
4037 }
4038 else if (uIdtVector == X86_XCPT_DF)
4039 {
4040 enmReflect = SVMREFLECTXCPT_TF;
4041 Log4(("IDT: Pending vectoring triple-fault %#RX64 uIdtVector=%#x uExitVector=%#x\n",
4042 pVCpu->hm.s.Event.u64IntInfo, uIdtVector, uExitVector));
4043 }
4044 else
4045 enmReflect = SVMREFLECTXCPT_XCPT;
4046 }
4047 else
4048 {
4049 /*
4050 * If event delivery caused an #VMEXIT that is not an exception (e.g. #NPF) then reflect the original
4051 * exception to the guest after handling the #VMEXIT.
4052 */
4053 enmReflect = SVMREFLECTXCPT_XCPT;
4054 }
4055 }
4056 else if ( pVmcb->ctrl.ExitIntInfo.n.u3Type == SVM_EVENT_EXTERNAL_IRQ
4057 || pVmcb->ctrl.ExitIntInfo.n.u3Type == SVM_EVENT_NMI)
4058 {
4059 enmReflect = SVMREFLECTXCPT_XCPT;
4060 fReflectingNmi = RT_BOOL(pVmcb->ctrl.ExitIntInfo.n.u3Type == SVM_EVENT_NMI);
4061
4062 if (pSvmTransient->u64ExitCode - SVM_EXIT_EXCEPTION_0 <= SVM_EXIT_EXCEPTION_31)
4063 {
4064 uint8_t uExitVector = (uint8_t)(pSvmTransient->u64ExitCode - SVM_EXIT_EXCEPTION_0);
4065 if (uExitVector == X86_XCPT_PF)
4066 {
4067 pSvmTransient->fVectoringPF = true;
4068 Log4(("IDT: Vectoring #PF due to Ext-Int/NMI. uCR2=%#RX64\n", pCtx->cr2));
4069 }
4070 }
4071 }
4072 /* else: Ignore software interrupts (INT n) as they reoccur when restarting the instruction. */
4073
4074 switch (enmReflect)
4075 {
4076 case SVMREFLECTXCPT_XCPT:
4077 {
4078 /* If we are re-injecting the NMI, clear NMI blocking. */
4079 if (fReflectingNmi)
4080 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_BLOCK_NMIS);
4081
4082 Assert(pVmcb->ctrl.ExitIntInfo.n.u3Type != SVM_EVENT_SOFTWARE_INT);
4083 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectPendingReflect);
4084 hmR0SvmSetPendingEvent(pVCpu, &pVmcb->ctrl.ExitIntInfo, 0 /* GCPtrFaultAddress */);
4085
4086 /* If uExitVector is #PF, CR2 value will be updated from the VMCB if it's a guest #PF. See hmR0SvmExitXcptPF(). */
4087 Log4(("IDT: Pending vectoring event %#RX64 ErrValid=%RTbool Err=%#RX32\n", pVmcb->ctrl.ExitIntInfo.u,
4088 !!pVmcb->ctrl.ExitIntInfo.n.u1ErrorCodeValid, pVmcb->ctrl.ExitIntInfo.n.u32ErrorCode));
4089 break;
4090 }
4091
4092 case SVMREFLECTXCPT_DF:
4093 {
4094 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectPendingReflect);
4095 hmR0SvmSetPendingXcptDF(pVCpu);
4096 rc = VINF_HM_DOUBLE_FAULT;
4097 break;
4098 }
4099
4100 case SVMREFLECTXCPT_TF:
4101 {
4102 rc = VINF_EM_RESET;
4103 break;
4104 }
4105
4106 case SVMREFLECTXCPT_HANG:
4107 {
4108 rc = VERR_EM_GUEST_CPU_HANG;
4109 break;
4110 }
4111
4112 default:
4113 Assert(rc == VINF_SUCCESS);
4114 break;
4115 }
4116 }
4117 Assert(rc == VINF_SUCCESS || rc == VINF_HM_DOUBLE_FAULT || rc == VINF_EM_RESET || rc == VERR_EM_GUEST_CPU_HANG);
4118 NOREF(pCtx);
4119 return rc;
4120}
4121
4122
4123/**
4124 * Updates interrupt shadow for the current RIP.
4125 */
4126#define HMSVM_UPDATE_INTR_SHADOW(pVCpu, pCtx) \
4127 do { \
4128 /* Update interrupt shadow. */ \
4129 if ( VMCPU_FF_IS_PENDING(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS) \
4130 && pCtx->rip != EMGetInhibitInterruptsPC(pVCpu)) \
4131 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_INHIBIT_INTERRUPTS); \
4132 } while (0)
4133
4134
4135/**
4136 * Advances the guest RIP making use of the CPU's NRIP_SAVE feature if
4137 * supported, otherwise advances the RIP by the number of bytes specified in
4138 * @a cb.
4139 *
4140 * @param pVCpu The cross context virtual CPU structure.
4141 * @param pCtx Pointer to the guest-CPU context.
4142 * @param cb RIP increment value in bytes.
4143 *
4144 * @remarks Use this function only from \#VMEXIT's where the NRIP value is valid
4145 * when NRIP_SAVE is supported by the CPU, otherwise use
4146 * hmR0SvmAdvanceRipDumb!
4147 */
4148DECLINLINE(void) hmR0SvmAdvanceRipHwAssist(PVMCPU pVCpu, PCPUMCTX pCtx, uint32_t cb)
4149{
4150 if (pVCpu->CTX_SUFF(pVM)->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_NRIP_SAVE)
4151 {
4152 PCSVMVMCB pVmcb = (PCSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
4153 Assert(pVmcb->ctrl.u64NextRIP);
4154 AssertRelease(pVmcb->ctrl.u64NextRIP - pCtx->rip == cb); /* temporary, remove later */
4155 pCtx->rip = pVmcb->ctrl.u64NextRIP;
4156 }
4157 else
4158 pCtx->rip += cb;
4159
4160 HMSVM_UPDATE_INTR_SHADOW(pVCpu, pCtx);
4161}
4162
4163/* Currently only used by nested hw.virt instructions, so ifdef'd as such, otherwise compilers start whining. */
4164#ifdef VBOX_WITH_NESTED_HWVIRT
4165/**
4166 * Gets the length of the current instruction if the CPU supports the NRIP_SAVE
4167 * feature. Otherwise, returns the value in @a cbLikely.
4168 *
4169 * @param pVCpu The cross context virtual CPU structure.
4170 * @param pCtx Pointer to the guest-CPU context.
4171 * @param cbLikely The likely instruction length.
4172 */
4173DECLINLINE(uint8_t) hmR0SvmGetInstrLengthHwAssist(PVMCPU pVCpu, PCPUMCTX pCtx, uint8_t cbLikely)
4174{
4175 Assert(cbLikely <= 15); /* See Intel spec. 2.3.11 "AVX Instruction Length" */
4176 if (pVCpu->CTX_SUFF(pVM)->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_NRIP_SAVE)
4177 {
4178 PCSVMVMCB pVmcb = (PCSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
4179 uint8_t const cbInstr = pVmcb->ctrl.u64NextRIP - pCtx->rip;
4180 Assert(cbInstr == cbLikely);
4181 return cbInstr;
4182 }
4183 return cbLikely;
4184}
4185#endif
4186
4187/**
4188 * Advances the guest RIP by the number of bytes specified in @a cb. This does
4189 * not make use of any hardware features to determine the instruction length.
4190 *
4191 * @param pVCpu The cross context virtual CPU structure.
4192 * @param pCtx Pointer to the guest-CPU context.
4193 * @param cb RIP increment value in bytes.
4194 */
4195DECLINLINE(void) hmR0SvmAdvanceRipDumb(PVMCPU pVCpu, PCPUMCTX pCtx, uint32_t cb)
4196{
4197 pCtx->rip += cb;
4198 HMSVM_UPDATE_INTR_SHADOW(pVCpu, pCtx);
4199}
4200#undef HMSVM_UPDATE_INTR_SHADOW
4201
4202
4203/* -=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= */
4204/* -=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=- #VMEXIT handlers -=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=- */
4205/* -=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=--=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-= */
4206
4207/** @name \#VMEXIT handlers.
4208 * @{
4209 */
4210
4211/**
4212 * \#VMEXIT handler for external interrupts, NMIs, FPU assertion freeze and INIT
4213 * signals (SVM_EXIT_INTR, SVM_EXIT_NMI, SVM_EXIT_FERR_FREEZE, SVM_EXIT_INIT).
4214 */
4215HMSVM_EXIT_DECL hmR0SvmExitIntr(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4216{
4217 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4218
4219 if (pSvmTransient->u64ExitCode == SVM_EXIT_NMI)
4220 STAM_REL_COUNTER_INC(&pVCpu->hm.s.StatExitHostNmiInGC);
4221 else if (pSvmTransient->u64ExitCode == SVM_EXIT_INTR)
4222 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitExtInt);
4223
4224 /*
4225 * AMD-V has no preemption timer and the generic periodic preemption timer has no way to signal -before- the timer
4226 * fires if the current interrupt is our own timer or a some other host interrupt. We also cannot examine what
4227 * interrupt it is until the host actually take the interrupt.
4228 *
4229 * Going back to executing guest code here unconditionally causes random scheduling problems (observed on an
4230 * AMD Phenom 9850 Quad-Core on Windows 64-bit host).
4231 */
4232 return VINF_EM_RAW_INTERRUPT;
4233}
4234
4235
4236/**
4237 * \#VMEXIT handler for WBINVD (SVM_EXIT_WBINVD). Conditional \#VMEXIT.
4238 */
4239HMSVM_EXIT_DECL hmR0SvmExitWbinvd(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4240{
4241 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4242
4243 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 2);
4244 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitWbinvd);
4245 int rc = VINF_SUCCESS;
4246 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4247 return rc;
4248}
4249
4250
4251/**
4252 * \#VMEXIT handler for INVD (SVM_EXIT_INVD). Unconditional \#VMEXIT.
4253 */
4254HMSVM_EXIT_DECL hmR0SvmExitInvd(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4255{
4256 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4257
4258 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 2);
4259 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitInvd);
4260 int rc = VINF_SUCCESS;
4261 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4262 return rc;
4263}
4264
4265
4266/**
4267 * \#VMEXIT handler for INVD (SVM_EXIT_CPUID). Conditional \#VMEXIT.
4268 */
4269HMSVM_EXIT_DECL hmR0SvmExitCpuid(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4270{
4271 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4272 PVM pVM = pVCpu->CTX_SUFF(pVM);
4273 int rc = EMInterpretCpuId(pVM, pVCpu, CPUMCTX2CORE(pCtx));
4274 if (RT_LIKELY(rc == VINF_SUCCESS))
4275 {
4276 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 2);
4277 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4278 }
4279 else
4280 {
4281 AssertMsgFailed(("hmR0SvmExitCpuid: EMInterpretCpuId failed with %Rrc\n", rc));
4282 rc = VERR_EM_INTERPRETER;
4283 }
4284 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCpuid);
4285 return rc;
4286}
4287
4288
4289/**
4290 * \#VMEXIT handler for RDTSC (SVM_EXIT_RDTSC). Conditional \#VMEXIT.
4291 */
4292HMSVM_EXIT_DECL hmR0SvmExitRdtsc(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4293{
4294 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4295 PVM pVM = pVCpu->CTX_SUFF(pVM);
4296 int rc = EMInterpretRdtsc(pVM, pVCpu, CPUMCTX2CORE(pCtx));
4297 if (RT_LIKELY(rc == VINF_SUCCESS))
4298 {
4299 pSvmTransient->fUpdateTscOffsetting = true;
4300 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 2);
4301 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4302 }
4303 else
4304 {
4305 AssertMsgFailed(("hmR0SvmExitRdtsc: EMInterpretRdtsc failed with %Rrc\n", rc));
4306 rc = VERR_EM_INTERPRETER;
4307 }
4308 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitRdtsc);
4309 return rc;
4310}
4311
4312
4313/**
4314 * \#VMEXIT handler for RDTSCP (SVM_EXIT_RDTSCP). Conditional \#VMEXIT.
4315 */
4316HMSVM_EXIT_DECL hmR0SvmExitRdtscp(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4317{
4318 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4319 int rc = EMInterpretRdtscp(pVCpu->CTX_SUFF(pVM), pVCpu, pCtx);
4320 if (RT_LIKELY(rc == VINF_SUCCESS))
4321 {
4322 pSvmTransient->fUpdateTscOffsetting = true;
4323 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 3);
4324 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4325 }
4326 else
4327 {
4328 AssertMsgFailed(("hmR0SvmExitRdtsc: EMInterpretRdtscp failed with %Rrc\n", rc));
4329 rc = VERR_EM_INTERPRETER;
4330 }
4331 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitRdtscp);
4332 return rc;
4333}
4334
4335
4336/**
4337 * \#VMEXIT handler for RDPMC (SVM_EXIT_RDPMC). Conditional \#VMEXIT.
4338 */
4339HMSVM_EXIT_DECL hmR0SvmExitRdpmc(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4340{
4341 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4342 int rc = EMInterpretRdpmc(pVCpu->CTX_SUFF(pVM), pVCpu, CPUMCTX2CORE(pCtx));
4343 if (RT_LIKELY(rc == VINF_SUCCESS))
4344 {
4345 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 2);
4346 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4347 }
4348 else
4349 {
4350 AssertMsgFailed(("hmR0SvmExitRdpmc: EMInterpretRdpmc failed with %Rrc\n", rc));
4351 rc = VERR_EM_INTERPRETER;
4352 }
4353 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitRdpmc);
4354 return rc;
4355}
4356
4357
4358/**
4359 * \#VMEXIT handler for INVLPG (SVM_EXIT_INVLPG). Conditional \#VMEXIT.
4360 */
4361HMSVM_EXIT_DECL hmR0SvmExitInvlpg(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4362{
4363 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4364 PVM pVM = pVCpu->CTX_SUFF(pVM);
4365 Assert(!pVM->hm.s.fNestedPaging);
4366
4367 /** @todo Decode Assist. */
4368 int rc = hmR0SvmInterpretInvlpg(pVM, pVCpu, pCtx); /* Updates RIP if successful. */
4369 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitInvlpg);
4370 Assert(rc == VINF_SUCCESS || rc == VERR_EM_INTERPRETER);
4371 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4372 return rc;
4373}
4374
4375
4376/**
4377 * \#VMEXIT handler for HLT (SVM_EXIT_HLT). Conditional \#VMEXIT.
4378 */
4379HMSVM_EXIT_DECL hmR0SvmExitHlt(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4380{
4381 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4382
4383 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 1);
4384 int rc = EMShouldContinueAfterHalt(pVCpu, pCtx) ? VINF_SUCCESS : VINF_EM_HALT;
4385 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4386 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitHlt);
4387 if (rc != VINF_SUCCESS)
4388 STAM_COUNTER_INC(&pVCpu->hm.s.StatSwitchHltToR3);
4389 return rc;
4390}
4391
4392
4393/**
4394 * \#VMEXIT handler for MONITOR (SVM_EXIT_MONITOR). Conditional \#VMEXIT.
4395 */
4396HMSVM_EXIT_DECL hmR0SvmExitMonitor(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4397{
4398 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4399 int rc = EMInterpretMonitor(pVCpu->CTX_SUFF(pVM), pVCpu, CPUMCTX2CORE(pCtx));
4400 if (RT_LIKELY(rc == VINF_SUCCESS))
4401 {
4402 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 3);
4403 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4404 }
4405 else
4406 {
4407 AssertMsg(rc == VERR_EM_INTERPRETER, ("hmR0SvmExitMonitor: EMInterpretMonitor failed with %Rrc\n", rc));
4408 rc = VERR_EM_INTERPRETER;
4409 }
4410 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitMonitor);
4411 return rc;
4412}
4413
4414
4415/**
4416 * \#VMEXIT handler for MWAIT (SVM_EXIT_MWAIT). Conditional \#VMEXIT.
4417 */
4418HMSVM_EXIT_DECL hmR0SvmExitMwait(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4419{
4420 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4421 VBOXSTRICTRC rc2 = EMInterpretMWait(pVCpu->CTX_SUFF(pVM), pVCpu, CPUMCTX2CORE(pCtx));
4422 int rc = VBOXSTRICTRC_VAL(rc2);
4423 if ( rc == VINF_EM_HALT
4424 || rc == VINF_SUCCESS)
4425 {
4426 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 3);
4427
4428 if ( rc == VINF_EM_HALT
4429 && EMMonitorWaitShouldContinue(pVCpu, pCtx))
4430 {
4431 rc = VINF_SUCCESS;
4432 }
4433 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4434 }
4435 else
4436 {
4437 AssertMsg(rc == VERR_EM_INTERPRETER, ("hmR0SvmExitMwait: EMInterpretMWait failed with %Rrc\n", rc));
4438 rc = VERR_EM_INTERPRETER;
4439 }
4440 AssertMsg(rc == VINF_SUCCESS || rc == VINF_EM_HALT || rc == VERR_EM_INTERPRETER,
4441 ("hmR0SvmExitMwait: EMInterpretMWait failed rc=%Rrc\n", rc));
4442 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitMwait);
4443 return rc;
4444}
4445
4446
4447/**
4448 * \#VMEXIT handler for shutdown (triple-fault) (SVM_EXIT_SHUTDOWN). Conditional
4449 * \#VMEXIT.
4450 */
4451HMSVM_EXIT_DECL hmR0SvmExitShutdown(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4452{
4453 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4454 return VINF_EM_RESET;
4455}
4456
4457
4458/**
4459 * \#VMEXIT handler for CRx reads (SVM_EXIT_READ_CR*). Conditional \#VMEXIT.
4460 */
4461HMSVM_EXIT_DECL hmR0SvmExitReadCRx(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4462{
4463 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4464
4465 Log4(("hmR0SvmExitReadCRx: CS:RIP=%04x:%#RX64\n", pCtx->cs.Sel, pCtx->rip));
4466
4467 /** @todo Decode Assist. */
4468 VBOXSTRICTRC rc2 = EMInterpretInstruction(pVCpu, CPUMCTX2CORE(pCtx), 0 /* pvFault */);
4469 int rc = VBOXSTRICTRC_VAL(rc2);
4470 AssertMsg(rc == VINF_SUCCESS || rc == VERR_EM_INTERPRETER || rc == VINF_PGM_CHANGE_MODE || rc == VINF_PGM_SYNC_CR3,
4471 ("hmR0SvmExitReadCRx: EMInterpretInstruction failed rc=%Rrc\n", rc));
4472 Assert((pSvmTransient->u64ExitCode - SVM_EXIT_READ_CR0) <= 15);
4473 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitCRxRead[pSvmTransient->u64ExitCode - SVM_EXIT_READ_CR0]);
4474 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4475 return rc;
4476}
4477
4478
4479/**
4480 * \#VMEXIT handler for CRx writes (SVM_EXIT_WRITE_CR*). Conditional \#VMEXIT.
4481 */
4482HMSVM_EXIT_DECL hmR0SvmExitWriteCRx(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4483{
4484 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4485
4486 /** @todo Decode Assist. */
4487 VBOXSTRICTRC rcStrict = IEMExecOneBypassEx(pVCpu, CPUMCTX2CORE(pCtx), NULL);
4488 if (RT_UNLIKELY( rcStrict == VERR_IEM_ASPECT_NOT_IMPLEMENTED
4489 || rcStrict == VERR_IEM_INSTR_NOT_IMPLEMENTED))
4490 rcStrict = VERR_EM_INTERPRETER;
4491 if (rcStrict == VINF_SUCCESS)
4492 {
4493 /* RIP has been updated by EMInterpretInstruction(). */
4494 Assert((pSvmTransient->u64ExitCode - SVM_EXIT_WRITE_CR0) <= 15);
4495 switch (pSvmTransient->u64ExitCode - SVM_EXIT_WRITE_CR0)
4496 {
4497 case 0: /* CR0. */
4498 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_CR0);
4499 break;
4500
4501 case 3: /* CR3. */
4502 Assert(!pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging);
4503 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_CR3);
4504 break;
4505
4506 case 4: /* CR4. */
4507 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_CR4);
4508 break;
4509
4510 case 8: /* CR8 (TPR). */
4511 HMCPU_CF_SET(pVCpu, HM_CHANGED_SVM_GUEST_APIC_STATE);
4512 break;
4513
4514 default:
4515 AssertMsgFailed(("hmR0SvmExitWriteCRx: Invalid/Unexpected Write-CRx exit. u64ExitCode=%#RX64 %#x\n",
4516 pSvmTransient->u64ExitCode, pSvmTransient->u64ExitCode - SVM_EXIT_WRITE_CR0));
4517 break;
4518 }
4519 HMSVM_CHECK_SINGLE_STEP(pVCpu, rcStrict);
4520 }
4521 else
4522 Assert(rcStrict == VERR_EM_INTERPRETER || rcStrict == VINF_PGM_CHANGE_MODE || rcStrict == VINF_PGM_SYNC_CR3);
4523 return VBOXSTRICTRC_TODO(rcStrict);
4524}
4525
4526
4527/**
4528 * \#VMEXIT handler for instructions that result in a \#UD exception delivered
4529 * to the guest.
4530 */
4531HMSVM_EXIT_DECL hmR0SvmExitSetPendingXcptUD(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4532{
4533 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4534 hmR0SvmSetPendingXcptUD(pVCpu);
4535 return VINF_SUCCESS;
4536}
4537
4538
4539/**
4540 * \#VMEXIT handler for MSR read and writes (SVM_EXIT_MSR). Conditional
4541 * \#VMEXIT.
4542 */
4543HMSVM_EXIT_DECL hmR0SvmExitMsr(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4544{
4545 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4546 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
4547 PVM pVM = pVCpu->CTX_SUFF(pVM);
4548
4549 int rc;
4550 if (pVmcb->ctrl.u64ExitInfo1 == SVM_EXIT1_MSR_WRITE)
4551 {
4552 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitWrmsr);
4553
4554 /* Handle TPR patching; intercepted LSTAR write. */
4555 if ( pVM->hm.s.fTPRPatchingActive
4556 && pCtx->ecx == MSR_K8_LSTAR)
4557 {
4558 if ((pCtx->eax & 0xff) != pSvmTransient->u8GuestTpr)
4559 {
4560 /* Our patch code uses LSTAR for TPR caching for 32-bit guests. */
4561 int rc2 = APICSetTpr(pVCpu, pCtx->eax & 0xff);
4562 AssertRC(rc2);
4563 HMCPU_CF_SET(pVCpu, HM_CHANGED_SVM_GUEST_APIC_STATE);
4564 }
4565 rc = VINF_SUCCESS;
4566 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 2);
4567 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4568 return rc;
4569 }
4570
4571 if (pVM->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_NRIP_SAVE)
4572 {
4573 rc = EMInterpretWrmsr(pVM, pVCpu, CPUMCTX2CORE(pCtx));
4574 if (RT_LIKELY(rc == VINF_SUCCESS))
4575 {
4576 pCtx->rip = pVmcb->ctrl.u64NextRIP;
4577 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4578 }
4579 else
4580 AssertMsg( rc == VERR_EM_INTERPRETER
4581 || rc == VINF_CPUM_R3_MSR_WRITE, ("hmR0SvmExitMsr: EMInterpretWrmsr failed rc=%Rrc\n", rc));
4582 }
4583 else
4584 {
4585 rc = VBOXSTRICTRC_TODO(EMInterpretInstruction(pVCpu, CPUMCTX2CORE(pCtx), 0 /* pvFault */));
4586 if (RT_LIKELY(rc == VINF_SUCCESS))
4587 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc); /* RIP updated by EMInterpretInstruction(). */
4588 else
4589 AssertMsg( rc == VERR_EM_INTERPRETER
4590 || rc == VINF_CPUM_R3_MSR_WRITE, ("hmR0SvmExitMsr: WrMsr. EMInterpretInstruction failed rc=%Rrc\n", rc));
4591 }
4592
4593 if (rc == VINF_SUCCESS)
4594 {
4595 /* If this is an X2APIC WRMSR access, update the APIC state as well. */
4596 if ( pCtx->ecx >= MSR_IA32_X2APIC_START
4597 && pCtx->ecx <= MSR_IA32_X2APIC_END)
4598 {
4599 /*
4600 * We've already saved the APIC related guest-state (TPR) in hmR0SvmPostRunGuest(). When full APIC register
4601 * virtualization is implemented we'll have to make sure APIC state is saved from the VMCB before
4602 * EMInterpretWrmsr() changes it.
4603 */
4604 HMCPU_CF_SET(pVCpu, HM_CHANGED_SVM_GUEST_APIC_STATE);
4605 }
4606 else if (pCtx->ecx == MSR_K6_EFER)
4607 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_EFER_MSR);
4608 else if (pCtx->ecx == MSR_IA32_TSC)
4609 pSvmTransient->fUpdateTscOffsetting = true;
4610 }
4611 }
4612 else
4613 {
4614 /* MSR Read access. */
4615 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitRdmsr);
4616 Assert(pVmcb->ctrl.u64ExitInfo1 == SVM_EXIT1_MSR_READ);
4617
4618 if (pVM->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_NRIP_SAVE)
4619 {
4620 rc = EMInterpretRdmsr(pVM, pVCpu, CPUMCTX2CORE(pCtx));
4621 if (RT_LIKELY(rc == VINF_SUCCESS))
4622 {
4623 pCtx->rip = pVmcb->ctrl.u64NextRIP;
4624 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4625 }
4626 else
4627 AssertMsg( rc == VERR_EM_INTERPRETER
4628 || rc == VINF_CPUM_R3_MSR_READ, ("hmR0SvmExitMsr: EMInterpretRdmsr failed rc=%Rrc\n", rc));
4629 }
4630 else
4631 {
4632 rc = VBOXSTRICTRC_TODO(EMInterpretInstruction(pVCpu, CPUMCTX2CORE(pCtx), 0));
4633 if (RT_UNLIKELY(rc != VINF_SUCCESS))
4634 {
4635 AssertMsg( rc == VERR_EM_INTERPRETER
4636 || rc == VINF_CPUM_R3_MSR_READ, ("hmR0SvmExitMsr: RdMsr. EMInterpretInstruction failed rc=%Rrc\n", rc));
4637 }
4638 /* RIP updated by EMInterpretInstruction(). */
4639 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4640 }
4641 }
4642
4643 /* RIP has been updated by EMInterpret[Rd|Wr]msr(). */
4644 return rc;
4645}
4646
4647
4648/**
4649 * \#VMEXIT handler for DRx read (SVM_EXIT_READ_DRx). Conditional \#VMEXIT.
4650 */
4651HMSVM_EXIT_DECL hmR0SvmExitReadDRx(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4652{
4653 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4654 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitDRxRead);
4655
4656 /* We should -not- get this #VMEXIT if the guest's debug registers were active. */
4657 if (pSvmTransient->fWasGuestDebugStateActive)
4658 {
4659 AssertMsgFailed(("hmR0SvmHandleExit: Unexpected exit %#RX32\n", (uint32_t)pSvmTransient->u64ExitCode));
4660 pVCpu->hm.s.u32HMError = (uint32_t)pSvmTransient->u64ExitCode;
4661 return VERR_SVM_UNEXPECTED_EXIT;
4662 }
4663
4664 /*
4665 * Lazy DR0-3 loading.
4666 */
4667 if (!pSvmTransient->fWasHyperDebugStateActive)
4668 {
4669 Assert(!DBGFIsStepping(pVCpu)); Assert(!pVCpu->hm.s.fSingleInstruction);
4670 Log5(("hmR0SvmExitReadDRx: Lazy loading guest debug registers\n"));
4671
4672 /* Don't intercept DRx read and writes. */
4673 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
4674 pVmcb->ctrl.u16InterceptRdDRx = 0;
4675 pVmcb->ctrl.u16InterceptWrDRx = 0;
4676 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_INTERCEPTS;
4677
4678 /* We're playing with the host CPU state here, make sure we don't preempt or longjmp. */
4679 VMMRZCallRing3Disable(pVCpu);
4680 HM_DISABLE_PREEMPT();
4681
4682 /* Save the host & load the guest debug state, restart execution of the MOV DRx instruction. */
4683 CPUMR0LoadGuestDebugState(pVCpu, false /* include DR6 */);
4684 Assert(CPUMIsGuestDebugStateActive(pVCpu) || HC_ARCH_BITS == 32);
4685
4686 HM_RESTORE_PREEMPT();
4687 VMMRZCallRing3Enable(pVCpu);
4688
4689 STAM_COUNTER_INC(&pVCpu->hm.s.StatDRxContextSwitch);
4690 return VINF_SUCCESS;
4691 }
4692
4693 /*
4694 * Interpret the read/writing of DRx.
4695 */
4696 /** @todo Decode assist. */
4697 VBOXSTRICTRC rc = EMInterpretInstruction(pVCpu, CPUMCTX2CORE(pCtx), 0 /* pvFault */);
4698 Log5(("hmR0SvmExitReadDRx: Emulated DRx access: rc=%Rrc\n", VBOXSTRICTRC_VAL(rc)));
4699 if (RT_LIKELY(rc == VINF_SUCCESS))
4700 {
4701 /* Not necessary for read accesses but whatever doesn't hurt for now, will be fixed with decode assist. */
4702 /** @todo CPUM should set this flag! */
4703 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_DEBUG);
4704 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
4705 }
4706 else
4707 Assert(rc == VERR_EM_INTERPRETER);
4708 return VBOXSTRICTRC_TODO(rc);
4709}
4710
4711
4712/**
4713 * \#VMEXIT handler for DRx write (SVM_EXIT_WRITE_DRx). Conditional \#VMEXIT.
4714 */
4715HMSVM_EXIT_DECL hmR0SvmExitWriteDRx(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4716{
4717 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4718 /* For now it's the same since we interpret the instruction anyway. Will change when using of Decode Assist is implemented. */
4719 int rc = hmR0SvmExitReadDRx(pVCpu, pCtx, pSvmTransient);
4720 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitDRxWrite);
4721 STAM_COUNTER_DEC(&pVCpu->hm.s.StatExitDRxRead);
4722 return rc;
4723}
4724
4725
4726/**
4727 * \#VMEXIT handler for XCRx write (SVM_EXIT_XSETBV). Conditional \#VMEXIT.
4728 */
4729HMSVM_EXIT_DECL hmR0SvmExitXsetbv(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4730{
4731 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4732
4733 /** @todo decode assists... */
4734 VBOXSTRICTRC rcStrict = IEMExecOne(pVCpu);
4735 if (rcStrict == VINF_IEM_RAISED_XCPT)
4736 HMCPU_CF_SET(pVCpu, HM_CHANGED_ALL_GUEST);
4737
4738 pVCpu->hm.s.fLoadSaveGuestXcr0 = (pCtx->cr4 & X86_CR4_OSXSAVE) && pCtx->aXcr[0] != ASMGetXcr0();
4739 Log4(("hmR0SvmExitXsetbv: New XCR0=%#RX64 fLoadSaveGuestXcr0=%d (cr4=%RX64) rcStrict=%Rrc\n",
4740 pCtx->aXcr[0], pVCpu->hm.s.fLoadSaveGuestXcr0, pCtx->cr4, VBOXSTRICTRC_VAL(rcStrict)));
4741
4742 HMSVM_CHECK_SINGLE_STEP(pVCpu, rcStrict);
4743 return VBOXSTRICTRC_TODO(rcStrict);
4744}
4745
4746
4747/**
4748 * \#VMEXIT handler for I/O instructions (SVM_EXIT_IOIO). Conditional \#VMEXIT.
4749 */
4750HMSVM_EXIT_DECL hmR0SvmExitIOInstr(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4751{
4752 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4753
4754 /* I/O operation lookup arrays. */
4755 static uint32_t const s_aIOSize[8] = { 0, 1, 2, 0, 4, 0, 0, 0 }; /* Size of the I/O accesses in bytes. */
4756 static uint32_t const s_aIOOpAnd[8] = { 0, 0xff, 0xffff, 0, 0xffffffff, 0, 0, 0 }; /* AND masks for saving
4757 the result (in AL/AX/EAX). */
4758 Log4(("hmR0SvmExitIOInstr: CS:RIP=%04x:%#RX64\n", pCtx->cs.Sel, pCtx->rip));
4759
4760 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
4761 PVM pVM = pVCpu->CTX_SUFF(pVM);
4762
4763 /* Refer AMD spec. 15.10.2 "IN and OUT Behaviour" and Figure 15-2. "EXITINFO1 for IOIO Intercept" for the format. */
4764 SVMIOIOEXITINFO IoExitInfo;
4765 IoExitInfo.u = (uint32_t)pVmcb->ctrl.u64ExitInfo1;
4766 uint32_t uIOWidth = (IoExitInfo.u >> 4) & 0x7;
4767 uint32_t cbValue = s_aIOSize[uIOWidth];
4768 uint32_t uAndVal = s_aIOOpAnd[uIOWidth];
4769
4770 if (RT_UNLIKELY(!cbValue))
4771 {
4772 AssertMsgFailed(("hmR0SvmExitIOInstr: Invalid IO operation. uIOWidth=%u\n", uIOWidth));
4773 return VERR_EM_INTERPRETER;
4774 }
4775
4776 VBOXSTRICTRC rcStrict;
4777 bool fUpdateRipAlready = false;
4778 if (IoExitInfo.n.u1STR)
4779 {
4780#ifdef VBOX_WITH_2ND_IEM_STEP
4781 /* INS/OUTS - I/O String instruction. */
4782 /** @todo Huh? why can't we use the segment prefix information given by AMD-V
4783 * in EXITINFO1? Investigate once this thing is up and running. */
4784 Log4(("CS:RIP=%04x:%08RX64 %#06x/%u %c str\n", pCtx->cs.Sel, pCtx->rip, IoExitInfo.n.u16Port, cbValue,
4785 IoExitInfo.n.u1Type == SVM_IOIO_WRITE ? 'w' : 'r'));
4786 AssertReturn(pCtx->dx == IoExitInfo.n.u16Port, VERR_SVM_IPE_2);
4787 static IEMMODE const s_aenmAddrMode[8] =
4788 {
4789 (IEMMODE)-1, IEMMODE_16BIT, IEMMODE_32BIT, (IEMMODE)-1, IEMMODE_64BIT, (IEMMODE)-1, (IEMMODE)-1, (IEMMODE)-1
4790 };
4791 IEMMODE enmAddrMode = s_aenmAddrMode[(IoExitInfo.u >> 7) & 0x7];
4792 if (enmAddrMode != (IEMMODE)-1)
4793 {
4794 uint64_t cbInstr = pVmcb->ctrl.u64ExitInfo2 - pCtx->rip;
4795 if (cbInstr <= 15 && cbInstr >= 1)
4796 {
4797 Assert(cbInstr >= 1U + IoExitInfo.n.u1REP);
4798 if (IoExitInfo.n.u1Type == SVM_IOIO_WRITE)
4799 {
4800 /* Don't know exactly how to detect whether u3SEG is valid, currently
4801 only enabling it for Bulldozer and later with NRIP. OS/2 broke on
4802 2384 Opterons when only checking NRIP. */
4803 if ( (pVM->hm.s.svm.u32Features & X86_CPUID_SVM_FEATURE_EDX_NRIP_SAVE)
4804 && pVM->cpum.ro.GuestFeatures.enmMicroarch >= kCpumMicroarch_AMD_15h_First)
4805 {
4806 AssertMsg(IoExitInfo.n.u3SEG == X86_SREG_DS || cbInstr > 1U + IoExitInfo.n.u1REP,
4807 ("u32Seg=%d cbInstr=%d u1REP=%d", IoExitInfo.n.u3SEG, cbInstr, IoExitInfo.n.u1REP));
4808 rcStrict = IEMExecStringIoWrite(pVCpu, cbValue, enmAddrMode, IoExitInfo.n.u1REP, (uint8_t)cbInstr,
4809 IoExitInfo.n.u3SEG, true /*fIoChecked*/);
4810 }
4811 else if (cbInstr == 1U + IoExitInfo.n.u1REP)
4812 rcStrict = IEMExecStringIoWrite(pVCpu, cbValue, enmAddrMode, IoExitInfo.n.u1REP, (uint8_t)cbInstr,
4813 X86_SREG_DS, true /*fIoChecked*/);
4814 else
4815 rcStrict = IEMExecOne(pVCpu);
4816 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIOStringWrite);
4817 }
4818 else
4819 {
4820 AssertMsg(IoExitInfo.n.u3SEG == X86_SREG_ES /*=0*/, ("%#x\n", IoExitInfo.n.u3SEG));
4821 rcStrict = IEMExecStringIoRead(pVCpu, cbValue, enmAddrMode, IoExitInfo.n.u1REP, (uint8_t)cbInstr,
4822 true /*fIoChecked*/);
4823 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIOStringRead);
4824 }
4825 }
4826 else
4827 {
4828 AssertMsgFailed(("rip=%RX64 nrip=%#RX64 cbInstr=%#RX64\n", pCtx->rip, pVmcb->ctrl.u64ExitInfo2, cbInstr));
4829 rcStrict = IEMExecOne(pVCpu);
4830 }
4831 }
4832 else
4833 {
4834 AssertMsgFailed(("IoExitInfo=%RX64\n", IoExitInfo.u));
4835 rcStrict = IEMExecOne(pVCpu);
4836 }
4837 fUpdateRipAlready = true;
4838
4839#else
4840 /* INS/OUTS - I/O String instruction. */
4841 PDISCPUSTATE pDis = &pVCpu->hm.s.DisState;
4842
4843 /** @todo Huh? why can't we use the segment prefix information given by AMD-V
4844 * in EXITINFO1? Investigate once this thing is up and running. */
4845
4846 rcStrict = EMInterpretDisasCurrent(pVM, pVCpu, pDis, NULL);
4847 if (rcStrict == VINF_SUCCESS)
4848 {
4849 if (IoExitInfo.n.u1Type == SVM_IOIO_WRITE)
4850 {
4851 rcStrict = IOMInterpretOUTSEx(pVM, pVCpu, CPUMCTX2CORE(pCtx), IoExitInfo.n.u16Port, pDis->fPrefix,
4852 (DISCPUMODE)pDis->uAddrMode, cbValue);
4853 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIOStringWrite);
4854 }
4855 else
4856 {
4857 rcStrict = IOMInterpretINSEx(pVM, pVCpu, CPUMCTX2CORE(pCtx), IoExitInfo.n.u16Port, pDis->fPrefix,
4858 (DISCPUMODE)pDis->uAddrMode, cbValue);
4859 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIOStringRead);
4860 }
4861 }
4862 else
4863 rcStrict = VINF_EM_RAW_EMULATE_INSTR;
4864#endif
4865 }
4866 else
4867 {
4868 /* IN/OUT - I/O instruction. */
4869 Assert(!IoExitInfo.n.u1REP);
4870
4871 if (IoExitInfo.n.u1Type == SVM_IOIO_WRITE)
4872 {
4873 rcStrict = IOMIOPortWrite(pVM, pVCpu, IoExitInfo.n.u16Port, pCtx->eax & uAndVal, cbValue);
4874 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIOWrite);
4875 }
4876 else
4877 {
4878 uint32_t u32Val = 0;
4879 rcStrict = IOMIOPortRead(pVM, pVCpu, IoExitInfo.n.u16Port, &u32Val, cbValue);
4880 if (IOM_SUCCESS(rcStrict))
4881 {
4882 /* Save result of I/O IN instr. in AL/AX/EAX. */
4883 /** @todo r=bird: 32-bit op size should clear high bits of rax! */
4884 pCtx->eax = (pCtx->eax & ~uAndVal) | (u32Val & uAndVal);
4885 }
4886 else if (rcStrict == VINF_IOM_R3_IOPORT_READ)
4887 HMR0SavePendingIOPortRead(pVCpu, pCtx->rip, pVmcb->ctrl.u64ExitInfo2, IoExitInfo.n.u16Port, uAndVal, cbValue);
4888
4889 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIORead);
4890 }
4891 }
4892
4893 if (IOM_SUCCESS(rcStrict))
4894 {
4895 /* AMD-V saves the RIP of the instruction following the IO instruction in EXITINFO2. */
4896 if (!fUpdateRipAlready)
4897 pCtx->rip = pVmcb->ctrl.u64ExitInfo2;
4898
4899 /*
4900 * If any I/O breakpoints are armed, we need to check if one triggered
4901 * and take appropriate action.
4902 * Note that the I/O breakpoint type is undefined if CR4.DE is 0.
4903 */
4904 /** @todo Optimize away the DBGFBpIsHwIoArmed call by having DBGF tell the
4905 * execution engines about whether hyper BPs and such are pending. */
4906 uint32_t const uDr7 = pCtx->dr[7];
4907 if (RT_UNLIKELY( ( (uDr7 & X86_DR7_ENABLED_MASK)
4908 && X86_DR7_ANY_RW_IO(uDr7)
4909 && (pCtx->cr4 & X86_CR4_DE))
4910 || DBGFBpIsHwIoArmed(pVM)))
4911 {
4912 /* We're playing with the host CPU state here, make sure we don't preempt or longjmp. */
4913 VMMRZCallRing3Disable(pVCpu);
4914 HM_DISABLE_PREEMPT();
4915
4916 STAM_COUNTER_INC(&pVCpu->hm.s.StatDRxIoCheck);
4917 CPUMR0DebugStateMaybeSaveGuest(pVCpu, false /*fDr6*/);
4918
4919 VBOXSTRICTRC rcStrict2 = DBGFBpCheckIo(pVM, pVCpu, pCtx, IoExitInfo.n.u16Port, cbValue);
4920 if (rcStrict2 == VINF_EM_RAW_GUEST_TRAP)
4921 {
4922 /* Raise #DB. */
4923 pVmcb->guest.u64DR6 = pCtx->dr[6];
4924 pVmcb->guest.u64DR7 = pCtx->dr[7];
4925 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_DRX;
4926 hmR0SvmSetPendingXcptDB(pVCpu);
4927 }
4928 /* rcStrict is VINF_SUCCESS, VINF_IOM_R3_IOPORT_COMMIT_WRITE, or in [VINF_EM_FIRST..VINF_EM_LAST],
4929 however we can ditch VINF_IOM_R3_IOPORT_COMMIT_WRITE as it has VMCPU_FF_IOM as backup. */
4930 else if ( rcStrict2 != VINF_SUCCESS
4931 && (rcStrict == VINF_SUCCESS || rcStrict2 < rcStrict))
4932 rcStrict = rcStrict2;
4933 AssertCompile(VINF_EM_LAST < VINF_IOM_R3_IOPORT_COMMIT_WRITE);
4934
4935 HM_RESTORE_PREEMPT();
4936 VMMRZCallRing3Enable(pVCpu);
4937 }
4938
4939 HMSVM_CHECK_SINGLE_STEP(pVCpu, rcStrict);
4940 }
4941
4942#ifdef VBOX_STRICT
4943 if (rcStrict == VINF_IOM_R3_IOPORT_READ)
4944 Assert(IoExitInfo.n.u1Type == SVM_IOIO_READ);
4945 else if (rcStrict == VINF_IOM_R3_IOPORT_WRITE || rcStrict == VINF_IOM_R3_IOPORT_COMMIT_WRITE)
4946 Assert(IoExitInfo.n.u1Type == SVM_IOIO_WRITE);
4947 else
4948 {
4949 /** @todo r=bird: This is missing a bunch of VINF_EM_FIRST..VINF_EM_LAST
4950 * statuses, that the VMM device and some others may return. See
4951 * IOM_SUCCESS() for guidance. */
4952 AssertMsg( RT_FAILURE(rcStrict)
4953 || rcStrict == VINF_SUCCESS
4954 || rcStrict == VINF_EM_RAW_EMULATE_INSTR
4955 || rcStrict == VINF_EM_DBG_BREAKPOINT
4956 || rcStrict == VINF_EM_RAW_GUEST_TRAP
4957 || rcStrict == VINF_EM_RAW_TO_R3
4958 || rcStrict == VINF_TRPM_XCPT_DISPATCHED, ("%Rrc\n", VBOXSTRICTRC_VAL(rcStrict)));
4959 }
4960#endif
4961 return VBOXSTRICTRC_TODO(rcStrict);
4962}
4963
4964
4965/**
4966 * \#VMEXIT handler for Nested Page-faults (SVM_EXIT_NPF). Conditional \#VMEXIT.
4967 */
4968HMSVM_EXIT_DECL hmR0SvmExitNestedPF(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
4969{
4970 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
4971 PVM pVM = pVCpu->CTX_SUFF(pVM);
4972 Assert(pVM->hm.s.fNestedPaging);
4973
4974 HMSVM_CHECK_EXIT_DUE_TO_EVENT_DELIVERY();
4975
4976 /* See AMD spec. 15.25.6 "Nested versus Guest Page Faults, Fault Ordering" for VMCB details for #NPF. */
4977 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
4978 uint32_t u32ErrCode = pVmcb->ctrl.u64ExitInfo1;
4979 RTGCPHYS GCPhysFaultAddr = pVmcb->ctrl.u64ExitInfo2;
4980
4981 Log4(("#NPF at CS:RIP=%04x:%#RX64 faultaddr=%RGp errcode=%#x \n", pCtx->cs.Sel, pCtx->rip, GCPhysFaultAddr, u32ErrCode));
4982
4983#ifdef VBOX_HM_WITH_GUEST_PATCHING
4984 /* TPR patching for 32-bit guests, using the reserved bit in the page tables for MMIO regions. */
4985 if ( pVM->hm.s.fTprPatchingAllowed
4986 && (GCPhysFaultAddr & PAGE_OFFSET_MASK) == XAPIC_OFF_TPR
4987 && ( !(u32ErrCode & X86_TRAP_PF_P) /* Not present */
4988 || (u32ErrCode & (X86_TRAP_PF_P | X86_TRAP_PF_RSVD)) == (X86_TRAP_PF_P | X86_TRAP_PF_RSVD)) /* MMIO page. */
4989 && !CPUMIsGuestInLongModeEx(pCtx)
4990 && !CPUMGetGuestCPL(pVCpu)
4991 && pVM->hm.s.cPatches < RT_ELEMENTS(pVM->hm.s.aPatches))
4992 {
4993 RTGCPHYS GCPhysApicBase = APICGetBaseMsrNoCheck(pVCpu);
4994 GCPhysApicBase &= PAGE_BASE_GC_MASK;
4995
4996 if (GCPhysFaultAddr == GCPhysApicBase + XAPIC_OFF_TPR)
4997 {
4998 /* Only attempt to patch the instruction once. */
4999 PHMTPRPATCH pPatch = (PHMTPRPATCH)RTAvloU32Get(&pVM->hm.s.PatchTree, (AVLOU32KEY)pCtx->eip);
5000 if (!pPatch)
5001 return VINF_EM_HM_PATCH_TPR_INSTR;
5002 }
5003 }
5004#endif
5005
5006 /*
5007 * Determine the nested paging mode.
5008 */
5009 PGMMODE enmNestedPagingMode;
5010#if HC_ARCH_BITS == 32
5011 if (CPUMIsGuestInLongModeEx(pCtx))
5012 enmNestedPagingMode = PGMMODE_AMD64_NX;
5013 else
5014#endif
5015 enmNestedPagingMode = PGMGetHostMode(pVM);
5016
5017 /*
5018 * MMIO optimization using the reserved (RSVD) bit in the guest page tables for MMIO pages.
5019 */
5020 int rc;
5021 Assert((u32ErrCode & (X86_TRAP_PF_RSVD | X86_TRAP_PF_P)) != X86_TRAP_PF_RSVD);
5022 if ((u32ErrCode & (X86_TRAP_PF_RSVD | X86_TRAP_PF_P)) == (X86_TRAP_PF_RSVD | X86_TRAP_PF_P))
5023 {
5024 /* If event delivery causes an MMIO #NPF, go back to instruction emulation as
5025 otherwise injecting the original pending event would most likely cause the same MMIO #NPF. */
5026 if (RT_UNLIKELY(pVCpu->hm.s.Event.fPending))
5027 return VERR_EM_INTERPRETER;
5028
5029 VBOXSTRICTRC rc2 = PGMR0Trap0eHandlerNPMisconfig(pVM, pVCpu, enmNestedPagingMode, CPUMCTX2CORE(pCtx), GCPhysFaultAddr,
5030 u32ErrCode);
5031 rc = VBOXSTRICTRC_VAL(rc2);
5032
5033 /*
5034 * If we succeed, resume guest execution.
5035 * If we fail in interpreting the instruction because we couldn't get the guest physical address
5036 * of the page containing the instruction via the guest's page tables (we would invalidate the guest page
5037 * in the host TLB), resume execution which would cause a guest page fault to let the guest handle this
5038 * weird case. See @bugref{6043}.
5039 */
5040 if ( rc == VINF_SUCCESS
5041 || rc == VERR_PAGE_TABLE_NOT_PRESENT
5042 || rc == VERR_PAGE_NOT_PRESENT)
5043 {
5044 /* Successfully handled MMIO operation. */
5045 HMCPU_CF_SET(pVCpu, HM_CHANGED_SVM_GUEST_APIC_STATE);
5046 rc = VINF_SUCCESS;
5047 }
5048 return rc;
5049 }
5050
5051 TRPMAssertXcptPF(pVCpu, GCPhysFaultAddr, u32ErrCode);
5052 rc = PGMR0Trap0eHandlerNestedPaging(pVM, pVCpu, enmNestedPagingMode, u32ErrCode, CPUMCTX2CORE(pCtx), GCPhysFaultAddr);
5053 TRPMResetTrap(pVCpu);
5054
5055 Log4(("#NPF: PGMR0Trap0eHandlerNestedPaging returned %Rrc CS:RIP=%04x:%#RX64\n", rc, pCtx->cs.Sel, pCtx->rip));
5056
5057 /*
5058 * Same case as PGMR0Trap0eHandlerNPMisconfig(). See comment above, @bugref{6043}.
5059 */
5060 if ( rc == VINF_SUCCESS
5061 || rc == VERR_PAGE_TABLE_NOT_PRESENT
5062 || rc == VERR_PAGE_NOT_PRESENT)
5063 {
5064 /* We've successfully synced our shadow page tables. */
5065 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitShadowPF);
5066 rc = VINF_SUCCESS;
5067 }
5068
5069 return rc;
5070}
5071
5072
5073/**
5074 * \#VMEXIT handler for virtual interrupt (SVM_EXIT_VINTR). Conditional
5075 * \#VMEXIT.
5076 */
5077HMSVM_EXIT_DECL hmR0SvmExitVIntr(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5078{
5079 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5080
5081 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
5082 pVmcb->ctrl.IntCtrl.n.u1VIrqPending = 0; /* No virtual interrupts pending, we'll inject the current one/NMI before reentry. */
5083 pVmcb->ctrl.IntCtrl.n.u8VIntrVector = 0;
5084
5085 /* Indicate that we no longer need to #VMEXIT when the guest is ready to receive interrupts/NMIs, it is now ready. */
5086 pVmcb->ctrl.u64InterceptCtrl &= ~SVM_CTRL_INTERCEPT_VINTR;
5087 pVmcb->ctrl.u64VmcbCleanBits &= ~(HMSVM_VMCB_CLEAN_INTERCEPTS | HMSVM_VMCB_CLEAN_TPR);
5088
5089 /* Deliver the pending interrupt/NMI via hmR0SvmEvaluatePendingEvent() and resume guest execution. */
5090 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitIntWindow);
5091 return VINF_SUCCESS;
5092}
5093
5094
5095/**
5096 * \#VMEXIT handler for task switches (SVM_EXIT_TASK_SWITCH). Conditional
5097 * \#VMEXIT.
5098 */
5099HMSVM_EXIT_DECL hmR0SvmExitTaskSwitch(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5100{
5101 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5102
5103 HMSVM_CHECK_EXIT_DUE_TO_EVENT_DELIVERY();
5104
5105#ifndef HMSVM_ALWAYS_TRAP_TASK_SWITCH
5106 Assert(!pVCpu->CTX_SUFF(pVM)->hm.s.fNestedPaging);
5107#endif
5108
5109 /* Check if this task-switch occurred while delivering an event through the guest IDT. */
5110 if (pVCpu->hm.s.Event.fPending) /* Can happen with exceptions/NMI. See @bugref{8411}. */
5111 {
5112 /*
5113 * AMD-V provides us with the exception which caused the TS; we collect
5114 * the information in the call to hmR0SvmCheckExitDueToEventDelivery.
5115 */
5116 Log4(("hmR0SvmExitTaskSwitch: TS occurred during event delivery.\n"));
5117 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitTaskSwitch);
5118 return VINF_EM_RAW_INJECT_TRPM_EVENT;
5119 }
5120
5121 /** @todo Emulate task switch someday, currently just going back to ring-3 for
5122 * emulation. */
5123 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitTaskSwitch);
5124 return VERR_EM_INTERPRETER;
5125}
5126
5127
5128/**
5129 * \#VMEXIT handler for VMMCALL (SVM_EXIT_VMMCALL). Conditional \#VMEXIT.
5130 */
5131HMSVM_EXIT_DECL hmR0SvmExitVmmCall(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5132{
5133 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5134 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitVmcall);
5135
5136 bool fRipUpdated;
5137 VBOXSTRICTRC rcStrict = HMSvmVmmcall(pVCpu, pCtx, &fRipUpdated);
5138 if (RT_SUCCESS(rcStrict))
5139 {
5140 if (!fRipUpdated)
5141 hmR0SvmAdvanceRipHwAssist(pVCpu, pCtx, 3 /* cbInstr */);
5142
5143 /* If the hypercall or TPR patching changes anything other than guest's general-purpose registers,
5144 we would need to reload the guest changed bits here before VM-entry. */
5145 return VBOXSTRICTRC_VAL(rcStrict);
5146 }
5147
5148 hmR0SvmSetPendingXcptUD(pVCpu);
5149 return VINF_SUCCESS;
5150}
5151
5152
5153/**
5154 * \#VMEXIT handler for VMMCALL (SVM_EXIT_VMMCALL). Conditional \#VMEXIT.
5155 */
5156HMSVM_EXIT_DECL hmR0SvmExitPause(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5157{
5158 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5159 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitPause);
5160 return VINF_EM_RAW_INTERRUPT;
5161}
5162
5163
5164/**
5165 * \#VMEXIT handler for IRET (SVM_EXIT_IRET). Conditional \#VMEXIT.
5166 */
5167HMSVM_EXIT_DECL hmR0SvmExitIret(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5168{
5169 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5170
5171 /* Clear NMI blocking. */
5172 VMCPU_FF_CLEAR(pVCpu, VMCPU_FF_BLOCK_NMIS);
5173
5174 /* Indicate that we no longer need to #VMEXIT when the guest is ready to receive NMIs, it is now ready. */
5175 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
5176 hmR0SvmClearIretIntercept(pVmcb);
5177
5178 /* Deliver the pending NMI via hmR0SvmEvaluatePendingEvent() and resume guest execution. */
5179 return VINF_SUCCESS;
5180}
5181
5182
5183/**
5184 * \#VMEXIT handler for page-fault exceptions (SVM_EXIT_EXCEPTION_14).
5185 * Conditional \#VMEXIT.
5186 */
5187HMSVM_EXIT_DECL hmR0SvmExitXcptPF(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5188{
5189 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5190
5191 HMSVM_CHECK_EXIT_DUE_TO_EVENT_DELIVERY();
5192
5193 /* See AMD spec. 15.12.15 "#PF (Page Fault)". */
5194 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
5195 uint32_t u32ErrCode = pVmcb->ctrl.u64ExitInfo1;
5196 RTGCUINTPTR uFaultAddress = pVmcb->ctrl.u64ExitInfo2;
5197 PVM pVM = pVCpu->CTX_SUFF(pVM);
5198
5199#if defined(HMSVM_ALWAYS_TRAP_ALL_XCPTS) || defined(HMSVM_ALWAYS_TRAP_PF)
5200 if (pVM->hm.s.fNestedPaging)
5201 {
5202 pVCpu->hm.s.Event.fPending = false; /* In case it's a contributory or vectoring #PF. */
5203 if (!pSvmTransient->fVectoringDoublePF)
5204 {
5205 /* A genuine guest #PF, reflect it to the guest. */
5206 hmR0SvmSetPendingXcptPF(pVCpu, pCtx, u32ErrCode, uFaultAddress);
5207 Log4(("#PF: Guest page fault at %04X:%RGv FaultAddr=%RGv ErrCode=%#x\n", pCtx->cs.Sel, (RTGCPTR)pCtx->rip,
5208 uFaultAddress, u32ErrCode));
5209 }
5210 else
5211 {
5212 /* A guest page-fault occurred during delivery of a page-fault. Inject #DF. */
5213 hmR0SvmSetPendingXcptDF(pVCpu);
5214 Log4(("Pending #DF due to vectoring #PF. NP\n"));
5215 }
5216 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestPF);
5217 return VINF_SUCCESS;
5218 }
5219#endif
5220
5221 Assert(!pVM->hm.s.fNestedPaging);
5222
5223#ifdef VBOX_HM_WITH_GUEST_PATCHING
5224 /* Shortcut for APIC TPR reads and writes; only applicable to 32-bit guests. */
5225 if ( pVM->hm.s.fTprPatchingAllowed
5226 && (uFaultAddress & 0xfff) == XAPIC_OFF_TPR
5227 && !(u32ErrCode & X86_TRAP_PF_P) /* Not present. */
5228 && !CPUMIsGuestInLongModeEx(pCtx)
5229 && !CPUMGetGuestCPL(pVCpu)
5230 && pVM->hm.s.cPatches < RT_ELEMENTS(pVM->hm.s.aPatches))
5231 {
5232 RTGCPHYS GCPhysApicBase;
5233 GCPhysApicBase = APICGetBaseMsrNoCheck(pVCpu);
5234 GCPhysApicBase &= PAGE_BASE_GC_MASK;
5235
5236 /* Check if the page at the fault-address is the APIC base. */
5237 RTGCPHYS GCPhysPage;
5238 int rc2 = PGMGstGetPage(pVCpu, (RTGCPTR)uFaultAddress, NULL /* pfFlags */, &GCPhysPage);
5239 if ( rc2 == VINF_SUCCESS
5240 && GCPhysPage == GCPhysApicBase)
5241 {
5242 /* Only attempt to patch the instruction once. */
5243 PHMTPRPATCH pPatch = (PHMTPRPATCH)RTAvloU32Get(&pVM->hm.s.PatchTree, (AVLOU32KEY)pCtx->eip);
5244 if (!pPatch)
5245 return VINF_EM_HM_PATCH_TPR_INSTR;
5246 }
5247 }
5248#endif
5249
5250 Log4(("#PF: uFaultAddress=%#RX64 CS:RIP=%#04x:%#RX64 u32ErrCode %#RX32 cr3=%#RX64\n", uFaultAddress, pCtx->cs.Sel,
5251 pCtx->rip, u32ErrCode, pCtx->cr3));
5252
5253 /* If it's a vectoring #PF, emulate injecting the original event injection as PGMTrap0eHandler() is incapable
5254 of differentiating between instruction emulation and event injection that caused a #PF. See @bugref{6607}. */
5255 if (pSvmTransient->fVectoringPF)
5256 {
5257 Assert(pVCpu->hm.s.Event.fPending);
5258 return VINF_EM_RAW_INJECT_TRPM_EVENT;
5259 }
5260
5261 TRPMAssertXcptPF(pVCpu, uFaultAddress, u32ErrCode);
5262 int rc = PGMTrap0eHandler(pVCpu, u32ErrCode, CPUMCTX2CORE(pCtx), (RTGCPTR)uFaultAddress);
5263
5264 Log4(("#PF rc=%Rrc\n", rc));
5265
5266 if (rc == VINF_SUCCESS)
5267 {
5268 /* Successfully synced shadow pages tables or emulated an MMIO instruction. */
5269 TRPMResetTrap(pVCpu);
5270 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitShadowPF);
5271 HMCPU_CF_SET(pVCpu, HM_CHANGED_ALL_GUEST);
5272 return rc;
5273 }
5274 else if (rc == VINF_EM_RAW_GUEST_TRAP)
5275 {
5276 pVCpu->hm.s.Event.fPending = false; /* In case it's a contributory or vectoring #PF. */
5277
5278 if (!pSvmTransient->fVectoringDoublePF)
5279 {
5280 /* It's a guest page fault and needs to be reflected to the guest. */
5281 u32ErrCode = TRPMGetErrorCode(pVCpu); /* The error code might have been changed. */
5282 TRPMResetTrap(pVCpu);
5283 hmR0SvmSetPendingXcptPF(pVCpu, pCtx, u32ErrCode, uFaultAddress);
5284 }
5285 else
5286 {
5287 /* A guest page-fault occurred during delivery of a page-fault. Inject #DF. */
5288 TRPMResetTrap(pVCpu);
5289 hmR0SvmSetPendingXcptDF(pVCpu);
5290 Log4(("#PF: Pending #DF due to vectoring #PF\n"));
5291 }
5292
5293 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestPF);
5294 return VINF_SUCCESS;
5295 }
5296
5297 TRPMResetTrap(pVCpu);
5298 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitShadowPFEM);
5299 return rc;
5300}
5301
5302
5303/**
5304 * \#VMEXIT handler for device-not-available exceptions (SVM_EXIT_EXCEPTION_7).
5305 * Conditional \#VMEXIT.
5306 */
5307HMSVM_EXIT_DECL hmR0SvmExitXcptNM(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5308{
5309 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5310
5311 /* Paranoia; Ensure we cannot be called as a result of event delivery. */
5312 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb; NOREF(pVmcb);
5313 Assert(!pVmcb->ctrl.ExitIntInfo.n.u1Valid);
5314
5315 /* We're playing with the host CPU state here, make sure we don't preempt or longjmp. */
5316 VMMRZCallRing3Disable(pVCpu);
5317 HM_DISABLE_PREEMPT();
5318
5319 int rc;
5320 /* If the guest FPU was active at the time of the #NM exit, then it's a guest fault. */
5321 if (pSvmTransient->fWasGuestFPUStateActive)
5322 {
5323 rc = VINF_EM_RAW_GUEST_TRAP;
5324 Assert(CPUMIsGuestFPUStateActive(pVCpu) || HMCPU_CF_IS_PENDING(pVCpu, HM_CHANGED_GUEST_CR0));
5325 }
5326 else
5327 {
5328#ifndef HMSVM_ALWAYS_TRAP_ALL_XCPTS
5329 Assert(!pSvmTransient->fWasGuestFPUStateActive);
5330#endif
5331 rc = CPUMR0Trap07Handler(pVCpu->CTX_SUFF(pVM), pVCpu); /* (No need to set HM_CHANGED_HOST_CONTEXT for SVM.) */
5332 Assert( rc == VINF_EM_RAW_GUEST_TRAP
5333 || ((rc == VINF_SUCCESS || rc == VINF_CPUM_HOST_CR0_MODIFIED) && CPUMIsGuestFPUStateActive(pVCpu)));
5334 }
5335
5336 HM_RESTORE_PREEMPT();
5337 VMMRZCallRing3Enable(pVCpu);
5338
5339 if (rc == VINF_SUCCESS || rc == VINF_CPUM_HOST_CR0_MODIFIED)
5340 {
5341 /* Guest FPU state was activated, we'll want to change CR0 FPU intercepts before the next VM-reentry. */
5342 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_CR0);
5343 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitShadowNM);
5344 pVCpu->hm.s.fPreloadGuestFpu = true;
5345 }
5346 else
5347 {
5348 /* Forward #NM to the guest. */
5349 Assert(rc == VINF_EM_RAW_GUEST_TRAP);
5350 hmR0SvmSetPendingXcptNM(pVCpu);
5351 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestNM);
5352 }
5353 return VINF_SUCCESS;
5354}
5355
5356
5357/**
5358 * \#VMEXIT handler for undefined opcode (SVM_EXIT_EXCEPTION_6).
5359 * Conditional \#VMEXIT.
5360 */
5361HMSVM_EXIT_DECL hmR0SvmExitXcptUD(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5362{
5363 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5364
5365 /* Paranoia; Ensure we cannot be called as a result of event delivery. */
5366 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb; NOREF(pVmcb);
5367 Assert(!pVmcb->ctrl.ExitIntInfo.n.u1Valid);
5368
5369 int rc = VERR_SVM_UNEXPECTED_XCPT_EXIT;
5370 if (pVCpu->hm.s.fGIMTrapXcptUD)
5371 {
5372 uint8_t cbInstr = 0;
5373 VBOXSTRICTRC rcStrict = GIMXcptUD(pVCpu, pCtx, NULL /* pDis */, &cbInstr);
5374 if (rcStrict == VINF_SUCCESS)
5375 {
5376 /* #UD #VMEXIT does not have valid NRIP information, manually advance RIP. See @bugref{7270#c170}. */
5377 hmR0SvmAdvanceRipDumb(pVCpu, pCtx, cbInstr);
5378 rc = VINF_SUCCESS;
5379 HMSVM_CHECK_SINGLE_STEP(pVCpu, rc);
5380 }
5381 else if (rcStrict == VINF_GIM_HYPERCALL_CONTINUING)
5382 rc = VINF_SUCCESS;
5383 else if (rcStrict == VINF_GIM_R3_HYPERCALL)
5384 rc = VINF_GIM_R3_HYPERCALL;
5385 else
5386 Assert(RT_FAILURE(VBOXSTRICTRC_VAL(rcStrict)));
5387 }
5388
5389 /* If the GIM #UD exception handler didn't succeed for some reason or wasn't needed, raise #UD. */
5390 if (RT_FAILURE(rc))
5391 {
5392 hmR0SvmSetPendingXcptUD(pVCpu);
5393 rc = VINF_SUCCESS;
5394 }
5395
5396 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestUD);
5397 return rc;
5398}
5399
5400
5401/**
5402 * \#VMEXIT handler for math-fault exceptions (SVM_EXIT_EXCEPTION_16).
5403 * Conditional \#VMEXIT.
5404 */
5405HMSVM_EXIT_DECL hmR0SvmExitXcptMF(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5406{
5407 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5408
5409 /* Paranoia; Ensure we cannot be called as a result of event delivery. */
5410 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb; NOREF(pVmcb);
5411 Assert(!pVmcb->ctrl.ExitIntInfo.n.u1Valid);
5412
5413 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestMF);
5414
5415 if (!(pCtx->cr0 & X86_CR0_NE))
5416 {
5417 PVM pVM = pVCpu->CTX_SUFF(pVM);
5418 PDISSTATE pDis = &pVCpu->hm.s.DisState;
5419 unsigned cbOp;
5420 int rc = EMInterpretDisasCurrent(pVM, pVCpu, pDis, &cbOp);
5421 if (RT_SUCCESS(rc))
5422 {
5423 /* Convert a #MF into a FERR -> IRQ 13. See @bugref{6117}. */
5424 rc = PDMIsaSetIrq(pVCpu->CTX_SUFF(pVM), 13, 1, 0 /* uTagSrc */);
5425 if (RT_SUCCESS(rc))
5426 pCtx->rip += cbOp;
5427 }
5428 else
5429 Log4(("hmR0SvmExitXcptMF: EMInterpretDisasCurrent returned %Rrc uOpCode=%#x\n", rc, pDis->pCurInstr->uOpcode));
5430 return rc;
5431 }
5432
5433 hmR0SvmSetPendingXcptMF(pVCpu);
5434 return VINF_SUCCESS;
5435}
5436
5437
5438/**
5439 * \#VMEXIT handler for debug exceptions (SVM_EXIT_EXCEPTION_1). Conditional
5440 * \#VMEXIT.
5441 */
5442HMSVM_EXIT_DECL hmR0SvmExitXcptDB(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5443{
5444 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5445
5446 /* If this #DB is the result of delivering an event, go back to the interpreter. */
5447 HMSVM_CHECK_EXIT_DUE_TO_EVENT_DELIVERY();
5448 if (RT_UNLIKELY(pVCpu->hm.s.Event.fPending))
5449 {
5450 STAM_COUNTER_INC(&pVCpu->hm.s.StatInjectPendingInterpret);
5451 return VERR_EM_INTERPRETER;
5452 }
5453
5454 STAM_COUNTER_INC(&pVCpu->hm.s.StatExitGuestDB);
5455
5456 /* This can be a fault-type #DB (instruction breakpoint) or a trap-type #DB (data breakpoint). However, for both cases
5457 DR6 and DR7 are updated to what the exception handler expects. See AMD spec. 15.12.2 "#DB (Debug)". */
5458 PSVMVMCB pVmcb = (PSVMVMCB)pVCpu->hm.s.svm.pvVmcb;
5459 PVM pVM = pVCpu->CTX_SUFF(pVM);
5460 int rc = DBGFRZTrap01Handler(pVM, pVCpu, CPUMCTX2CORE(pCtx), pVmcb->guest.u64DR6, pVCpu->hm.s.fSingleInstruction);
5461 if (rc == VINF_EM_RAW_GUEST_TRAP)
5462 {
5463 Log5(("hmR0SvmExitXcptDB: DR6=%#RX64 -> guest trap\n", pVmcb->guest.u64DR6));
5464 if (CPUMIsHyperDebugStateActive(pVCpu))
5465 CPUMSetGuestDR6(pVCpu, CPUMGetGuestDR6(pVCpu) | pVmcb->guest.u64DR6);
5466
5467 /* Reflect the exception back to the guest. */
5468 hmR0SvmSetPendingXcptDB(pVCpu);
5469 rc = VINF_SUCCESS;
5470 }
5471
5472 /*
5473 * Update DR6.
5474 */
5475 if (CPUMIsHyperDebugStateActive(pVCpu))
5476 {
5477 Log5(("hmR0SvmExitXcptDB: DR6=%#RX64 -> %Rrc\n", pVmcb->guest.u64DR6, rc));
5478 pVmcb->guest.u64DR6 = X86_DR6_INIT_VAL;
5479 pVmcb->ctrl.u64VmcbCleanBits &= ~HMSVM_VMCB_CLEAN_DRX;
5480 }
5481 else
5482 {
5483 AssertMsg(rc == VINF_SUCCESS, ("rc=%Rrc\n", rc));
5484 Assert(!pVCpu->hm.s.fSingleInstruction && !DBGFIsStepping(pVCpu));
5485 }
5486
5487 return rc;
5488}
5489
5490
5491/**
5492 * \#VMEXIT handler for alignment check exceptions (SVM_EXIT_EXCEPTION_17).
5493 * Conditional \#VMEXIT.
5494 */
5495HMSVM_EXIT_DECL hmR0SvmExitXcptAC(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5496{
5497 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5498
5499 HMSVM_CHECK_EXIT_DUE_TO_EVENT_DELIVERY();
5500
5501 SVMEVENT Event;
5502 Event.u = 0;
5503 Event.n.u1Valid = 1;
5504 Event.n.u3Type = SVM_EVENT_EXCEPTION;
5505 Event.n.u8Vector = X86_XCPT_AC;
5506 Event.n.u1ErrorCodeValid = 1;
5507 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
5508 return VINF_SUCCESS;
5509}
5510
5511
5512/**
5513 * \#VMEXIT handler for breakpoint exceptions (SVM_EXIT_EXCEPTION_3).
5514 * Conditional \#VMEXIT.
5515 */
5516HMSVM_EXIT_DECL hmR0SvmExitXcptBP(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5517{
5518 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5519
5520 HMSVM_CHECK_EXIT_DUE_TO_EVENT_DELIVERY();
5521
5522 int rc = DBGFRZTrap03Handler(pVCpu->CTX_SUFF(pVM), pVCpu, CPUMCTX2CORE(pCtx));
5523 if (rc == VINF_EM_RAW_GUEST_TRAP)
5524 {
5525 SVMEVENT Event;
5526 Event.u = 0;
5527 Event.n.u1Valid = 1;
5528 Event.n.u3Type = SVM_EVENT_EXCEPTION;
5529 Event.n.u8Vector = X86_XCPT_BP;
5530 Event.n.u1ErrorCodeValid = 0;
5531 hmR0SvmSetPendingEvent(pVCpu, &Event, 0 /* GCPtrFaultAddress */);
5532 }
5533
5534 Assert(rc == VINF_SUCCESS || rc == VINF_EM_RAW_GUEST_TRAP || rc == VINF_EM_DBG_BREAKPOINT);
5535 return rc;
5536}
5537
5538
5539#ifdef VBOX_WITH_NESTED_HWVIRT
5540/**
5541 * \#VMEXIT handler for CLGI (SVM_EXIT_CLGI). Conditional \#VMEXIT.
5542 */
5543HMSVM_EXIT_DECL hmR0SvmExitClgi(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5544{
5545 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5546 /** @todo Stat. */
5547 /* STAM_COUNTER_INC(&pVCpu->hm.s.StatExitClgi); */
5548 uint8_t const cbInstr = hmR0SvmGetInstrLengthHwAssist(pVCpu, pCtx, 3);
5549 VBOXSTRICTRC rcStrict = IEMExecDecodedClgi(pVCpu, cbInstr);
5550 return VBOXSTRICTRC_VAL(rcStrict);
5551}
5552
5553
5554/**
5555 * \#VMEXIT handler for STGI (SVM_EXIT_STGI). Conditional \#VMEXIT.
5556 */
5557HMSVM_EXIT_DECL hmR0SvmExitStgi(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5558{
5559 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5560 /** @todo Stat. */
5561 /* STAM_COUNTER_INC(&pVCpu->hm.s.StatExitStgi); */
5562 uint8_t const cbInstr = hmR0SvmGetInstrLengthHwAssist(pVCpu, pCtx, 3);
5563 VBOXSTRICTRC rcStrict = IEMExecDecodedStgi(pVCpu, cbInstr);
5564 return VBOXSTRICTRC_VAL(rcStrict);
5565}
5566
5567
5568/**
5569 * \#VMEXIT handler for VMLOAD (SVM_EXIT_VMLOAD). Conditional \#VMEXIT.
5570 */
5571HMSVM_EXIT_DECL hmR0SvmExitVmload(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5572{
5573 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5574 /** @todo Stat. */
5575 /* STAM_COUNTER_INC(&pVCpu->hm.s.StatExitVmload); */
5576 uint8_t const cbInstr = hmR0SvmGetInstrLengthHwAssist(pVCpu, pCtx, 3);
5577 VBOXSTRICTRC rcStrict = IEMExecDecodedVmload(pVCpu, cbInstr);
5578 return VBOXSTRICTRC_VAL(rcStrict);
5579}
5580
5581
5582/**
5583 * \#VMEXIT handler for VMSAVE (SVM_EXIT_VMSAVE). Conditional \#VMEXIT.
5584 */
5585HMSVM_EXIT_DECL hmR0SvmExitVmsave(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5586{
5587 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5588 /** @todo Stat. */
5589 /* STAM_COUNTER_INC(&pVCpu->hm.s.StatExitVmsave); */
5590 uint8_t const cbInstr = hmR0SvmGetInstrLengthHwAssist(pVCpu, pCtx, 3);
5591 VBOXSTRICTRC rcStrict = IEMExecDecodedVmsave(pVCpu, cbInstr);
5592 return VBOXSTRICTRC_VAL(rcStrict);
5593}
5594
5595
5596/**
5597 * \#VMEXIT handler for INVLPGA (SVM_EXIT_INVLPGA). Conditional \#VMEXIT.
5598 */
5599HMSVM_EXIT_DECL hmR0SvmExitInvlpga(PVMCPU pVCpu, PCPUMCTX pCtx, PSVMTRANSIENT pSvmTransient)
5600{
5601 HMSVM_VALIDATE_EXIT_HANDLER_PARAMS();
5602 /** @todo Stat. */
5603 /* STAM_COUNTER_INC(&pVCpu->hm.s.StatExitInvlpga); */
5604 uint8_t const cbInstr = hmR0SvmGetInstrLengthHwAssist(pVCpu, pCtx, 3);
5605 VBOXSTRICTRC rcStrict = IEMExecDecodedInvlpga(pVCpu, cbInstr);
5606 return VBOXSTRICTRC_VAL(rcStrict);
5607}
5608#endif /* VBOX_WITH_NESTED_HWVIRT */
5609
5610
5611/** @} */
5612
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette