VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMR3/HM.cpp@ 48565

Last change on this file since 48565 was 48565, checked in by vboxsync, 11 years ago

VMM/HM: Added total VM-exits STAM.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Id Revision
File size: 138.2 KB
Line 
1/* $Id: HM.cpp 48565 2013-09-19 22:16:00Z vboxsync $ */
2/** @file
3 * HM - Intel/AMD VM Hardware Support Manager.
4 */
5
6/*
7 * Copyright (C) 2006-2013 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*******************************************************************************
20* Header Files *
21*******************************************************************************/
22#define LOG_GROUP LOG_GROUP_HM
23#include <VBox/vmm/cpum.h>
24#include <VBox/vmm/stam.h>
25#include <VBox/vmm/mm.h>
26#include <VBox/vmm/pdmapi.h>
27#include <VBox/vmm/pgm.h>
28#include <VBox/vmm/ssm.h>
29#include <VBox/vmm/trpm.h>
30#include <VBox/vmm/dbgf.h>
31#include <VBox/vmm/iom.h>
32#include <VBox/vmm/patm.h>
33#include <VBox/vmm/csam.h>
34#include <VBox/vmm/selm.h>
35#ifdef VBOX_WITH_REM
36# include <VBox/vmm/rem.h>
37#endif
38#include <VBox/vmm/hm_vmx.h>
39#include <VBox/vmm/hm_svm.h>
40#include "HMInternal.h"
41#include <VBox/vmm/vm.h>
42#include <VBox/vmm/uvm.h>
43#include <VBox/err.h>
44#include <VBox/param.h>
45
46#include <iprt/assert.h>
47#include <VBox/log.h>
48#include <iprt/asm.h>
49#include <iprt/asm-amd64-x86.h>
50#include <iprt/string.h>
51#include <iprt/env.h>
52#include <iprt/thread.h>
53
54
55/*******************************************************************************
56* Global Variables *
57*******************************************************************************/
58#ifdef VBOX_WITH_STATISTICS
59# define EXIT_REASON(def, val, str) #def " - " #val " - " str
60# define EXIT_REASON_NIL() NULL
61/** Exit reason descriptions for VT-x, used to describe statistics. */
62static const char * const g_apszVTxExitReasons[MAX_EXITREASON_STAT] =
63{
64 EXIT_REASON(VMX_EXIT_XCPT_OR_NMI , 0, "Exception or non-maskable interrupt (NMI)."),
65 EXIT_REASON(VMX_EXIT_EXT_INT , 1, "External interrupt."),
66 EXIT_REASON(VMX_EXIT_TRIPLE_FAULT , 2, "Triple fault."),
67 EXIT_REASON(VMX_EXIT_INIT_SIGNAL , 3, "INIT signal."),
68 EXIT_REASON(VMX_EXIT_SIPI , 4, "Start-up IPI (SIPI)."),
69 EXIT_REASON(VMX_EXIT_IO_SMI_IRQ , 5, "I/O system-management interrupt (SMI)."),
70 EXIT_REASON(VMX_EXIT_SMI_IRQ , 6, "Other SMI."),
71 EXIT_REASON(VMX_EXIT_INT_WINDOW , 7, "Interrupt window."),
72 EXIT_REASON_NIL(),
73 EXIT_REASON(VMX_EXIT_TASK_SWITCH , 9, "Task switch."),
74 EXIT_REASON(VMX_EXIT_CPUID , 10, "Guest attempted to execute CPUID."),
75 EXIT_REASON_NIL(),
76 EXIT_REASON(VMX_EXIT_HLT , 12, "Guest attempted to execute HLT."),
77 EXIT_REASON(VMX_EXIT_INVD , 13, "Guest attempted to execute INVD."),
78 EXIT_REASON(VMX_EXIT_INVLPG , 14, "Guest attempted to execute INVLPG."),
79 EXIT_REASON(VMX_EXIT_RDPMC , 15, "Guest attempted to execute RDPMC."),
80 EXIT_REASON(VMX_EXIT_RDTSC , 16, "Guest attempted to execute RDTSC."),
81 EXIT_REASON(VMX_EXIT_RSM , 17, "Guest attempted to execute RSM in SMM."),
82 EXIT_REASON(VMX_EXIT_VMCALL , 18, "Guest attempted to execute VMCALL."),
83 EXIT_REASON(VMX_EXIT_VMCLEAR , 19, "Guest attempted to execute VMCLEAR."),
84 EXIT_REASON(VMX_EXIT_VMLAUNCH , 20, "Guest attempted to execute VMLAUNCH."),
85 EXIT_REASON(VMX_EXIT_VMPTRLD , 21, "Guest attempted to execute VMPTRLD."),
86 EXIT_REASON(VMX_EXIT_VMPTRST , 22, "Guest attempted to execute VMPTRST."),
87 EXIT_REASON(VMX_EXIT_VMREAD , 23, "Guest attempted to execute VMREAD."),
88 EXIT_REASON(VMX_EXIT_VMRESUME , 24, "Guest attempted to execute VMRESUME."),
89 EXIT_REASON(VMX_EXIT_VMWRITE , 25, "Guest attempted to execute VMWRITE."),
90 EXIT_REASON(VMX_EXIT_VMXOFF , 26, "Guest attempted to execute VMXOFF."),
91 EXIT_REASON(VMX_EXIT_VMXON , 27, "Guest attempted to execute VMXON."),
92 EXIT_REASON(VMX_EXIT_MOV_CRX , 28, "Control-register accesses."),
93 EXIT_REASON(VMX_EXIT_MOV_DRX , 29, "Debug-register accesses."),
94 EXIT_REASON(VMX_EXIT_PORT_IO , 30, "I/O instruction."),
95 EXIT_REASON(VMX_EXIT_RDMSR , 31, "Guest attempted to execute RDMSR."),
96 EXIT_REASON(VMX_EXIT_WRMSR , 32, "Guest attempted to execute WRMSR."),
97 EXIT_REASON(VMX_EXIT_ERR_INVALID_GUEST_STATE, 33, "VM-entry failure due to invalid guest state."),
98 EXIT_REASON(VMX_EXIT_ERR_MSR_LOAD , 34, "VM-entry failure due to MSR loading."),
99 EXIT_REASON_NIL(),
100 EXIT_REASON(VMX_EXIT_MWAIT , 36, "Guest executed MWAIT."),
101 EXIT_REASON(VMX_EXIT_MTF , 37, "Monitor Trap Flag."),
102 EXIT_REASON_NIL(),
103 EXIT_REASON(VMX_EXIT_MONITOR , 39, "Guest attempted to execute MONITOR."),
104 EXIT_REASON(VMX_EXIT_PAUSE , 40, "Guest attempted to execute PAUSE."),
105 EXIT_REASON(VMX_EXIT_ERR_MACHINE_CHECK , 41, "VM-entry failure due to machine-check."),
106 EXIT_REASON_NIL(),
107 EXIT_REASON(VMX_EXIT_TPR_BELOW_THRESHOLD, 43, "TPR below threshold. Guest attempted to execute MOV to CR8."),
108 EXIT_REASON(VMX_EXIT_APIC_ACCESS , 44, "APIC access. Guest attempted to access memory at a physical address on the APIC-access page."),
109 EXIT_REASON_NIL(),
110 EXIT_REASON(VMX_EXIT_XDTR_ACCESS , 46, "Access to GDTR or IDTR. Guest attempted to execute LGDT, LIDT, SGDT, or SIDT."),
111 EXIT_REASON(VMX_EXIT_TR_ACCESS , 47, "Access to LDTR or TR. Guest attempted to execute LLDT, LTR, SLDT, or STR."),
112 EXIT_REASON(VMX_EXIT_EPT_VIOLATION , 48, "EPT violation. An attempt to access memory with a guest-physical address was disallowed by the configuration of the EPT paging structures."),
113 EXIT_REASON(VMX_EXIT_EPT_MISCONFIG , 49, "EPT misconfiguration. An attempt to access memory with a guest-physical address encountered a misconfigured EPT paging-structure entry."),
114 EXIT_REASON(VMX_EXIT_INVEPT , 50, "Guest attempted to execute INVEPT."),
115 EXIT_REASON(VMX_EXIT_RDTSCP , 51, "Guest attempted to execute RDTSCP."),
116 EXIT_REASON(VMX_EXIT_PREEMPT_TIMER , 52, "VMX-preemption timer expired."),
117 EXIT_REASON(VMX_EXIT_INVVPID , 53, "Guest attempted to execute INVVPID."),
118 EXIT_REASON(VMX_EXIT_WBINVD , 54, "Guest attempted to execute WBINVD."),
119 EXIT_REASON(VMX_EXIT_XSETBV , 55, "Guest attempted to execute XSETBV."),
120 EXIT_REASON_NIL(),
121 EXIT_REASON(VMX_EXIT_RDRAND , 57, "Guest attempted to execute RDRAND."),
122 EXIT_REASON(VMX_EXIT_INVPCID , 58, "Guest attempted to execute INVPCID."),
123 EXIT_REASON(VMX_EXIT_VMFUNC , 59, "Guest attempted to execute VMFUNC.")
124};
125/** Exit reason descriptions for AMD-V, used to describe statistics. */
126static const char * const g_apszAmdVExitReasons[MAX_EXITREASON_STAT] =
127{
128 EXIT_REASON(SVM_EXIT_READ_CR0 , 0, "Read CR0."),
129 EXIT_REASON(SVM_EXIT_READ_CR1 , 1, "Read CR1."),
130 EXIT_REASON(SVM_EXIT_READ_CR2 , 2, "Read CR2."),
131 EXIT_REASON(SVM_EXIT_READ_CR3 , 3, "Read CR3."),
132 EXIT_REASON(SVM_EXIT_READ_CR4 , 4, "Read CR4."),
133 EXIT_REASON(SVM_EXIT_READ_CR5 , 5, "Read CR5."),
134 EXIT_REASON(SVM_EXIT_READ_CR6 , 6, "Read CR6."),
135 EXIT_REASON(SVM_EXIT_READ_CR7 , 7, "Read CR7."),
136 EXIT_REASON(SVM_EXIT_READ_CR8 , 8, "Read CR8."),
137 EXIT_REASON(SVM_EXIT_READ_CR9 , 9, "Read CR9."),
138 EXIT_REASON(SVM_EXIT_READ_CR10 , 10, "Read CR10."),
139 EXIT_REASON(SVM_EXIT_READ_CR11 , 11, "Read CR11."),
140 EXIT_REASON(SVM_EXIT_READ_CR12 , 12, "Read CR12."),
141 EXIT_REASON(SVM_EXIT_READ_CR13 , 13, "Read CR13."),
142 EXIT_REASON(SVM_EXIT_READ_CR14 , 14, "Read CR14."),
143 EXIT_REASON(SVM_EXIT_READ_CR15 , 15, "Read CR15."),
144 EXIT_REASON(SVM_EXIT_WRITE_CR0 , 16, "Write CR0."),
145 EXIT_REASON(SVM_EXIT_WRITE_CR1 , 17, "Write CR1."),
146 EXIT_REASON(SVM_EXIT_WRITE_CR2 , 18, "Write CR2."),
147 EXIT_REASON(SVM_EXIT_WRITE_CR3 , 19, "Write CR3."),
148 EXIT_REASON(SVM_EXIT_WRITE_CR4 , 20, "Write CR4."),
149 EXIT_REASON(SVM_EXIT_WRITE_CR5 , 21, "Write CR5."),
150 EXIT_REASON(SVM_EXIT_WRITE_CR6 , 22, "Write CR6."),
151 EXIT_REASON(SVM_EXIT_WRITE_CR7 , 23, "Write CR7."),
152 EXIT_REASON(SVM_EXIT_WRITE_CR8 , 24, "Write CR8."),
153 EXIT_REASON(SVM_EXIT_WRITE_CR9 , 25, "Write CR9."),
154 EXIT_REASON(SVM_EXIT_WRITE_CR10 , 26, "Write CR10."),
155 EXIT_REASON(SVM_EXIT_WRITE_CR11 , 27, "Write CR11."),
156 EXIT_REASON(SVM_EXIT_WRITE_CR12 , 28, "Write CR12."),
157 EXIT_REASON(SVM_EXIT_WRITE_CR13 , 29, "Write CR13."),
158 EXIT_REASON(SVM_EXIT_WRITE_CR14 , 30, "Write CR14."),
159 EXIT_REASON(SVM_EXIT_WRITE_CR15 , 31, "Write CR15."),
160 EXIT_REASON(SVM_EXIT_READ_DR0 , 32, "Read DR0."),
161 EXIT_REASON(SVM_EXIT_READ_DR1 , 33, "Read DR1."),
162 EXIT_REASON(SVM_EXIT_READ_DR2 , 34, "Read DR2."),
163 EXIT_REASON(SVM_EXIT_READ_DR3 , 35, "Read DR3."),
164 EXIT_REASON(SVM_EXIT_READ_DR4 , 36, "Read DR4."),
165 EXIT_REASON(SVM_EXIT_READ_DR5 , 37, "Read DR5."),
166 EXIT_REASON(SVM_EXIT_READ_DR6 , 38, "Read DR6."),
167 EXIT_REASON(SVM_EXIT_READ_DR7 , 39, "Read DR7."),
168 EXIT_REASON(SVM_EXIT_READ_DR8 , 40, "Read DR8."),
169 EXIT_REASON(SVM_EXIT_READ_DR9 , 41, "Read DR9."),
170 EXIT_REASON(SVM_EXIT_READ_DR10 , 42, "Read DR10."),
171 EXIT_REASON(SVM_EXIT_READ_DR11 , 43, "Read DR11"),
172 EXIT_REASON(SVM_EXIT_READ_DR12 , 44, "Read DR12."),
173 EXIT_REASON(SVM_EXIT_READ_DR13 , 45, "Read DR13."),
174 EXIT_REASON(SVM_EXIT_READ_DR14 , 46, "Read DR14."),
175 EXIT_REASON(SVM_EXIT_READ_DR15 , 47, "Read DR15."),
176 EXIT_REASON(SVM_EXIT_WRITE_DR0 , 48, "Write DR0."),
177 EXIT_REASON(SVM_EXIT_WRITE_DR1 , 49, "Write DR1."),
178 EXIT_REASON(SVM_EXIT_WRITE_DR2 , 50, "Write DR2."),
179 EXIT_REASON(SVM_EXIT_WRITE_DR3 , 51, "Write DR3."),
180 EXIT_REASON(SVM_EXIT_WRITE_DR4 , 52, "Write DR4."),
181 EXIT_REASON(SVM_EXIT_WRITE_DR5 , 53, "Write DR5."),
182 EXIT_REASON(SVM_EXIT_WRITE_DR6 , 54, "Write DR6."),
183 EXIT_REASON(SVM_EXIT_WRITE_DR7 , 55, "Write DR7."),
184 EXIT_REASON(SVM_EXIT_WRITE_DR8 , 56, "Write DR8."),
185 EXIT_REASON(SVM_EXIT_WRITE_DR9 , 57, "Write DR9."),
186 EXIT_REASON(SVM_EXIT_WRITE_DR10 , 58, "Write DR10."),
187 EXIT_REASON(SVM_EXIT_WRITE_DR11 , 59, "Write DR11."),
188 EXIT_REASON(SVM_EXIT_WRITE_DR12 , 60, "Write DR12."),
189 EXIT_REASON(SVM_EXIT_WRITE_DR13 , 61, "Write DR13."),
190 EXIT_REASON(SVM_EXIT_WRITE_DR14 , 62, "Write DR14."),
191 EXIT_REASON(SVM_EXIT_WRITE_DR15 , 63, "Write DR15."),
192 EXIT_REASON(SVM_EXIT_EXCEPTION_0 , 64, "Exception Vector 0 (#DE)."),
193 EXIT_REASON(SVM_EXIT_EXCEPTION_1 , 65, "Exception Vector 1 (#DB)."),
194 EXIT_REASON(SVM_EXIT_EXCEPTION_2 , 66, "Exception Vector 2 (#NMI)."),
195 EXIT_REASON(SVM_EXIT_EXCEPTION_3 , 67, "Exception Vector 3 (#BP)."),
196 EXIT_REASON(SVM_EXIT_EXCEPTION_4 , 68, "Exception Vector 4 (#OF)."),
197 EXIT_REASON(SVM_EXIT_EXCEPTION_5 , 69, "Exception Vector 5 (#BR)."),
198 EXIT_REASON(SVM_EXIT_EXCEPTION_6 , 70, "Exception Vector 6 (#UD)."),
199 EXIT_REASON(SVM_EXIT_EXCEPTION_7 , 71, "Exception Vector 7 (#NM)."),
200 EXIT_REASON(SVM_EXIT_EXCEPTION_8 , 72, "Exception Vector 8 (#DF)."),
201 EXIT_REASON(SVM_EXIT_EXCEPTION_9 , 73, "Exception Vector 9 (#CO_SEG_OVERRUN)."),
202 EXIT_REASON(SVM_EXIT_EXCEPTION_A , 74, "Exception Vector 10 (#TS)."),
203 EXIT_REASON(SVM_EXIT_EXCEPTION_B , 75, "Exception Vector 11 (#NP)."),
204 EXIT_REASON(SVM_EXIT_EXCEPTION_C , 76, "Exception Vector 12 (#SS)."),
205 EXIT_REASON(SVM_EXIT_EXCEPTION_D , 77, "Exception Vector 13 (#GP)."),
206 EXIT_REASON(SVM_EXIT_EXCEPTION_E , 78, "Exception Vector 14 (#PF)."),
207 EXIT_REASON(SVM_EXIT_EXCEPTION_F , 79, "Exception Vector 15 (0x0f)."),
208 EXIT_REASON(SVM_EXIT_EXCEPTION_10 , 80, "Exception Vector 16 (#MF)."),
209 EXIT_REASON(SVM_EXIT_EXCEPTION_11 , 81, "Exception Vector 17 (#AC)."),
210 EXIT_REASON(SVM_EXIT_EXCEPTION_12 , 82, "Exception Vector 18 (#MC)."),
211 EXIT_REASON(SVM_EXIT_EXCEPTION_13 , 83, "Exception Vector 19 (#XF)."),
212 EXIT_REASON(SVM_EXIT_EXCEPTION_14 , 84, "Exception Vector 20 (0x14)."),
213 EXIT_REASON(SVM_EXIT_EXCEPTION_15 , 85, "Exception Vector 22 (0x15)."),
214 EXIT_REASON(SVM_EXIT_EXCEPTION_16 , 86, "Exception Vector 22 (0x16)."),
215 EXIT_REASON(SVM_EXIT_EXCEPTION_17 , 87, "Exception Vector 23 (0x17)."),
216 EXIT_REASON(SVM_EXIT_EXCEPTION_18 , 88, "Exception Vector 24 (0x18)."),
217 EXIT_REASON(SVM_EXIT_EXCEPTION_19 , 89, "Exception Vector 25 (0x19)."),
218 EXIT_REASON(SVM_EXIT_EXCEPTION_1A , 90, "Exception Vector 26 (0x1A)."),
219 EXIT_REASON(SVM_EXIT_EXCEPTION_1B , 91, "Exception Vector 27 (0x1B)."),
220 EXIT_REASON(SVM_EXIT_EXCEPTION_1C , 92, "Exception Vector 28 (0x1C)."),
221 EXIT_REASON(SVM_EXIT_EXCEPTION_1D , 93, "Exception Vector 29 (0x1D)."),
222 EXIT_REASON(SVM_EXIT_EXCEPTION_1E , 94, "Exception Vector 30 (0x1E)."),
223 EXIT_REASON(SVM_EXIT_EXCEPTION_1F , 95, "Exception Vector 31 (0x1F)."),
224 EXIT_REASON(SVM_EXIT_INTR , 96, "Physical maskable interrupt (host)."),
225 EXIT_REASON(SVM_EXIT_NMI , 97, "Physical non-maskable interrupt (host)."),
226 EXIT_REASON(SVM_EXIT_SMI , 98, "System management interrupt (host)."),
227 EXIT_REASON(SVM_EXIT_INIT , 99, "Physical INIT signal (host)."),
228 EXIT_REASON(SVM_EXIT_VINTR ,100, "Virtual interrupt-window exit."),
229 EXIT_REASON(SVM_EXIT_CR0_SEL_WRITE ,101, "Write to CR0 that changed any bits other than CR0.TS or CR0.MP."),
230 EXIT_REASON(SVM_EXIT_IDTR_READ ,102, "Read IDTR"),
231 EXIT_REASON(SVM_EXIT_GDTR_READ ,103, "Read GDTR"),
232 EXIT_REASON(SVM_EXIT_LDTR_READ ,104, "Read LDTR."),
233 EXIT_REASON(SVM_EXIT_TR_READ ,105, "Read TR."),
234 EXIT_REASON(SVM_EXIT_TR_READ ,106, "Write IDTR."),
235 EXIT_REASON(SVM_EXIT_TR_READ ,107, "Write GDTR."),
236 EXIT_REASON(SVM_EXIT_TR_READ ,108, "Write LDTR."),
237 EXIT_REASON(SVM_EXIT_TR_READ ,109, "Write TR."),
238 EXIT_REASON(SVM_EXIT_RDTSC ,110, "RDTSC instruction."),
239 EXIT_REASON(SVM_EXIT_RDPMC ,111, "RDPMC instruction."),
240 EXIT_REASON(SVM_EXIT_PUSHF ,112, "PUSHF instruction."),
241 EXIT_REASON(SVM_EXIT_POPF ,113, "POPF instruction."),
242 EXIT_REASON(SVM_EXIT_CPUID ,114, "CPUID instruction."),
243 EXIT_REASON(SVM_EXIT_RSM ,115, "RSM instruction."),
244 EXIT_REASON(SVM_EXIT_IRET ,116, "IRET instruction."),
245 EXIT_REASON(SVM_EXIT_SWINT ,117, "Software interrupt (INTn instructions)."),
246 EXIT_REASON(SVM_EXIT_INVD ,118, "INVD instruction."),
247 EXIT_REASON(SVM_EXIT_PAUSE ,119, "PAUSE instruction."),
248 EXIT_REASON(SVM_EXIT_HLT ,120, "HLT instruction."),
249 EXIT_REASON(SVM_EXIT_INVLPG ,121, "INVLPG instruction."),
250 EXIT_REASON(SVM_EXIT_INVLPGA ,122, "INVLPGA instruction."),
251 EXIT_REASON(SVM_EXIT_IOIO ,123, "IN/OUT accessing protected port."),
252 EXIT_REASON(SVM_EXIT_MSR ,124, "RDMSR or WRMSR access to protected MSR."),
253 EXIT_REASON(SVM_EXIT_TASK_SWITCH ,125, "Task switch."),
254 EXIT_REASON(SVM_EXIT_FERR_FREEZE ,126, "Legacy FPU handling enabled; processor is frozen in an x87/mmx instruction waiting for an interrupt"),
255 EXIT_REASON(SVM_EXIT_SHUTDOWN ,127, "Shutdown."),
256 EXIT_REASON(SVM_EXIT_VMRUN ,128, "VMRUN instruction."),
257 EXIT_REASON(SVM_EXIT_VMMCALL ,129, "VMCALL instruction."),
258 EXIT_REASON(SVM_EXIT_VMLOAD ,130, "VMLOAD instruction."),
259 EXIT_REASON(SVM_EXIT_VMSAVE ,131, "VMSAVE instruction."),
260 EXIT_REASON(SVM_EXIT_STGI ,132, "STGI instruction."),
261 EXIT_REASON(SVM_EXIT_CLGI ,133, "CLGI instruction."),
262 EXIT_REASON(SVM_EXIT_SKINIT ,134, "SKINIT instruction."),
263 EXIT_REASON(SVM_EXIT_RDTSCP ,135, "RDTSCP instruction."),
264 EXIT_REASON(SVM_EXIT_ICEBP ,136, "ICEBP instruction."),
265 EXIT_REASON(SVM_EXIT_WBINVD ,137, "WBINVD instruction."),
266 EXIT_REASON(SVM_EXIT_MONITOR ,138, "MONITOR instruction."),
267 EXIT_REASON(SVM_EXIT_MWAIT ,139, "MWAIT instruction."),
268 EXIT_REASON(SVM_EXIT_MWAIT_ARMED ,140, "MWAIT instruction when armed."),
269 EXIT_REASON(SVM_EXIT_NPF ,1024, "Nested paging fault."),
270 EXIT_REASON_NIL()
271};
272# undef EXIT_REASON
273# undef EXIT_REASON_NIL
274#endif /* VBOX_WITH_STATISTICS */
275
276#define HMVMX_REPORT_FEATURE(allowed1, disallowed0, featflag) \
277 do { \
278 if ((allowed1) & (featflag)) \
279 LogRel(("HM: " #featflag "\n")); \
280 else \
281 LogRel(("HM: " #featflag " *must* be cleared\n")); \
282 if ((disallowed0) & (featflag)) \
283 LogRel(("HM: " #featflag " *must* be set\n")); \
284 } while (0)
285
286#define HMVMX_REPORT_ALLOWED_FEATURE(allowed1, featflag) \
287 do { \
288 if ((allowed1) & (featflag)) \
289 LogRel(("HM: " #featflag "\n")); \
290 else \
291 LogRel(("HM: " #featflag " not supported\n")); \
292 } while (0)
293
294#define HMVMX_REPORT_CAPABILITY(msrcaps, cap) \
295 do { \
296 if ((msrcaps) & (cap)) \
297 LogRel(("HM: " #cap "\n")); \
298 } while (0)
299
300
301/*******************************************************************************
302* Internal Functions *
303*******************************************************************************/
304static DECLCALLBACK(int) hmR3Save(PVM pVM, PSSMHANDLE pSSM);
305static DECLCALLBACK(int) hmR3Load(PVM pVM, PSSMHANDLE pSSM, uint32_t uVersion, uint32_t uPass);
306static int hmR3InitCPU(PVM pVM);
307static int hmR3InitFinalizeR0(PVM pVM);
308static int hmR3InitFinalizeR0Intel(PVM pVM);
309static int hmR3InitFinalizeR0Amd(PVM pVM);
310static int hmR3TermCPU(PVM pVM);
311
312
313
314/**
315 * Initializes the HM.
316 *
317 * This reads the config and check whether VT-x or AMD-V hardware is available
318 * if configured to use it. This is one of the very first components to be
319 * initialized after CFGM, so that we can fall back to raw-mode early in the
320 * initialization process.
321 *
322 * Note that a lot of the set up work is done in ring-0 and thus postponed till
323 * the ring-3 and ring-0 callback to HMR3InitCompleted.
324 *
325 * @returns VBox status code.
326 * @param pVM Pointer to the VM.
327 *
328 * @remarks Be careful with what we call here, since most of the VMM components
329 * are uninitialized.
330 */
331VMMR3_INT_DECL(int) HMR3Init(PVM pVM)
332{
333 LogFlow(("HMR3Init\n"));
334
335 /*
336 * Assert alignment and sizes.
337 */
338 AssertCompileMemberAlignment(VM, hm.s, 32);
339 AssertCompile(sizeof(pVM->hm.s) <= sizeof(pVM->hm.padding));
340
341 /*
342 * Register the saved state data unit.
343 */
344 int rc = SSMR3RegisterInternal(pVM, "HWACCM", 0, HM_SSM_VERSION, sizeof(HM),
345 NULL, NULL, NULL,
346 NULL, hmR3Save, NULL,
347 NULL, hmR3Load, NULL);
348 if (RT_FAILURE(rc))
349 return rc;
350
351 /*
352 * Misc initialisation.
353 */
354 //pVM->hm.s.vmx.fSupported = false;
355 //pVM->hm.s.svm.fSupported = false;
356 //pVM->hm.s.vmx.fEnabled = false;
357 //pVM->hm.s.svm.fEnabled = false;
358 //pVM->hm.s.fNestedPaging = false;
359
360
361 /*
362 * Read configuration.
363 */
364 PCFGMNODE pCfgHM = CFGMR3GetChild(CFGMR3GetRoot(pVM), "HM/");
365
366 /** @cfgm{/HM/HMForced, bool, false}
367 * Forces hardware virtualization, no falling back on raw-mode. HM must be
368 * enabled, i.e. /HMEnabled must be true. */
369 bool fHMForced;
370#ifdef VBOX_WITH_RAW_MODE
371 rc = CFGMR3QueryBoolDef(pCfgHM, "HMForced", &fHMForced, false);
372 AssertRCReturn(rc, rc);
373 AssertLogRelMsgReturn(!fHMForced || pVM->fHMEnabled, ("Configuration error: HM forced but not enabled!\n"),
374 VERR_INVALID_PARAMETER);
375# if defined(RT_OS_DARWIN)
376 if (pVM->fHMEnabled)
377 fHMForced = true;
378# endif
379 AssertLogRelMsgReturn(pVM->cCpus == 1 || pVM->fHMEnabled, ("Configuration error: SMP requires HM to be enabled!\n"),
380 VERR_INVALID_PARAMETER);
381 if (pVM->cCpus > 1)
382 fHMForced = true;
383#else /* !VBOX_WITH_RAW_MODE */
384 AssertRelease(pVM->fHMEnabled);
385 fHMForced = true;
386#endif /* !VBOX_WITH_RAW_MODE */
387
388 /** @cfgm{/HM/EnableNestedPaging, bool, false}
389 * Enables nested paging (aka extended page tables). */
390 rc = CFGMR3QueryBoolDef(pCfgHM, "EnableNestedPaging", &pVM->hm.s.fAllowNestedPaging, false);
391 AssertRCReturn(rc, rc);
392
393 /** @cfgm{/HM/EnableUX, bool, true}
394 * Enables the VT-x unrestricted execution feature. */
395 rc = CFGMR3QueryBoolDef(pCfgHM, "EnableUX", &pVM->hm.s.vmx.fAllowUnrestricted, true);
396 AssertRCReturn(rc, rc);
397
398 /** @cfgm{/HM/EnableLargePages, bool, false}
399 * Enables using large pages (2 MB) for guest memory, thus saving on (nested)
400 * page table walking and maybe better TLB hit rate in some cases. */
401 rc = CFGMR3QueryBoolDef(pCfgHM, "EnableLargePages", &pVM->hm.s.fLargePages, false);
402 AssertRCReturn(rc, rc);
403
404 /** @cfgm{/HM/EnableVPID, bool, false}
405 * Enables the VT-x VPID feature. */
406 rc = CFGMR3QueryBoolDef(pCfgHM, "EnableVPID", &pVM->hm.s.vmx.fAllowVpid, false);
407 AssertRCReturn(rc, rc);
408
409 /** @cfgm{/HM/TPRPatchingEnabled, bool, false}
410 * Enables TPR patching for 32-bit windows guests with IO-APIC. */
411 rc = CFGMR3QueryBoolDef(pCfgHM, "TPRPatchingEnabled", &pVM->hm.s.fTRPPatchingAllowed, false);
412 AssertRCReturn(rc, rc);
413
414 /** @cfgm{/HM/64bitEnabled, bool, 32-bit:false, 64-bit:true}
415 * Enables AMD64 cpu features.
416 * On 32-bit hosts this isn't default and require host CPU support. 64-bit hosts
417 * already have the support. */
418#ifdef VBOX_ENABLE_64_BITS_GUESTS
419 rc = CFGMR3QueryBoolDef(pCfgHM, "64bitEnabled", &pVM->hm.s.fAllow64BitGuests, HC_ARCH_BITS == 64);
420 AssertLogRelRCReturn(rc, rc);
421#else
422 pVM->hm.s.fAllow64BitGuests = false;
423#endif
424
425 /** @cfgm{/HM/Exclusive, bool}
426 * Determines the init method for AMD-V and VT-x. If set to true, HM will do a
427 * global init for each host CPU. If false, we do local init each time we wish
428 * to execute guest code.
429 *
430 * Default is false for Mac OS X and Windows due to the higher risk of conflicts
431 * with other hypervisors.
432 */
433 rc = CFGMR3QueryBoolDef(pCfgHM, "Exclusive", &pVM->hm.s.fGlobalInit,
434#if defined(RT_OS_DARWIN) || defined(RT_OS_WINDOWS)
435 false
436#else
437 true
438#endif
439 );
440 AssertLogRelRCReturn(rc, rc);
441
442 /** @cfgm{/HM/MaxResumeLoops, uint32_t}
443 * The number of times to resume guest execution before we forcibly return to
444 * ring-3. The return value of RTThreadPreemptIsPendingTrusty in ring-0
445 * determines the default value. */
446 rc = CFGMR3QueryU32Def(pCfgHM, "MaxResumeLoops", &pVM->hm.s.cMaxResumeLoops, 0 /* set by R0 later */);
447 AssertLogRelRCReturn(rc, rc);
448
449 /*
450 * Check if VT-x or AMD-v support according to the users wishes.
451 */
452 /** @todo SUPR3QueryVTCaps won't catch VERR_VMX_IN_VMX_ROOT_MODE or
453 * VERR_SVM_IN_USE. */
454 if (pVM->fHMEnabled)
455 {
456 uint32_t fCaps;
457 rc = SUPR3QueryVTCaps(&fCaps);
458 if (RT_SUCCESS(rc))
459 {
460 if (fCaps & SUPVTCAPS_AMD_V)
461 LogRel(("HMR3Init: AMD-V%s\n", fCaps & SUPVTCAPS_NESTED_PAGING ? " w/ nested paging" : ""));
462 else if (fCaps & SUPVTCAPS_VT_X)
463 {
464 rc = SUPR3QueryVTxSupported();
465 if (RT_SUCCESS(rc))
466 LogRel(("HMR3Init: VT-x%s\n", fCaps & SUPVTCAPS_NESTED_PAGING ? " w/ nested paging" : ""));
467 else
468 {
469#ifdef RT_OS_LINUX
470 const char *pszMinReq = " Linux 2.6.13 or newer required!";
471#else
472 const char *pszMinReq = "";
473#endif
474 if (fHMForced)
475 return VMSetError(pVM, rc, RT_SRC_POS, "The host kernel does not support VT-x.%s\n", pszMinReq);
476
477 /* Fall back to raw-mode. */
478 LogRel(("HMR3Init: Falling back to raw-mode: The host kernel does not support VT-x.%s\n", pszMinReq));
479 pVM->fHMEnabled = false;
480 }
481 }
482 else
483 AssertLogRelMsgFailedReturn(("SUPR3QueryVTCaps didn't return either AMD-V or VT-x flag set (%#x)!\n", fCaps),
484 VERR_INTERNAL_ERROR_5);
485
486 /*
487 * Do we require a little bit or raw-mode for 64-bit guest execution?
488 */
489 pVM->fHMNeedRawModeCtx = HC_ARCH_BITS == 32
490 && pVM->fHMEnabled
491 && pVM->hm.s.fAllow64BitGuests;
492 }
493 else
494 {
495 const char *pszMsg;
496 switch (rc)
497 {
498 case VERR_UNSUPPORTED_CPU:
499 pszMsg = "Unknown CPU, VT-x or AMD-v features cannot be ascertained.";
500 break;
501
502 case VERR_VMX_NO_VMX:
503 pszMsg = "VT-x is not available.";
504 break;
505
506 case VERR_VMX_MSR_VMXON_DISABLED:
507 pszMsg = "VT-x is disabled in the BIOS.";
508 break;
509
510 case VERR_VMX_MSR_SMX_VMXON_DISABLED:
511 pszMsg = "VT-x is disabled in the BIOS for Safer-Mode/Trusted Extensions.";
512 break;
513
514 case VERR_VMX_MSR_LOCKING_FAILED:
515 pszMsg = "Failed to enable and lock VT-x features.";
516 break;
517
518 case VERR_SVM_NO_SVM:
519 pszMsg = "AMD-V is not available.";
520 break;
521
522 case VERR_SVM_DISABLED:
523 pszMsg = "AMD-V is disabled in the BIOS (or by the host OS).";
524 break;
525
526 default:
527 pszMsg = NULL;
528 break;
529 }
530 if (fHMForced && pszMsg)
531 return VM_SET_ERROR(pVM, rc, pszMsg);
532 if (!pszMsg)
533 return VMSetError(pVM, rc, RT_SRC_POS, "SUPR3QueryVTCaps failed with %Rrc", rc);
534
535 /* Fall back to raw-mode. */
536 LogRel(("HMR3Init: Falling back to raw-mode: %s\n", pszMsg));
537 pVM->fHMEnabled = false;
538 }
539 }
540
541 /* It's now OK to use the predicate function. */
542 pVM->fHMEnabledFixed = true;
543 return VINF_SUCCESS;
544}
545
546
547/**
548 * Initializes the per-VCPU HM.
549 *
550 * @returns VBox status code.
551 * @param pVM Pointer to the VM.
552 */
553static int hmR3InitCPU(PVM pVM)
554{
555 LogFlow(("HMR3InitCPU\n"));
556
557 if (!HMIsEnabled(pVM))
558 return VINF_SUCCESS;
559
560 for (VMCPUID i = 0; i < pVM->cCpus; i++)
561 {
562 PVMCPU pVCpu = &pVM->aCpus[i];
563 pVCpu->hm.s.fActive = false;
564 }
565
566#ifdef VBOX_WITH_STATISTICS
567 STAM_REG(pVM, &pVM->hm.s.StatTprPatchSuccess, STAMTYPE_COUNTER, "/HM/TPR/Patch/Success", STAMUNIT_OCCURENCES, "Number of times an instruction was successfully patched.");
568 STAM_REG(pVM, &pVM->hm.s.StatTprPatchFailure, STAMTYPE_COUNTER, "/HM/TPR/Patch/Failed", STAMUNIT_OCCURENCES, "Number of unsuccessful patch attempts.");
569 STAM_REG(pVM, &pVM->hm.s.StatTprReplaceSuccess, STAMTYPE_COUNTER, "/HM/TPR/Replace/Success",STAMUNIT_OCCURENCES, "Number of times an instruction was successfully patched.");
570 STAM_REG(pVM, &pVM->hm.s.StatTprReplaceFailure, STAMTYPE_COUNTER, "/HM/TPR/Replace/Failed", STAMUNIT_OCCURENCES, "Number of unsuccessful patch attempts.");
571#endif
572
573 /*
574 * Statistics.
575 */
576 for (VMCPUID i = 0; i < pVM->cCpus; i++)
577 {
578 PVMCPU pVCpu = &pVM->aCpus[i];
579 int rc;
580
581#ifdef VBOX_WITH_STATISTICS
582 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatPoke, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
583 "Profiling of RTMpPokeCpu",
584 "/PROF/CPU%d/HM/Poke", i);
585 AssertRC(rc);
586 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatSpinPoke, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
587 "Profiling of poke wait",
588 "/PROF/CPU%d/HM/PokeWait", i);
589 AssertRC(rc);
590 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatSpinPokeFailed, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
591 "Profiling of poke wait when RTMpPokeCpu fails",
592 "/PROF/CPU%d/HM/PokeWaitFailed", i);
593 AssertRC(rc);
594 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatEntry, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
595 "Profiling of VMXR0RunGuestCode entry",
596 "/PROF/CPU%d/HM/StatEntry", i);
597 AssertRC(rc);
598 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatExit1, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
599 "Profiling of VMXR0RunGuestCode exit part 1",
600 "/PROF/CPU%d/HM/SwitchFromGC_1", i);
601 AssertRC(rc);
602 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatExit2, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
603 "Profiling of VMXR0RunGuestCode exit part 2",
604 "/PROF/CPU%d/HM/SwitchFromGC_2", i);
605 AssertRC(rc);
606
607 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatExitIO, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
608 "I/O",
609 "/PROF/CPU%d/HM/SwitchFromGC_2/IO", i);
610 AssertRC(rc);
611 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatExitMovCRx, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
612 "MOV CRx",
613 "/PROF/CPU%d/HM/SwitchFromGC_2/MovCRx", i);
614 AssertRC(rc);
615 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatExitXcptNmi, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
616 "Exceptions, NMIs",
617 "/PROF/CPU%d/HM/SwitchFromGC_2/XcptNmi", i);
618 AssertRC(rc);
619
620 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatLoadGuestState, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
621 "Profiling of VMXR0LoadGuestState",
622 "/PROF/CPU%d/HM/StatLoadGuestState", i);
623 AssertRC(rc);
624 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatInGC, STAMTYPE_PROFILE, STAMVISIBILITY_USED, STAMUNIT_TICKS_PER_CALL,
625 "Profiling of VMLAUNCH/VMRESUME.",
626 "/PROF/CPU%d/HM/InGC", i);
627 AssertRC(rc);
628
629# if HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
630 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatWorldSwitch3264, STAMTYPE_PROFILE, STAMVISIBILITY_USED,
631 STAMUNIT_TICKS_PER_CALL, "Profiling of the 32/64 switcher.",
632 "/PROF/CPU%d/HM/Switcher3264", i);
633 AssertRC(rc);
634# endif
635
636# ifdef HM_PROFILE_EXIT_DISPATCH
637 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatExitDispatch, STAMTYPE_PROFILE_ADV, STAMVISIBILITY_USED,
638 STAMUNIT_TICKS_PER_CALL, "Profiling the dispatching of exit handlers.",
639 "/PROF/CPU%d/HM/ExitDispatch", i);
640 AssertRC(rc);
641# endif
642
643#endif
644# define HM_REG_COUNTER(a, b, desc) \
645 rc = STAMR3RegisterF(pVM, a, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_OCCURENCES, desc, b, i); \
646 AssertRC(rc);
647
648#ifdef VBOX_WITH_STATISTICS
649 HM_REG_COUNTER(&pVCpu->hm.s.StatExitAll, "/HM/CPU%d/Exit/All", "Exits (total).");
650 HM_REG_COUNTER(&pVCpu->hm.s.StatExitShadowNM, "/HM/CPU%d/Exit/Trap/Shw/#NM", "Shadow #NM (device not available, no math co-processor) exception.");
651 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestNM, "/HM/CPU%d/Exit/Trap/Gst/#NM", "Guest #NM (device not available, no math co-processor) exception.");
652 HM_REG_COUNTER(&pVCpu->hm.s.StatExitShadowPF, "/HM/CPU%d/Exit/Trap/Shw/#PF", "Shadow #PF (page fault) exception.");
653 HM_REG_COUNTER(&pVCpu->hm.s.StatExitShadowPFEM, "/HM/CPU%d/Exit/Trap/Shw/#PF-EM", "#PF (page fault) exception going back to ring-3 for emulating the instruction.");
654 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestPF, "/HM/CPU%d/Exit/Trap/Gst/#PF", "Guest #PF (page fault) exception.");
655 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestUD, "/HM/CPU%d/Exit/Trap/Gst/#UD", "Guest #UD (undefined opcode) exception.");
656 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestSS, "/HM/CPU%d/Exit/Trap/Gst/#SS", "Guest #SS (stack-segment fault) exception.");
657 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestNP, "/HM/CPU%d/Exit/Trap/Gst/#NP", "Guest #NP (segment not present) exception.");
658 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestGP, "/HM/CPU%d/Exit/Trap/Gst/#GP", "Guest #GP (general protection) execption.");
659 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestMF, "/HM/CPU%d/Exit/Trap/Gst/#MF", "Guest #MF (x87 FPU error, math fault) exception.");
660 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestDE, "/HM/CPU%d/Exit/Trap/Gst/#DE", "Guest #DE (divide error) exception.");
661 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestDB, "/HM/CPU%d/Exit/Trap/Gst/#DB", "Guest #DB (debug) exception.");
662 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestBP, "/HM/CPU%d/Exit/Trap/Gst/#BP", "Guest #BP (breakpoint) exception.");
663 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestXF, "/HM/CPU%d/Exit/Trap/Gst/#XF", "Guest #XF (extended math fault, SIMD FPU) exception.");
664 HM_REG_COUNTER(&pVCpu->hm.s.StatExitGuestXcpUnk, "/HM/CPU%d/Exit/Trap/Gst/Other", "Other guest exceptions.");
665 HM_REG_COUNTER(&pVCpu->hm.s.StatExitInvlpg, "/HM/CPU%d/Exit/Instr/Invlpg", "Guest attempted to execute INVLPG.");
666 HM_REG_COUNTER(&pVCpu->hm.s.StatExitInvd, "/HM/CPU%d/Exit/Instr/Invd", "Guest attempted to execute INVD.");
667 HM_REG_COUNTER(&pVCpu->hm.s.StatExitWbinvd, "/HM/CPU%d/Exit/Instr/Wbinvd", "Guest attempted to execute WBINVD.");
668 HM_REG_COUNTER(&pVCpu->hm.s.StatExitPause, "/HM/CPU%d/Exit/Instr/Pause", "Guest attempted to execute PAUSE.");
669 HM_REG_COUNTER(&pVCpu->hm.s.StatExitCpuid, "/HM/CPU%d/Exit/Instr/Cpuid", "Guest attempted to execute CPUID.");
670 HM_REG_COUNTER(&pVCpu->hm.s.StatExitRdtsc, "/HM/CPU%d/Exit/Instr/Rdtsc", "Guest attempted to execute RDTSC.");
671 HM_REG_COUNTER(&pVCpu->hm.s.StatExitRdtscp, "/HM/CPU%d/Exit/Instr/Rdtscp", "Guest attempted to execute RDTSCP.");
672 HM_REG_COUNTER(&pVCpu->hm.s.StatExitRdpmc, "/HM/CPU%d/Exit/Instr/Rdpmc", "Guest attempted to execute RDPMC.");
673 HM_REG_COUNTER(&pVCpu->hm.s.StatExitRdrand, "/HM/CPU%d/Exit/Instr/Rdrand", "Guest attempted to execute RDRAND.");
674 HM_REG_COUNTER(&pVCpu->hm.s.StatExitRdmsr, "/HM/CPU%d/Exit/Instr/Rdmsr", "Guest attempted to execute RDMSR.");
675 HM_REG_COUNTER(&pVCpu->hm.s.StatExitWrmsr, "/HM/CPU%d/Exit/Instr/Wrmsr", "Guest attempted to execute WRMSR.");
676 HM_REG_COUNTER(&pVCpu->hm.s.StatExitMwait, "/HM/CPU%d/Exit/Instr/Mwait", "Guest attempted to execute MWAIT.");
677 HM_REG_COUNTER(&pVCpu->hm.s.StatExitMonitor, "/HM/CPU%d/Exit/Instr/Monitor", "Guest attempted to execute MONITOR.");
678 HM_REG_COUNTER(&pVCpu->hm.s.StatExitDRxWrite, "/HM/CPU%d/Exit/Instr/DR/Write", "Guest attempted to write a debug register.");
679 HM_REG_COUNTER(&pVCpu->hm.s.StatExitDRxRead, "/HM/CPU%d/Exit/Instr/DR/Read", "Guest attempted to read a debug register.");
680 HM_REG_COUNTER(&pVCpu->hm.s.StatExitClts, "/HM/CPU%d/Exit/Instr/CLTS", "Guest attempted to execute CLTS.");
681 HM_REG_COUNTER(&pVCpu->hm.s.StatExitLmsw, "/HM/CPU%d/Exit/Instr/LMSW", "Guest attempted to execute LMSW.");
682 HM_REG_COUNTER(&pVCpu->hm.s.StatExitCli, "/HM/CPU%d/Exit/Instr/Cli", "Guest attempted to execute CLI.");
683 HM_REG_COUNTER(&pVCpu->hm.s.StatExitSti, "/HM/CPU%d/Exit/Instr/Sti", "Guest attempted to execute STI.");
684 HM_REG_COUNTER(&pVCpu->hm.s.StatExitPushf, "/HM/CPU%d/Exit/Instr/Pushf", "Guest attempted to execute PUSHF.");
685 HM_REG_COUNTER(&pVCpu->hm.s.StatExitPopf, "/HM/CPU%d/Exit/Instr/Popf", "Guest attempted to execute POPF.");
686 HM_REG_COUNTER(&pVCpu->hm.s.StatExitIret, "/HM/CPU%d/Exit/Instr/Iret", "Guest attempted to execute IRET.");
687 HM_REG_COUNTER(&pVCpu->hm.s.StatExitInt, "/HM/CPU%d/Exit/Instr/Int", "Guest attempted to execute INT.");
688 HM_REG_COUNTER(&pVCpu->hm.s.StatExitHlt, "/HM/CPU%d/Exit/Instr/Hlt", "Guest attempted to execute HLT.");
689 HM_REG_COUNTER(&pVCpu->hm.s.StatExitXdtrAccess, "/HM/CPU%d/Exit/Instr/XdtrAccess", "Guest attempted to access descriptor table register (GDTR, IDTR, LDTR).");
690 HM_REG_COUNTER(&pVCpu->hm.s.StatExitIOWrite, "/HM/CPU%d/Exit/IO/Write", "I/O write.");
691 HM_REG_COUNTER(&pVCpu->hm.s.StatExitIORead, "/HM/CPU%d/Exit/IO/Read", "I/O read.");
692 HM_REG_COUNTER(&pVCpu->hm.s.StatExitIOStringWrite, "/HM/CPU%d/Exit/IO/WriteString", "String I/O write.");
693 HM_REG_COUNTER(&pVCpu->hm.s.StatExitIOStringRead, "/HM/CPU%d/Exit/IO/ReadString", "String I/O read.");
694 HM_REG_COUNTER(&pVCpu->hm.s.StatExitIntWindow, "/HM/CPU%d/Exit/IntWindow", "Interrupt-window exit. Guest is ready to receive interrupts again.");
695 HM_REG_COUNTER(&pVCpu->hm.s.StatExitMaxResume, "/HM/CPU%d/Exit/MaxResume", "Maximum VMRESUME inner-loop counter reached.");
696 HM_REG_COUNTER(&pVCpu->hm.s.StatExitExtInt, "/HM/CPU%d/Exit/ExtInt", "Host interrupt received.");
697#endif
698 HM_REG_COUNTER(&pVCpu->hm.s.StatExitHostNmiInGC, "/HM/CPU%d/Exit/HostNmiInGC", "Host NMI received while in guest context.");
699#ifdef VBOX_WITH_STATISTICS
700 HM_REG_COUNTER(&pVCpu->hm.s.StatExitPreemptTimer, "/HM/CPU%d/Exit/PreemptTimer", "VMX-preemption timer expired.");
701 HM_REG_COUNTER(&pVCpu->hm.s.StatExitTprBelowThreshold, "/HM/CPU%d/Exit/TprBelowThreshold", "TPR lowered below threshold by the guest.");
702 HM_REG_COUNTER(&pVCpu->hm.s.StatExitTaskSwitch, "/HM/CPU%d/Exit/TaskSwitch", "Guest attempted a task switch.");
703 HM_REG_COUNTER(&pVCpu->hm.s.StatExitMtf, "/HM/CPU%d/Exit/MonitorTrapFlag", "Monitor Trap Flag.");
704 HM_REG_COUNTER(&pVCpu->hm.s.StatExitApicAccess, "/HM/CPU%d/Exit/ApicAccess", "APIC access. Guest attempted to access memory at a physical address on the APIC-access page.");
705
706 HM_REG_COUNTER(&pVCpu->hm.s.StatSwitchGuestIrq, "/HM/CPU%d/Switch/IrqPending", "PDMGetInterrupt() cleared behind our back!?!.");
707 HM_REG_COUNTER(&pVCpu->hm.s.StatPendingHostIrq, "/HM/CPU%d/Switch/PendingHostIrq", "Exit to ring-3 due to pending host interrupt before executing guest code.");
708 HM_REG_COUNTER(&pVCpu->hm.s.StatSwitchHmToR3FF, "/HM/CPU%d/Switch/HmToR3FF", "Exit to ring-3 due to pending timers, EMT rendezvous, critical section etc.");
709 HM_REG_COUNTER(&pVCpu->hm.s.StatSwitchExitToR3, "/HM/CPU%d/Switch/ExitToR3", "Exit to ring-3 (total).");
710 HM_REG_COUNTER(&pVCpu->hm.s.StatSwitchLongJmpToR3, "/HM/CPU%d/Switch/LongJmpToR3", "Longjump to ring-3.");
711
712 HM_REG_COUNTER(&pVCpu->hm.s.StatInjectInterrupt, "/HM/CPU%d/EventInject/Interrupt", "Injected an external interrupt into the guest.");
713 HM_REG_COUNTER(&pVCpu->hm.s.StatInjectXcpt, "/HM/CPU%d/EventInject/Trap", "Injected an exception into the guest.");
714 HM_REG_COUNTER(&pVCpu->hm.s.StatInjectPendingReflect, "/HM/CPU%d/EventInject/PendingReflect", "Reflecting an exception back to the guest.");
715
716 HM_REG_COUNTER(&pVCpu->hm.s.StatPreemptPreempting, "/HM/CPU%d/Preempt/Preempting", "EMT has been preempted while in HM context.");
717 HM_REG_COUNTER(&pVCpu->hm.s.StatPreemptSaveHostState, "/HM/CPU%d/Preempt/SaveHostState", "Preemption caused us to resave host state.");
718
719 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushPage, "/HM/CPU%d/Flush/Page", "Invalidating a guest page on all guest CPUs.");
720 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushPageManual, "/HM/CPU%d/Flush/Page/Virt", "Invalidating a guest page using guest-virtual address.");
721 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushPhysPageManual, "/HM/CPU%d/Flush/Page/Phys", "Invalidating a guest page using guest-physical address.");
722 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushTlb, "/HM/CPU%d/Flush/TLB", "Forcing a full guest-TLB flush (ring-0).");
723 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushTlbManual, "/HM/CPU%d/Flush/TLB/Manual", "Request a full guest-TLB flush.");
724 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushTlbWorldSwitch, "/HM/CPU%d/Flush/TLB/CpuSwitch", "Forcing a full guest-TLB flush due to host-CPU reschedule or ASID-limit hit by another guest-VCPU.");
725 HM_REG_COUNTER(&pVCpu->hm.s.StatNoFlushTlbWorldSwitch, "/HM/CPU%d/Flush/TLB/Skipped", "No TLB flushing required.");
726 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushEntire, "/HM/CPU%d/Flush/TLB/Entire", "Flush the entire TLB (host + guest).");
727 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushAsid, "/HM/CPU%d/Flush/TLB/ASID", "Flushed guest-TLB entries for the current VPID.");
728 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushNestedPaging, "/HM/CPU%d/Flush/TLB/NestedPaging", "Flushed guest-TLB entries for the current EPT.");
729 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushTlbInvlpgVirt, "/HM/CPU%d/Flush/TLB/InvlpgVirt", "Invalidated a guest-TLB entry for a guest-virtual address.");
730 HM_REG_COUNTER(&pVCpu->hm.s.StatFlushTlbInvlpgPhys, "/HM/CPU%d/Flush/TLB/InvlpgPhys", "Currently not possible, flushes entire guest-TLB.");
731 HM_REG_COUNTER(&pVCpu->hm.s.StatTlbShootdown, "/HM/CPU%d/Flush/Shootdown/Page", "Inter-VCPU request to flush queued guest page.");
732 HM_REG_COUNTER(&pVCpu->hm.s.StatTlbShootdownFlush, "/HM/CPU%d/Flush/Shootdown/TLB", "Inter-VCPU request to flush entire guest-TLB.");
733
734 HM_REG_COUNTER(&pVCpu->hm.s.StatTscOffset, "/HM/CPU%d/TSC/Offset", "TSC offsetting is in effect.");
735 HM_REG_COUNTER(&pVCpu->hm.s.StatTscIntercept, "/HM/CPU%d/TSC/Intercept", "Guest is in catchup mode, intercept TSC accesses.");
736 HM_REG_COUNTER(&pVCpu->hm.s.StatTscInterceptOverFlow, "/HM/CPU%d/TSC/InterceptOverflow", "TSC offset overflow, fallback to intercept TSC accesses.");
737
738 HM_REG_COUNTER(&pVCpu->hm.s.StatDRxArmed, "/HM/CPU%d/Debug/Armed", "Loaded guest-debug state while loading guest-state.");
739 HM_REG_COUNTER(&pVCpu->hm.s.StatDRxContextSwitch, "/HM/CPU%d/Debug/ContextSwitch", "Loaded guest-debug state on MOV DRx.");
740 HM_REG_COUNTER(&pVCpu->hm.s.StatDRxIoCheck, "/HM/CPU%d/Debug/IOCheck", "Checking for I/O breakpoint.");
741
742 HM_REG_COUNTER(&pVCpu->hm.s.StatLoadMinimal, "/HM/CPU%d/Load/Minimal", "VM-entry loading minimal guest-state.");
743 HM_REG_COUNTER(&pVCpu->hm.s.StatLoadFull, "/HM/CPU%d/Load/Full", "VM-entry loading the full guest-state.");
744
745 HM_REG_COUNTER(&pVCpu->hm.s.StatVmxCheckBadRmSelBase, "/HM/CPU%d/VMXCheck/RMSelBase", "Could not use VMX due to unsuitable real-mode selector base.");
746 HM_REG_COUNTER(&pVCpu->hm.s.StatVmxCheckBadRmSelLimit, "/HM/CPU%d/VMXCheck/RMSelLimit", "Could not use VMX due to unsuitable real-mode selector limit.");
747 HM_REG_COUNTER(&pVCpu->hm.s.StatVmxCheckRmOk, "/HM/CPU%d/VMXCheck/VMX_RM", "VMX execution in real (V86) mode OK.");
748 HM_REG_COUNTER(&pVCpu->hm.s.StatVmxCheckBadSel, "/HM/CPU%d/VMXCheck/Selector", "Could not use VMX due to unsuitable selector.");
749 HM_REG_COUNTER(&pVCpu->hm.s.StatVmxCheckBadRpl, "/HM/CPU%d/VMXCheck/RPL", "Could not use VMX due to unsuitable RPL.");
750 HM_REG_COUNTER(&pVCpu->hm.s.StatVmxCheckBadLdt, "/HM/CPU%d/VMXCheck/LDT", "Could not use VMX due to unsuitable LDT.");
751 HM_REG_COUNTER(&pVCpu->hm.s.StatVmxCheckBadTr, "/HM/CPU%d/VMXCheck/TR", "Could not use VMX due to unsuitable TR.");
752 HM_REG_COUNTER(&pVCpu->hm.s.StatVmxCheckPmOk, "/HM/CPU%d/VMXCheck/VMX_PM", "VMX execution in protected mode OK.");
753
754#if HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
755 HM_REG_COUNTER(&pVCpu->hm.s.StatFpu64SwitchBack, "/HM/CPU%d/Switch64/Fpu", "Saving guest FPU/XMM state.");
756 HM_REG_COUNTER(&pVCpu->hm.s.StatDebug64SwitchBack, "/HM/CPU%d/Switch64/Debug", "Saving guest debug state.");
757#endif
758
759 for (unsigned j = 0; j < RT_ELEMENTS(pVCpu->hm.s.StatExitCRxWrite); j++)
760 {
761 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatExitCRxWrite[j], STAMTYPE_COUNTER, STAMVISIBILITY_USED,
762 STAMUNIT_OCCURENCES, "Profiling of CRx writes",
763 "/HM/CPU%d/Exit/Instr/CR/Write/%x", i, j);
764 AssertRC(rc);
765 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatExitCRxRead[j], STAMTYPE_COUNTER, STAMVISIBILITY_USED,
766 STAMUNIT_OCCURENCES, "Profiling of CRx reads",
767 "/HM/CPU%d/Exit/Instr/CR/Read/%x", i, j);
768 AssertRC(rc);
769 }
770
771#undef HM_REG_COUNTER
772
773 pVCpu->hm.s.paStatExitReason = NULL;
774
775 rc = MMHyperAlloc(pVM, MAX_EXITREASON_STAT*sizeof(*pVCpu->hm.s.paStatExitReason), 0, MM_TAG_HM,
776 (void **)&pVCpu->hm.s.paStatExitReason);
777 AssertRC(rc);
778 if (RT_SUCCESS(rc))
779 {
780 const char * const *papszDesc = ASMIsIntelCpu() ? &g_apszVTxExitReasons[0] : &g_apszAmdVExitReasons[0];
781 for (int j = 0; j < MAX_EXITREASON_STAT; j++)
782 {
783 if (papszDesc[j])
784 {
785 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.paStatExitReason[j], STAMTYPE_COUNTER, STAMVISIBILITY_USED,
786 STAMUNIT_OCCURENCES, papszDesc[j], "/HM/CPU%d/Exit/Reason/%02x", i, j);
787 AssertRC(rc);
788 }
789 }
790 rc = STAMR3RegisterF(pVM, &pVCpu->hm.s.StatExitReasonNpf, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_OCCURENCES,
791 "Nested page fault", "/HM/CPU%d/Exit/Reason/#NPF", i);
792 AssertRC(rc);
793 }
794 pVCpu->hm.s.paStatExitReasonR0 = MMHyperR3ToR0(pVM, pVCpu->hm.s.paStatExitReason);
795# ifdef VBOX_WITH_2X_4GB_ADDR_SPACE
796 Assert(pVCpu->hm.s.paStatExitReasonR0 != NIL_RTR0PTR || !HMIsEnabled(pVM));
797# else
798 Assert(pVCpu->hm.s.paStatExitReasonR0 != NIL_RTR0PTR);
799# endif
800
801 rc = MMHyperAlloc(pVM, sizeof(STAMCOUNTER) * 256, 8, MM_TAG_HM, (void **)&pVCpu->hm.s.paStatInjectedIrqs);
802 AssertRCReturn(rc, rc);
803 pVCpu->hm.s.paStatInjectedIrqsR0 = MMHyperR3ToR0(pVM, pVCpu->hm.s.paStatInjectedIrqs);
804# ifdef VBOX_WITH_2X_4GB_ADDR_SPACE
805 Assert(pVCpu->hm.s.paStatInjectedIrqsR0 != NIL_RTR0PTR || !HMIsEnabled(pVM));
806# else
807 Assert(pVCpu->hm.s.paStatInjectedIrqsR0 != NIL_RTR0PTR);
808# endif
809 for (unsigned j = 0; j < 255; j++)
810 {
811 STAMR3RegisterF(pVM, &pVCpu->hm.s.paStatInjectedIrqs[j], STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_OCCURENCES,
812 "Injected event.",
813 (j < 0x20) ? "/HM/CPU%d/EventInject/Event/Trap/%02X" : "/HM/CPU%d/EventInject/Event/IRQ/%02X", i, j);
814 }
815
816#endif /* VBOX_WITH_STATISTICS */
817 }
818
819#ifdef VBOX_WITH_CRASHDUMP_MAGIC
820 /*
821 * Magic marker for searching in crash dumps.
822 */
823 for (VMCPUID i = 0; i < pVM->cCpus; i++)
824 {
825 PVMCPU pVCpu = &pVM->aCpus[i];
826
827 PVMCSCACHE pCache = &pVCpu->hm.s.vmx.VMCSCache;
828 strcpy((char *)pCache->aMagic, "VMCSCACHE Magic");
829 pCache->uMagic = UINT64_C(0xDEADBEEFDEADBEEF);
830 }
831#endif
832
833 return VINF_SUCCESS;
834}
835
836
837/**
838 * Called when a init phase has completed.
839 *
840 * @returns VBox status code.
841 * @param pVM The VM.
842 * @param enmWhat The phase that completed.
843 */
844VMMR3_INT_DECL(int) HMR3InitCompleted(PVM pVM, VMINITCOMPLETED enmWhat)
845{
846 switch (enmWhat)
847 {
848 case VMINITCOMPLETED_RING3:
849 return hmR3InitCPU(pVM);
850 case VMINITCOMPLETED_RING0:
851 return hmR3InitFinalizeR0(pVM);
852 default:
853 return VINF_SUCCESS;
854 }
855}
856
857
858/**
859 * Turns off normal raw mode features.
860 *
861 * @param pVM Pointer to the VM.
862 */
863static void hmR3DisableRawMode(PVM pVM)
864{
865 /* Reinit the paging mode to force the new shadow mode. */
866 for (VMCPUID i = 0; i < pVM->cCpus; i++)
867 {
868 PVMCPU pVCpu = &pVM->aCpus[i];
869
870 PGMR3ChangeMode(pVM, pVCpu, PGMMODE_REAL);
871 }
872}
873
874
875/**
876 * Initialize VT-x or AMD-V.
877 *
878 * @returns VBox status code.
879 * @param pVM Pointer to the VM.
880 */
881static int hmR3InitFinalizeR0(PVM pVM)
882{
883 int rc;
884
885 if (!HMIsEnabled(pVM))
886 return VINF_SUCCESS;
887
888 /*
889 * Hack to allow users to work around broken BIOSes that incorrectly set
890 * EFER.SVME, which makes us believe somebody else is already using AMD-V.
891 */
892 if ( !pVM->hm.s.vmx.fSupported
893 && !pVM->hm.s.svm.fSupported
894 && pVM->hm.s.lLastError == VERR_SVM_IN_USE /* implies functional AMD-V */
895 && RTEnvExist("VBOX_HWVIRTEX_IGNORE_SVM_IN_USE"))
896 {
897 LogRel(("HM: VBOX_HWVIRTEX_IGNORE_SVM_IN_USE active!\n"));
898 pVM->hm.s.svm.fSupported = true;
899 pVM->hm.s.svm.fIgnoreInUseError = true;
900 pVM->hm.s.lLastError = VINF_SUCCESS;
901 }
902
903 /*
904 * Report ring-0 init errors.
905 */
906 if ( !pVM->hm.s.vmx.fSupported
907 && !pVM->hm.s.svm.fSupported)
908 {
909 LogRel(("HM: Failed to initialize VT-x / AMD-V: %Rrc\n", pVM->hm.s.lLastError));
910 LogRel(("HM: VMX MSR_IA32_FEATURE_CONTROL=%RX64\n", pVM->hm.s.vmx.Msrs.u64FeatureCtrl));
911 switch (pVM->hm.s.lLastError)
912 {
913 case VERR_VMX_IN_VMX_ROOT_MODE:
914 return VM_SET_ERROR(pVM, VERR_VMX_IN_VMX_ROOT_MODE, "VT-x is being used by another hypervisor.");
915 case VERR_VMX_NO_VMX:
916 return VM_SET_ERROR(pVM, VERR_VMX_NO_VMX, "VT-x is not available.");
917 case VERR_VMX_MSR_VMXON_DISABLED:
918 return VM_SET_ERROR(pVM, VERR_VMX_NO_VMX, "VT-x is disabled in the BIOS.");
919 case VERR_VMX_MSR_SMX_VMXON_DISABLED:
920 return VM_SET_ERROR(pVM, VERR_VMX_NO_VMX, "VT-x is disabled in the BIOS for Safer-Mode/Trusted Extensions.");
921 case VERR_VMX_MSR_LOCKING_FAILED:
922 return VM_SET_ERROR(pVM, VERR_VMX_NO_VMX, "Failed to enable and lock VT-x features.");
923
924 case VERR_SVM_IN_USE:
925 return VM_SET_ERROR(pVM, VERR_SVM_IN_USE, "AMD-V is being used by another hypervisor.");
926 case VERR_SVM_NO_SVM:
927 return VM_SET_ERROR(pVM, VERR_SVM_NO_SVM, "AMD-V is not available.");
928 case VERR_SVM_DISABLED:
929 return VM_SET_ERROR(pVM, VERR_SVM_DISABLED, "AMD-V is disabled in the BIOS.");
930 }
931 return VMSetError(pVM, pVM->hm.s.lLastError, RT_SRC_POS, "HM ring-0 init failed: %Rrc", pVM->hm.s.lLastError);
932 }
933
934 /*
935 * Enable VT-x or AMD-V on all host CPUs.
936 */
937 rc = SUPR3CallVMMR0Ex(pVM->pVMR0, 0 /*idCpu*/, VMMR0_DO_HM_ENABLE, 0, NULL);
938 if (RT_FAILURE(rc))
939 {
940 LogRel(("HMR3InitFinalize: SUPR3CallVMMR0Ex VMMR0_DO_HM_ENABLE failed with %Rrc\n", rc));
941 return rc;
942 }
943
944 /*
945 * No TPR patching is required when the IO-APIC is not enabled for this VM.
946 * (Main should have taken care of this already)
947 */
948 pVM->hm.s.fHasIoApic = PDMHasIoApic(pVM);
949 if (!pVM->hm.s.fHasIoApic)
950 {
951 Assert(!pVM->hm.s.fTRPPatchingAllowed); /* paranoia */
952 pVM->hm.s.fTRPPatchingAllowed = false;
953 }
954
955 /*
956 * Do the vendor specific initalization .
957 * .
958 * Note! We disable release log buffering here since we're doing relatively .
959 * lot of logging and doesn't want to hit the disk with each LogRel .
960 * statement.
961 */
962 AssertLogRelReturn(!pVM->hm.s.fInitialized, VERR_HM_IPE_5);
963 bool fOldBuffered = RTLogRelSetBuffering(true /*fBuffered*/);
964 if (pVM->hm.s.vmx.fSupported)
965 rc = hmR3InitFinalizeR0Intel(pVM);
966 else
967 rc = hmR3InitFinalizeR0Amd(pVM);
968 LogRel(("HM: VT-x/AMD-V init method: %s\n", (pVM->hm.s.fGlobalInit) ? "GLOBAL" : "LOCAL"));
969 RTLogRelSetBuffering(fOldBuffered);
970 pVM->hm.s.fInitialized = true;
971
972 return rc;
973}
974
975
976/**
977 * Finish VT-x initialization (after ring-0 init).
978 *
979 * @returns VBox status code.
980 * @param pVM The cross context VM structure.
981 */
982static int hmR3InitFinalizeR0Intel(PVM pVM)
983{
984 int rc;
985
986 Log(("pVM->hm.s.vmx.fSupported = %d\n", pVM->hm.s.vmx.fSupported));
987 AssertLogRelReturn(pVM->hm.s.vmx.Msrs.u64FeatureCtrl != 0, VERR_HM_IPE_4);
988
989 uint64_t val;
990 uint64_t zap;
991 RTGCPHYS GCPhys = 0;
992
993 LogRel(("HM: Using VT-x implementation 2.0!\n"));
994 LogRel(("HM: Host CR4 = %#RX64\n", pVM->hm.s.vmx.u64HostCr4));
995 LogRel(("HM: MSR_IA32_FEATURE_CONTROL = %#RX64\n", pVM->hm.s.vmx.Msrs.u64FeatureCtrl));
996 LogRel(("HM: MSR_IA32_VMX_BASIC_INFO = %#RX64\n", pVM->hm.s.vmx.Msrs.u64BasicInfo));
997 LogRel(("HM: VMCS id = %#x\n", MSR_IA32_VMX_BASIC_INFO_VMCS_ID(pVM->hm.s.vmx.Msrs.u64BasicInfo)));
998 LogRel(("HM: VMCS size = %u\n", MSR_IA32_VMX_BASIC_INFO_VMCS_SIZE(pVM->hm.s.vmx.Msrs.u64BasicInfo)));
999 LogRel(("HM: VMCS physical address limit = %s\n", MSR_IA32_VMX_BASIC_INFO_VMCS_PHYS_WIDTH(pVM->hm.s.vmx.Msrs.u64BasicInfo) ? "< 4 GB" : "None"));
1000 LogRel(("HM: VMCS memory type = %#x\n", MSR_IA32_VMX_BASIC_INFO_VMCS_MEM_TYPE(pVM->hm.s.vmx.Msrs.u64BasicInfo)));
1001 LogRel(("HM: Dual-monitor treatment support = %RTbool\n", !!MSR_IA32_VMX_BASIC_INFO_VMCS_DUAL_MON(pVM->hm.s.vmx.Msrs.u64BasicInfo)));
1002 LogRel(("HM: OUTS & INS instruction-info = %RTbool\n", !!MSR_IA32_VMX_BASIC_INFO_VMCS_INS_OUTS(pVM->hm.s.vmx.Msrs.u64BasicInfo)));
1003 LogRel(("HM: Max resume loops = %u\n", pVM->hm.s.cMaxResumeLoops));
1004
1005 LogRel(("HM: MSR_IA32_VMX_PINBASED_CTLS = %#RX64\n", pVM->hm.s.vmx.Msrs.VmxPinCtls.u));
1006 val = pVM->hm.s.vmx.Msrs.VmxPinCtls.n.allowed1;
1007 zap = pVM->hm.s.vmx.Msrs.VmxPinCtls.n.disallowed0;
1008 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PIN_EXEC_EXT_INT_EXIT);
1009 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PIN_EXEC_NMI_EXIT);
1010 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PIN_EXEC_VIRTUAL_NMI);
1011 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PIN_EXEC_PREEMPT_TIMER);
1012
1013 LogRel(("HM: MSR_IA32_VMX_PROCBASED_CTLS = %#RX64\n", pVM->hm.s.vmx.Msrs.VmxProcCtls.u));
1014 val = pVM->hm.s.vmx.Msrs.VmxProcCtls.n.allowed1;
1015 zap = pVM->hm.s.vmx.Msrs.VmxProcCtls.n.disallowed0;
1016 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_INT_WINDOW_EXIT);
1017 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_USE_TSC_OFFSETTING);
1018 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_HLT_EXIT);
1019 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_INVLPG_EXIT);
1020 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_MWAIT_EXIT);
1021 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_RDPMC_EXIT);
1022 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_RDTSC_EXIT);
1023 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_CR3_LOAD_EXIT);
1024 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_CR3_STORE_EXIT);
1025 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_CR8_LOAD_EXIT);
1026 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_CR8_STORE_EXIT);
1027 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_USE_TPR_SHADOW);
1028 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_NMI_WINDOW_EXIT);
1029 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_MOV_DR_EXIT);
1030 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_UNCOND_IO_EXIT);
1031 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_USE_IO_BITMAPS);
1032 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_MONITOR_TRAP_FLAG);
1033 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_USE_MSR_BITMAPS);
1034 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_MONITOR_EXIT);
1035 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_PAUSE_EXIT);
1036 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC_USE_SECONDARY_EXEC_CTRL);
1037 if (pVM->hm.s.vmx.Msrs.VmxProcCtls.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC_USE_SECONDARY_EXEC_CTRL)
1038 {
1039 LogRel(("HM: MSR_IA32_VMX_PROCBASED_CTLS2 = %#RX64\n", pVM->hm.s.vmx.Msrs.VmxProcCtls2.u));
1040 val = pVM->hm.s.vmx.Msrs.VmxProcCtls2.n.allowed1;
1041 zap = pVM->hm.s.vmx.Msrs.VmxProcCtls2.n.disallowed0;
1042 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_VIRT_APIC);
1043 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_EPT);
1044 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_DESCRIPTOR_TABLE_EXIT);
1045 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_RDTSCP);
1046 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_VIRT_X2APIC);
1047 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_VPID);
1048 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_WBINVD_EXIT);
1049 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_UNRESTRICTED_GUEST);
1050 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_PAUSE_LOOP_EXIT);
1051 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_RDRAND_EXIT);
1052 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_INVPCID);
1053 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_PROC_EXEC2_VMFUNC);
1054 }
1055
1056 LogRel(("HM: MSR_IA32_VMX_ENTRY_CTLS = %#RX64\n", pVM->hm.s.vmx.Msrs.VmxEntry.u));
1057 val = pVM->hm.s.vmx.Msrs.VmxEntry.n.allowed1;
1058 zap = pVM->hm.s.vmx.Msrs.VmxEntry.n.disallowed0;
1059 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_ENTRY_LOAD_DEBUG);
1060 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_ENTRY_IA32E_MODE_GUEST);
1061 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_ENTRY_ENTRY_SMM);
1062 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_ENTRY_DEACTIVATE_DUALMON);
1063 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_ENTRY_LOAD_GUEST_PERF_MSR);
1064 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_ENTRY_LOAD_GUEST_PAT_MSR);
1065 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_ENTRY_LOAD_GUEST_EFER_MSR);
1066
1067 LogRel(("HM: MSR_IA32_VMX_EXIT_CTLS = %#RX64\n", pVM->hm.s.vmx.Msrs.VmxExit.u));
1068 val = pVM->hm.s.vmx.Msrs.VmxExit.n.allowed1;
1069 zap = pVM->hm.s.vmx.Msrs.VmxExit.n.disallowed0;
1070 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_EXIT_SAVE_DEBUG);
1071 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_EXIT_HOST_ADDR_SPACE_SIZE);
1072 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_EXIT_LOAD_PERF_MSR);
1073 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_EXIT_ACK_EXT_INT);
1074 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_EXIT_SAVE_GUEST_PAT_MSR);
1075 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_EXIT_LOAD_HOST_PAT_MSR);
1076 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_EXIT_SAVE_GUEST_EFER_MSR);
1077 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_EXIT_LOAD_HOST_EFER_MSR);
1078 HMVMX_REPORT_FEATURE(val, zap, VMX_VMCS_CTRL_EXIT_SAVE_VMX_PREEMPT_TIMER);
1079
1080 if (pVM->hm.s.vmx.Msrs.u64EptVpidCaps)
1081 {
1082 val = pVM->hm.s.vmx.Msrs.u64EptVpidCaps;
1083 LogRel(("HM: MSR_IA32_VMX_EPT_VPID_CAP = %#RX64\n", val));
1084 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_RWX_X_ONLY);
1085 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_RWX_W_ONLY);
1086 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_RWX_WX_ONLY);
1087 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_GAW_21_BITS);
1088 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_GAW_30_BITS);
1089 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_GAW_39_BITS);
1090 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_GAW_48_BITS);
1091 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_GAW_57_BITS);
1092 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_EMT_UC);
1093 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_EMT_WC);
1094 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_EMT_WT);
1095 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_EMT_WP);
1096 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_EMT_WB);
1097 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_SP_21_BITS);
1098 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_SP_30_BITS);
1099 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_SP_39_BITS);
1100 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_SP_48_BITS);
1101 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_INVEPT);
1102 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_INVEPT_SINGLE_CONTEXT);
1103 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_INVEPT_ALL_CONTEXTS);
1104 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_INVVPID);
1105 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_INVVPID_INDIV_ADDR);
1106 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_INVVPID_SINGLE_CONTEXT);
1107 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_INVVPID_ALL_CONTEXTS);
1108 HMVMX_REPORT_CAPABILITY(val, MSR_IA32_VMX_EPT_VPID_CAP_INVVPID_SINGLE_CONTEXT_RETAIN_GLOBALS);
1109 }
1110
1111 val = pVM->hm.s.vmx.Msrs.u64Misc;
1112 LogRel(("HM: MSR_IA32_VMX_MISC = %#RX64\n", val));
1113 if (MSR_IA32_VMX_MISC_PREEMPT_TSC_BIT(val) == pVM->hm.s.vmx.cPreemptTimerShift)
1114 LogRel(("HM: MSR_IA32_VMX_MISC_PREEMPT_TSC_BIT = %#x\n", MSR_IA32_VMX_MISC_PREEMPT_TSC_BIT(val)));
1115 else
1116 {
1117 LogRel(("HM: MSR_IA32_VMX_MISC_PREEMPT_TSC_BIT = %#x - erratum detected, using %#x instead\n",
1118 MSR_IA32_VMX_MISC_PREEMPT_TSC_BIT(val), pVM->hm.s.vmx.cPreemptTimerShift));
1119 }
1120
1121 LogRel(("HM: MSR_IA32_VMX_MISC_STORE_EFERLMA_VMEXIT = %RTbool\n", !!MSR_IA32_VMX_MISC_STORE_EFERLMA_VMEXIT(val)));
1122 LogRel(("HM: MSR_IA32_VMX_MISC_ACTIVITY_STATES = %#x\n", MSR_IA32_VMX_MISC_ACTIVITY_STATES(val)));
1123 LogRel(("HM: MSR_IA32_VMX_MISC_CR3_TARGET = %#x\n", MSR_IA32_VMX_MISC_CR3_TARGET(val)));
1124 LogRel(("HM: MSR_IA32_VMX_MISC_MAX_MSR = %u\n", MSR_IA32_VMX_MISC_MAX_MSR(val)));
1125 LogRel(("HM: MSR_IA32_VMX_MISC_RDMSR_SMBASE_MSR_SMM = %RTbool\n", !!MSR_IA32_VMX_MISC_RDMSR_SMBASE_MSR_SMM(val)));
1126 LogRel(("HM: MSR_IA32_VMX_MISC_SMM_MONITOR_CTL_B2 = %RTbool\n", !!MSR_IA32_VMX_MISC_SMM_MONITOR_CTL_B2(val)));
1127 LogRel(("HM: MSR_IA32_VMX_MISC_VMWRITE_VMEXIT_INFO = %RTbool\n", !!MSR_IA32_VMX_MISC_VMWRITE_VMEXIT_INFO(val)));
1128 LogRel(("HM: MSR_IA32_VMX_MISC_MSEG_ID = %#x\n", MSR_IA32_VMX_MISC_MSEG_ID(val)));
1129
1130 /* Paranoia */
1131 AssertRelease(MSR_IA32_VMX_MISC_MAX_MSR(pVM->hm.s.vmx.Msrs.u64Misc) >= 512);
1132
1133 LogRel(("HM: MSR_IA32_VMX_CR0_FIXED0 = %#RX64\n", pVM->hm.s.vmx.Msrs.u64Cr0Fixed0));
1134 LogRel(("HM: MSR_IA32_VMX_CR0_FIXED1 = %#RX64\n", pVM->hm.s.vmx.Msrs.u64Cr0Fixed1));
1135 LogRel(("HM: MSR_IA32_VMX_CR4_FIXED0 = %#RX64\n", pVM->hm.s.vmx.Msrs.u64Cr4Fixed0));
1136 LogRel(("HM: MSR_IA32_VMX_CR4_FIXED1 = %#RX64\n", pVM->hm.s.vmx.Msrs.u64Cr4Fixed1));
1137
1138 val = pVM->hm.s.vmx.Msrs.u64VmcsEnum;
1139 LogRel(("HM: MSR_IA32_VMX_VMCS_ENUM = %#RX64\n", val));
1140 LogRel(("HM: MSR_IA32_VMX_VMCS_ENUM_HIGHEST_INDEX = %#x\n", MSR_IA32_VMX_VMCS_ENUM_HIGHEST_INDEX(val)));
1141
1142 val = pVM->hm.s.vmx.Msrs.u64Vmfunc;
1143 if (val)
1144 {
1145 LogRel(("HM: MSR_A32_VMX_VMFUNC = %#RX64\n", val));
1146 HMVMX_REPORT_ALLOWED_FEATURE(val, VMX_VMCS_CTRL_VMFUNC_EPTP_SWITCHING);
1147 }
1148
1149 LogRel(("HM: APIC-access page physaddr = %#RHp\n", pVM->hm.s.vmx.HCPhysApicAccess));
1150
1151 for (VMCPUID i = 0; i < pVM->cCpus; i++)
1152 {
1153 LogRel(("HM: VCPU%3d: MSR bitmap physaddr = %#RHp\n", i, pVM->aCpus[i].hm.s.vmx.HCPhysMsrBitmap));
1154 LogRel(("HM: VCPU%3d: VMCS physaddr = %#RHp\n", i, pVM->aCpus[i].hm.s.vmx.HCPhysVmcs));
1155 }
1156
1157 if (pVM->hm.s.vmx.Msrs.VmxProcCtls2.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC2_EPT)
1158 pVM->hm.s.fNestedPaging = pVM->hm.s.fAllowNestedPaging;
1159
1160 if (pVM->hm.s.vmx.Msrs.VmxProcCtls2.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC2_VPID)
1161 pVM->hm.s.vmx.fVpid = pVM->hm.s.vmx.fAllowVpid;
1162
1163 /*
1164 * Disallow RDTSCP in the guest if there is no secondary process-based VM execution controls as otherwise
1165 * RDTSCP would cause a #UD. There might be no CPUs out there where this happens, as RDTSCP was introduced
1166 * in Nehalems and secondary VM exec. controls should be supported in all of them, but nonetheless it's Intel...
1167 */
1168 if ( !(pVM->hm.s.vmx.Msrs.VmxProcCtls.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC_USE_SECONDARY_EXEC_CTRL)
1169 && CPUMGetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_RDTSCP))
1170 {
1171 CPUMClearGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_RDTSCP);
1172 LogRel(("HM: RDTSCP disabled.\n"));
1173 }
1174
1175 /* Unrestricted guest execution also requires EPT. */
1176 if ( pVM->hm.s.vmx.fAllowUnrestricted
1177 && pVM->hm.s.fNestedPaging
1178 && (pVM->hm.s.vmx.Msrs.VmxProcCtls2.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC2_UNRESTRICTED_GUEST))
1179 {
1180 pVM->hm.s.vmx.fUnrestrictedGuest = true;
1181 }
1182
1183 if (!pVM->hm.s.vmx.fUnrestrictedGuest)
1184 {
1185 /* Allocate three pages for the TSS we need for real mode emulation. (2 pages for the IO bitmap) */
1186 rc = PDMR3VmmDevHeapAlloc(pVM, HM_VTX_TOTAL_DEVHEAP_MEM, (RTR3PTR *)&pVM->hm.s.vmx.pRealModeTSS);
1187 if (RT_SUCCESS(rc))
1188 {
1189 /* The IO bitmap starts right after the virtual interrupt redirection bitmap.
1190 Refer Intel spec. 20.3.3 "Software Interrupt Handling in Virtual-8086 mode"
1191 esp. Figure 20-5.*/
1192 ASMMemZero32(pVM->hm.s.vmx.pRealModeTSS, sizeof(*pVM->hm.s.vmx.pRealModeTSS));
1193 pVM->hm.s.vmx.pRealModeTSS->offIoBitmap = sizeof(*pVM->hm.s.vmx.pRealModeTSS);
1194
1195 /* Bit set to 0 means software interrupts are redirected to the
1196 8086 program interrupt handler rather than switching to
1197 protected-mode handler. */
1198 memset(pVM->hm.s.vmx.pRealModeTSS->IntRedirBitmap, 0, sizeof(pVM->hm.s.vmx.pRealModeTSS->IntRedirBitmap));
1199
1200 /* Allow all port IO, so that port IO instructions do not cause
1201 exceptions and would instead cause a VM-exit (based on VT-x's
1202 IO bitmap which we currently configure to always cause an exit). */
1203 memset(pVM->hm.s.vmx.pRealModeTSS + 1, 0, PAGE_SIZE * 2);
1204 *((unsigned char *)pVM->hm.s.vmx.pRealModeTSS + HM_VTX_TSS_SIZE - 2) = 0xff;
1205
1206 /*
1207 * Construct a 1024 element page directory with 4 MB pages for
1208 * the identity mapped page table used in real and protected mode
1209 * without paging with EPT.
1210 */
1211 pVM->hm.s.vmx.pNonPagingModeEPTPageTable = (PX86PD)((char *)pVM->hm.s.vmx.pRealModeTSS + PAGE_SIZE * 3);
1212 for (uint32_t i = 0; i < X86_PG_ENTRIES; i++)
1213 {
1214 pVM->hm.s.vmx.pNonPagingModeEPTPageTable->a[i].u = _4M * i;
1215 pVM->hm.s.vmx.pNonPagingModeEPTPageTable->a[i].u |= X86_PDE4M_P | X86_PDE4M_RW | X86_PDE4M_US
1216 | X86_PDE4M_A | X86_PDE4M_D | X86_PDE4M_PS
1217 | X86_PDE4M_G;
1218 }
1219
1220 /* We convert it here every time as pci regions could be reconfigured. */
1221 rc = PDMVmmDevHeapR3ToGCPhys(pVM, pVM->hm.s.vmx.pRealModeTSS, &GCPhys);
1222 AssertRCReturn(rc, rc);
1223 LogRel(("HM: Real Mode TSS guest physaddr = %#RGp\n", GCPhys));
1224
1225 rc = PDMVmmDevHeapR3ToGCPhys(pVM, pVM->hm.s.vmx.pNonPagingModeEPTPageTable, &GCPhys);
1226 AssertRCReturn(rc, rc);
1227 LogRel(("HM: Non-Paging Mode EPT CR3 = %#RGp\n", GCPhys));
1228 }
1229 else
1230 {
1231 /** @todo This cannot possibly work, there are other places which assumes
1232 * this allocation cannot fail (see HMR3CanExecuteGuest()). Make this
1233 * a failure case. */
1234 LogRel(("HM: No real mode VT-x support (PDMR3VMMDevHeapAlloc returned %Rrc)\n", rc));
1235 pVM->hm.s.vmx.pRealModeTSS = NULL;
1236 pVM->hm.s.vmx.pNonPagingModeEPTPageTable = NULL;
1237 }
1238 }
1239
1240 /*
1241 * Call ring-0 to set up the VM.
1242 */
1243 rc = SUPR3CallVMMR0Ex(pVM->pVMR0, 0 /*idCpu*/, VMMR0_DO_HM_SETUP_VM, 0, NULL);
1244 if (rc != VINF_SUCCESS)
1245 {
1246 AssertMsgFailed(("%Rrc\n", rc));
1247 LogRel(("HM: VMX setup failed with rc=%Rrc!\n", rc));
1248 for (VMCPUID i = 0; i < pVM->cCpus; i++)
1249 {
1250 PVMCPU pVCpu = &pVM->aCpus[i];
1251 LogRel(("HM: CPU[%u] Last instruction error %#x\n", i, pVCpu->hm.s.vmx.LastError.u32InstrError));
1252 LogRel(("HM: CPU[%u] HM error %#x (%u)\n", i, pVCpu->hm.s.u32HMError, pVCpu->hm.s.u32HMError));
1253 }
1254 return VMSetError(pVM, rc, RT_SRC_POS, "VT-x setup failed: %Rrc", rc);
1255 }
1256
1257 LogRel(("HM: VMX enabled!\n"));
1258 pVM->hm.s.vmx.fEnabled = true;
1259
1260 hmR3DisableRawMode(pVM); /** @todo make this go away! */
1261
1262 /*
1263 * Change the CPU features.
1264 */
1265 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_SEP);
1266 if (pVM->hm.s.fAllow64BitGuests)
1267 {
1268 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_PAE);
1269 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_LONG_MODE);
1270 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_SYSCALL); /* 64 bits only on Intel CPUs */
1271 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_LAHF);
1272 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_NX);
1273#if 0 /** @todo r=bird: This ain't making any sense whatsoever. */
1274#if RT_ARCH_X86
1275 if ( !CPUMGetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_PAE)
1276 || !(pVM->hm.s.vmx.u64HostEfer & MSR_K6_EFER_NXE))
1277 LogRel(("NX is only supported for 64-bit guests!\n"));
1278#endif
1279#endif
1280 }
1281 /* Turn on NXE if PAE has been enabled *and* the host has turned on NXE
1282 (we reuse the host EFER in the switcher). */
1283 /** @todo this needs to be fixed properly!! */
1284 else if ( CPUMGetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_PAE)
1285 && (pVM->hm.s.vmx.u64HostEfer & MSR_K6_EFER_NXE))
1286 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_NX);
1287 else
1288 LogRel(("HM: NX not supported by the host.\n"));
1289
1290 /*
1291 * Log configuration details.
1292 */
1293 LogRel((pVM->hm.s.fAllow64BitGuests
1294 ? "HM: Guest support: 32-bit and 64-bit.\n"
1295 : "HM: Guest support: 32-bit only.\n"));
1296 if (pVM->hm.s.fNestedPaging)
1297 {
1298 LogRel(("HM: Nested paging enabled!\n"));
1299 if (pVM->hm.s.vmx.enmFlushEpt == VMX_FLUSH_EPT_SINGLE_CONTEXT)
1300 LogRel(("HM: EPT flush type = VMX_FLUSH_EPT_SINGLE_CONTEXT\n"));
1301 else if (pVM->hm.s.vmx.enmFlushEpt == VMX_FLUSH_EPT_ALL_CONTEXTS)
1302 LogRel(("HM: EPT flush type = VMX_FLUSH_EPT_ALL_CONTEXTS\n"));
1303 else if (pVM->hm.s.vmx.enmFlushEpt == VMX_FLUSH_EPT_NOT_SUPPORTED)
1304 LogRel(("HM: EPT flush type = VMX_FLUSH_EPT_NOT_SUPPORTED\n"));
1305 else
1306 LogRel(("HM: EPT flush type = %d\n", pVM->hm.s.vmx.enmFlushEpt));
1307
1308 if (pVM->hm.s.vmx.fUnrestrictedGuest)
1309 LogRel(("HM: Unrestricted guest execution enabled!\n"));
1310
1311#if HC_ARCH_BITS == 64
1312 if (pVM->hm.s.fLargePages)
1313 {
1314 /* Use large (2 MB) pages for our EPT PDEs where possible. */
1315 PGMSetLargePageUsage(pVM, true);
1316 LogRel(("HM: Large page support enabled!\n"));
1317 }
1318#endif
1319 }
1320 else
1321 Assert(!pVM->hm.s.vmx.fUnrestrictedGuest);
1322
1323 if (pVM->hm.s.vmx.fVpid)
1324 {
1325 LogRel(("HM: VPID enabled!\n"));
1326 if (pVM->hm.s.vmx.enmFlushVpid == VMX_FLUSH_VPID_INDIV_ADDR)
1327 LogRel(("HM: VPID flush type = VMX_FLUSH_VPID_INDIV_ADDR\n"));
1328 else if (pVM->hm.s.vmx.enmFlushVpid == VMX_FLUSH_VPID_SINGLE_CONTEXT)
1329 LogRel(("HM: VPID flush type = VMX_FLUSH_VPID_SINGLE_CONTEXT\n"));
1330 else if (pVM->hm.s.vmx.enmFlushVpid == VMX_FLUSH_VPID_ALL_CONTEXTS)
1331 LogRel(("HM: VPID flush type = VMX_FLUSH_VPID_ALL_CONTEXTS\n"));
1332 else if (pVM->hm.s.vmx.enmFlushVpid == VMX_FLUSH_VPID_SINGLE_CONTEXT_RETAIN_GLOBALS)
1333 LogRel(("HM: VPID flush type = VMX_FLUSH_VPID_SINGLE_CONTEXT_RETAIN_GLOBALS\n"));
1334 else
1335 LogRel(("HM: VPID flush type = %d\n", pVM->hm.s.vmx.enmFlushVpid));
1336 }
1337 else if (pVM->hm.s.vmx.enmFlushVpid == VMX_FLUSH_VPID_NOT_SUPPORTED)
1338 LogRel(("HM: Ignoring VPID capabilities of CPU.\n"));
1339
1340 /*
1341 * Check for preemption timer config override and log the state of it.
1342 */
1343 if (pVM->hm.s.vmx.fUsePreemptTimer)
1344 {
1345 PCFGMNODE pCfgHm = CFGMR3GetChild(CFGMR3GetRoot(pVM), "HM");
1346 rc = CFGMR3QueryBoolDef(pCfgHm, "UsePreemptTimer", &pVM->hm.s.vmx.fUsePreemptTimer, true);
1347 AssertLogRelRCReturn(rc, rc);
1348 }
1349 if (pVM->hm.s.vmx.fUsePreemptTimer)
1350 LogRel(("HM: VMX-preemption timer enabled (cPreemptTimerShift=%u).\n", pVM->hm.s.vmx.cPreemptTimerShift));
1351 else
1352 LogRel(("HM: VMX-preemption timer disabled.\n"));
1353
1354 return VINF_SUCCESS;
1355}
1356
1357
1358/**
1359 * Finish AMD-V initialization (after ring-0 init).
1360 *
1361 * @returns VBox status code.
1362 * @param pVM The cross context VM structure.
1363 */
1364static int hmR3InitFinalizeR0Amd(PVM pVM)
1365{
1366 Log(("pVM->hm.s.svm.fSupported = %d\n", pVM->hm.s.svm.fSupported));
1367
1368 LogRel(("HM: Using AMD-V implementation 2.0!\n"));
1369
1370 uint32_t u32Family;
1371 uint32_t u32Model;
1372 uint32_t u32Stepping;
1373 if (HMAmdIsSubjectToErratum170(&u32Family, &u32Model, &u32Stepping))
1374 LogRel(("HM: AMD Cpu with erratum 170 family %#x model %#x stepping %#x\n", u32Family, u32Model, u32Stepping));
1375 LogRel(("HM: CPUID 0x80000001.u32AMDFeatureECX = %#RX32\n", pVM->hm.s.cpuid.u32AMDFeatureECX));
1376 LogRel(("HM: CPUID 0x80000001.u32AMDFeatureEDX = %#RX32\n", pVM->hm.s.cpuid.u32AMDFeatureEDX));
1377 LogRel(("HM: AMD HWCR MSR = %#RX64\n", pVM->hm.s.svm.u64MsrHwcr));
1378 LogRel(("HM: AMD-V revision = %#x\n", pVM->hm.s.svm.u32Rev));
1379 LogRel(("HM: AMD-V max ASID = %RU32\n", pVM->hm.s.uMaxAsid));
1380 LogRel(("HM: AMD-V features = %#x\n", pVM->hm.s.svm.u32Features));
1381
1382 /*
1383 * Enumerate AMD-V features.
1384 */
1385 static const struct { uint32_t fFlag; const char *pszName; } s_aSvmFeatures[] =
1386 {
1387#define HMSVM_REPORT_FEATURE(a_Define) { a_Define, #a_Define }
1388 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_NESTED_PAGING),
1389 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_LBR_VIRT),
1390 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_SVM_LOCK),
1391 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_NRIP_SAVE),
1392 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_TSC_RATE_MSR),
1393 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_VMCB_CLEAN),
1394 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_FLUSH_BY_ASID),
1395 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_DECODE_ASSIST),
1396 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_PAUSE_FILTER),
1397 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_PAUSE_FILTER_THRESHOLD),
1398 HMSVM_REPORT_FEATURE(AMD_CPUID_SVM_FEATURE_EDX_AVIC),
1399#undef HMSVM_REPORT_FEATURE
1400 };
1401
1402 uint32_t fSvmFeatures = pVM->hm.s.svm.u32Features;
1403 for (unsigned i = 0; i < RT_ELEMENTS(s_aSvmFeatures); i++)
1404 if (fSvmFeatures & s_aSvmFeatures[i].fFlag)
1405 {
1406 LogRel(("HM: %s\n", s_aSvmFeatures[i].pszName));
1407 fSvmFeatures &= ~s_aSvmFeatures[i].fFlag;
1408 }
1409 if (fSvmFeatures)
1410 for (unsigned iBit = 0; iBit < 32; iBit++)
1411 if (RT_BIT_32(iBit) & fSvmFeatures)
1412 LogRel(("HM: Reserved bit %u\n", iBit));
1413
1414 /*
1415 * Adjust feature(s).
1416 */
1417 if (pVM->hm.s.svm.u32Features & AMD_CPUID_SVM_FEATURE_EDX_NESTED_PAGING)
1418 pVM->hm.s.fNestedPaging = pVM->hm.s.fAllowNestedPaging;
1419
1420 /*
1421 * Call ring-0 to set up the VM.
1422 */
1423 int rc = SUPR3CallVMMR0Ex(pVM->pVMR0, 0 /*idCpu*/, VMMR0_DO_HM_SETUP_VM, 0, NULL);
1424 if (rc != VINF_SUCCESS)
1425 {
1426 AssertMsgFailed(("%Rrc\n", rc));
1427 LogRel(("HM: AMD-V setup failed with rc=%Rrc!\n", rc));
1428 return VMSetError(pVM, rc, RT_SRC_POS, "AMD-V setup failed: %Rrc", rc);
1429 }
1430
1431 LogRel(("HM: AMD-V enabled!\n"));
1432 pVM->hm.s.svm.fEnabled = true;
1433
1434 if (pVM->hm.s.fNestedPaging)
1435 {
1436 LogRel(("HM: Nested paging enabled!\n"));
1437
1438 /*
1439 * Enable large pages (2 MB) if applicable.
1440 */
1441#if HC_ARCH_BITS == 64
1442 if (pVM->hm.s.fLargePages)
1443 {
1444 PGMSetLargePageUsage(pVM, true);
1445 LogRel(("HM: Large page support enabled!\n"));
1446 }
1447#endif
1448 }
1449
1450 hmR3DisableRawMode(pVM);
1451
1452 /*
1453 * Change the CPU features.
1454 */
1455 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_SEP);
1456 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_SYSCALL);
1457 if (pVM->hm.s.fAllow64BitGuests)
1458 {
1459 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_PAE);
1460 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_LONG_MODE);
1461 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_NX);
1462 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_LAHF);
1463 }
1464 /* Turn on NXE if PAE has been enabled. */
1465 else if (CPUMGetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_PAE))
1466 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_NX);
1467
1468 LogRel(("HM: TPR Patching %s.\n", (pVM->hm.s.fTRPPatchingAllowed) ? "enabled" : "disabled"));
1469
1470 LogRel((pVM->hm.s.fAllow64BitGuests
1471 ? "HM: Guest support: 32-bit and 64-bit.\n"
1472 : "HM: Guest support: 32-bit only.\n"));
1473
1474 return VINF_SUCCESS;
1475}
1476
1477
1478/**
1479 * Applies relocations to data and code managed by this
1480 * component. This function will be called at init and
1481 * whenever the VMM need to relocate it self inside the GC.
1482 *
1483 * @param pVM The VM.
1484 */
1485VMMR3_INT_DECL(void) HMR3Relocate(PVM pVM)
1486{
1487 Log(("HMR3Relocate to %RGv\n", MMHyperGetArea(pVM, 0)));
1488
1489 /* Fetch the current paging mode during the relocate callback during state loading. */
1490 if (VMR3GetState(pVM) == VMSTATE_LOADING)
1491 {
1492 for (VMCPUID i = 0; i < pVM->cCpus; i++)
1493 {
1494 PVMCPU pVCpu = &pVM->aCpus[i];
1495 pVCpu->hm.s.enmShadowMode = PGMGetShadowMode(pVCpu);
1496 }
1497 }
1498#if HC_ARCH_BITS == 32 && defined(VBOX_ENABLE_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
1499 if (HMIsEnabled(pVM))
1500 {
1501 switch (PGMGetHostMode(pVM))
1502 {
1503 case PGMMODE_32_BIT:
1504 pVM->hm.s.pfnHost32ToGuest64R0 = VMMR3GetHostToGuestSwitcher(pVM, VMMSWITCHER_32_TO_AMD64);
1505 break;
1506
1507 case PGMMODE_PAE:
1508 case PGMMODE_PAE_NX:
1509 pVM->hm.s.pfnHost32ToGuest64R0 = VMMR3GetHostToGuestSwitcher(pVM, VMMSWITCHER_PAE_TO_AMD64);
1510 break;
1511
1512 default:
1513 AssertFailed();
1514 break;
1515 }
1516 }
1517#endif
1518 return;
1519}
1520
1521
1522/**
1523 * Notification callback which is called whenever there is a chance that a CR3
1524 * value might have changed.
1525 *
1526 * This is called by PGM.
1527 *
1528 * @param pVM Pointer to the VM.
1529 * @param pVCpu Pointer to the VMCPU.
1530 * @param enmShadowMode New shadow paging mode.
1531 * @param enmGuestMode New guest paging mode.
1532 */
1533VMMR3_INT_DECL(void) HMR3PagingModeChanged(PVM pVM, PVMCPU pVCpu, PGMMODE enmShadowMode, PGMMODE enmGuestMode)
1534{
1535 /* Ignore page mode changes during state loading. */
1536 if (VMR3GetState(pVCpu->pVMR3) == VMSTATE_LOADING)
1537 return;
1538
1539 pVCpu->hm.s.enmShadowMode = enmShadowMode;
1540
1541 /*
1542 * If the guest left protected mode VMX execution, we'll have to be
1543 * extra careful if/when the guest switches back to protected mode.
1544 */
1545 if (enmGuestMode == PGMMODE_REAL)
1546 {
1547 Log(("HMR3PagingModeChanged indicates real mode execution\n"));
1548 pVCpu->hm.s.vmx.fWasInRealMode = true;
1549 }
1550
1551 /** @todo r=ramshankar: Disabling for now. If nothing breaks remove it
1552 * eventually. (Test platforms that use the cache ofc). */
1553#if 0
1554#ifdef VMX_USE_CACHED_VMCS_ACCESSES
1555 /* Reset the contents of the read cache. */
1556 PVMCSCACHE pCache = &pVCpu->hm.s.vmx.VMCSCache;
1557 for (unsigned j = 0; j < pCache->Read.cValidEntries; j++)
1558 pCache->Read.aFieldVal[j] = 0;
1559#endif
1560#endif
1561}
1562
1563
1564/**
1565 * Terminates the HM.
1566 *
1567 * Termination means cleaning up and freeing all resources,
1568 * the VM itself is, at this point, powered off or suspended.
1569 *
1570 * @returns VBox status code.
1571 * @param pVM Pointer to the VM.
1572 */
1573VMMR3_INT_DECL(int) HMR3Term(PVM pVM)
1574{
1575 if (pVM->hm.s.vmx.pRealModeTSS)
1576 {
1577 PDMR3VmmDevHeapFree(pVM, pVM->hm.s.vmx.pRealModeTSS);
1578 pVM->hm.s.vmx.pRealModeTSS = 0;
1579 }
1580 hmR3TermCPU(pVM);
1581 return 0;
1582}
1583
1584
1585/**
1586 * Terminates the per-VCPU HM.
1587 *
1588 * @returns VBox status code.
1589 * @param pVM Pointer to the VM.
1590 */
1591static int hmR3TermCPU(PVM pVM)
1592{
1593 for (VMCPUID i = 0; i < pVM->cCpus; i++)
1594 {
1595 PVMCPU pVCpu = &pVM->aCpus[i]; NOREF(pVCpu);
1596
1597#ifdef VBOX_WITH_STATISTICS
1598 if (pVCpu->hm.s.paStatExitReason)
1599 {
1600 MMHyperFree(pVM, pVCpu->hm.s.paStatExitReason);
1601 pVCpu->hm.s.paStatExitReason = NULL;
1602 pVCpu->hm.s.paStatExitReasonR0 = NIL_RTR0PTR;
1603 }
1604 if (pVCpu->hm.s.paStatInjectedIrqs)
1605 {
1606 MMHyperFree(pVM, pVCpu->hm.s.paStatInjectedIrqs);
1607 pVCpu->hm.s.paStatInjectedIrqs = NULL;
1608 pVCpu->hm.s.paStatInjectedIrqsR0 = NIL_RTR0PTR;
1609 }
1610#endif
1611
1612#ifdef VBOX_WITH_CRASHDUMP_MAGIC
1613 memset(pVCpu->hm.s.vmx.VMCSCache.aMagic, 0, sizeof(pVCpu->hm.s.vmx.VMCSCache.aMagic));
1614 pVCpu->hm.s.vmx.VMCSCache.uMagic = 0;
1615 pVCpu->hm.s.vmx.VMCSCache.uPos = 0xffffffff;
1616#endif
1617 }
1618 return 0;
1619}
1620
1621
1622/**
1623 * Resets a virtual CPU.
1624 *
1625 * Used by HMR3Reset and CPU hot plugging.
1626 *
1627 * @param pVCpu The CPU to reset.
1628 */
1629VMMR3_INT_DECL(void) HMR3ResetCpu(PVMCPU pVCpu)
1630{
1631 /* Sync. entire state on VM reset R0-reentry. It's safe to reset
1632 the HM flags here, all other EMTs are in ring-3. See VMR3Reset(). */
1633 VMCPU_HMCF_RESET_TO(pVCpu, HM_CHANGED_HOST_CONTEXT | HM_CHANGED_ALL_GUEST);
1634
1635 pVCpu->hm.s.vmx.u32CR0Mask = 0;
1636 pVCpu->hm.s.vmx.u32CR4Mask = 0;
1637 pVCpu->hm.s.fActive = false;
1638 pVCpu->hm.s.Event.fPending = false;
1639 pVCpu->hm.s.vmx.fWasInRealMode = true;
1640
1641 /* Reset the contents of the read cache. */
1642 PVMCSCACHE pCache = &pVCpu->hm.s.vmx.VMCSCache;
1643 for (unsigned j = 0; j < pCache->Read.cValidEntries; j++)
1644 pCache->Read.aFieldVal[j] = 0;
1645
1646#ifdef VBOX_WITH_CRASHDUMP_MAGIC
1647 /* Magic marker for searching in crash dumps. */
1648 strcpy((char *)pCache->aMagic, "VMCSCACHE Magic");
1649 pCache->uMagic = UINT64_C(0xDEADBEEFDEADBEEF);
1650#endif
1651}
1652
1653
1654/**
1655 * The VM is being reset.
1656 *
1657 * For the HM component this means that any GDT/LDT/TSS monitors
1658 * needs to be removed.
1659 *
1660 * @param pVM Pointer to the VM.
1661 */
1662VMMR3_INT_DECL(void) HMR3Reset(PVM pVM)
1663{
1664 LogFlow(("HMR3Reset:\n"));
1665
1666 if (HMIsEnabled(pVM))
1667 hmR3DisableRawMode(pVM);
1668
1669 for (VMCPUID i = 0; i < pVM->cCpus; i++)
1670 {
1671 PVMCPU pVCpu = &pVM->aCpus[i];
1672
1673 HMR3ResetCpu(pVCpu);
1674 }
1675
1676 /* Clear all patch information. */
1677 pVM->hm.s.pGuestPatchMem = 0;
1678 pVM->hm.s.pFreeGuestPatchMem = 0;
1679 pVM->hm.s.cbGuestPatchMem = 0;
1680 pVM->hm.s.cPatches = 0;
1681 pVM->hm.s.PatchTree = 0;
1682 pVM->hm.s.fTPRPatchingActive = false;
1683 ASMMemZero32(pVM->hm.s.aPatches, sizeof(pVM->hm.s.aPatches));
1684}
1685
1686
1687/**
1688 * Callback to patch a TPR instruction (vmmcall or mov cr8).
1689 *
1690 * @returns VBox strict status code.
1691 * @param pVM Pointer to the VM.
1692 * @param pVCpu The VMCPU for the EMT we're being called on.
1693 * @param pvUser Unused.
1694 */
1695DECLCALLBACK(VBOXSTRICTRC) hmR3RemovePatches(PVM pVM, PVMCPU pVCpu, void *pvUser)
1696{
1697 VMCPUID idCpu = (VMCPUID)(uintptr_t)pvUser;
1698
1699 /* Only execute the handler on the VCPU the original patch request was issued. */
1700 if (pVCpu->idCpu != idCpu)
1701 return VINF_SUCCESS;
1702
1703 Log(("hmR3RemovePatches\n"));
1704 for (unsigned i = 0; i < pVM->hm.s.cPatches; i++)
1705 {
1706 uint8_t abInstr[15];
1707 PHMTPRPATCH pPatch = &pVM->hm.s.aPatches[i];
1708 RTGCPTR pInstrGC = (RTGCPTR)pPatch->Core.Key;
1709 int rc;
1710
1711#ifdef LOG_ENABLED
1712 char szOutput[256];
1713
1714 rc = DBGFR3DisasInstrEx(pVM->pUVM, pVCpu->idCpu, CPUMGetGuestCS(pVCpu), pInstrGC, DBGF_DISAS_FLAGS_DEFAULT_MODE,
1715 szOutput, sizeof(szOutput), NULL);
1716 if (RT_SUCCESS(rc))
1717 Log(("Patched instr: %s\n", szOutput));
1718#endif
1719
1720 /* Check if the instruction is still the same. */
1721 rc = PGMPhysSimpleReadGCPtr(pVCpu, abInstr, pInstrGC, pPatch->cbNewOp);
1722 if (rc != VINF_SUCCESS)
1723 {
1724 Log(("Patched code removed? (rc=%Rrc0\n", rc));
1725 continue; /* swapped out or otherwise removed; skip it. */
1726 }
1727
1728 if (memcmp(abInstr, pPatch->aNewOpcode, pPatch->cbNewOp))
1729 {
1730 Log(("Patched instruction was changed! (rc=%Rrc0\n", rc));
1731 continue; /* skip it. */
1732 }
1733
1734 rc = PGMPhysSimpleWriteGCPtr(pVCpu, pInstrGC, pPatch->aOpcode, pPatch->cbOp);
1735 AssertRC(rc);
1736
1737#ifdef LOG_ENABLED
1738 rc = DBGFR3DisasInstrEx(pVM->pUVM, pVCpu->idCpu, CPUMGetGuestCS(pVCpu), pInstrGC, DBGF_DISAS_FLAGS_DEFAULT_MODE,
1739 szOutput, sizeof(szOutput), NULL);
1740 if (RT_SUCCESS(rc))
1741 Log(("Original instr: %s\n", szOutput));
1742#endif
1743 }
1744 pVM->hm.s.cPatches = 0;
1745 pVM->hm.s.PatchTree = 0;
1746 pVM->hm.s.pFreeGuestPatchMem = pVM->hm.s.pGuestPatchMem;
1747 pVM->hm.s.fTPRPatchingActive = false;
1748 return VINF_SUCCESS;
1749}
1750
1751
1752/**
1753 * Worker for enabling patching in a VT-x/AMD-V guest.
1754 *
1755 * @returns VBox status code.
1756 * @param pVM Pointer to the VM.
1757 * @param idCpu VCPU to execute hmR3RemovePatches on.
1758 * @param pPatchMem Patch memory range.
1759 * @param cbPatchMem Size of the memory range.
1760 */
1761static int hmR3EnablePatching(PVM pVM, VMCPUID idCpu, RTRCPTR pPatchMem, unsigned cbPatchMem)
1762{
1763 int rc = VMMR3EmtRendezvous(pVM, VMMEMTRENDEZVOUS_FLAGS_TYPE_ONE_BY_ONE, hmR3RemovePatches, (void *)(uintptr_t)idCpu);
1764 AssertRC(rc);
1765
1766 pVM->hm.s.pGuestPatchMem = pPatchMem;
1767 pVM->hm.s.pFreeGuestPatchMem = pPatchMem;
1768 pVM->hm.s.cbGuestPatchMem = cbPatchMem;
1769 return VINF_SUCCESS;
1770}
1771
1772
1773/**
1774 * Enable patching in a VT-x/AMD-V guest
1775 *
1776 * @returns VBox status code.
1777 * @param pVM Pointer to the VM.
1778 * @param pPatchMem Patch memory range.
1779 * @param cbPatchMem Size of the memory range.
1780 */
1781VMMR3_INT_DECL(int) HMR3EnablePatching(PVM pVM, RTGCPTR pPatchMem, unsigned cbPatchMem)
1782{
1783 VM_ASSERT_EMT(pVM);
1784 Log(("HMR3EnablePatching %RGv size %x\n", pPatchMem, cbPatchMem));
1785 if (pVM->cCpus > 1)
1786 {
1787 /* We own the IOM lock here and could cause a deadlock by waiting for a VCPU that is blocking on the IOM lock. */
1788 int rc = VMR3ReqCallNoWait(pVM, VMCPUID_ANY_QUEUE,
1789 (PFNRT)hmR3EnablePatching, 4, pVM, VMMGetCpuId(pVM), (RTRCPTR)pPatchMem, cbPatchMem);
1790 AssertRC(rc);
1791 return rc;
1792 }
1793 return hmR3EnablePatching(pVM, VMMGetCpuId(pVM), (RTRCPTR)pPatchMem, cbPatchMem);
1794}
1795
1796
1797/**
1798 * Disable patching in a VT-x/AMD-V guest.
1799 *
1800 * @returns VBox status code.
1801 * @param pVM Pointer to the VM.
1802 * @param pPatchMem Patch memory range.
1803 * @param cbPatchMem Size of the memory range.
1804 */
1805VMMR3_INT_DECL(int) HMR3DisablePatching(PVM pVM, RTGCPTR pPatchMem, unsigned cbPatchMem)
1806{
1807 Log(("HMR3DisablePatching %RGv size %x\n", pPatchMem, cbPatchMem));
1808
1809 Assert(pVM->hm.s.pGuestPatchMem == pPatchMem);
1810 Assert(pVM->hm.s.cbGuestPatchMem == cbPatchMem);
1811
1812 /* @todo Potential deadlock when other VCPUs are waiting on the IOM lock (we own it)!! */
1813 int rc = VMMR3EmtRendezvous(pVM, VMMEMTRENDEZVOUS_FLAGS_TYPE_ONE_BY_ONE, hmR3RemovePatches,
1814 (void *)(uintptr_t)VMMGetCpuId(pVM));
1815 AssertRC(rc);
1816
1817 pVM->hm.s.pGuestPatchMem = 0;
1818 pVM->hm.s.pFreeGuestPatchMem = 0;
1819 pVM->hm.s.cbGuestPatchMem = 0;
1820 pVM->hm.s.fTPRPatchingActive = false;
1821 return VINF_SUCCESS;
1822}
1823
1824
1825/**
1826 * Callback to patch a TPR instruction (vmmcall or mov cr8).
1827 *
1828 * @returns VBox strict status code.
1829 * @param pVM Pointer to the VM.
1830 * @param pVCpu The VMCPU for the EMT we're being called on.
1831 * @param pvUser User specified CPU context.
1832 *
1833 */
1834DECLCALLBACK(VBOXSTRICTRC) hmR3ReplaceTprInstr(PVM pVM, PVMCPU pVCpu, void *pvUser)
1835{
1836 /*
1837 * Only execute the handler on the VCPU the original patch request was
1838 * issued. (The other CPU(s) might not yet have switched to protected
1839 * mode, nor have the correct memory context.)
1840 */
1841 VMCPUID idCpu = (VMCPUID)(uintptr_t)pvUser;
1842 if (pVCpu->idCpu != idCpu)
1843 return VINF_SUCCESS;
1844
1845 /*
1846 * We're racing other VCPUs here, so don't try patch the instruction twice
1847 * and make sure there is still room for our patch record.
1848 */
1849 PCPUMCTX pCtx = CPUMQueryGuestCtxPtr(pVCpu);
1850 PHMTPRPATCH pPatch = (PHMTPRPATCH)RTAvloU32Get(&pVM->hm.s.PatchTree, (AVLOU32KEY)pCtx->eip);
1851 if (pPatch)
1852 {
1853 Log(("hmR3ReplaceTprInstr: already patched %RGv\n", pCtx->rip));
1854 return VINF_SUCCESS;
1855 }
1856 uint32_t const idx = pVM->hm.s.cPatches;
1857 if (idx >= RT_ELEMENTS(pVM->hm.s.aPatches))
1858 {
1859 Log(("hmR3ReplaceTprInstr: no available patch slots (%RGv)\n", pCtx->rip));
1860 return VINF_SUCCESS;
1861 }
1862 pPatch = &pVM->hm.s.aPatches[idx];
1863
1864 Log(("hmR3ReplaceTprInstr: rip=%RGv idxPatch=%u\n", pCtx->rip, idx));
1865
1866 /*
1867 * Disassembler the instruction and get cracking.
1868 */
1869 DBGFR3_DISAS_INSTR_CUR_LOG(pVCpu, "hmR3ReplaceTprInstr");
1870 PDISCPUSTATE pDis = &pVCpu->hm.s.DisState;
1871 uint32_t cbOp;
1872 int rc = EMInterpretDisasCurrent(pVM, pVCpu, pDis, &cbOp);
1873 AssertRC(rc);
1874 if ( rc == VINF_SUCCESS
1875 && pDis->pCurInstr->uOpcode == OP_MOV
1876 && cbOp >= 3)
1877 {
1878 static uint8_t const s_abVMMCall[3] = { 0x0f, 0x01, 0xd9 };
1879
1880 rc = PGMPhysSimpleReadGCPtr(pVCpu, pPatch->aOpcode, pCtx->rip, cbOp);
1881 AssertRC(rc);
1882
1883 pPatch->cbOp = cbOp;
1884
1885 if (pDis->Param1.fUse == DISUSE_DISPLACEMENT32)
1886 {
1887 /* write. */
1888 if (pDis->Param2.fUse == DISUSE_REG_GEN32)
1889 {
1890 pPatch->enmType = HMTPRINSTR_WRITE_REG;
1891 pPatch->uSrcOperand = pDis->Param2.Base.idxGenReg;
1892 Log(("hmR3ReplaceTprInstr: HMTPRINSTR_WRITE_REG %u\n", pDis->Param2.Base.idxGenReg));
1893 }
1894 else
1895 {
1896 Assert(pDis->Param2.fUse == DISUSE_IMMEDIATE32);
1897 pPatch->enmType = HMTPRINSTR_WRITE_IMM;
1898 pPatch->uSrcOperand = pDis->Param2.uValue;
1899 Log(("hmR3ReplaceTprInstr: HMTPRINSTR_WRITE_IMM %#llx\n", pDis->Param2.uValue));
1900 }
1901 rc = PGMPhysSimpleWriteGCPtr(pVCpu, pCtx->rip, s_abVMMCall, sizeof(s_abVMMCall));
1902 AssertRC(rc);
1903
1904 memcpy(pPatch->aNewOpcode, s_abVMMCall, sizeof(s_abVMMCall));
1905 pPatch->cbNewOp = sizeof(s_abVMMCall);
1906 }
1907 else
1908 {
1909 /*
1910 * TPR Read.
1911 *
1912 * Found:
1913 * mov eax, dword [fffe0080] (5 bytes)
1914 * Check if next instruction is:
1915 * shr eax, 4
1916 */
1917 Assert(pDis->Param1.fUse == DISUSE_REG_GEN32);
1918
1919 uint8_t const idxMmioReg = pDis->Param1.Base.idxGenReg;
1920 uint8_t const cbOpMmio = cbOp;
1921 uint64_t const uSavedRip = pCtx->rip;
1922
1923 pCtx->rip += cbOp;
1924 rc = EMInterpretDisasCurrent(pVM, pVCpu, pDis, &cbOp);
1925 DBGFR3_DISAS_INSTR_CUR_LOG(pVCpu, "Following read");
1926 pCtx->rip = uSavedRip;
1927
1928 if ( rc == VINF_SUCCESS
1929 && pDis->pCurInstr->uOpcode == OP_SHR
1930 && pDis->Param1.fUse == DISUSE_REG_GEN32
1931 && pDis->Param1.Base.idxGenReg == idxMmioReg
1932 && pDis->Param2.fUse == DISUSE_IMMEDIATE8
1933 && pDis->Param2.uValue == 4
1934 && cbOpMmio + cbOp < sizeof(pVM->hm.s.aPatches[idx].aOpcode))
1935 {
1936 uint8_t abInstr[15];
1937
1938 /* Replacing the two instructions above with an AMD-V specific lock-prefixed 32-bit MOV CR8 instruction so as to
1939 access CR8 in 32-bit mode and not cause a #VMEXIT. */
1940 rc = PGMPhysSimpleReadGCPtr(pVCpu, &pPatch->aOpcode, pCtx->rip, cbOpMmio + cbOp);
1941 AssertRC(rc);
1942
1943 pPatch->cbOp = cbOpMmio + cbOp;
1944
1945 /* 0xF0, 0x0F, 0x20, 0xC0 = mov eax, cr8 */
1946 abInstr[0] = 0xF0;
1947 abInstr[1] = 0x0F;
1948 abInstr[2] = 0x20;
1949 abInstr[3] = 0xC0 | pDis->Param1.Base.idxGenReg;
1950 for (unsigned i = 4; i < pPatch->cbOp; i++)
1951 abInstr[i] = 0x90; /* nop */
1952
1953 rc = PGMPhysSimpleWriteGCPtr(pVCpu, pCtx->rip, abInstr, pPatch->cbOp);
1954 AssertRC(rc);
1955
1956 memcpy(pPatch->aNewOpcode, abInstr, pPatch->cbOp);
1957 pPatch->cbNewOp = pPatch->cbOp;
1958
1959 Log(("Acceptable read/shr candidate!\n"));
1960 pPatch->enmType = HMTPRINSTR_READ_SHR4;
1961 }
1962 else
1963 {
1964 pPatch->enmType = HMTPRINSTR_READ;
1965 pPatch->uDstOperand = idxMmioReg;
1966
1967 rc = PGMPhysSimpleWriteGCPtr(pVCpu, pCtx->rip, s_abVMMCall, sizeof(s_abVMMCall));
1968 AssertRC(rc);
1969
1970 memcpy(pPatch->aNewOpcode, s_abVMMCall, sizeof(s_abVMMCall));
1971 pPatch->cbNewOp = sizeof(s_abVMMCall);
1972 Log(("hmR3ReplaceTprInstr: HMTPRINSTR_READ %u\n", pPatch->uDstOperand));
1973 }
1974 }
1975
1976 pPatch->Core.Key = pCtx->eip;
1977 rc = RTAvloU32Insert(&pVM->hm.s.PatchTree, &pPatch->Core);
1978 AssertRC(rc);
1979
1980 pVM->hm.s.cPatches++;
1981 STAM_COUNTER_INC(&pVM->hm.s.StatTprReplaceSuccess);
1982 return VINF_SUCCESS;
1983 }
1984
1985 /*
1986 * Save invalid patch, so we will not try again.
1987 */
1988 Log(("hmR3ReplaceTprInstr: Failed to patch instr!\n"));
1989 pPatch->Core.Key = pCtx->eip;
1990 pPatch->enmType = HMTPRINSTR_INVALID;
1991 rc = RTAvloU32Insert(&pVM->hm.s.PatchTree, &pPatch->Core);
1992 AssertRC(rc);
1993 pVM->hm.s.cPatches++;
1994 STAM_COUNTER_INC(&pVM->hm.s.StatTprReplaceFailure);
1995 return VINF_SUCCESS;
1996}
1997
1998
1999/**
2000 * Callback to patch a TPR instruction (jump to generated code).
2001 *
2002 * @returns VBox strict status code.
2003 * @param pVM Pointer to the VM.
2004 * @param pVCpu The VMCPU for the EMT we're being called on.
2005 * @param pvUser User specified CPU context.
2006 *
2007 */
2008DECLCALLBACK(VBOXSTRICTRC) hmR3PatchTprInstr(PVM pVM, PVMCPU pVCpu, void *pvUser)
2009{
2010 /*
2011 * Only execute the handler on the VCPU the original patch request was
2012 * issued. (The other CPU(s) might not yet have switched to protected
2013 * mode, nor have the correct memory context.)
2014 */
2015 VMCPUID idCpu = (VMCPUID)(uintptr_t)pvUser;
2016 if (pVCpu->idCpu != idCpu)
2017 return VINF_SUCCESS;
2018
2019 /*
2020 * We're racing other VCPUs here, so don't try patch the instruction twice
2021 * and make sure there is still room for our patch record.
2022 */
2023 PCPUMCTX pCtx = CPUMQueryGuestCtxPtr(pVCpu);
2024 PHMTPRPATCH pPatch = (PHMTPRPATCH)RTAvloU32Get(&pVM->hm.s.PatchTree, (AVLOU32KEY)pCtx->eip);
2025 if (pPatch)
2026 {
2027 Log(("hmR3PatchTprInstr: already patched %RGv\n", pCtx->rip));
2028 return VINF_SUCCESS;
2029 }
2030 uint32_t const idx = pVM->hm.s.cPatches;
2031 if (idx >= RT_ELEMENTS(pVM->hm.s.aPatches))
2032 {
2033 Log(("hmR3PatchTprInstr: no available patch slots (%RGv)\n", pCtx->rip));
2034 return VINF_SUCCESS;
2035 }
2036 pPatch = &pVM->hm.s.aPatches[idx];
2037
2038 Log(("hmR3PatchTprInstr: rip=%RGv idxPatch=%u\n", pCtx->rip, idx));
2039 DBGFR3_DISAS_INSTR_CUR_LOG(pVCpu, "hmR3PatchTprInstr");
2040
2041 /*
2042 * Disassemble the instruction and get cracking.
2043 */
2044 PDISCPUSTATE pDis = &pVCpu->hm.s.DisState;
2045 uint32_t cbOp;
2046 int rc = EMInterpretDisasCurrent(pVM, pVCpu, pDis, &cbOp);
2047 AssertRC(rc);
2048 if ( rc == VINF_SUCCESS
2049 && pDis->pCurInstr->uOpcode == OP_MOV
2050 && cbOp >= 5)
2051 {
2052 uint8_t aPatch[64];
2053 uint32_t off = 0;
2054
2055 rc = PGMPhysSimpleReadGCPtr(pVCpu, pPatch->aOpcode, pCtx->rip, cbOp);
2056 AssertRC(rc);
2057
2058 pPatch->cbOp = cbOp;
2059 pPatch->enmType = HMTPRINSTR_JUMP_REPLACEMENT;
2060
2061 if (pDis->Param1.fUse == DISUSE_DISPLACEMENT32)
2062 {
2063 /*
2064 * TPR write:
2065 *
2066 * push ECX [51]
2067 * push EDX [52]
2068 * push EAX [50]
2069 * xor EDX,EDX [31 D2]
2070 * mov EAX,EAX [89 C0]
2071 * or
2072 * mov EAX,0000000CCh [B8 CC 00 00 00]
2073 * mov ECX,0C0000082h [B9 82 00 00 C0]
2074 * wrmsr [0F 30]
2075 * pop EAX [58]
2076 * pop EDX [5A]
2077 * pop ECX [59]
2078 * jmp return_address [E9 return_address]
2079 *
2080 */
2081 bool fUsesEax = (pDis->Param2.fUse == DISUSE_REG_GEN32 && pDis->Param2.Base.idxGenReg == DISGREG_EAX);
2082
2083 aPatch[off++] = 0x51; /* push ecx */
2084 aPatch[off++] = 0x52; /* push edx */
2085 if (!fUsesEax)
2086 aPatch[off++] = 0x50; /* push eax */
2087 aPatch[off++] = 0x31; /* xor edx, edx */
2088 aPatch[off++] = 0xD2;
2089 if (pDis->Param2.fUse == DISUSE_REG_GEN32)
2090 {
2091 if (!fUsesEax)
2092 {
2093 aPatch[off++] = 0x89; /* mov eax, src_reg */
2094 aPatch[off++] = MAKE_MODRM(3, pDis->Param2.Base.idxGenReg, DISGREG_EAX);
2095 }
2096 }
2097 else
2098 {
2099 Assert(pDis->Param2.fUse == DISUSE_IMMEDIATE32);
2100 aPatch[off++] = 0xB8; /* mov eax, immediate */
2101 *(uint32_t *)&aPatch[off] = pDis->Param2.uValue;
2102 off += sizeof(uint32_t);
2103 }
2104 aPatch[off++] = 0xB9; /* mov ecx, 0xc0000082 */
2105 *(uint32_t *)&aPatch[off] = MSR_K8_LSTAR;
2106 off += sizeof(uint32_t);
2107
2108 aPatch[off++] = 0x0F; /* wrmsr */
2109 aPatch[off++] = 0x30;
2110 if (!fUsesEax)
2111 aPatch[off++] = 0x58; /* pop eax */
2112 aPatch[off++] = 0x5A; /* pop edx */
2113 aPatch[off++] = 0x59; /* pop ecx */
2114 }
2115 else
2116 {
2117 /*
2118 * TPR read:
2119 *
2120 * push ECX [51]
2121 * push EDX [52]
2122 * push EAX [50]
2123 * mov ECX,0C0000082h [B9 82 00 00 C0]
2124 * rdmsr [0F 32]
2125 * mov EAX,EAX [89 C0]
2126 * pop EAX [58]
2127 * pop EDX [5A]
2128 * pop ECX [59]
2129 * jmp return_address [E9 return_address]
2130 *
2131 */
2132 Assert(pDis->Param1.fUse == DISUSE_REG_GEN32);
2133
2134 if (pDis->Param1.Base.idxGenReg != DISGREG_ECX)
2135 aPatch[off++] = 0x51; /* push ecx */
2136 if (pDis->Param1.Base.idxGenReg != DISGREG_EDX )
2137 aPatch[off++] = 0x52; /* push edx */
2138 if (pDis->Param1.Base.idxGenReg != DISGREG_EAX)
2139 aPatch[off++] = 0x50; /* push eax */
2140
2141 aPatch[off++] = 0x31; /* xor edx, edx */
2142 aPatch[off++] = 0xD2;
2143
2144 aPatch[off++] = 0xB9; /* mov ecx, 0xc0000082 */
2145 *(uint32_t *)&aPatch[off] = MSR_K8_LSTAR;
2146 off += sizeof(uint32_t);
2147
2148 aPatch[off++] = 0x0F; /* rdmsr */
2149 aPatch[off++] = 0x32;
2150
2151 if (pDis->Param1.Base.idxGenReg != DISGREG_EAX)
2152 {
2153 aPatch[off++] = 0x89; /* mov dst_reg, eax */
2154 aPatch[off++] = MAKE_MODRM(3, DISGREG_EAX, pDis->Param1.Base.idxGenReg);
2155 }
2156
2157 if (pDis->Param1.Base.idxGenReg != DISGREG_EAX)
2158 aPatch[off++] = 0x58; /* pop eax */
2159 if (pDis->Param1.Base.idxGenReg != DISGREG_EDX )
2160 aPatch[off++] = 0x5A; /* pop edx */
2161 if (pDis->Param1.Base.idxGenReg != DISGREG_ECX)
2162 aPatch[off++] = 0x59; /* pop ecx */
2163 }
2164 aPatch[off++] = 0xE9; /* jmp return_address */
2165 *(RTRCUINTPTR *)&aPatch[off] = ((RTRCUINTPTR)pCtx->eip + cbOp) - ((RTRCUINTPTR)pVM->hm.s.pFreeGuestPatchMem + off + 4);
2166 off += sizeof(RTRCUINTPTR);
2167
2168 if (pVM->hm.s.pFreeGuestPatchMem + off <= pVM->hm.s.pGuestPatchMem + pVM->hm.s.cbGuestPatchMem)
2169 {
2170 /* Write new code to the patch buffer. */
2171 rc = PGMPhysSimpleWriteGCPtr(pVCpu, pVM->hm.s.pFreeGuestPatchMem, aPatch, off);
2172 AssertRC(rc);
2173
2174#ifdef LOG_ENABLED
2175 uint32_t cbCurInstr;
2176 for (RTGCPTR GCPtrInstr = pVM->hm.s.pFreeGuestPatchMem;
2177 GCPtrInstr < pVM->hm.s.pFreeGuestPatchMem + off;
2178 GCPtrInstr += RT_MAX(cbCurInstr, 1))
2179 {
2180 char szOutput[256];
2181 rc = DBGFR3DisasInstrEx(pVM->pUVM, pVCpu->idCpu, pCtx->cs.Sel, GCPtrInstr, DBGF_DISAS_FLAGS_DEFAULT_MODE,
2182 szOutput, sizeof(szOutput), &cbCurInstr);
2183 if (RT_SUCCESS(rc))
2184 Log(("Patch instr %s\n", szOutput));
2185 else
2186 Log(("%RGv: rc=%Rrc\n", GCPtrInstr, rc));
2187 }
2188#endif
2189
2190 pPatch->aNewOpcode[0] = 0xE9;
2191 *(RTRCUINTPTR *)&pPatch->aNewOpcode[1] = ((RTRCUINTPTR)pVM->hm.s.pFreeGuestPatchMem) - ((RTRCUINTPTR)pCtx->eip + 5);
2192
2193 /* Overwrite the TPR instruction with a jump. */
2194 rc = PGMPhysSimpleWriteGCPtr(pVCpu, pCtx->eip, pPatch->aNewOpcode, 5);
2195 AssertRC(rc);
2196
2197 DBGFR3_DISAS_INSTR_CUR_LOG(pVCpu, "Jump");
2198
2199 pVM->hm.s.pFreeGuestPatchMem += off;
2200 pPatch->cbNewOp = 5;
2201
2202 pPatch->Core.Key = pCtx->eip;
2203 rc = RTAvloU32Insert(&pVM->hm.s.PatchTree, &pPatch->Core);
2204 AssertRC(rc);
2205
2206 pVM->hm.s.cPatches++;
2207 pVM->hm.s.fTPRPatchingActive = true;
2208 STAM_COUNTER_INC(&pVM->hm.s.StatTprPatchSuccess);
2209 return VINF_SUCCESS;
2210 }
2211
2212 Log(("Ran out of space in our patch buffer!\n"));
2213 }
2214 else
2215 Log(("hmR3PatchTprInstr: Failed to patch instr!\n"));
2216
2217
2218 /*
2219 * Save invalid patch, so we will not try again.
2220 */
2221 pPatch = &pVM->hm.s.aPatches[idx];
2222 pPatch->Core.Key = pCtx->eip;
2223 pPatch->enmType = HMTPRINSTR_INVALID;
2224 rc = RTAvloU32Insert(&pVM->hm.s.PatchTree, &pPatch->Core);
2225 AssertRC(rc);
2226 pVM->hm.s.cPatches++;
2227 STAM_COUNTER_INC(&pVM->hm.s.StatTprPatchFailure);
2228 return VINF_SUCCESS;
2229}
2230
2231
2232/**
2233 * Attempt to patch TPR mmio instructions.
2234 *
2235 * @returns VBox status code.
2236 * @param pVM Pointer to the VM.
2237 * @param pVCpu Pointer to the VMCPU.
2238 * @param pCtx Pointer to the guest CPU context.
2239 */
2240VMMR3_INT_DECL(int) HMR3PatchTprInstr(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
2241{
2242 NOREF(pCtx);
2243 int rc = VMMR3EmtRendezvous(pVM, VMMEMTRENDEZVOUS_FLAGS_TYPE_ONE_BY_ONE,
2244 pVM->hm.s.pGuestPatchMem ? hmR3PatchTprInstr : hmR3ReplaceTprInstr,
2245 (void *)(uintptr_t)pVCpu->idCpu);
2246 AssertRC(rc);
2247 return rc;
2248}
2249
2250
2251/**
2252 * Checks if a code selector (CS) is suitable for execution
2253 * within VMX when unrestricted execution isn't available.
2254 *
2255 * @returns true if selector is suitable for VMX, otherwise
2256 * false.
2257 * @param pSel Pointer to the selector to check (CS).
2258 * uStackDpl The CPL, aka the DPL of the stack segment.
2259 */
2260static bool hmR3IsCodeSelectorOkForVmx(PCPUMSELREG pSel, unsigned uStackDpl)
2261{
2262 /*
2263 * Segment must be an accessed code segment, it must be present and it must
2264 * be usable.
2265 * Note! These are all standard requirements and if CS holds anything else
2266 * we've got buggy code somewhere!
2267 */
2268 AssertCompile(X86DESCATTR_TYPE == 0xf);
2269 AssertMsgReturn( (pSel->Attr.u & (X86_SEL_TYPE_ACCESSED | X86_SEL_TYPE_CODE | X86DESCATTR_DT | X86DESCATTR_P | X86DESCATTR_UNUSABLE))
2270 == (X86_SEL_TYPE_ACCESSED | X86_SEL_TYPE_CODE | X86DESCATTR_DT | X86DESCATTR_P),
2271 ("%#x\n", pSel->Attr.u),
2272 false);
2273
2274 /* For conforming segments, CS.DPL must be <= SS.DPL, while CS.DPL
2275 must equal SS.DPL for non-confroming segments.
2276 Note! This is also a hard requirement like above. */
2277 AssertMsgReturn( pSel->Attr.n.u4Type & X86_SEL_TYPE_CONF
2278 ? pSel->Attr.n.u2Dpl <= uStackDpl
2279 : pSel->Attr.n.u2Dpl == uStackDpl,
2280 ("u4Type=%#x u2Dpl=%u uStackDpl=%u\n", pSel->Attr.n.u4Type, pSel->Attr.n.u2Dpl, uStackDpl),
2281 false);
2282
2283 /*
2284 * The following two requirements are VT-x specific:
2285 * - G bit must be set if any high limit bits are set.
2286 * - G bit must be clear if any low limit bits are clear.
2287 */
2288 if ( ((pSel->u32Limit & 0xfff00000) == 0x00000000 || pSel->Attr.n.u1Granularity)
2289 && ((pSel->u32Limit & 0x00000fff) == 0x00000fff || !pSel->Attr.n.u1Granularity) )
2290 return true;
2291 return false;
2292}
2293
2294
2295/**
2296 * Checks if a data selector (DS/ES/FS/GS) is suitable for
2297 * execution within VMX when unrestricted execution isn't
2298 * available.
2299 *
2300 * @returns true if selector is suitable for VMX, otherwise
2301 * false.
2302 * @param pSel Pointer to the selector to check
2303 * (DS/ES/FS/GS).
2304 */
2305static bool hmR3IsDataSelectorOkForVmx(PCPUMSELREG pSel)
2306{
2307 /*
2308 * Unusable segments are OK. These days they should be marked as such, as
2309 * but as an alternative we for old saved states and AMD<->VT-x migration
2310 * we also treat segments with all the attributes cleared as unusable.
2311 */
2312 if (pSel->Attr.n.u1Unusable || !pSel->Attr.u)
2313 return true;
2314
2315 /** @todo tighten these checks. Will require CPUM load adjusting. */
2316
2317 /* Segment must be accessed. */
2318 if (pSel->Attr.u & X86_SEL_TYPE_ACCESSED)
2319 {
2320 /* Code segments must also be readable. */
2321 if ( !(pSel->Attr.u & X86_SEL_TYPE_CODE)
2322 || (pSel->Attr.u & X86_SEL_TYPE_READ))
2323 {
2324 /* The S bit must be set. */
2325 if (pSel->Attr.n.u1DescType)
2326 {
2327 /* Except for conforming segments, DPL >= RPL. */
2328 if ( pSel->Attr.n.u2Dpl >= (pSel->Sel & X86_SEL_RPL)
2329 || pSel->Attr.n.u4Type >= X86_SEL_TYPE_ER_ACC)
2330 {
2331 /* Segment must be present. */
2332 if (pSel->Attr.n.u1Present)
2333 {
2334 /*
2335 * The following two requirements are VT-x specific:
2336 * - G bit must be set if any high limit bits are set.
2337 * - G bit must be clear if any low limit bits are clear.
2338 */
2339 if ( ((pSel->u32Limit & 0xfff00000) == 0x00000000 || pSel->Attr.n.u1Granularity)
2340 && ((pSel->u32Limit & 0x00000fff) == 0x00000fff || !pSel->Attr.n.u1Granularity) )
2341 return true;
2342 }
2343 }
2344 }
2345 }
2346 }
2347
2348 return false;
2349}
2350
2351
2352/**
2353 * Checks if the stack selector (SS) is suitable for execution
2354 * within VMX when unrestricted execution isn't available.
2355 *
2356 * @returns true if selector is suitable for VMX, otherwise
2357 * false.
2358 * @param pSel Pointer to the selector to check (SS).
2359 */
2360static bool hmR3IsStackSelectorOkForVmx(PCPUMSELREG pSel)
2361{
2362 /*
2363 * Unusable segments are OK. These days they should be marked as such, as
2364 * but as an alternative we for old saved states and AMD<->VT-x migration
2365 * we also treat segments with all the attributes cleared as unusable.
2366 */
2367 /** @todo r=bird: actually all zeros isn't gonna cut it... SS.DPL == CPL. */
2368 if (pSel->Attr.n.u1Unusable || !pSel->Attr.u)
2369 return true;
2370
2371 /*
2372 * Segment must be an accessed writable segment, it must be present.
2373 * Note! These are all standard requirements and if SS holds anything else
2374 * we've got buggy code somewhere!
2375 */
2376 AssertCompile(X86DESCATTR_TYPE == 0xf);
2377 AssertMsgReturn( (pSel->Attr.u & (X86_SEL_TYPE_ACCESSED | X86_SEL_TYPE_WRITE | X86DESCATTR_DT | X86DESCATTR_P | X86_SEL_TYPE_CODE))
2378 == (X86_SEL_TYPE_ACCESSED | X86_SEL_TYPE_WRITE | X86DESCATTR_DT | X86DESCATTR_P),
2379 ("%#x\n", pSel->Attr.u),
2380 false);
2381
2382 /* DPL must equal RPL.
2383 Note! This is also a hard requirement like above. */
2384 AssertMsgReturn(pSel->Attr.n.u2Dpl == (pSel->Sel & X86_SEL_RPL),
2385 ("u2Dpl=%u Sel=%#x\n", pSel->Attr.n.u2Dpl, pSel->Sel),
2386 false);
2387
2388 /*
2389 * The following two requirements are VT-x specific:
2390 * - G bit must be set if any high limit bits are set.
2391 * - G bit must be clear if any low limit bits are clear.
2392 */
2393 if ( ((pSel->u32Limit & 0xfff00000) == 0x00000000 || pSel->Attr.n.u1Granularity)
2394 && ((pSel->u32Limit & 0x00000fff) == 0x00000fff || !pSel->Attr.n.u1Granularity) )
2395 return true;
2396 return false;
2397}
2398
2399
2400/**
2401 * Force execution of the current IO code in the recompiler.
2402 *
2403 * @returns VBox status code.
2404 * @param pVM Pointer to the VM.
2405 * @param pCtx Partial VM execution context.
2406 */
2407VMMR3_INT_DECL(int) HMR3EmulateIoBlock(PVM pVM, PCPUMCTX pCtx)
2408{
2409 PVMCPU pVCpu = VMMGetCpu(pVM);
2410
2411 Assert(HMIsEnabled(pVM));
2412 Log(("HMR3EmulateIoBlock\n"));
2413
2414 /* This is primarily intended to speed up Grub, so we don't care about paged protected mode. */
2415 if (HMCanEmulateIoBlockEx(pCtx))
2416 {
2417 Log(("HMR3EmulateIoBlock -> enabled\n"));
2418 pVCpu->hm.s.EmulateIoBlock.fEnabled = true;
2419 pVCpu->hm.s.EmulateIoBlock.GCPtrFunctionEip = pCtx->rip;
2420 pVCpu->hm.s.EmulateIoBlock.cr0 = pCtx->cr0;
2421 return VINF_EM_RESCHEDULE_REM;
2422 }
2423 return VINF_SUCCESS;
2424}
2425
2426
2427/**
2428 * Checks if we can currently use hardware accelerated raw mode.
2429 *
2430 * @returns true if we can currently use hardware acceleration, otherwise false.
2431 * @param pVM Pointer to the VM.
2432 * @param pCtx Partial VM execution context.
2433 */
2434VMMR3DECL(bool) HMR3CanExecuteGuest(PVM pVM, PCPUMCTX pCtx)
2435{
2436 PVMCPU pVCpu = VMMGetCpu(pVM);
2437
2438 Assert(HMIsEnabled(pVM));
2439
2440 /* If we're still executing the IO code, then return false. */
2441 if ( RT_UNLIKELY(pVCpu->hm.s.EmulateIoBlock.fEnabled)
2442 && pCtx->rip < pVCpu->hm.s.EmulateIoBlock.GCPtrFunctionEip + 0x200
2443 && pCtx->rip > pVCpu->hm.s.EmulateIoBlock.GCPtrFunctionEip - 0x200
2444 && pCtx->cr0 == pVCpu->hm.s.EmulateIoBlock.cr0)
2445 return false;
2446
2447 pVCpu->hm.s.EmulateIoBlock.fEnabled = false;
2448
2449 /* AMD-V supports real & protected mode with or without paging. */
2450 if (pVM->hm.s.svm.fEnabled)
2451 {
2452 pVCpu->hm.s.fActive = true;
2453 return true;
2454 }
2455
2456 pVCpu->hm.s.fActive = false;
2457
2458 /* Note! The context supplied by REM is partial. If we add more checks here, be sure to verify that REM provides this info! */
2459 Assert( (pVM->hm.s.vmx.fUnrestrictedGuest && !pVM->hm.s.vmx.pRealModeTSS)
2460 || (!pVM->hm.s.vmx.fUnrestrictedGuest && pVM->hm.s.vmx.pRealModeTSS));
2461
2462 bool fSupportsRealMode = pVM->hm.s.vmx.fUnrestrictedGuest || PDMVmmDevHeapIsEnabled(pVM);
2463 if (!pVM->hm.s.vmx.fUnrestrictedGuest)
2464 {
2465 /*
2466 * The VMM device heap is a requirement for emulating real mode or protected mode without paging with the unrestricted
2467 * guest execution feature i missing (VT-x only).
2468 */
2469 if (fSupportsRealMode)
2470 {
2471 if (CPUMIsGuestInRealModeEx(pCtx))
2472 {
2473 /* In V86 mode (VT-x or not), the CPU enforces real-mode compatible selector
2474 * bases and limits, i.e. limit must be 64K and base must be selector * 16.
2475 * If this is not true, we cannot execute real mode as V86 and have to fall
2476 * back to emulation.
2477 */
2478 if ( pCtx->cs.Sel != (pCtx->cs.u64Base >> 4)
2479 || pCtx->ds.Sel != (pCtx->ds.u64Base >> 4)
2480 || pCtx->es.Sel != (pCtx->es.u64Base >> 4)
2481 || pCtx->ss.Sel != (pCtx->ss.u64Base >> 4)
2482 || pCtx->fs.Sel != (pCtx->fs.u64Base >> 4)
2483 || pCtx->gs.Sel != (pCtx->gs.u64Base >> 4))
2484 {
2485 STAM_COUNTER_INC(&pVCpu->hm.s.StatVmxCheckBadRmSelBase);
2486 return false;
2487 }
2488 if ( (pCtx->cs.u32Limit != 0xffff)
2489 || (pCtx->ds.u32Limit != 0xffff)
2490 || (pCtx->es.u32Limit != 0xffff)
2491 || (pCtx->ss.u32Limit != 0xffff)
2492 || (pCtx->fs.u32Limit != 0xffff)
2493 || (pCtx->gs.u32Limit != 0xffff))
2494 {
2495 STAM_COUNTER_INC(&pVCpu->hm.s.StatVmxCheckBadRmSelLimit);
2496 return false;
2497 }
2498 STAM_COUNTER_INC(&pVCpu->hm.s.StatVmxCheckRmOk);
2499 }
2500 else
2501 {
2502 /* Verify the requirements for executing code in protected
2503 mode. VT-x can't handle the CPU state right after a switch
2504 from real to protected mode. (all sorts of RPL & DPL assumptions). */
2505 if (pVCpu->hm.s.vmx.fWasInRealMode)
2506 {
2507 /** @todo If guest is in V86 mode, these checks should be different! */
2508 if ((pCtx->cs.Sel & X86_SEL_RPL) != (pCtx->ss.Sel & X86_SEL_RPL))
2509 {
2510 STAM_COUNTER_INC(&pVCpu->hm.s.StatVmxCheckBadRpl);
2511 return false;
2512 }
2513 if ( !hmR3IsCodeSelectorOkForVmx(&pCtx->cs, pCtx->ss.Attr.n.u2Dpl)
2514 || !hmR3IsDataSelectorOkForVmx(&pCtx->ds)
2515 || !hmR3IsDataSelectorOkForVmx(&pCtx->es)
2516 || !hmR3IsDataSelectorOkForVmx(&pCtx->fs)
2517 || !hmR3IsDataSelectorOkForVmx(&pCtx->gs)
2518 || !hmR3IsStackSelectorOkForVmx(&pCtx->ss))
2519 {
2520 STAM_COUNTER_INC(&pVCpu->hm.s.StatVmxCheckBadSel);
2521 return false;
2522 }
2523 }
2524 /* VT-x also chokes on invalid TR or LDTR selectors (minix). */
2525 if (pCtx->gdtr.cbGdt)
2526 {
2527 if (pCtx->tr.Sel > pCtx->gdtr.cbGdt)
2528 {
2529 STAM_COUNTER_INC(&pVCpu->hm.s.StatVmxCheckBadTr);
2530 return false;
2531 }
2532 else if (pCtx->ldtr.Sel > pCtx->gdtr.cbGdt)
2533 {
2534 STAM_COUNTER_INC(&pVCpu->hm.s.StatVmxCheckBadLdt);
2535 return false;
2536 }
2537 }
2538 STAM_COUNTER_INC(&pVCpu->hm.s.StatVmxCheckPmOk);
2539 }
2540 }
2541 else
2542 {
2543 if ( !CPUMIsGuestInLongModeEx(pCtx)
2544 && !pVM->hm.s.vmx.fUnrestrictedGuest)
2545 {
2546 if ( !pVM->hm.s.fNestedPaging /* Requires a fake PD for real *and* protected mode without paging - stored in the VMM device heap */
2547 || CPUMIsGuestInRealModeEx(pCtx)) /* Requires a fake TSS for real mode - stored in the VMM device heap */
2548 return false;
2549
2550 /* Too early for VT-x; Solaris guests will fail with a guru meditation otherwise; same for XP. */
2551 if (pCtx->idtr.pIdt == 0 || pCtx->idtr.cbIdt == 0 || pCtx->tr.Sel == 0)
2552 return false;
2553
2554 /* The guest is about to complete the switch to protected mode. Wait a bit longer. */
2555 /* Windows XP; switch to protected mode; all selectors are marked not present in the
2556 * hidden registers (possible recompiler bug; see load_seg_vm) */
2557 if (pCtx->cs.Attr.n.u1Present == 0)
2558 return false;
2559 if (pCtx->ss.Attr.n.u1Present == 0)
2560 return false;
2561
2562 /* Windows XP: possible same as above, but new recompiler requires new heuristics?
2563 VT-x doesn't seem to like something about the guest state and this stuff avoids it. */
2564 /** @todo This check is actually wrong, it doesn't take the direction of the
2565 * stack segment into account. But, it does the job for now. */
2566 if (pCtx->rsp >= pCtx->ss.u32Limit)
2567 return false;
2568 }
2569 }
2570 }
2571
2572 if (pVM->hm.s.vmx.fEnabled)
2573 {
2574 uint32_t mask;
2575
2576 /* if bit N is set in cr0_fixed0, then it must be set in the guest's cr0. */
2577 mask = (uint32_t)pVM->hm.s.vmx.Msrs.u64Cr0Fixed0;
2578 /* Note: We ignore the NE bit here on purpose; see vmmr0\hmr0.cpp for details. */
2579 mask &= ~X86_CR0_NE;
2580
2581 if (fSupportsRealMode)
2582 {
2583 /* Note: We ignore the PE & PG bits here on purpose; we emulate real and protected mode without paging. */
2584 mask &= ~(X86_CR0_PG|X86_CR0_PE);
2585 }
2586 else
2587 {
2588 /* We support protected mode without paging using identity mapping. */
2589 mask &= ~X86_CR0_PG;
2590 }
2591 if ((pCtx->cr0 & mask) != mask)
2592 return false;
2593
2594 /* if bit N is cleared in cr0_fixed1, then it must be zero in the guest's cr0. */
2595 mask = (uint32_t)~pVM->hm.s.vmx.Msrs.u64Cr0Fixed1;
2596 if ((pCtx->cr0 & mask) != 0)
2597 return false;
2598
2599 /* if bit N is set in cr4_fixed0, then it must be set in the guest's cr4. */
2600 mask = (uint32_t)pVM->hm.s.vmx.Msrs.u64Cr4Fixed0;
2601 mask &= ~X86_CR4_VMXE;
2602 if ((pCtx->cr4 & mask) != mask)
2603 return false;
2604
2605 /* if bit N is cleared in cr4_fixed1, then it must be zero in the guest's cr4. */
2606 mask = (uint32_t)~pVM->hm.s.vmx.Msrs.u64Cr4Fixed1;
2607 if ((pCtx->cr4 & mask) != 0)
2608 return false;
2609
2610 pVCpu->hm.s.fActive = true;
2611 return true;
2612 }
2613
2614 return false;
2615}
2616
2617
2618/**
2619 * Checks if we need to reschedule due to VMM device heap changes.
2620 *
2621 * @returns true if a reschedule is required, otherwise false.
2622 * @param pVM Pointer to the VM.
2623 * @param pCtx VM execution context.
2624 */
2625VMMR3_INT_DECL(bool) HMR3IsRescheduleRequired(PVM pVM, PCPUMCTX pCtx)
2626{
2627 /*
2628 * The VMM device heap is a requirement for emulating real-mode or protected-mode without paging
2629 * when the unrestricted guest execution feature is missing (VT-x only).
2630 */
2631 if ( pVM->hm.s.vmx.fEnabled
2632 && !pVM->hm.s.vmx.fUnrestrictedGuest
2633 && CPUMIsGuestInRealModeEx(pCtx)
2634 && !PDMVmmDevHeapIsEnabled(pVM))
2635 {
2636 return true;
2637 }
2638
2639 return false;
2640}
2641
2642
2643/**
2644 * Notification from EM about a rescheduling into hardware assisted execution
2645 * mode.
2646 *
2647 * @param pVCpu Pointer to the current VMCPU.
2648 */
2649VMMR3_INT_DECL(void) HMR3NotifyScheduled(PVMCPU pVCpu)
2650{
2651 VMCPU_HMCF_SET(pVCpu, HM_CHANGED_ALL_GUEST);
2652}
2653
2654
2655/**
2656 * Notification from EM about returning from instruction emulation (REM / EM).
2657 *
2658 * @param pVCpu Pointer to the VMCPU.
2659 */
2660VMMR3_INT_DECL(void) HMR3NotifyEmulated(PVMCPU pVCpu)
2661{
2662 VMCPU_HMCF_SET(pVCpu, HM_CHANGED_ALL_GUEST);
2663}
2664
2665
2666/**
2667 * Checks if we are currently using hardware accelerated raw mode.
2668 *
2669 * @returns true if hardware acceleration is being used, otherwise false.
2670 * @param pVCpu Pointer to the VMCPU.
2671 */
2672VMMR3_INT_DECL(bool) HMR3IsActive(PVMCPU pVCpu)
2673{
2674 return pVCpu->hm.s.fActive;
2675}
2676
2677
2678/**
2679 * External interface for querying whether hardware accelerated raw mode is
2680 * enabled.
2681 *
2682 * @returns true if VT-x or AMD-V is being used, otherwise false.
2683 * @param pUVM The user mode VM handle.
2684 * @sa HMIsEnabled, HMIsEnabledNotMacro.
2685 */
2686VMMR3DECL(bool) HMR3IsEnabled(PUVM pUVM)
2687{
2688 UVM_ASSERT_VALID_EXT_RETURN(pUVM, false);
2689 PVM pVM = pUVM->pVM;
2690 VM_ASSERT_VALID_EXT_RETURN(pVM, false);
2691 return pVM->fHMEnabled; /* Don't use the macro as the GUI may query us very very early. */
2692}
2693
2694
2695/**
2696 * External interface for querying whether VT-x is being used.
2697 *
2698 * @returns true if VT-x is being used, otherwise false.
2699 * @param pUVM The user mode VM handle.
2700 * @sa HMR3IsSvmEnabled, HMIsEnabled
2701 */
2702VMMR3DECL(bool) HMR3IsVmxEnabled(PUVM pUVM)
2703{
2704 UVM_ASSERT_VALID_EXT_RETURN(pUVM, false);
2705 PVM pVM = pUVM->pVM;
2706 VM_ASSERT_VALID_EXT_RETURN(pVM, false);
2707 return pVM->hm.s.vmx.fEnabled
2708 && pVM->hm.s.vmx.fSupported
2709 && pVM->fHMEnabled;
2710}
2711
2712
2713/**
2714 * External interface for querying whether AMD-V is being used.
2715 *
2716 * @returns true if VT-x is being used, otherwise false.
2717 * @param pUVM The user mode VM handle.
2718 * @sa HMR3IsVmxEnabled, HMIsEnabled
2719 */
2720VMMR3DECL(bool) HMR3IsSvmEnabled(PUVM pUVM)
2721{
2722 UVM_ASSERT_VALID_EXT_RETURN(pUVM, false);
2723 PVM pVM = pUVM->pVM;
2724 VM_ASSERT_VALID_EXT_RETURN(pVM, false);
2725 return pVM->hm.s.svm.fEnabled
2726 && pVM->hm.s.svm.fSupported
2727 && pVM->fHMEnabled;
2728}
2729
2730
2731/**
2732 * Checks if we are currently using nested paging.
2733 *
2734 * @returns true if nested paging is being used, otherwise false.
2735 * @param pUVM The user mode VM handle.
2736 */
2737VMMR3DECL(bool) HMR3IsNestedPagingActive(PUVM pUVM)
2738{
2739 UVM_ASSERT_VALID_EXT_RETURN(pUVM, false);
2740 PVM pVM = pUVM->pVM;
2741 VM_ASSERT_VALID_EXT_RETURN(pVM, false);
2742 return pVM->hm.s.fNestedPaging;
2743}
2744
2745
2746/**
2747 * Checks if we are currently using VPID in VT-x mode.
2748 *
2749 * @returns true if VPID is being used, otherwise false.
2750 * @param pUVM The user mode VM handle.
2751 */
2752VMMR3DECL(bool) HMR3IsVpidActive(PUVM pUVM)
2753{
2754 UVM_ASSERT_VALID_EXT_RETURN(pUVM, false);
2755 PVM pVM = pUVM->pVM;
2756 VM_ASSERT_VALID_EXT_RETURN(pVM, false);
2757 return pVM->hm.s.vmx.fVpid;
2758}
2759
2760
2761/**
2762 * Checks if we are currently using VT-x unrestricted execution,
2763 * aka UX.
2764 *
2765 * @returns true if UX is being used, otherwise false.
2766 * @param pUVM The user mode VM handle.
2767 */
2768VMMR3DECL(bool) HMR3IsUXActive(PUVM pUVM)
2769{
2770 UVM_ASSERT_VALID_EXT_RETURN(pUVM, false);
2771 PVM pVM = pUVM->pVM;
2772 VM_ASSERT_VALID_EXT_RETURN(pVM, false);
2773 return pVM->hm.s.vmx.fUnrestrictedGuest;
2774}
2775
2776
2777/**
2778 * Checks if internal events are pending. In that case we are not allowed to dispatch interrupts.
2779 *
2780 * @returns true if an internal event is pending, otherwise false.
2781 * @param pVM Pointer to the VM.
2782 */
2783VMMR3_INT_DECL(bool) HMR3IsEventPending(PVMCPU pVCpu)
2784{
2785 return HMIsEnabled(pVCpu->pVMR3) && pVCpu->hm.s.Event.fPending;
2786}
2787
2788
2789/**
2790 * Checks if the VMX-preemption timer is being used.
2791 *
2792 * @returns true if the VMX-preemption timer is being used, otherwise false.
2793 * @param pVM Pointer to the VM.
2794 */
2795VMMR3_INT_DECL(bool) HMR3IsVmxPreemptionTimerUsed(PVM pVM)
2796{
2797 return HMIsEnabled(pVM)
2798 && pVM->hm.s.vmx.fEnabled
2799 && pVM->hm.s.vmx.fUsePreemptTimer;
2800}
2801
2802
2803/**
2804 * Restart an I/O instruction that was refused in ring-0
2805 *
2806 * @returns Strict VBox status code. Informational status codes other than the one documented
2807 * here are to be treated as internal failure. Use IOM_SUCCESS() to check for success.
2808 * @retval VINF_SUCCESS Success.
2809 * @retval VINF_EM_FIRST-VINF_EM_LAST Success with some exceptions (see IOM_SUCCESS()), the
2810 * status code must be passed on to EM.
2811 * @retval VERR_NOT_FOUND if no pending I/O instruction.
2812 *
2813 * @param pVM Pointer to the VM.
2814 * @param pVCpu Pointer to the VMCPU.
2815 * @param pCtx Pointer to the guest CPU context.
2816 */
2817VMMR3_INT_DECL(VBOXSTRICTRC) HMR3RestartPendingIOInstr(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
2818{
2819 HMPENDINGIO enmType = pVCpu->hm.s.PendingIO.enmType;
2820
2821 pVCpu->hm.s.PendingIO.enmType = HMPENDINGIO_INVALID;
2822
2823 if ( pVCpu->hm.s.PendingIO.GCPtrRip != pCtx->rip
2824 || enmType == HMPENDINGIO_INVALID)
2825 return VERR_NOT_FOUND;
2826
2827 VBOXSTRICTRC rcStrict;
2828 switch (enmType)
2829 {
2830 case HMPENDINGIO_PORT_READ:
2831 {
2832 uint32_t uAndVal = pVCpu->hm.s.PendingIO.s.Port.uAndVal;
2833 uint32_t u32Val = 0;
2834
2835 rcStrict = IOMIOPortRead(pVM, pVCpu, pVCpu->hm.s.PendingIO.s.Port.uPort,
2836 &u32Val,
2837 pVCpu->hm.s.PendingIO.s.Port.cbSize);
2838 if (IOM_SUCCESS(rcStrict))
2839 {
2840 /* Write back to the EAX register. */
2841 pCtx->eax = (pCtx->eax & ~uAndVal) | (u32Val & uAndVal);
2842 pCtx->rip = pVCpu->hm.s.PendingIO.GCPtrRipNext;
2843 }
2844 break;
2845 }
2846
2847 case HMPENDINGIO_PORT_WRITE:
2848 rcStrict = IOMIOPortWrite(pVM, pVCpu, pVCpu->hm.s.PendingIO.s.Port.uPort,
2849 pCtx->eax & pVCpu->hm.s.PendingIO.s.Port.uAndVal,
2850 pVCpu->hm.s.PendingIO.s.Port.cbSize);
2851 if (IOM_SUCCESS(rcStrict))
2852 pCtx->rip = pVCpu->hm.s.PendingIO.GCPtrRipNext;
2853 break;
2854
2855 default:
2856 AssertLogRelFailedReturn(VERR_HM_UNKNOWN_IO_INSTRUCTION);
2857 }
2858
2859 if (IOM_SUCCESS(rcStrict))
2860 {
2861 /*
2862 * Check for I/O breakpoints.
2863 */
2864 uint32_t const uDr7 = pCtx->dr[7];
2865 if ( ( (uDr7 & X86_DR7_ENABLED_MASK)
2866 && X86_DR7_ANY_RW_IO(uDr7)
2867 && (pCtx->cr4 & X86_CR4_DE))
2868 || DBGFBpIsHwIoArmed(pVM))
2869 {
2870 VBOXSTRICTRC rcStrict2 = DBGFBpCheckIo(pVM, pVCpu, pCtx, pVCpu->hm.s.PendingIO.s.Port.uPort,
2871 pVCpu->hm.s.PendingIO.s.Port.cbSize);
2872 if (rcStrict2 == VINF_EM_RAW_GUEST_TRAP)
2873 rcStrict2 = TRPMAssertTrap(pVCpu, X86_XCPT_DB, TRPM_TRAP);
2874 /* rcStrict is VINF_SUCCESS or in [VINF_EM_FIRST..VINF_EM_LAST]. */
2875 else if (rcStrict2 != VINF_SUCCESS && (rcStrict == VINF_SUCCESS || rcStrict2 < rcStrict))
2876 rcStrict = rcStrict2;
2877 }
2878 }
2879 return rcStrict;
2880}
2881
2882
2883/**
2884 * Check fatal VT-x/AMD-V error and produce some meaningful
2885 * log release message.
2886 *
2887 * @param pVM Pointer to the VM.
2888 * @param iStatusCode VBox status code.
2889 */
2890VMMR3_INT_DECL(void) HMR3CheckError(PVM pVM, int iStatusCode)
2891{
2892 for (VMCPUID i = 0; i < pVM->cCpus; i++)
2893 {
2894 PVMCPU pVCpu = &pVM->aCpus[i];
2895 switch (iStatusCode)
2896 {
2897 case VERR_VMX_INVALID_VMCS_FIELD:
2898 break;
2899
2900 case VERR_VMX_INVALID_VMCS_PTR:
2901 LogRel(("HM: VERR_VMX_INVALID_VMCS_PTR:\n"));
2902 LogRel(("HM: CPU[%u] Current pointer %#RGp vs %#RGp\n", i, pVCpu->hm.s.vmx.LastError.u64VMCSPhys,
2903 pVCpu->hm.s.vmx.HCPhysVmcs));
2904 LogRel(("HM: CPU[%u] Current VMCS version %#x\n", i, pVCpu->hm.s.vmx.LastError.u32VMCSRevision));
2905 LogRel(("HM: CPU[%u] Entered Host Cpu %u\n", i, pVCpu->hm.s.vmx.LastError.idEnteredCpu));
2906 LogRel(("HM: CPU[%u] Current Host Cpu %u\n", i, pVCpu->hm.s.vmx.LastError.idCurrentCpu));
2907 break;
2908
2909 case VERR_VMX_UNABLE_TO_START_VM:
2910 LogRel(("HM: VERR_VMX_UNABLE_TO_START_VM:\n"));
2911 LogRel(("HM: CPU[%u] Instruction error %#x\n", i, pVCpu->hm.s.vmx.LastError.u32InstrError));
2912 LogRel(("HM: CPU[%u] Exit reason %#x\n", i, pVCpu->hm.s.vmx.LastError.u32ExitReason));
2913
2914 if ( pVM->aCpus[i].hm.s.vmx.LastError.u32InstrError == VMX_ERROR_VMLAUCH_NON_CLEAR_VMCS
2915 || pVM->aCpus[i].hm.s.vmx.LastError.u32InstrError == VMX_ERROR_VMRESUME_NON_LAUNCHED_VMCS)
2916 {
2917 LogRel(("HM: CPU[%u] Entered Host Cpu %u\n", i, pVCpu->hm.s.vmx.LastError.idEnteredCpu));
2918 LogRel(("HM: CPU[%u] Current Host Cpu %u\n", i, pVCpu->hm.s.vmx.LastError.idCurrentCpu));
2919 }
2920 else if (pVM->aCpus[i].hm.s.vmx.LastError.u32InstrError == VMX_ERROR_VMENTRY_INVALID_CONTROL_FIELDS)
2921 {
2922 LogRel(("HM: CPU[%u] PinCtls %#RX32\n", i, pVCpu->hm.s.vmx.u32PinCtls));
2923 LogRel(("HM: CPU[%u] ProcCtls %#RX32\n", i, pVCpu->hm.s.vmx.u32ProcCtls));
2924 LogRel(("HM: CPU[%u] ProcCtls2 %#RX32\n", i, pVCpu->hm.s.vmx.u32ProcCtls2));
2925 LogRel(("HM: CPU[%u] EntryCtls %#RX32\n", i, pVCpu->hm.s.vmx.u32EntryCtls));
2926 LogRel(("HM: CPU[%u] ExitCtls %#RX32\n", i, pVCpu->hm.s.vmx.u32ExitCtls));
2927 LogRel(("HM: CPU[%u] MSRBitmapPhys %#RHp\n", i, pVCpu->hm.s.vmx.HCPhysMsrBitmap));
2928#ifdef VBOX_WITH_AUTO_MSR_LOAD_RESTORE
2929 LogRel(("HM: CPU[%u] GuestMSRPhys %#RHp\n", i, pVCpu->hm.s.vmx.HCPhysGuestMsr));
2930 LogRel(("HM: CPU[%u] HostMsrPhys %#RHp\n", i, pVCpu->hm.s.vmx.HCPhysHostMsr));
2931 LogRel(("HM: CPU[%u] cGuestMSRs %u\n", i, pVCpu->hm.s.vmx.cGuestMsrs));
2932#endif
2933 }
2934 /** @todo Log VM-entry event injection control fields
2935 * VMX_VMCS_CTRL_ENTRY_IRQ_INFO, VMX_VMCS_CTRL_ENTRY_EXCEPTION_ERRCODE
2936 * and VMX_VMCS_CTRL_ENTRY_INSTR_LENGTH from the VMCS. */
2937 break;
2938
2939 case VERR_VMX_INVALID_VMXON_PTR:
2940 break;
2941
2942 case VERR_HM_UNSUPPORTED_CPU_FEATURE_COMBO:
2943 case VERR_VMX_INVALID_GUEST_STATE:
2944 case VERR_VMX_UNEXPECTED_EXIT_CODE:
2945 case VERR_SVM_UNKNOWN_EXIT:
2946 case VERR_SVM_UNEXPECTED_EXIT:
2947 case VERR_SVM_UNEXPECTED_PATCH_TYPE:
2948 case VERR_SVM_UNEXPECTED_XCPT_EXIT:
2949 {
2950 LogRel(("HM: CPU[%u] HM error %#x (%u)\n", i, pVCpu->hm.s.u32HMError, pVCpu->hm.s.u32HMError));
2951 break;
2952 }
2953 }
2954 }
2955
2956 if (iStatusCode == VERR_VMX_UNABLE_TO_START_VM)
2957 {
2958 LogRel(("VERR_VMX_UNABLE_TO_START_VM: VM-entry allowed %#RX32\n", pVM->hm.s.vmx.Msrs.VmxEntry.n.allowed1));
2959 LogRel(("VERR_VMX_UNABLE_TO_START_VM: VM-entry disallowed %#RX32\n", pVM->hm.s.vmx.Msrs.VmxEntry.n.disallowed0));
2960 }
2961}
2962
2963
2964/**
2965 * Execute state save operation.
2966 *
2967 * @returns VBox status code.
2968 * @param pVM Pointer to the VM.
2969 * @param pSSM SSM operation handle.
2970 */
2971static DECLCALLBACK(int) hmR3Save(PVM pVM, PSSMHANDLE pSSM)
2972{
2973 int rc;
2974
2975 Log(("hmR3Save:\n"));
2976
2977 for (VMCPUID i = 0; i < pVM->cCpus; i++)
2978 {
2979 /*
2980 * Save the basic bits - fortunately all the other things can be resynced on load.
2981 */
2982 rc = SSMR3PutU32(pSSM, pVM->aCpus[i].hm.s.Event.fPending);
2983 AssertRCReturn(rc, rc);
2984 rc = SSMR3PutU32(pSSM, pVM->aCpus[i].hm.s.Event.u32ErrCode);
2985 AssertRCReturn(rc, rc);
2986 rc = SSMR3PutU64(pSSM, pVM->aCpus[i].hm.s.Event.u64IntrInfo);
2987 AssertRCReturn(rc, rc);
2988
2989 /** @todo We only need to save pVM->aCpus[i].hm.s.vmx.fWasInRealMode and
2990 * perhaps not even that (the initial value of @c true is safe. */
2991 uint32_t u32Dummy = PGMMODE_REAL;
2992 rc = SSMR3PutU32(pSSM, u32Dummy);
2993 AssertRCReturn(rc, rc);
2994 rc = SSMR3PutU32(pSSM, u32Dummy);
2995 AssertRCReturn(rc, rc);
2996 rc = SSMR3PutU32(pSSM, u32Dummy);
2997 AssertRCReturn(rc, rc);
2998 }
2999
3000#ifdef VBOX_HM_WITH_GUEST_PATCHING
3001 rc = SSMR3PutGCPtr(pSSM, pVM->hm.s.pGuestPatchMem);
3002 AssertRCReturn(rc, rc);
3003 rc = SSMR3PutGCPtr(pSSM, pVM->hm.s.pFreeGuestPatchMem);
3004 AssertRCReturn(rc, rc);
3005 rc = SSMR3PutU32(pSSM, pVM->hm.s.cbGuestPatchMem);
3006 AssertRCReturn(rc, rc);
3007
3008 /* Store all the guest patch records too. */
3009 rc = SSMR3PutU32(pSSM, pVM->hm.s.cPatches);
3010 AssertRCReturn(rc, rc);
3011
3012 for (unsigned i = 0; i < pVM->hm.s.cPatches; i++)
3013 {
3014 PHMTPRPATCH pPatch = &pVM->hm.s.aPatches[i];
3015
3016 rc = SSMR3PutU32(pSSM, pPatch->Core.Key);
3017 AssertRCReturn(rc, rc);
3018
3019 rc = SSMR3PutMem(pSSM, pPatch->aOpcode, sizeof(pPatch->aOpcode));
3020 AssertRCReturn(rc, rc);
3021
3022 rc = SSMR3PutU32(pSSM, pPatch->cbOp);
3023 AssertRCReturn(rc, rc);
3024
3025 rc = SSMR3PutMem(pSSM, pPatch->aNewOpcode, sizeof(pPatch->aNewOpcode));
3026 AssertRCReturn(rc, rc);
3027
3028 rc = SSMR3PutU32(pSSM, pPatch->cbNewOp);
3029 AssertRCReturn(rc, rc);
3030
3031 AssertCompileSize(HMTPRINSTR, 4);
3032 rc = SSMR3PutU32(pSSM, (uint32_t)pPatch->enmType);
3033 AssertRCReturn(rc, rc);
3034
3035 rc = SSMR3PutU32(pSSM, pPatch->uSrcOperand);
3036 AssertRCReturn(rc, rc);
3037
3038 rc = SSMR3PutU32(pSSM, pPatch->uDstOperand);
3039 AssertRCReturn(rc, rc);
3040
3041 rc = SSMR3PutU32(pSSM, pPatch->pJumpTarget);
3042 AssertRCReturn(rc, rc);
3043
3044 rc = SSMR3PutU32(pSSM, pPatch->cFaults);
3045 AssertRCReturn(rc, rc);
3046 }
3047#endif
3048 return VINF_SUCCESS;
3049}
3050
3051
3052/**
3053 * Execute state load operation.
3054 *
3055 * @returns VBox status code.
3056 * @param pVM Pointer to the VM.
3057 * @param pSSM SSM operation handle.
3058 * @param uVersion Data layout version.
3059 * @param uPass The data pass.
3060 */
3061static DECLCALLBACK(int) hmR3Load(PVM pVM, PSSMHANDLE pSSM, uint32_t uVersion, uint32_t uPass)
3062{
3063 int rc;
3064
3065 Log(("hmR3Load:\n"));
3066 Assert(uPass == SSM_PASS_FINAL); NOREF(uPass);
3067
3068 /*
3069 * Validate version.
3070 */
3071 if ( uVersion != HM_SSM_VERSION
3072 && uVersion != HM_SSM_VERSION_NO_PATCHING
3073 && uVersion != HM_SSM_VERSION_2_0_X)
3074 {
3075 AssertMsgFailed(("hmR3Load: Invalid version uVersion=%d!\n", uVersion));
3076 return VERR_SSM_UNSUPPORTED_DATA_UNIT_VERSION;
3077 }
3078 for (VMCPUID i = 0; i < pVM->cCpus; i++)
3079 {
3080 rc = SSMR3GetU32(pSSM, &pVM->aCpus[i].hm.s.Event.fPending);
3081 AssertRCReturn(rc, rc);
3082 rc = SSMR3GetU32(pSSM, &pVM->aCpus[i].hm.s.Event.u32ErrCode);
3083 AssertRCReturn(rc, rc);
3084 rc = SSMR3GetU64(pSSM, &pVM->aCpus[i].hm.s.Event.u64IntrInfo);
3085 AssertRCReturn(rc, rc);
3086
3087 if (uVersion >= HM_SSM_VERSION_NO_PATCHING)
3088 {
3089 uint32_t val;
3090 /** @todo See note in hmR3Save(). */
3091 rc = SSMR3GetU32(pSSM, &val);
3092 AssertRCReturn(rc, rc);
3093 rc = SSMR3GetU32(pSSM, &val);
3094 AssertRCReturn(rc, rc);
3095 rc = SSMR3GetU32(pSSM, &val);
3096 AssertRCReturn(rc, rc);
3097 }
3098 }
3099#ifdef VBOX_HM_WITH_GUEST_PATCHING
3100 if (uVersion > HM_SSM_VERSION_NO_PATCHING)
3101 {
3102 rc = SSMR3GetGCPtr(pSSM, &pVM->hm.s.pGuestPatchMem);
3103 AssertRCReturn(rc, rc);
3104 rc = SSMR3GetGCPtr(pSSM, &pVM->hm.s.pFreeGuestPatchMem);
3105 AssertRCReturn(rc, rc);
3106 rc = SSMR3GetU32(pSSM, &pVM->hm.s.cbGuestPatchMem);
3107 AssertRCReturn(rc, rc);
3108
3109 /* Fetch all TPR patch records. */
3110 rc = SSMR3GetU32(pSSM, &pVM->hm.s.cPatches);
3111 AssertRCReturn(rc, rc);
3112
3113 for (unsigned i = 0; i < pVM->hm.s.cPatches; i++)
3114 {
3115 PHMTPRPATCH pPatch = &pVM->hm.s.aPatches[i];
3116
3117 rc = SSMR3GetU32(pSSM, &pPatch->Core.Key);
3118 AssertRCReturn(rc, rc);
3119
3120 rc = SSMR3GetMem(pSSM, pPatch->aOpcode, sizeof(pPatch->aOpcode));
3121 AssertRCReturn(rc, rc);
3122
3123 rc = SSMR3GetU32(pSSM, &pPatch->cbOp);
3124 AssertRCReturn(rc, rc);
3125
3126 rc = SSMR3GetMem(pSSM, pPatch->aNewOpcode, sizeof(pPatch->aNewOpcode));
3127 AssertRCReturn(rc, rc);
3128
3129 rc = SSMR3GetU32(pSSM, &pPatch->cbNewOp);
3130 AssertRCReturn(rc, rc);
3131
3132 rc = SSMR3GetU32(pSSM, (uint32_t *)&pPatch->enmType);
3133 AssertRCReturn(rc, rc);
3134
3135 if (pPatch->enmType == HMTPRINSTR_JUMP_REPLACEMENT)
3136 pVM->hm.s.fTPRPatchingActive = true;
3137
3138 Assert(pPatch->enmType == HMTPRINSTR_JUMP_REPLACEMENT || pVM->hm.s.fTPRPatchingActive == false);
3139
3140 rc = SSMR3GetU32(pSSM, &pPatch->uSrcOperand);
3141 AssertRCReturn(rc, rc);
3142
3143 rc = SSMR3GetU32(pSSM, &pPatch->uDstOperand);
3144 AssertRCReturn(rc, rc);
3145
3146 rc = SSMR3GetU32(pSSM, &pPatch->cFaults);
3147 AssertRCReturn(rc, rc);
3148
3149 rc = SSMR3GetU32(pSSM, &pPatch->pJumpTarget);
3150 AssertRCReturn(rc, rc);
3151
3152 Log(("hmR3Load: patch %d\n", i));
3153 Log(("Key = %x\n", pPatch->Core.Key));
3154 Log(("cbOp = %d\n", pPatch->cbOp));
3155 Log(("cbNewOp = %d\n", pPatch->cbNewOp));
3156 Log(("type = %d\n", pPatch->enmType));
3157 Log(("srcop = %d\n", pPatch->uSrcOperand));
3158 Log(("dstop = %d\n", pPatch->uDstOperand));
3159 Log(("cFaults = %d\n", pPatch->cFaults));
3160 Log(("target = %x\n", pPatch->pJumpTarget));
3161 rc = RTAvloU32Insert(&pVM->hm.s.PatchTree, &pPatch->Core);
3162 AssertRC(rc);
3163 }
3164 }
3165#endif
3166
3167 return VINF_SUCCESS;
3168}
3169
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette