VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMR0/VMMR0.cpp@ 75323

Last change on this file since 75323 was 74785, checked in by vboxsync, 6 years ago

vm.h,VMM: Use VMCPU_FF_IS_SET instead of VMCPU_FF_IS_PENDING when checking a single flag. Added compile time assertion on single flag. bugref:9180

  • Property svn:eol-style set to native
  • Property svn:keywords set to Id Revision
File size: 90.6 KB
Line 
1/* $Id: VMMR0.cpp 74785 2018-10-12 10:14:19Z vboxsync $ */
2/** @file
3 * VMM - Host Context Ring 0.
4 */
5
6/*
7 * Copyright (C) 2006-2017 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*********************************************************************************************************************************
20* Header Files *
21*********************************************************************************************************************************/
22#define LOG_GROUP LOG_GROUP_VMM
23#include <VBox/vmm/vmm.h>
24#include <VBox/sup.h>
25#include <VBox/vmm/trpm.h>
26#include <VBox/vmm/cpum.h>
27#include <VBox/vmm/pdmapi.h>
28#include <VBox/vmm/pgm.h>
29#ifdef VBOX_WITH_NEM_R0
30# include <VBox/vmm/nem.h>
31#endif
32#include <VBox/vmm/em.h>
33#include <VBox/vmm/stam.h>
34#include <VBox/vmm/tm.h>
35#include "VMMInternal.h"
36#include <VBox/vmm/vm.h>
37#include <VBox/vmm/gvm.h>
38#ifdef VBOX_WITH_PCI_PASSTHROUGH
39# include <VBox/vmm/pdmpci.h>
40#endif
41#include <VBox/vmm/apic.h>
42
43#include <VBox/vmm/gvmm.h>
44#include <VBox/vmm/gmm.h>
45#include <VBox/vmm/gim.h>
46#include <VBox/intnet.h>
47#include <VBox/vmm/hm.h>
48#include <VBox/param.h>
49#include <VBox/err.h>
50#include <VBox/version.h>
51#include <VBox/log.h>
52
53#include <iprt/asm-amd64-x86.h>
54#include <iprt/assert.h>
55#include <iprt/crc.h>
56#include <iprt/mp.h>
57#include <iprt/once.h>
58#include <iprt/stdarg.h>
59#include <iprt/string.h>
60#include <iprt/thread.h>
61#include <iprt/timer.h>
62
63#include "dtrace/VBoxVMM.h"
64
65
66#if defined(_MSC_VER) && defined(RT_ARCH_AMD64) /** @todo check this with with VC7! */
67# pragma intrinsic(_AddressOfReturnAddress)
68#endif
69
70#if defined(RT_OS_DARWIN) && ARCH_BITS == 32
71# error "32-bit darwin is no longer supported. Go back to 4.3 or earlier!"
72#endif
73
74
75
76/*********************************************************************************************************************************
77* Defined Constants And Macros *
78*********************************************************************************************************************************/
79/** @def VMM_CHECK_SMAP_SETUP
80 * SMAP check setup. */
81/** @def VMM_CHECK_SMAP_CHECK
82 * Checks that the AC flag is set if SMAP is enabled. If AC is not set,
83 * it will be logged and @a a_BadExpr is executed. */
84/** @def VMM_CHECK_SMAP_CHECK2
85 * Checks that the AC flag is set if SMAP is enabled. If AC is not set, it will
86 * be logged, written to the VMs assertion text buffer, and @a a_BadExpr is
87 * executed. */
88#if defined(VBOX_STRICT) || 1
89# define VMM_CHECK_SMAP_SETUP() uint32_t const fKernelFeatures = SUPR0GetKernelFeatures()
90# define VMM_CHECK_SMAP_CHECK(a_BadExpr) \
91 do { \
92 if (fKernelFeatures & SUPKERNELFEATURES_SMAP) \
93 { \
94 RTCCUINTREG fEflCheck = ASMGetFlags(); \
95 if (RT_LIKELY(fEflCheck & X86_EFL_AC)) \
96 { /* likely */ } \
97 else \
98 { \
99 SUPR0Printf("%s, line %d: EFLAGS.AC is clear! (%#x)\n", __FUNCTION__, __LINE__, (uint32_t)fEflCheck); \
100 a_BadExpr; \
101 } \
102 } \
103 } while (0)
104# define VMM_CHECK_SMAP_CHECK2(a_pVM, a_BadExpr) \
105 do { \
106 if (fKernelFeatures & SUPKERNELFEATURES_SMAP) \
107 { \
108 RTCCUINTREG fEflCheck = ASMGetFlags(); \
109 if (RT_LIKELY(fEflCheck & X86_EFL_AC)) \
110 { /* likely */ } \
111 else \
112 { \
113 SUPR0BadContext((a_pVM) ? (a_pVM)->pSession : NULL, __FILE__, __LINE__, "EFLAGS.AC is zero!"); \
114 RTStrPrintf(pVM->vmm.s.szRing0AssertMsg1, sizeof(pVM->vmm.s.szRing0AssertMsg1), \
115 "%s, line %d: EFLAGS.AC is clear! (%#x)\n", __FUNCTION__, __LINE__, (uint32_t)fEflCheck); \
116 a_BadExpr; \
117 } \
118 } \
119 } while (0)
120#else
121# define VMM_CHECK_SMAP_SETUP() uint32_t const fKernelFeatures = 0
122# define VMM_CHECK_SMAP_CHECK(a_BadExpr) NOREF(fKernelFeatures)
123# define VMM_CHECK_SMAP_CHECK2(a_pVM, a_BadExpr) NOREF(fKernelFeatures)
124#endif
125
126
127/*********************************************************************************************************************************
128* Internal Functions *
129*********************************************************************************************************************************/
130RT_C_DECLS_BEGIN
131#if defined(RT_ARCH_X86) && (defined(RT_OS_SOLARIS) || defined(RT_OS_FREEBSD))
132extern uint64_t __udivdi3(uint64_t, uint64_t);
133extern uint64_t __umoddi3(uint64_t, uint64_t);
134#endif
135RT_C_DECLS_END
136
137
138/*********************************************************************************************************************************
139* Global Variables *
140*********************************************************************************************************************************/
141/** Drag in necessary library bits.
142 * The runtime lives here (in VMMR0.r0) and VBoxDD*R0.r0 links against us. */
143PFNRT g_VMMR0Deps[] =
144{
145 (PFNRT)RTCrc32,
146 (PFNRT)RTOnce,
147#if defined(RT_ARCH_X86) && (defined(RT_OS_SOLARIS) || defined(RT_OS_FREEBSD))
148 (PFNRT)__udivdi3,
149 (PFNRT)__umoddi3,
150#endif
151 NULL
152};
153
154#ifdef RT_OS_SOLARIS
155/* Dependency information for the native solaris loader. */
156extern "C" { char _depends_on[] = "vboxdrv"; }
157#endif
158
159/** The result of SUPR0GetRawModeUsability(), set by ModuleInit(). */
160int g_rcRawModeUsability = VINF_SUCCESS;
161
162
163/**
164 * Initialize the module.
165 * This is called when we're first loaded.
166 *
167 * @returns 0 on success.
168 * @returns VBox status on failure.
169 * @param hMod Image handle for use in APIs.
170 */
171DECLEXPORT(int) ModuleInit(void *hMod)
172{
173 VMM_CHECK_SMAP_SETUP();
174 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
175
176#ifdef VBOX_WITH_DTRACE_R0
177 /*
178 * The first thing to do is register the static tracepoints.
179 * (Deregistration is automatic.)
180 */
181 int rc2 = SUPR0TracerRegisterModule(hMod, &g_VTGObjHeader);
182 if (RT_FAILURE(rc2))
183 return rc2;
184#endif
185 LogFlow(("ModuleInit:\n"));
186
187#ifdef VBOX_WITH_64ON32_CMOS_DEBUG
188 /*
189 * Display the CMOS debug code.
190 */
191 ASMOutU8(0x72, 0x03);
192 uint8_t bDebugCode = ASMInU8(0x73);
193 LogRel(("CMOS Debug Code: %#x (%d)\n", bDebugCode, bDebugCode));
194 RTLogComPrintf("CMOS Debug Code: %#x (%d)\n", bDebugCode, bDebugCode);
195#endif
196
197 /*
198 * Initialize the VMM, GVMM, GMM, HM, PGM (Darwin) and INTNET.
199 */
200 int rc = vmmInitFormatTypes();
201 if (RT_SUCCESS(rc))
202 {
203 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
204 rc = GVMMR0Init();
205 if (RT_SUCCESS(rc))
206 {
207 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
208 rc = GMMR0Init();
209 if (RT_SUCCESS(rc))
210 {
211 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
212 rc = HMR0Init();
213 if (RT_SUCCESS(rc))
214 {
215 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
216 rc = PGMRegisterStringFormatTypes();
217 if (RT_SUCCESS(rc))
218 {
219 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
220#ifdef VBOX_WITH_2X_4GB_ADDR_SPACE
221 rc = PGMR0DynMapInit();
222#endif
223 if (RT_SUCCESS(rc))
224 {
225 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
226 rc = IntNetR0Init();
227 if (RT_SUCCESS(rc))
228 {
229#ifdef VBOX_WITH_PCI_PASSTHROUGH
230 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
231 rc = PciRawR0Init();
232#endif
233 if (RT_SUCCESS(rc))
234 {
235 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
236 rc = CPUMR0ModuleInit();
237 if (RT_SUCCESS(rc))
238 {
239#ifdef VBOX_WITH_TRIPLE_FAULT_HACK
240 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
241 rc = vmmR0TripleFaultHackInit();
242 if (RT_SUCCESS(rc))
243#endif
244 {
245 VMM_CHECK_SMAP_CHECK(rc = VERR_VMM_SMAP_BUT_AC_CLEAR);
246 if (RT_SUCCESS(rc))
247 {
248 g_rcRawModeUsability = SUPR0GetRawModeUsability();
249 if (g_rcRawModeUsability != VINF_SUCCESS)
250 SUPR0Printf("VMMR0!ModuleInit: SUPR0GetRawModeUsability -> %Rrc\n",
251 g_rcRawModeUsability);
252 LogFlow(("ModuleInit: returns success\n"));
253 return VINF_SUCCESS;
254 }
255 }
256
257 /*
258 * Bail out.
259 */
260#ifdef VBOX_WITH_TRIPLE_FAULT_HACK
261 vmmR0TripleFaultHackTerm();
262#endif
263 }
264 else
265 LogRel(("ModuleInit: CPUMR0ModuleInit -> %Rrc\n", rc));
266#ifdef VBOX_WITH_PCI_PASSTHROUGH
267 PciRawR0Term();
268#endif
269 }
270 else
271 LogRel(("ModuleInit: PciRawR0Init -> %Rrc\n", rc));
272 IntNetR0Term();
273 }
274 else
275 LogRel(("ModuleInit: IntNetR0Init -> %Rrc\n", rc));
276#ifdef VBOX_WITH_2X_4GB_ADDR_SPACE
277 PGMR0DynMapTerm();
278#endif
279 }
280 else
281 LogRel(("ModuleInit: PGMR0DynMapInit -> %Rrc\n", rc));
282 PGMDeregisterStringFormatTypes();
283 }
284 else
285 LogRel(("ModuleInit: PGMRegisterStringFormatTypes -> %Rrc\n", rc));
286 HMR0Term();
287 }
288 else
289 LogRel(("ModuleInit: HMR0Init -> %Rrc\n", rc));
290 GMMR0Term();
291 }
292 else
293 LogRel(("ModuleInit: GMMR0Init -> %Rrc\n", rc));
294 GVMMR0Term();
295 }
296 else
297 LogRel(("ModuleInit: GVMMR0Init -> %Rrc\n", rc));
298 vmmTermFormatTypes();
299 }
300 else
301 LogRel(("ModuleInit: vmmInitFormatTypes -> %Rrc\n", rc));
302
303 LogFlow(("ModuleInit: failed %Rrc\n", rc));
304 return rc;
305}
306
307
308/**
309 * Terminate the module.
310 * This is called when we're finally unloaded.
311 *
312 * @param hMod Image handle for use in APIs.
313 */
314DECLEXPORT(void) ModuleTerm(void *hMod)
315{
316 NOREF(hMod);
317 LogFlow(("ModuleTerm:\n"));
318
319 /*
320 * Terminate the CPUM module (Local APIC cleanup).
321 */
322 CPUMR0ModuleTerm();
323
324 /*
325 * Terminate the internal network service.
326 */
327 IntNetR0Term();
328
329 /*
330 * PGM (Darwin), HM and PciRaw global cleanup.
331 */
332#ifdef VBOX_WITH_2X_4GB_ADDR_SPACE
333 PGMR0DynMapTerm();
334#endif
335#ifdef VBOX_WITH_PCI_PASSTHROUGH
336 PciRawR0Term();
337#endif
338 PGMDeregisterStringFormatTypes();
339 HMR0Term();
340#ifdef VBOX_WITH_TRIPLE_FAULT_HACK
341 vmmR0TripleFaultHackTerm();
342#endif
343
344 /*
345 * Destroy the GMM and GVMM instances.
346 */
347 GMMR0Term();
348 GVMMR0Term();
349
350 vmmTermFormatTypes();
351
352 LogFlow(("ModuleTerm: returns\n"));
353}
354
355
356/**
357 * Initiates the R0 driver for a particular VM instance.
358 *
359 * @returns VBox status code.
360 *
361 * @param pGVM The global (ring-0) VM structure.
362 * @param pVM The cross context VM structure.
363 * @param uSvnRev The SVN revision of the ring-3 part.
364 * @param uBuildType Build type indicator.
365 * @thread EMT(0)
366 */
367static int vmmR0InitVM(PGVM pGVM, PVM pVM, uint32_t uSvnRev, uint32_t uBuildType)
368{
369 VMM_CHECK_SMAP_SETUP();
370 VMM_CHECK_SMAP_CHECK(return VERR_VMM_SMAP_BUT_AC_CLEAR);
371
372 /*
373 * Match the SVN revisions and build type.
374 */
375 if (uSvnRev != VMMGetSvnRev())
376 {
377 LogRel(("VMMR0InitVM: Revision mismatch, r3=%d r0=%d\n", uSvnRev, VMMGetSvnRev()));
378 SUPR0Printf("VMMR0InitVM: Revision mismatch, r3=%d r0=%d\n", uSvnRev, VMMGetSvnRev());
379 return VERR_VMM_R0_VERSION_MISMATCH;
380 }
381 if (uBuildType != vmmGetBuildType())
382 {
383 LogRel(("VMMR0InitVM: Build type mismatch, r3=%#x r0=%#x\n", uBuildType, vmmGetBuildType()));
384 SUPR0Printf("VMMR0InitVM: Build type mismatch, r3=%#x r0=%#x\n", uBuildType, vmmGetBuildType());
385 return VERR_VMM_R0_VERSION_MISMATCH;
386 }
387
388 int rc = GVMMR0ValidateGVMandVMandEMT(pGVM, pVM, 0 /*idCpu*/);
389 if (RT_FAILURE(rc))
390 return rc;
391
392#ifdef LOG_ENABLED
393 /*
394 * Register the EMT R0 logger instance for VCPU 0.
395 */
396 PVMCPU pVCpu = &pVM->aCpus[0];
397
398 PVMMR0LOGGER pR0Logger = pVCpu->vmm.s.pR0LoggerR0;
399 if (pR0Logger)
400 {
401# if 0 /* testing of the logger. */
402 LogCom(("vmmR0InitVM: before %p\n", RTLogDefaultInstance()));
403 LogCom(("vmmR0InitVM: pfnFlush=%p actual=%p\n", pR0Logger->Logger.pfnFlush, vmmR0LoggerFlush));
404 LogCom(("vmmR0InitVM: pfnLogger=%p actual=%p\n", pR0Logger->Logger.pfnLogger, vmmR0LoggerWrapper));
405 LogCom(("vmmR0InitVM: offScratch=%d fFlags=%#x fDestFlags=%#x\n", pR0Logger->Logger.offScratch, pR0Logger->Logger.fFlags, pR0Logger->Logger.fDestFlags));
406
407 RTLogSetDefaultInstanceThread(&pR0Logger->Logger, (uintptr_t)pVM->pSession);
408 LogCom(("vmmR0InitVM: after %p reg\n", RTLogDefaultInstance()));
409 RTLogSetDefaultInstanceThread(NULL, pVM->pSession);
410 LogCom(("vmmR0InitVM: after %p dereg\n", RTLogDefaultInstance()));
411
412 pR0Logger->Logger.pfnLogger("hello ring-0 logger\n");
413 LogCom(("vmmR0InitVM: returned successfully from direct logger call.\n"));
414 pR0Logger->Logger.pfnFlush(&pR0Logger->Logger);
415 LogCom(("vmmR0InitVM: returned successfully from direct flush call.\n"));
416
417 RTLogSetDefaultInstanceThread(&pR0Logger->Logger, (uintptr_t)pVM->pSession);
418 LogCom(("vmmR0InitVM: after %p reg2\n", RTLogDefaultInstance()));
419 pR0Logger->Logger.pfnLogger("hello ring-0 logger\n");
420 LogCom(("vmmR0InitVM: returned successfully from direct logger call (2). offScratch=%d\n", pR0Logger->Logger.offScratch));
421 RTLogSetDefaultInstanceThread(NULL, pVM->pSession);
422 LogCom(("vmmR0InitVM: after %p dereg2\n", RTLogDefaultInstance()));
423
424 RTLogLoggerEx(&pR0Logger->Logger, 0, ~0U, "hello ring-0 logger (RTLogLoggerEx)\n");
425 LogCom(("vmmR0InitVM: RTLogLoggerEx returned fine offScratch=%d\n", pR0Logger->Logger.offScratch));
426
427 RTLogSetDefaultInstanceThread(&pR0Logger->Logger, (uintptr_t)pVM->pSession);
428 RTLogPrintf("hello ring-0 logger (RTLogPrintf)\n");
429 LogCom(("vmmR0InitVM: RTLogPrintf returned fine offScratch=%d\n", pR0Logger->Logger.offScratch));
430# endif
431 Log(("Switching to per-thread logging instance %p (key=%p)\n", &pR0Logger->Logger, pVM->pSession));
432 RTLogSetDefaultInstanceThread(&pR0Logger->Logger, (uintptr_t)pVM->pSession);
433 pR0Logger->fRegistered = true;
434 }
435#endif /* LOG_ENABLED */
436
437 /*
438 * Check if the host supports high resolution timers or not.
439 */
440 if ( pVM->vmm.s.fUsePeriodicPreemptionTimers
441 && !RTTimerCanDoHighResolution())
442 pVM->vmm.s.fUsePeriodicPreemptionTimers = false;
443
444 /*
445 * Initialize the per VM data for GVMM and GMM.
446 */
447 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
448 rc = GVMMR0InitVM(pGVM);
449// if (RT_SUCCESS(rc))
450// rc = GMMR0InitPerVMData(pVM);
451 if (RT_SUCCESS(rc))
452 {
453 /*
454 * Init HM, CPUM and PGM (Darwin only).
455 */
456 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
457 rc = HMR0InitVM(pVM);
458 if (RT_SUCCESS(rc))
459 VMM_CHECK_SMAP_CHECK2(pVM, rc = VERR_VMM_RING0_ASSERTION); /* CPUR0InitVM will otherwise panic the host */
460 if (RT_SUCCESS(rc))
461 {
462 rc = CPUMR0InitVM(pVM);
463 if (RT_SUCCESS(rc))
464 {
465 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
466#ifdef VBOX_WITH_2X_4GB_ADDR_SPACE
467 rc = PGMR0DynMapInitVM(pVM);
468#endif
469 if (RT_SUCCESS(rc))
470 {
471 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
472 rc = EMR0InitVM(pGVM, pVM);
473 if (RT_SUCCESS(rc))
474 {
475 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
476#ifdef VBOX_WITH_PCI_PASSTHROUGH
477 rc = PciRawR0InitVM(pGVM, pVM);
478#endif
479 if (RT_SUCCESS(rc))
480 {
481 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
482 rc = GIMR0InitVM(pVM);
483 if (RT_SUCCESS(rc))
484 {
485 VMM_CHECK_SMAP_CHECK2(pVM, rc = VERR_VMM_RING0_ASSERTION);
486 if (RT_SUCCESS(rc))
487 {
488 GVMMR0DoneInitVM(pGVM);
489
490 /*
491 * Collect a bit of info for the VM release log.
492 */
493 pVM->vmm.s.fIsPreemptPendingApiTrusty = RTThreadPreemptIsPendingTrusty();
494 pVM->vmm.s.fIsPreemptPossible = RTThreadPreemptIsPossible();;
495
496 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
497 return rc;
498 }
499
500 /* bail out*/
501 GIMR0TermVM(pVM);
502 }
503#ifdef VBOX_WITH_PCI_PASSTHROUGH
504 PciRawR0TermVM(pGVM, pVM);
505#endif
506 }
507 }
508 }
509 }
510 HMR0TermVM(pVM);
511 }
512 }
513
514 RTLogSetDefaultInstanceThread(NULL, (uintptr_t)pVM->pSession);
515 return rc;
516}
517
518
519/**
520 * Does EMT specific VM initialization.
521 *
522 * @returns VBox status code.
523 * @param pGVM The ring-0 VM structure.
524 * @param pVM The cross context VM structure.
525 * @param idCpu The EMT that's calling.
526 */
527static int vmmR0InitVMEmt(PGVM pGVM, PVM pVM, VMCPUID idCpu)
528{
529 /* Paranoia (caller checked these already). */
530 AssertReturn(idCpu < pGVM->cCpus, VERR_INVALID_CPU_ID);
531 AssertReturn(pGVM->aCpus[idCpu].hEMT == RTThreadNativeSelf(), VERR_INVALID_CPU_ID);
532
533#ifdef LOG_ENABLED
534 /*
535 * Registration of ring 0 loggers.
536 */
537 PVMCPU pVCpu = &pVM->aCpus[idCpu];
538 PVMMR0LOGGER pR0Logger = pVCpu->vmm.s.pR0LoggerR0;
539 if ( pR0Logger
540 && !pR0Logger->fRegistered)
541 {
542 RTLogSetDefaultInstanceThread(&pR0Logger->Logger, (uintptr_t)pVM->pSession);
543 pR0Logger->fRegistered = true;
544 }
545#endif
546 RT_NOREF(pVM);
547
548 return VINF_SUCCESS;
549}
550
551
552
553/**
554 * Terminates the R0 bits for a particular VM instance.
555 *
556 * This is normally called by ring-3 as part of the VM termination process, but
557 * may alternatively be called during the support driver session cleanup when
558 * the VM object is destroyed (see GVMM).
559 *
560 * @returns VBox status code.
561 *
562 * @param pGVM The global (ring-0) VM structure.
563 * @param pVM The cross context VM structure.
564 * @param idCpu Set to 0 if EMT(0) or NIL_VMCPUID if session cleanup
565 * thread.
566 * @thread EMT(0) or session clean up thread.
567 */
568VMMR0_INT_DECL(int) VMMR0TermVM(PGVM pGVM, PVM pVM, VMCPUID idCpu)
569{
570 /*
571 * Check EMT(0) claim if we're called from userland.
572 */
573 if (idCpu != NIL_VMCPUID)
574 {
575 AssertReturn(idCpu == 0, VERR_INVALID_CPU_ID);
576 int rc = GVMMR0ValidateGVMandVMandEMT(pGVM, pVM, idCpu);
577 if (RT_FAILURE(rc))
578 return rc;
579 }
580
581#ifdef VBOX_WITH_PCI_PASSTHROUGH
582 PciRawR0TermVM(pGVM, pVM);
583#endif
584
585 /*
586 * Tell GVMM what we're up to and check that we only do this once.
587 */
588 if (GVMMR0DoingTermVM(pGVM))
589 {
590 GIMR0TermVM(pVM);
591
592 /** @todo I wish to call PGMR0PhysFlushHandyPages(pVM, &pVM->aCpus[idCpu])
593 * here to make sure we don't leak any shared pages if we crash... */
594#ifdef VBOX_WITH_2X_4GB_ADDR_SPACE
595 PGMR0DynMapTermVM(pVM);
596#endif
597 HMR0TermVM(pVM);
598 }
599
600 /*
601 * Deregister the logger.
602 */
603 RTLogSetDefaultInstanceThread(NULL, (uintptr_t)pVM->pSession);
604 return VINF_SUCCESS;
605}
606
607
608/**
609 * VMM ring-0 thread-context callback.
610 *
611 * This does common HM state updating and calls the HM-specific thread-context
612 * callback.
613 *
614 * @param enmEvent The thread-context event.
615 * @param pvUser Opaque pointer to the VMCPU.
616 *
617 * @thread EMT(pvUser)
618 */
619static DECLCALLBACK(void) vmmR0ThreadCtxCallback(RTTHREADCTXEVENT enmEvent, void *pvUser)
620{
621 PVMCPU pVCpu = (PVMCPU)pvUser;
622
623 switch (enmEvent)
624 {
625 case RTTHREADCTXEVENT_IN:
626 {
627 /*
628 * Linux may call us with preemption enabled (really!) but technically we
629 * cannot get preempted here, otherwise we end up in an infinite recursion
630 * scenario (i.e. preempted in resume hook -> preempt hook -> resume hook...
631 * ad infinitum). Let's just disable preemption for now...
632 */
633 /** @todo r=bird: I don't believe the above. The linux code is clearly enabling
634 * preemption after doing the callout (one or two functions up the
635 * call chain). */
636 /** @todo r=ramshankar: See @bugref{5313#c30}. */
637 RTTHREADPREEMPTSTATE ParanoidPreemptState = RTTHREADPREEMPTSTATE_INITIALIZER;
638 RTThreadPreemptDisable(&ParanoidPreemptState);
639
640 /* We need to update the VCPU <-> host CPU mapping. */
641 RTCPUID idHostCpu;
642 uint32_t iHostCpuSet = RTMpCurSetIndexAndId(&idHostCpu);
643 pVCpu->iHostCpuSet = iHostCpuSet;
644 ASMAtomicWriteU32(&pVCpu->idHostCpu, idHostCpu);
645
646 /* In the very unlikely event that the GIP delta for the CPU we're
647 rescheduled needs calculating, try force a return to ring-3.
648 We unfortunately cannot do the measurements right here. */
649 if (RT_UNLIKELY(SUPIsTscDeltaAvailableForCpuSetIndex(iHostCpuSet)))
650 VMCPU_FF_SET(pVCpu, VMCPU_FF_TO_R3);
651
652 /* Invoke the HM-specific thread-context callback. */
653 HMR0ThreadCtxCallback(enmEvent, pvUser);
654
655 /* Restore preemption. */
656 RTThreadPreemptRestore(&ParanoidPreemptState);
657 break;
658 }
659
660 case RTTHREADCTXEVENT_OUT:
661 {
662 /* Invoke the HM-specific thread-context callback. */
663 HMR0ThreadCtxCallback(enmEvent, pvUser);
664
665 /*
666 * Sigh. See VMMGetCpu() used by VMCPU_ASSERT_EMT(). We cannot let several VCPUs
667 * have the same host CPU associated with it.
668 */
669 pVCpu->iHostCpuSet = UINT32_MAX;
670 ASMAtomicWriteU32(&pVCpu->idHostCpu, NIL_RTCPUID);
671 break;
672 }
673
674 default:
675 /* Invoke the HM-specific thread-context callback. */
676 HMR0ThreadCtxCallback(enmEvent, pvUser);
677 break;
678 }
679}
680
681
682/**
683 * Creates thread switching hook for the current EMT thread.
684 *
685 * This is called by GVMMR0CreateVM and GVMMR0RegisterVCpu. If the host
686 * platform does not implement switcher hooks, no hooks will be create and the
687 * member set to NIL_RTTHREADCTXHOOK.
688 *
689 * @returns VBox status code.
690 * @param pVCpu The cross context virtual CPU structure.
691 * @thread EMT(pVCpu)
692 */
693VMMR0_INT_DECL(int) VMMR0ThreadCtxHookCreateForEmt(PVMCPU pVCpu)
694{
695 VMCPU_ASSERT_EMT(pVCpu);
696 Assert(pVCpu->vmm.s.hCtxHook == NIL_RTTHREADCTXHOOK);
697
698#if 1 /* To disable this stuff change to zero. */
699 int rc = RTThreadCtxHookCreate(&pVCpu->vmm.s.hCtxHook, 0, vmmR0ThreadCtxCallback, pVCpu);
700 if (RT_SUCCESS(rc))
701 return rc;
702#else
703 RT_NOREF(vmmR0ThreadCtxCallback);
704 int rc = VERR_NOT_SUPPORTED;
705#endif
706
707 pVCpu->vmm.s.hCtxHook = NIL_RTTHREADCTXHOOK;
708 if (rc == VERR_NOT_SUPPORTED)
709 return VINF_SUCCESS;
710
711 LogRelMax(32, ("RTThreadCtxHookCreate failed! rc=%Rrc pVCpu=%p idCpu=%RU32\n", rc, pVCpu, pVCpu->idCpu));
712 return VINF_SUCCESS; /* Just ignore it, we can live without context hooks. */
713}
714
715
716/**
717 * Destroys the thread switching hook for the specified VCPU.
718 *
719 * @param pVCpu The cross context virtual CPU structure.
720 * @remarks Can be called from any thread.
721 */
722VMMR0_INT_DECL(void) VMMR0ThreadCtxHookDestroyForEmt(PVMCPU pVCpu)
723{
724 int rc = RTThreadCtxHookDestroy(pVCpu->vmm.s.hCtxHook);
725 AssertRC(rc);
726 pVCpu->vmm.s.hCtxHook = NIL_RTTHREADCTXHOOK;
727}
728
729
730/**
731 * Disables the thread switching hook for this VCPU (if we got one).
732 *
733 * @param pVCpu The cross context virtual CPU structure.
734 * @thread EMT(pVCpu)
735 *
736 * @remarks This also clears VMCPU::idHostCpu, so the mapping is invalid after
737 * this call. This means you have to be careful with what you do!
738 */
739VMMR0_INT_DECL(void) VMMR0ThreadCtxHookDisable(PVMCPU pVCpu)
740{
741 /*
742 * Clear the VCPU <-> host CPU mapping as we've left HM context.
743 * @bugref{7726#c19} explains the need for this trick:
744 *
745 * hmR0VmxCallRing3Callback/hmR0SvmCallRing3Callback &
746 * hmR0VmxLeaveSession/hmR0SvmLeaveSession disables context hooks during
747 * longjmp & normal return to ring-3, which opens a window where we may be
748 * rescheduled without changing VMCPUID::idHostCpu and cause confusion if
749 * the CPU starts executing a different EMT. Both functions first disables
750 * preemption and then calls HMR0LeaveCpu which invalids idHostCpu, leaving
751 * an opening for getting preempted.
752 */
753 /** @todo Make HM not need this API! Then we could leave the hooks enabled
754 * all the time. */
755 /** @todo move this into the context hook disabling if(). */
756 ASMAtomicWriteU32(&pVCpu->idHostCpu, NIL_RTCPUID);
757
758 /*
759 * Disable the context hook, if we got one.
760 */
761 if (pVCpu->vmm.s.hCtxHook != NIL_RTTHREADCTXHOOK)
762 {
763 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
764 int rc = RTThreadCtxHookDisable(pVCpu->vmm.s.hCtxHook);
765 AssertRC(rc);
766 }
767}
768
769
770/**
771 * Internal version of VMMR0ThreadCtxHooksAreRegistered.
772 *
773 * @returns true if registered, false otherwise.
774 * @param pVCpu The cross context virtual CPU structure.
775 */
776DECLINLINE(bool) vmmR0ThreadCtxHookIsEnabled(PVMCPU pVCpu)
777{
778 return RTThreadCtxHookIsEnabled(pVCpu->vmm.s.hCtxHook);
779}
780
781
782/**
783 * Whether thread-context hooks are registered for this VCPU.
784 *
785 * @returns true if registered, false otherwise.
786 * @param pVCpu The cross context virtual CPU structure.
787 */
788VMMR0_INT_DECL(bool) VMMR0ThreadCtxHookIsEnabled(PVMCPU pVCpu)
789{
790 return vmmR0ThreadCtxHookIsEnabled(pVCpu);
791}
792
793
794#ifdef VBOX_WITH_STATISTICS
795/**
796 * Record return code statistics
797 * @param pVM The cross context VM structure.
798 * @param pVCpu The cross context virtual CPU structure.
799 * @param rc The status code.
800 */
801static void vmmR0RecordRC(PVM pVM, PVMCPU pVCpu, int rc)
802{
803 /*
804 * Collect statistics.
805 */
806 switch (rc)
807 {
808 case VINF_SUCCESS:
809 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetNormal);
810 break;
811 case VINF_EM_RAW_INTERRUPT:
812 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetInterrupt);
813 break;
814 case VINF_EM_RAW_INTERRUPT_HYPER:
815 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetInterruptHyper);
816 break;
817 case VINF_EM_RAW_GUEST_TRAP:
818 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetGuestTrap);
819 break;
820 case VINF_EM_RAW_RING_SWITCH:
821 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetRingSwitch);
822 break;
823 case VINF_EM_RAW_RING_SWITCH_INT:
824 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetRingSwitchInt);
825 break;
826 case VINF_EM_RAW_STALE_SELECTOR:
827 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetStaleSelector);
828 break;
829 case VINF_EM_RAW_IRET_TRAP:
830 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetIRETTrap);
831 break;
832 case VINF_IOM_R3_IOPORT_READ:
833 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetIORead);
834 break;
835 case VINF_IOM_R3_IOPORT_WRITE:
836 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetIOWrite);
837 break;
838 case VINF_IOM_R3_IOPORT_COMMIT_WRITE:
839 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetIOCommitWrite);
840 break;
841 case VINF_IOM_R3_MMIO_READ:
842 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetMMIORead);
843 break;
844 case VINF_IOM_R3_MMIO_WRITE:
845 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetMMIOWrite);
846 break;
847 case VINF_IOM_R3_MMIO_COMMIT_WRITE:
848 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetMMIOCommitWrite);
849 break;
850 case VINF_IOM_R3_MMIO_READ_WRITE:
851 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetMMIOReadWrite);
852 break;
853 case VINF_PATM_HC_MMIO_PATCH_READ:
854 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetMMIOPatchRead);
855 break;
856 case VINF_PATM_HC_MMIO_PATCH_WRITE:
857 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetMMIOPatchWrite);
858 break;
859 case VINF_CPUM_R3_MSR_READ:
860 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetMSRRead);
861 break;
862 case VINF_CPUM_R3_MSR_WRITE:
863 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetMSRWrite);
864 break;
865 case VINF_EM_RAW_EMULATE_INSTR:
866 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetEmulate);
867 break;
868 case VINF_PATCH_EMULATE_INSTR:
869 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPatchEmulate);
870 break;
871 case VINF_EM_RAW_EMULATE_INSTR_LDT_FAULT:
872 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetLDTFault);
873 break;
874 case VINF_EM_RAW_EMULATE_INSTR_GDT_FAULT:
875 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetGDTFault);
876 break;
877 case VINF_EM_RAW_EMULATE_INSTR_IDT_FAULT:
878 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetIDTFault);
879 break;
880 case VINF_EM_RAW_EMULATE_INSTR_TSS_FAULT:
881 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetTSSFault);
882 break;
883 case VINF_CSAM_PENDING_ACTION:
884 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetCSAMTask);
885 break;
886 case VINF_PGM_SYNC_CR3:
887 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetSyncCR3);
888 break;
889 case VINF_PATM_PATCH_INT3:
890 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPatchInt3);
891 break;
892 case VINF_PATM_PATCH_TRAP_PF:
893 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPatchPF);
894 break;
895 case VINF_PATM_PATCH_TRAP_GP:
896 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPatchGP);
897 break;
898 case VINF_PATM_PENDING_IRQ_AFTER_IRET:
899 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPatchIretIRQ);
900 break;
901 case VINF_EM_RESCHEDULE_REM:
902 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetRescheduleREM);
903 break;
904 case VINF_EM_RAW_TO_R3:
905 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3Total);
906 if (VM_FF_IS_SET(pVM, VM_FF_TM_VIRTUAL_SYNC))
907 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3TMVirt);
908 else if (VM_FF_IS_SET(pVM, VM_FF_PGM_NEED_HANDY_PAGES))
909 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3HandyPages);
910 else if (VM_FF_IS_SET(pVM, VM_FF_PDM_QUEUES))
911 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3PDMQueues);
912 else if (VM_FF_IS_SET(pVM, VM_FF_EMT_RENDEZVOUS))
913 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3Rendezvous);
914 else if (VM_FF_IS_SET(pVM, VM_FF_PDM_DMA))
915 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3DMA);
916 else if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TIMER))
917 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3Timer);
918 else if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_PDM_CRITSECT))
919 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3CritSect);
920 else if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TO_R3))
921 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3FF);
922 else if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_IEM))
923 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3Iem);
924 else if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_IOM))
925 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3Iom);
926 else
927 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetToR3Unknown);
928 break;
929
930 case VINF_EM_RAW_TIMER_PENDING:
931 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetTimerPending);
932 break;
933 case VINF_EM_RAW_INTERRUPT_PENDING:
934 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetInterruptPending);
935 break;
936 case VINF_VMM_CALL_HOST:
937 switch (pVCpu->vmm.s.enmCallRing3Operation)
938 {
939 case VMMCALLRING3_PDM_CRIT_SECT_ENTER:
940 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallPDMCritSectEnter);
941 break;
942 case VMMCALLRING3_PDM_LOCK:
943 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallPDMLock);
944 break;
945 case VMMCALLRING3_PGM_POOL_GROW:
946 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallPGMPoolGrow);
947 break;
948 case VMMCALLRING3_PGM_LOCK:
949 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallPGMLock);
950 break;
951 case VMMCALLRING3_PGM_MAP_CHUNK:
952 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallPGMMapChunk);
953 break;
954 case VMMCALLRING3_PGM_ALLOCATE_HANDY_PAGES:
955 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallPGMAllocHandy);
956 break;
957 case VMMCALLRING3_REM_REPLAY_HANDLER_NOTIFICATIONS:
958 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallRemReplay);
959 break;
960 case VMMCALLRING3_VMM_LOGGER_FLUSH:
961 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallLogFlush);
962 break;
963 case VMMCALLRING3_VM_SET_ERROR:
964 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallVMSetError);
965 break;
966 case VMMCALLRING3_VM_SET_RUNTIME_ERROR:
967 STAM_COUNTER_INC(&pVM->vmm.s.StatRZCallVMSetRuntimeError);
968 break;
969 case VMMCALLRING3_VM_R0_ASSERTION:
970 default:
971 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetCallRing3);
972 break;
973 }
974 break;
975 case VINF_PATM_DUPLICATE_FUNCTION:
976 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPATMDuplicateFn);
977 break;
978 case VINF_PGM_CHANGE_MODE:
979 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPGMChangeMode);
980 break;
981 case VINF_PGM_POOL_FLUSH_PENDING:
982 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPGMFlushPending);
983 break;
984 case VINF_EM_PENDING_REQUEST:
985 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPendingRequest);
986 break;
987 case VINF_EM_HM_PATCH_TPR_INSTR:
988 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetPatchTPR);
989 break;
990 default:
991 STAM_COUNTER_INC(&pVM->vmm.s.StatRZRetMisc);
992 break;
993 }
994}
995#endif /* VBOX_WITH_STATISTICS */
996
997
998/**
999 * The Ring 0 entry point, called by the fast-ioctl path.
1000 *
1001 * @param pGVM The global (ring-0) VM structure.
1002 * @param pVM The cross context VM structure.
1003 * The return code is stored in pVM->vmm.s.iLastGZRc.
1004 * @param idCpu The Virtual CPU ID of the calling EMT.
1005 * @param enmOperation Which operation to execute.
1006 * @remarks Assume called with interrupts _enabled_.
1007 */
1008VMMR0DECL(void) VMMR0EntryFast(PGVM pGVM, PVM pVM, VMCPUID idCpu, VMMR0OPERATION enmOperation)
1009{
1010 /*
1011 * Validation.
1012 */
1013 if ( idCpu < pGVM->cCpus
1014 && pGVM->cCpus == pVM->cCpus)
1015 { /*likely*/ }
1016 else
1017 {
1018 SUPR0Printf("VMMR0EntryFast: Bad idCpu=%#x cCpus=%#x/%#x\n", idCpu, pGVM->cCpus, pVM->cCpus);
1019 return;
1020 }
1021
1022 PGVMCPU pGVCpu = &pGVM->aCpus[idCpu];
1023 PVMCPU pVCpu = &pVM->aCpus[idCpu];
1024 RTNATIVETHREAD const hNativeThread = RTThreadNativeSelf();
1025 if (RT_LIKELY( pGVCpu->hEMT == hNativeThread
1026 && pVCpu->hNativeThreadR0 == hNativeThread))
1027 { /* likely */ }
1028 else
1029 {
1030 SUPR0Printf("VMMR0EntryFast: Bad thread idCpu=%#x hNativeSelf=%p pGVCpu->hEmt=%p pVCpu->hNativeThreadR0=%p\n",
1031 idCpu, hNativeThread, pGVCpu->hEMT, pVCpu->hNativeThreadR0);
1032 return;
1033 }
1034
1035 /*
1036 * SMAP fun.
1037 */
1038 VMM_CHECK_SMAP_SETUP();
1039 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1040
1041 /*
1042 * Perform requested operation.
1043 */
1044 switch (enmOperation)
1045 {
1046 /*
1047 * Switch to GC and run guest raw mode code.
1048 * Disable interrupts before doing the world switch.
1049 */
1050 case VMMR0_DO_RAW_RUN:
1051 {
1052#ifdef VBOX_WITH_RAW_MODE
1053# ifndef VBOX_WITH_2X_4GB_ADDR_SPACE_IN_R0
1054 /* Some safety precautions first. */
1055 if (RT_UNLIKELY(!PGMGetHyperCR3(pVCpu)))
1056 {
1057 pVCpu->vmm.s.iLastGZRc = VERR_PGM_NO_CR3_SHADOW_ROOT;
1058 break;
1059 }
1060# endif
1061 if (RT_SUCCESS(g_rcRawModeUsability))
1062 { /* likely */ }
1063 else
1064 {
1065 pVCpu->vmm.s.iLastGZRc = g_rcRawModeUsability;
1066 break;
1067 }
1068
1069 /*
1070 * Disable preemption.
1071 */
1072 RTTHREADPREEMPTSTATE PreemptState = RTTHREADPREEMPTSTATE_INITIALIZER;
1073 RTThreadPreemptDisable(&PreemptState);
1074
1075 /*
1076 * Get the host CPU identifiers, make sure they are valid and that
1077 * we've got a TSC delta for the CPU.
1078 */
1079 RTCPUID idHostCpu;
1080 uint32_t iHostCpuSet = RTMpCurSetIndexAndId(&idHostCpu);
1081 if (RT_LIKELY( iHostCpuSet < RTCPUSET_MAX_CPUS
1082 && SUPIsTscDeltaAvailableForCpuSetIndex(iHostCpuSet)))
1083 {
1084 /*
1085 * Commit the CPU identifiers and update the periodict preemption timer if it's active.
1086 */
1087# ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
1088 CPUMR0SetLApic(pVCpu, iHostCpuSet);
1089# endif
1090 pVCpu->iHostCpuSet = iHostCpuSet;
1091 ASMAtomicWriteU32(&pVCpu->idHostCpu, idHostCpu);
1092
1093 if (pVM->vmm.s.fUsePeriodicPreemptionTimers)
1094 GVMMR0SchedUpdatePeriodicPreemptionTimer(pVM, pVCpu->idHostCpu, TMCalcHostTimerFrequency(pVM, pVCpu));
1095
1096 /*
1097 * We might need to disable VT-x if the active switcher turns off paging.
1098 */
1099 bool fVTxDisabled;
1100 int rc = HMR0EnterSwitcher(pVM, pVM->vmm.s.enmSwitcher, &fVTxDisabled);
1101 if (RT_SUCCESS(rc))
1102 {
1103 /*
1104 * Disable interrupts and run raw-mode code. The loop is for efficiently
1105 * dispatching tracepoints that fired in raw-mode context.
1106 */
1107 RTCCUINTREG uFlags = ASMIntDisableFlags();
1108
1109 for (;;)
1110 {
1111 VMCPU_SET_STATE(pVCpu, VMCPUSTATE_STARTED_EXEC);
1112 TMNotifyStartOfExecution(pVCpu);
1113
1114 rc = pVM->vmm.s.pfnR0ToRawMode(pVM);
1115 pVCpu->vmm.s.iLastGZRc = rc;
1116
1117 TMNotifyEndOfExecution(pVCpu);
1118 VMCPU_SET_STATE(pVCpu, VMCPUSTATE_STARTED);
1119
1120 if (rc != VINF_VMM_CALL_TRACER)
1121 break;
1122 SUPR0TracerUmodProbeFire(pVM->pSession, &pVCpu->vmm.s.TracerCtx);
1123 }
1124
1125 /*
1126 * Re-enable VT-x before we dispatch any pending host interrupts and
1127 * re-enables interrupts.
1128 */
1129 HMR0LeaveSwitcher(pVM, fVTxDisabled);
1130
1131 if ( rc == VINF_EM_RAW_INTERRUPT
1132 || rc == VINF_EM_RAW_INTERRUPT_HYPER)
1133 TRPMR0DispatchHostInterrupt(pVM);
1134
1135 ASMSetFlags(uFlags);
1136
1137 /* Fire dtrace probe and collect statistics. */
1138 VBOXVMM_R0_VMM_RETURN_TO_RING3_RC(pVCpu, CPUMQueryGuestCtxPtr(pVCpu), rc);
1139# ifdef VBOX_WITH_STATISTICS
1140 STAM_COUNTER_INC(&pVM->vmm.s.StatRunRC);
1141 vmmR0RecordRC(pVM, pVCpu, rc);
1142# endif
1143 }
1144 else
1145 pVCpu->vmm.s.iLastGZRc = rc;
1146
1147 /*
1148 * Invalidate the host CPU identifiers as we restore preemption.
1149 */
1150 pVCpu->iHostCpuSet = UINT32_MAX;
1151 ASMAtomicWriteU32(&pVCpu->idHostCpu, NIL_RTCPUID);
1152
1153 RTThreadPreemptRestore(&PreemptState);
1154 }
1155 /*
1156 * Invalid CPU set index or TSC delta in need of measuring.
1157 */
1158 else
1159 {
1160 RTThreadPreemptRestore(&PreemptState);
1161 if (iHostCpuSet < RTCPUSET_MAX_CPUS)
1162 {
1163 int rc = SUPR0TscDeltaMeasureBySetIndex(pVM->pSession, iHostCpuSet, 0 /*fFlags*/,
1164 2 /*cMsWaitRetry*/, 5*RT_MS_1SEC /*cMsWaitThread*/,
1165 0 /*default cTries*/);
1166 if (RT_SUCCESS(rc) || rc == VERR_CPU_OFFLINE)
1167 pVCpu->vmm.s.iLastGZRc = VINF_EM_RAW_TO_R3;
1168 else
1169 pVCpu->vmm.s.iLastGZRc = rc;
1170 }
1171 else
1172 pVCpu->vmm.s.iLastGZRc = VERR_INVALID_CPU_INDEX;
1173 }
1174
1175#else /* !VBOX_WITH_RAW_MODE */
1176 pVCpu->vmm.s.iLastGZRc = VERR_RAW_MODE_NOT_SUPPORTED;
1177#endif
1178 break;
1179 }
1180
1181 /*
1182 * Run guest code using the available hardware acceleration technology.
1183 */
1184 case VMMR0_DO_HM_RUN:
1185 {
1186 /*
1187 * Disable preemption.
1188 */
1189 Assert(!vmmR0ThreadCtxHookIsEnabled(pVCpu));
1190 RTTHREADPREEMPTSTATE PreemptState = RTTHREADPREEMPTSTATE_INITIALIZER;
1191 RTThreadPreemptDisable(&PreemptState);
1192
1193 /*
1194 * Get the host CPU identifiers, make sure they are valid and that
1195 * we've got a TSC delta for the CPU.
1196 */
1197 RTCPUID idHostCpu;
1198 uint32_t iHostCpuSet = RTMpCurSetIndexAndId(&idHostCpu);
1199 if (RT_LIKELY( iHostCpuSet < RTCPUSET_MAX_CPUS
1200 && SUPIsTscDeltaAvailableForCpuSetIndex(iHostCpuSet)))
1201 {
1202 pVCpu->iHostCpuSet = iHostCpuSet;
1203 ASMAtomicWriteU32(&pVCpu->idHostCpu, idHostCpu);
1204
1205 /*
1206 * Update the periodic preemption timer if it's active.
1207 */
1208 if (pVM->vmm.s.fUsePeriodicPreemptionTimers)
1209 GVMMR0SchedUpdatePeriodicPreemptionTimer(pVM, pVCpu->idHostCpu, TMCalcHostTimerFrequency(pVM, pVCpu));
1210 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1211
1212#ifdef VMM_R0_TOUCH_FPU
1213 /*
1214 * Make sure we've got the FPU state loaded so and we don't need to clear
1215 * CR0.TS and get out of sync with the host kernel when loading the guest
1216 * FPU state. @ref sec_cpum_fpu (CPUM.cpp) and @bugref{4053}.
1217 */
1218 CPUMR0TouchHostFpu();
1219#endif
1220 int rc;
1221 bool fPreemptRestored = false;
1222 if (!HMR0SuspendPending())
1223 {
1224 /*
1225 * Enable the context switching hook.
1226 */
1227 if (pVCpu->vmm.s.hCtxHook != NIL_RTTHREADCTXHOOK)
1228 {
1229 Assert(!RTThreadCtxHookIsEnabled(pVCpu->vmm.s.hCtxHook));
1230 int rc2 = RTThreadCtxHookEnable(pVCpu->vmm.s.hCtxHook); AssertRC(rc2);
1231 }
1232
1233 /*
1234 * Enter HM context.
1235 */
1236 rc = HMR0Enter(pVCpu);
1237 if (RT_SUCCESS(rc))
1238 {
1239 VMCPU_SET_STATE(pVCpu, VMCPUSTATE_STARTED_HM);
1240
1241 /*
1242 * When preemption hooks are in place, enable preemption now that
1243 * we're in HM context.
1244 */
1245 if (vmmR0ThreadCtxHookIsEnabled(pVCpu))
1246 {
1247 fPreemptRestored = true;
1248 RTThreadPreemptRestore(&PreemptState);
1249 }
1250
1251 /*
1252 * Setup the longjmp machinery and execute guest code (calls HMR0RunGuestCode).
1253 */
1254 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1255 rc = vmmR0CallRing3SetJmp(&pVCpu->vmm.s.CallRing3JmpBufR0, HMR0RunGuestCode, pVM, pVCpu);
1256 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1257
1258 /*
1259 * Assert sanity on the way out. Using manual assertions code here as normal
1260 * assertions are going to panic the host since we're outside the setjmp/longjmp zone.
1261 */
1262 if (RT_UNLIKELY( VMCPU_GET_STATE(pVCpu) != VMCPUSTATE_STARTED_HM
1263 && RT_SUCCESS_NP(rc) && rc != VINF_VMM_CALL_HOST ))
1264 {
1265 pVM->vmm.s.szRing0AssertMsg1[0] = '\0';
1266 RTStrPrintf(pVM->vmm.s.szRing0AssertMsg2, sizeof(pVM->vmm.s.szRing0AssertMsg2),
1267 "Got VMCPU state %d expected %d.\n", VMCPU_GET_STATE(pVCpu), VMCPUSTATE_STARTED_HM);
1268 rc = VERR_VMM_WRONG_HM_VMCPU_STATE;
1269 }
1270 /** @todo Get rid of this. HM shouldn't disable the context hook. */
1271 else if (RT_UNLIKELY(vmmR0ThreadCtxHookIsEnabled(pVCpu)))
1272 {
1273 pVM->vmm.s.szRing0AssertMsg1[0] = '\0';
1274 RTStrPrintf(pVM->vmm.s.szRing0AssertMsg2, sizeof(pVM->vmm.s.szRing0AssertMsg2),
1275 "Thread-context hooks still enabled! VCPU=%p Id=%u rc=%d.\n", pVCpu, pVCpu->idCpu, rc);
1276 rc = VERR_INVALID_STATE;
1277 }
1278
1279 VMCPU_SET_STATE(pVCpu, VMCPUSTATE_STARTED);
1280 }
1281 STAM_COUNTER_INC(&pVM->vmm.s.StatRunRC);
1282
1283 /*
1284 * Invalidate the host CPU identifiers before we disable the context
1285 * hook / restore preemption.
1286 */
1287 pVCpu->iHostCpuSet = UINT32_MAX;
1288 ASMAtomicWriteU32(&pVCpu->idHostCpu, NIL_RTCPUID);
1289
1290 /*
1291 * Disable context hooks. Due to unresolved cleanup issues, we
1292 * cannot leave the hooks enabled when we return to ring-3.
1293 *
1294 * Note! At the moment HM may also have disabled the hook
1295 * when we get here, but the IPRT API handles that.
1296 */
1297 if (pVCpu->vmm.s.hCtxHook != NIL_RTTHREADCTXHOOK)
1298 {
1299 ASMAtomicWriteU32(&pVCpu->idHostCpu, NIL_RTCPUID);
1300 RTThreadCtxHookDisable(pVCpu->vmm.s.hCtxHook);
1301 }
1302 }
1303 /*
1304 * The system is about to go into suspend mode; go back to ring 3.
1305 */
1306 else
1307 {
1308 rc = VINF_EM_RAW_INTERRUPT;
1309 pVCpu->iHostCpuSet = UINT32_MAX;
1310 ASMAtomicWriteU32(&pVCpu->idHostCpu, NIL_RTCPUID);
1311 }
1312
1313 /** @todo When HM stops messing with the context hook state, we'll disable
1314 * preemption again before the RTThreadCtxHookDisable call. */
1315 if (!fPreemptRestored)
1316 RTThreadPreemptRestore(&PreemptState);
1317
1318 pVCpu->vmm.s.iLastGZRc = rc;
1319
1320 /* Fire dtrace probe and collect statistics. */
1321 VBOXVMM_R0_VMM_RETURN_TO_RING3_HM(pVCpu, CPUMQueryGuestCtxPtr(pVCpu), rc);
1322#ifdef VBOX_WITH_STATISTICS
1323 vmmR0RecordRC(pVM, pVCpu, rc);
1324#endif
1325 }
1326 /*
1327 * Invalid CPU set index or TSC delta in need of measuring.
1328 */
1329 else
1330 {
1331 pVCpu->iHostCpuSet = UINT32_MAX;
1332 ASMAtomicWriteU32(&pVCpu->idHostCpu, NIL_RTCPUID);
1333 RTThreadPreemptRestore(&PreemptState);
1334 if (iHostCpuSet < RTCPUSET_MAX_CPUS)
1335 {
1336 int rc = SUPR0TscDeltaMeasureBySetIndex(pVM->pSession, iHostCpuSet, 0 /*fFlags*/,
1337 2 /*cMsWaitRetry*/, 5*RT_MS_1SEC /*cMsWaitThread*/,
1338 0 /*default cTries*/);
1339 if (RT_SUCCESS(rc) || rc == VERR_CPU_OFFLINE)
1340 pVCpu->vmm.s.iLastGZRc = VINF_EM_RAW_TO_R3;
1341 else
1342 pVCpu->vmm.s.iLastGZRc = rc;
1343 }
1344 else
1345 pVCpu->vmm.s.iLastGZRc = VERR_INVALID_CPU_INDEX;
1346 }
1347 break;
1348 }
1349
1350#ifdef VBOX_WITH_NEM_R0
1351# if defined(RT_ARCH_AMD64) && defined(RT_OS_WINDOWS)
1352 case VMMR0_DO_NEM_RUN:
1353 {
1354 /*
1355 * Setup the longjmp machinery and execute guest code (calls NEMR0RunGuestCode).
1356 */
1357 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1358 int rc = vmmR0CallRing3SetJmp2(&pVCpu->vmm.s.CallRing3JmpBufR0, NEMR0RunGuestCode, pGVM, idCpu);
1359 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1360 STAM_COUNTER_INC(&pVM->vmm.s.StatRunRC);
1361
1362 pVCpu->vmm.s.iLastGZRc = rc;
1363
1364 /*
1365 * Fire dtrace probe and collect statistics.
1366 */
1367 VBOXVMM_R0_VMM_RETURN_TO_RING3_NEM(pVCpu, CPUMQueryGuestCtxPtr(pVCpu), rc);
1368# ifdef VBOX_WITH_STATISTICS
1369 vmmR0RecordRC(pVM, pVCpu, rc);
1370# endif
1371 break;
1372 }
1373# endif
1374#endif
1375
1376
1377 /*
1378 * For profiling.
1379 */
1380 case VMMR0_DO_NOP:
1381 pVCpu->vmm.s.iLastGZRc = VINF_SUCCESS;
1382 break;
1383
1384 /*
1385 * Shouldn't happen.
1386 */
1387 default:
1388 AssertMsgFailed(("%#x\n", enmOperation));
1389 pVCpu->vmm.s.iLastGZRc = VERR_NOT_SUPPORTED;
1390 break;
1391 }
1392 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1393}
1394
1395
1396/**
1397 * Validates a session or VM session argument.
1398 *
1399 * @returns true / false accordingly.
1400 * @param pVM The cross context VM structure.
1401 * @param pClaimedSession The session claim to validate.
1402 * @param pSession The session argument.
1403 */
1404DECLINLINE(bool) vmmR0IsValidSession(PVM pVM, PSUPDRVSESSION pClaimedSession, PSUPDRVSESSION pSession)
1405{
1406 /* This must be set! */
1407 if (!pSession)
1408 return false;
1409
1410 /* Only one out of the two. */
1411 if (pVM && pClaimedSession)
1412 return false;
1413 if (pVM)
1414 pClaimedSession = pVM->pSession;
1415 return pClaimedSession == pSession;
1416}
1417
1418
1419/**
1420 * VMMR0EntryEx worker function, either called directly or when ever possible
1421 * called thru a longjmp so we can exit safely on failure.
1422 *
1423 * @returns VBox status code.
1424 * @param pGVM The global (ring-0) VM structure.
1425 * @param pVM The cross context VM structure.
1426 * @param idCpu Virtual CPU ID argument. Must be NIL_VMCPUID if pVM
1427 * is NIL_RTR0PTR, and may be NIL_VMCPUID if it isn't
1428 * @param enmOperation Which operation to execute.
1429 * @param pReqHdr This points to a SUPVMMR0REQHDR packet. Optional.
1430 * The support driver validates this if it's present.
1431 * @param u64Arg Some simple constant argument.
1432 * @param pSession The session of the caller.
1433 *
1434 * @remarks Assume called with interrupts _enabled_.
1435 */
1436static int vmmR0EntryExWorker(PGVM pGVM, PVM pVM, VMCPUID idCpu, VMMR0OPERATION enmOperation,
1437 PSUPVMMR0REQHDR pReqHdr, uint64_t u64Arg, PSUPDRVSESSION pSession)
1438{
1439 /*
1440 * Validate pGVM, pVM and idCpu for consistency and validity.
1441 */
1442 if ( pGVM != NULL
1443 || pVM != NULL)
1444 {
1445 if (RT_LIKELY( RT_VALID_PTR(pGVM)
1446 && RT_VALID_PTR(pVM)
1447 && ((uintptr_t)pVM & PAGE_OFFSET_MASK) == 0))
1448 { /* likely */ }
1449 else
1450 {
1451 SUPR0Printf("vmmR0EntryExWorker: Invalid pGVM=%p and/or pVM=%p! (op=%d)\n", pGVM, pVM, enmOperation);
1452 return VERR_INVALID_POINTER;
1453 }
1454
1455 if (RT_LIKELY(pGVM->pVM == pVM))
1456 { /* likely */ }
1457 else
1458 {
1459 SUPR0Printf("vmmR0EntryExWorker: pVM mismatch: got %p, pGVM->pVM=%p\n", pVM, pGVM->pVM);
1460 return VERR_INVALID_PARAMETER;
1461 }
1462
1463 if (RT_LIKELY(idCpu == NIL_VMCPUID || idCpu < pGVM->cCpus))
1464 { /* likely */ }
1465 else
1466 {
1467 SUPR0Printf("vmmR0EntryExWorker: Invalid idCpu %#x (cCpus=%#x)\n", idCpu, pGVM->cCpus);
1468 return VERR_INVALID_PARAMETER;
1469 }
1470
1471 if (RT_LIKELY( pVM->enmVMState >= VMSTATE_CREATING
1472 && pVM->enmVMState <= VMSTATE_TERMINATED
1473 && pVM->cCpus == pGVM->cCpus
1474 && pVM->pSession == pSession
1475 && pVM->pVMR0 == pVM))
1476 { /* likely */ }
1477 else
1478 {
1479 SUPR0Printf("vmmR0EntryExWorker: Invalid pVM=%p:{.enmVMState=%d, .cCpus=%#x(==%#x), .pSession=%p(==%p), .pVMR0=%p(==%p)}! (op=%d)\n",
1480 pVM, pVM->enmVMState, pVM->cCpus, pGVM->cCpus, pVM->pSession, pSession, pVM->pVMR0, pVM, enmOperation);
1481 return VERR_INVALID_POINTER;
1482 }
1483 }
1484 else if (RT_LIKELY(idCpu == NIL_VMCPUID))
1485 { /* likely */ }
1486 else
1487 {
1488 SUPR0Printf("vmmR0EntryExWorker: Invalid idCpu=%u\n", idCpu);
1489 return VERR_INVALID_PARAMETER;
1490 }
1491
1492 /*
1493 * SMAP fun.
1494 */
1495 VMM_CHECK_SMAP_SETUP();
1496 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
1497
1498 /*
1499 * Process the request.
1500 */
1501 int rc;
1502 switch (enmOperation)
1503 {
1504 /*
1505 * GVM requests
1506 */
1507 case VMMR0_DO_GVMM_CREATE_VM:
1508 if (pGVM == NULL && pVM == NULL && u64Arg == 0 && idCpu == NIL_VMCPUID)
1509 rc = GVMMR0CreateVMReq((PGVMMCREATEVMREQ)pReqHdr, pSession);
1510 else
1511 rc = VERR_INVALID_PARAMETER;
1512 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
1513 break;
1514
1515 case VMMR0_DO_GVMM_DESTROY_VM:
1516 if (pReqHdr == NULL && u64Arg == 0)
1517 rc = GVMMR0DestroyVM(pGVM, pVM);
1518 else
1519 rc = VERR_INVALID_PARAMETER;
1520 VMM_CHECK_SMAP_CHECK(RT_NOTHING);
1521 break;
1522
1523 case VMMR0_DO_GVMM_REGISTER_VMCPU:
1524 if (pGVM != NULL && pVM != NULL)
1525 rc = GVMMR0RegisterVCpu(pGVM, pVM, idCpu);
1526 else
1527 rc = VERR_INVALID_PARAMETER;
1528 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1529 break;
1530
1531 case VMMR0_DO_GVMM_DEREGISTER_VMCPU:
1532 if (pGVM != NULL && pVM != NULL)
1533 rc = GVMMR0DeregisterVCpu(pGVM, pVM, idCpu);
1534 else
1535 rc = VERR_INVALID_PARAMETER;
1536 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1537 break;
1538
1539 case VMMR0_DO_GVMM_SCHED_HALT:
1540 if (pReqHdr)
1541 return VERR_INVALID_PARAMETER;
1542 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1543 rc = GVMMR0SchedHalt(pGVM, pVM, idCpu, u64Arg);
1544 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1545 break;
1546
1547 case VMMR0_DO_GVMM_SCHED_WAKE_UP:
1548 if (pReqHdr || u64Arg)
1549 return VERR_INVALID_PARAMETER;
1550 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1551 rc = GVMMR0SchedWakeUp(pGVM, pVM, idCpu);
1552 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1553 break;
1554
1555 case VMMR0_DO_GVMM_SCHED_POKE:
1556 if (pReqHdr || u64Arg)
1557 return VERR_INVALID_PARAMETER;
1558 rc = GVMMR0SchedPoke(pGVM, pVM, idCpu);
1559 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1560 break;
1561
1562 case VMMR0_DO_GVMM_SCHED_WAKE_UP_AND_POKE_CPUS:
1563 if (u64Arg)
1564 return VERR_INVALID_PARAMETER;
1565 rc = GVMMR0SchedWakeUpAndPokeCpusReq(pGVM, pVM, (PGVMMSCHEDWAKEUPANDPOKECPUSREQ)pReqHdr);
1566 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1567 break;
1568
1569 case VMMR0_DO_GVMM_SCHED_POLL:
1570 if (pReqHdr || u64Arg > 1)
1571 return VERR_INVALID_PARAMETER;
1572 rc = GVMMR0SchedPoll(pGVM, pVM, idCpu, !!u64Arg);
1573 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1574 break;
1575
1576 case VMMR0_DO_GVMM_QUERY_STATISTICS:
1577 if (u64Arg)
1578 return VERR_INVALID_PARAMETER;
1579 rc = GVMMR0QueryStatisticsReq(pGVM, pVM, (PGVMMQUERYSTATISTICSSREQ)pReqHdr, pSession);
1580 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1581 break;
1582
1583 case VMMR0_DO_GVMM_RESET_STATISTICS:
1584 if (u64Arg)
1585 return VERR_INVALID_PARAMETER;
1586 rc = GVMMR0ResetStatisticsReq(pGVM, pVM, (PGVMMRESETSTATISTICSSREQ)pReqHdr, pSession);
1587 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1588 break;
1589
1590 /*
1591 * Initialize the R0 part of a VM instance.
1592 */
1593 case VMMR0_DO_VMMR0_INIT:
1594 rc = vmmR0InitVM(pGVM, pVM, RT_LODWORD(u64Arg), RT_HIDWORD(u64Arg));
1595 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1596 break;
1597
1598 /*
1599 * Does EMT specific ring-0 init.
1600 */
1601 case VMMR0_DO_VMMR0_INIT_EMT:
1602 rc = vmmR0InitVMEmt(pGVM, pVM, idCpu);
1603 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1604 break;
1605
1606 /*
1607 * Terminate the R0 part of a VM instance.
1608 */
1609 case VMMR0_DO_VMMR0_TERM:
1610 rc = VMMR0TermVM(pGVM, pVM, 0 /*idCpu*/);
1611 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1612 break;
1613
1614 /*
1615 * Attempt to enable hm mode and check the current setting.
1616 */
1617 case VMMR0_DO_HM_ENABLE:
1618 rc = HMR0EnableAllCpus(pVM);
1619 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1620 break;
1621
1622 /*
1623 * Setup the hardware accelerated session.
1624 */
1625 case VMMR0_DO_HM_SETUP_VM:
1626 rc = HMR0SetupVM(pVM);
1627 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1628 break;
1629
1630 /*
1631 * Switch to RC to execute Hypervisor function.
1632 */
1633 case VMMR0_DO_CALL_HYPERVISOR:
1634 {
1635#ifdef VBOX_WITH_RAW_MODE
1636 /*
1637 * Validate input / context.
1638 */
1639 if (RT_UNLIKELY(idCpu != 0))
1640 return VERR_INVALID_CPU_ID;
1641 if (RT_UNLIKELY(pVM->cCpus != 1))
1642 return VERR_INVALID_PARAMETER;
1643 PVMCPU pVCpu = &pVM->aCpus[idCpu];
1644# ifndef VBOX_WITH_2X_4GB_ADDR_SPACE_IN_R0
1645 if (RT_UNLIKELY(!PGMGetHyperCR3(pVCpu)))
1646 return VERR_PGM_NO_CR3_SHADOW_ROOT;
1647# endif
1648 if (RT_FAILURE(g_rcRawModeUsability))
1649 return g_rcRawModeUsability;
1650
1651 /*
1652 * Disable interrupts.
1653 */
1654 RTCCUINTREG fFlags = ASMIntDisableFlags();
1655
1656 /*
1657 * Get the host CPU identifiers, make sure they are valid and that
1658 * we've got a TSC delta for the CPU.
1659 */
1660 RTCPUID idHostCpu;
1661 uint32_t iHostCpuSet = RTMpCurSetIndexAndId(&idHostCpu);
1662 if (RT_UNLIKELY(iHostCpuSet >= RTCPUSET_MAX_CPUS))
1663 {
1664 ASMSetFlags(fFlags);
1665 return VERR_INVALID_CPU_INDEX;
1666 }
1667 if (RT_UNLIKELY(!SUPIsTscDeltaAvailableForCpuSetIndex(iHostCpuSet)))
1668 {
1669 ASMSetFlags(fFlags);
1670 rc = SUPR0TscDeltaMeasureBySetIndex(pVM->pSession, iHostCpuSet, 0 /*fFlags*/,
1671 2 /*cMsWaitRetry*/, 5*RT_MS_1SEC /*cMsWaitThread*/,
1672 0 /*default cTries*/);
1673 if (RT_FAILURE(rc) && rc != VERR_CPU_OFFLINE)
1674 {
1675 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1676 return rc;
1677 }
1678 }
1679
1680 /*
1681 * Commit the CPU identifiers.
1682 */
1683# ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
1684 CPUMR0SetLApic(pVCpu, iHostCpuSet);
1685# endif
1686 pVCpu->iHostCpuSet = iHostCpuSet;
1687 ASMAtomicWriteU32(&pVCpu->idHostCpu, idHostCpu);
1688
1689 /*
1690 * We might need to disable VT-x if the active switcher turns off paging.
1691 */
1692 bool fVTxDisabled;
1693 rc = HMR0EnterSwitcher(pVM, pVM->vmm.s.enmSwitcher, &fVTxDisabled);
1694 if (RT_SUCCESS(rc))
1695 {
1696 /*
1697 * Go through the wormhole...
1698 */
1699 rc = pVM->vmm.s.pfnR0ToRawMode(pVM);
1700
1701 /*
1702 * Re-enable VT-x before we dispatch any pending host interrupts.
1703 */
1704 HMR0LeaveSwitcher(pVM, fVTxDisabled);
1705
1706 if ( rc == VINF_EM_RAW_INTERRUPT
1707 || rc == VINF_EM_RAW_INTERRUPT_HYPER)
1708 TRPMR0DispatchHostInterrupt(pVM);
1709 }
1710
1711 /*
1712 * Invalidate the host CPU identifiers as we restore interrupts.
1713 */
1714 pVCpu->iHostCpuSet = UINT32_MAX;
1715 ASMAtomicWriteU32(&pVCpu->idHostCpu, NIL_RTCPUID);
1716 ASMSetFlags(fFlags);
1717
1718#else /* !VBOX_WITH_RAW_MODE */
1719 rc = VERR_RAW_MODE_NOT_SUPPORTED;
1720#endif
1721 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1722 break;
1723 }
1724
1725 /*
1726 * PGM wrappers.
1727 */
1728 case VMMR0_DO_PGM_ALLOCATE_HANDY_PAGES:
1729 if (idCpu == NIL_VMCPUID)
1730 return VERR_INVALID_CPU_ID;
1731 rc = PGMR0PhysAllocateHandyPages(pGVM, pVM, idCpu);
1732 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1733 break;
1734
1735 case VMMR0_DO_PGM_FLUSH_HANDY_PAGES:
1736 if (idCpu == NIL_VMCPUID)
1737 return VERR_INVALID_CPU_ID;
1738 rc = PGMR0PhysFlushHandyPages(pGVM, pVM, idCpu);
1739 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1740 break;
1741
1742 case VMMR0_DO_PGM_ALLOCATE_LARGE_HANDY_PAGE:
1743 if (idCpu == NIL_VMCPUID)
1744 return VERR_INVALID_CPU_ID;
1745 rc = PGMR0PhysAllocateLargeHandyPage(pGVM, pVM, idCpu);
1746 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1747 break;
1748
1749 case VMMR0_DO_PGM_PHYS_SETUP_IOMMU:
1750 if (idCpu != 0)
1751 return VERR_INVALID_CPU_ID;
1752 rc = PGMR0PhysSetupIoMmu(pGVM, pVM);
1753 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1754 break;
1755
1756 /*
1757 * GMM wrappers.
1758 */
1759 case VMMR0_DO_GMM_INITIAL_RESERVATION:
1760 if (u64Arg)
1761 return VERR_INVALID_PARAMETER;
1762 rc = GMMR0InitialReservationReq(pGVM, pVM, idCpu, (PGMMINITIALRESERVATIONREQ)pReqHdr);
1763 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1764 break;
1765
1766 case VMMR0_DO_GMM_UPDATE_RESERVATION:
1767 if (u64Arg)
1768 return VERR_INVALID_PARAMETER;
1769 rc = GMMR0UpdateReservationReq(pGVM, pVM, idCpu, (PGMMUPDATERESERVATIONREQ)pReqHdr);
1770 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1771 break;
1772
1773 case VMMR0_DO_GMM_ALLOCATE_PAGES:
1774 if (u64Arg)
1775 return VERR_INVALID_PARAMETER;
1776 rc = GMMR0AllocatePagesReq(pGVM, pVM, idCpu, (PGMMALLOCATEPAGESREQ)pReqHdr);
1777 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1778 break;
1779
1780 case VMMR0_DO_GMM_FREE_PAGES:
1781 if (u64Arg)
1782 return VERR_INVALID_PARAMETER;
1783 rc = GMMR0FreePagesReq(pGVM, pVM, idCpu, (PGMMFREEPAGESREQ)pReqHdr);
1784 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1785 break;
1786
1787 case VMMR0_DO_GMM_FREE_LARGE_PAGE:
1788 if (u64Arg)
1789 return VERR_INVALID_PARAMETER;
1790 rc = GMMR0FreeLargePageReq(pGVM, pVM, idCpu, (PGMMFREELARGEPAGEREQ)pReqHdr);
1791 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1792 break;
1793
1794 case VMMR0_DO_GMM_QUERY_HYPERVISOR_MEM_STATS:
1795 if (u64Arg)
1796 return VERR_INVALID_PARAMETER;
1797 rc = GMMR0QueryHypervisorMemoryStatsReq((PGMMMEMSTATSREQ)pReqHdr);
1798 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1799 break;
1800
1801 case VMMR0_DO_GMM_QUERY_MEM_STATS:
1802 if (idCpu == NIL_VMCPUID)
1803 return VERR_INVALID_CPU_ID;
1804 if (u64Arg)
1805 return VERR_INVALID_PARAMETER;
1806 rc = GMMR0QueryMemoryStatsReq(pGVM, pVM, idCpu, (PGMMMEMSTATSREQ)pReqHdr);
1807 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1808 break;
1809
1810 case VMMR0_DO_GMM_BALLOONED_PAGES:
1811 if (u64Arg)
1812 return VERR_INVALID_PARAMETER;
1813 rc = GMMR0BalloonedPagesReq(pGVM, pVM, idCpu, (PGMMBALLOONEDPAGESREQ)pReqHdr);
1814 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1815 break;
1816
1817 case VMMR0_DO_GMM_MAP_UNMAP_CHUNK:
1818 if (u64Arg)
1819 return VERR_INVALID_PARAMETER;
1820 rc = GMMR0MapUnmapChunkReq(pGVM, pVM, (PGMMMAPUNMAPCHUNKREQ)pReqHdr);
1821 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1822 break;
1823
1824 case VMMR0_DO_GMM_SEED_CHUNK:
1825 if (pReqHdr)
1826 return VERR_INVALID_PARAMETER;
1827 rc = GMMR0SeedChunk(pGVM, pVM, idCpu, (RTR3PTR)u64Arg);
1828 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1829 break;
1830
1831 case VMMR0_DO_GMM_REGISTER_SHARED_MODULE:
1832 if (idCpu == NIL_VMCPUID)
1833 return VERR_INVALID_CPU_ID;
1834 if (u64Arg)
1835 return VERR_INVALID_PARAMETER;
1836 rc = GMMR0RegisterSharedModuleReq(pGVM, pVM, idCpu, (PGMMREGISTERSHAREDMODULEREQ)pReqHdr);
1837 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1838 break;
1839
1840 case VMMR0_DO_GMM_UNREGISTER_SHARED_MODULE:
1841 if (idCpu == NIL_VMCPUID)
1842 return VERR_INVALID_CPU_ID;
1843 if (u64Arg)
1844 return VERR_INVALID_PARAMETER;
1845 rc = GMMR0UnregisterSharedModuleReq(pGVM, pVM, idCpu, (PGMMUNREGISTERSHAREDMODULEREQ)pReqHdr);
1846 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1847 break;
1848
1849 case VMMR0_DO_GMM_RESET_SHARED_MODULES:
1850 if (idCpu == NIL_VMCPUID)
1851 return VERR_INVALID_CPU_ID;
1852 if ( u64Arg
1853 || pReqHdr)
1854 return VERR_INVALID_PARAMETER;
1855 rc = GMMR0ResetSharedModules(pGVM, pVM, idCpu);
1856 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1857 break;
1858
1859#ifdef VBOX_WITH_PAGE_SHARING
1860 case VMMR0_DO_GMM_CHECK_SHARED_MODULES:
1861 {
1862 if (idCpu == NIL_VMCPUID)
1863 return VERR_INVALID_CPU_ID;
1864 if ( u64Arg
1865 || pReqHdr)
1866 return VERR_INVALID_PARAMETER;
1867 rc = GMMR0CheckSharedModules(pGVM, pVM, idCpu);
1868 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1869 break;
1870 }
1871#endif
1872
1873#if defined(VBOX_STRICT) && HC_ARCH_BITS == 64
1874 case VMMR0_DO_GMM_FIND_DUPLICATE_PAGE:
1875 if (u64Arg)
1876 return VERR_INVALID_PARAMETER;
1877 rc = GMMR0FindDuplicatePageReq(pGVM, pVM, (PGMMFINDDUPLICATEPAGEREQ)pReqHdr);
1878 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1879 break;
1880#endif
1881
1882 case VMMR0_DO_GMM_QUERY_STATISTICS:
1883 if (u64Arg)
1884 return VERR_INVALID_PARAMETER;
1885 rc = GMMR0QueryStatisticsReq(pGVM, pVM, (PGMMQUERYSTATISTICSSREQ)pReqHdr);
1886 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1887 break;
1888
1889 case VMMR0_DO_GMM_RESET_STATISTICS:
1890 if (u64Arg)
1891 return VERR_INVALID_PARAMETER;
1892 rc = GMMR0ResetStatisticsReq(pGVM, pVM, (PGMMRESETSTATISTICSSREQ)pReqHdr);
1893 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1894 break;
1895
1896 /*
1897 * A quick GCFGM mock-up.
1898 */
1899 /** @todo GCFGM with proper access control, ring-3 management interface and all that. */
1900 case VMMR0_DO_GCFGM_SET_VALUE:
1901 case VMMR0_DO_GCFGM_QUERY_VALUE:
1902 {
1903 if (pGVM || pVM || !pReqHdr || u64Arg || idCpu != NIL_VMCPUID)
1904 return VERR_INVALID_PARAMETER;
1905 PGCFGMVALUEREQ pReq = (PGCFGMVALUEREQ)pReqHdr;
1906 if (pReq->Hdr.cbReq != sizeof(*pReq))
1907 return VERR_INVALID_PARAMETER;
1908 if (enmOperation == VMMR0_DO_GCFGM_SET_VALUE)
1909 {
1910 rc = GVMMR0SetConfig(pReq->pSession, &pReq->szName[0], pReq->u64Value);
1911 //if (rc == VERR_CFGM_VALUE_NOT_FOUND)
1912 // rc = GMMR0SetConfig(pReq->pSession, &pReq->szName[0], pReq->u64Value);
1913 }
1914 else
1915 {
1916 rc = GVMMR0QueryConfig(pReq->pSession, &pReq->szName[0], &pReq->u64Value);
1917 //if (rc == VERR_CFGM_VALUE_NOT_FOUND)
1918 // rc = GMMR0QueryConfig(pReq->pSession, &pReq->szName[0], &pReq->u64Value);
1919 }
1920 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1921 break;
1922 }
1923
1924 /*
1925 * PDM Wrappers.
1926 */
1927 case VMMR0_DO_PDM_DRIVER_CALL_REQ_HANDLER:
1928 {
1929 if (!pReqHdr || u64Arg || idCpu != NIL_VMCPUID)
1930 return VERR_INVALID_PARAMETER;
1931 rc = PDMR0DriverCallReqHandler(pGVM, pVM, (PPDMDRIVERCALLREQHANDLERREQ)pReqHdr);
1932 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1933 break;
1934 }
1935
1936 case VMMR0_DO_PDM_DEVICE_CALL_REQ_HANDLER:
1937 {
1938 if (!pReqHdr || u64Arg || idCpu != NIL_VMCPUID)
1939 return VERR_INVALID_PARAMETER;
1940 rc = PDMR0DeviceCallReqHandler(pGVM, pVM, (PPDMDEVICECALLREQHANDLERREQ)pReqHdr);
1941 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1942 break;
1943 }
1944
1945 /*
1946 * Requests to the internal networking service.
1947 */
1948 case VMMR0_DO_INTNET_OPEN:
1949 {
1950 PINTNETOPENREQ pReq = (PINTNETOPENREQ)pReqHdr;
1951 if (u64Arg || !pReq || !vmmR0IsValidSession(pVM, pReq->pSession, pSession) || idCpu != NIL_VMCPUID)
1952 return VERR_INVALID_PARAMETER;
1953 rc = IntNetR0OpenReq(pSession, pReq);
1954 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1955 break;
1956 }
1957
1958 case VMMR0_DO_INTNET_IF_CLOSE:
1959 if (u64Arg || !pReqHdr || !vmmR0IsValidSession(pVM, ((PINTNETIFCLOSEREQ)pReqHdr)->pSession, pSession) || idCpu != NIL_VMCPUID)
1960 return VERR_INVALID_PARAMETER;
1961 rc = IntNetR0IfCloseReq(pSession, (PINTNETIFCLOSEREQ)pReqHdr);
1962 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1963 break;
1964
1965
1966 case VMMR0_DO_INTNET_IF_GET_BUFFER_PTRS:
1967 if (u64Arg || !pReqHdr || !vmmR0IsValidSession(pVM, ((PINTNETIFGETBUFFERPTRSREQ)pReqHdr)->pSession, pSession) || idCpu != NIL_VMCPUID)
1968 return VERR_INVALID_PARAMETER;
1969 rc = IntNetR0IfGetBufferPtrsReq(pSession, (PINTNETIFGETBUFFERPTRSREQ)pReqHdr);
1970 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1971 break;
1972
1973 case VMMR0_DO_INTNET_IF_SET_PROMISCUOUS_MODE:
1974 if (u64Arg || !pReqHdr || !vmmR0IsValidSession(pVM, ((PINTNETIFSETPROMISCUOUSMODEREQ)pReqHdr)->pSession, pSession) || idCpu != NIL_VMCPUID)
1975 return VERR_INVALID_PARAMETER;
1976 rc = IntNetR0IfSetPromiscuousModeReq(pSession, (PINTNETIFSETPROMISCUOUSMODEREQ)pReqHdr);
1977 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1978 break;
1979
1980 case VMMR0_DO_INTNET_IF_SET_MAC_ADDRESS:
1981 if (u64Arg || !pReqHdr || !vmmR0IsValidSession(pVM, ((PINTNETIFSETMACADDRESSREQ)pReqHdr)->pSession, pSession) || idCpu != NIL_VMCPUID)
1982 return VERR_INVALID_PARAMETER;
1983 rc = IntNetR0IfSetMacAddressReq(pSession, (PINTNETIFSETMACADDRESSREQ)pReqHdr);
1984 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1985 break;
1986
1987 case VMMR0_DO_INTNET_IF_SET_ACTIVE:
1988 if (u64Arg || !pReqHdr || !vmmR0IsValidSession(pVM, ((PINTNETIFSETACTIVEREQ)pReqHdr)->pSession, pSession) || idCpu != NIL_VMCPUID)
1989 return VERR_INVALID_PARAMETER;
1990 rc = IntNetR0IfSetActiveReq(pSession, (PINTNETIFSETACTIVEREQ)pReqHdr);
1991 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1992 break;
1993
1994 case VMMR0_DO_INTNET_IF_SEND:
1995 if (u64Arg || !pReqHdr || !vmmR0IsValidSession(pVM, ((PINTNETIFSENDREQ)pReqHdr)->pSession, pSession) || idCpu != NIL_VMCPUID)
1996 return VERR_INVALID_PARAMETER;
1997 rc = IntNetR0IfSendReq(pSession, (PINTNETIFSENDREQ)pReqHdr);
1998 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
1999 break;
2000
2001 case VMMR0_DO_INTNET_IF_WAIT:
2002 if (u64Arg || !pReqHdr || !vmmR0IsValidSession(pVM, ((PINTNETIFWAITREQ)pReqHdr)->pSession, pSession) || idCpu != NIL_VMCPUID)
2003 return VERR_INVALID_PARAMETER;
2004 rc = IntNetR0IfWaitReq(pSession, (PINTNETIFWAITREQ)pReqHdr);
2005 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2006 break;
2007
2008 case VMMR0_DO_INTNET_IF_ABORT_WAIT:
2009 if (u64Arg || !pReqHdr || !vmmR0IsValidSession(pVM, ((PINTNETIFWAITREQ)pReqHdr)->pSession, pSession) || idCpu != NIL_VMCPUID)
2010 return VERR_INVALID_PARAMETER;
2011 rc = IntNetR0IfAbortWaitReq(pSession, (PINTNETIFABORTWAITREQ)pReqHdr);
2012 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2013 break;
2014
2015#ifdef VBOX_WITH_PCI_PASSTHROUGH
2016 /*
2017 * Requests to host PCI driver service.
2018 */
2019 case VMMR0_DO_PCIRAW_REQ:
2020 if (u64Arg || !pReqHdr || !vmmR0IsValidSession(pVM, ((PPCIRAWSENDREQ)pReqHdr)->pSession, pSession) || idCpu != NIL_VMCPUID)
2021 return VERR_INVALID_PARAMETER;
2022 rc = PciRawR0ProcessReq(pGVM, pVM, pSession, (PPCIRAWSENDREQ)pReqHdr);
2023 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2024 break;
2025#endif
2026
2027 /*
2028 * NEM requests.
2029 */
2030#ifdef VBOX_WITH_NEM_R0
2031# if defined(RT_ARCH_AMD64) && defined(RT_OS_WINDOWS)
2032 case VMMR0_DO_NEM_INIT_VM:
2033 if (u64Arg || pReqHdr || idCpu != 0)
2034 return VERR_INVALID_PARAMETER;
2035 rc = NEMR0InitVM(pGVM, pVM);
2036 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2037 break;
2038
2039 case VMMR0_DO_NEM_INIT_VM_PART_2:
2040 if (u64Arg || pReqHdr || idCpu != 0)
2041 return VERR_INVALID_PARAMETER;
2042 rc = NEMR0InitVMPart2(pGVM, pVM);
2043 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2044 break;
2045
2046 case VMMR0_DO_NEM_MAP_PAGES:
2047 if (u64Arg || pReqHdr || idCpu == NIL_VMCPUID)
2048 return VERR_INVALID_PARAMETER;
2049 rc = NEMR0MapPages(pGVM, pVM, idCpu);
2050 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2051 break;
2052
2053 case VMMR0_DO_NEM_UNMAP_PAGES:
2054 if (u64Arg || pReqHdr || idCpu == NIL_VMCPUID)
2055 return VERR_INVALID_PARAMETER;
2056 rc = NEMR0UnmapPages(pGVM, pVM, idCpu);
2057 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2058 break;
2059
2060 case VMMR0_DO_NEM_EXPORT_STATE:
2061 if (u64Arg || pReqHdr || idCpu == NIL_VMCPUID)
2062 return VERR_INVALID_PARAMETER;
2063 rc = NEMR0ExportState(pGVM, pVM, idCpu);
2064 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2065 break;
2066
2067 case VMMR0_DO_NEM_IMPORT_STATE:
2068 if (pReqHdr || idCpu == NIL_VMCPUID)
2069 return VERR_INVALID_PARAMETER;
2070 rc = NEMR0ImportState(pGVM, pVM, idCpu, u64Arg);
2071 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2072 break;
2073
2074 case VMMR0_DO_NEM_QUERY_CPU_TICK:
2075 if (u64Arg || pReqHdr || idCpu == NIL_VMCPUID)
2076 return VERR_INVALID_PARAMETER;
2077 rc = NEMR0QueryCpuTick(pGVM, pVM, idCpu);
2078 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2079 break;
2080
2081 case VMMR0_DO_NEM_RESUME_CPU_TICK_ON_ALL:
2082 if (pReqHdr || idCpu == NIL_VMCPUID)
2083 return VERR_INVALID_PARAMETER;
2084 rc = NEMR0ResumeCpuTickOnAll(pGVM, pVM, idCpu, u64Arg);
2085 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2086 break;
2087
2088 case VMMR0_DO_NEM_UPDATE_STATISTICS:
2089 if (u64Arg || pReqHdr)
2090 return VERR_INVALID_PARAMETER;
2091 rc = NEMR0UpdateStatistics(pGVM, pVM, idCpu);
2092 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2093 break;
2094
2095# if 1 && defined(DEBUG_bird)
2096 case VMMR0_DO_NEM_EXPERIMENT:
2097 if (pReqHdr)
2098 return VERR_INVALID_PARAMETER;
2099 rc = NEMR0DoExperiment(pGVM, pVM, idCpu, u64Arg);
2100 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2101 break;
2102# endif
2103# endif
2104#endif
2105
2106 /*
2107 * For profiling.
2108 */
2109 case VMMR0_DO_NOP:
2110 case VMMR0_DO_SLOW_NOP:
2111 return VINF_SUCCESS;
2112
2113 /*
2114 * For testing Ring-0 APIs invoked in this environment.
2115 */
2116 case VMMR0_DO_TESTS:
2117 /** @todo make new test */
2118 return VINF_SUCCESS;
2119
2120
2121#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS)
2122 case VMMR0_DO_TEST_SWITCHER3264:
2123 if (idCpu == NIL_VMCPUID)
2124 return VERR_INVALID_CPU_ID;
2125 rc = HMR0TestSwitcher3264(pVM);
2126 VMM_CHECK_SMAP_CHECK2(pVM, RT_NOTHING);
2127 break;
2128#endif
2129 default:
2130 /*
2131 * We're returning VERR_NOT_SUPPORT here so we've got something else
2132 * than -1 which the interrupt gate glue code might return.
2133 */
2134 Log(("operation %#x is not supported\n", enmOperation));
2135 return VERR_NOT_SUPPORTED;
2136 }
2137 return rc;
2138}
2139
2140
2141/**
2142 * Argument for vmmR0EntryExWrapper containing the arguments for VMMR0EntryEx.
2143 */
2144typedef struct VMMR0ENTRYEXARGS
2145{
2146 PGVM pGVM;
2147 PVM pVM;
2148 VMCPUID idCpu;
2149 VMMR0OPERATION enmOperation;
2150 PSUPVMMR0REQHDR pReq;
2151 uint64_t u64Arg;
2152 PSUPDRVSESSION pSession;
2153} VMMR0ENTRYEXARGS;
2154/** Pointer to a vmmR0EntryExWrapper argument package. */
2155typedef VMMR0ENTRYEXARGS *PVMMR0ENTRYEXARGS;
2156
2157/**
2158 * This is just a longjmp wrapper function for VMMR0EntryEx calls.
2159 *
2160 * @returns VBox status code.
2161 * @param pvArgs The argument package
2162 */
2163static DECLCALLBACK(int) vmmR0EntryExWrapper(void *pvArgs)
2164{
2165 return vmmR0EntryExWorker(((PVMMR0ENTRYEXARGS)pvArgs)->pGVM,
2166 ((PVMMR0ENTRYEXARGS)pvArgs)->pVM,
2167 ((PVMMR0ENTRYEXARGS)pvArgs)->idCpu,
2168 ((PVMMR0ENTRYEXARGS)pvArgs)->enmOperation,
2169 ((PVMMR0ENTRYEXARGS)pvArgs)->pReq,
2170 ((PVMMR0ENTRYEXARGS)pvArgs)->u64Arg,
2171 ((PVMMR0ENTRYEXARGS)pvArgs)->pSession);
2172}
2173
2174
2175/**
2176 * The Ring 0 entry point, called by the support library (SUP).
2177 *
2178 * @returns VBox status code.
2179 * @param pGVM The global (ring-0) VM structure.
2180 * @param pVM The cross context VM structure.
2181 * @param idCpu Virtual CPU ID argument. Must be NIL_VMCPUID if pVM
2182 * is NIL_RTR0PTR, and may be NIL_VMCPUID if it isn't
2183 * @param enmOperation Which operation to execute.
2184 * @param pReq Pointer to the SUPVMMR0REQHDR packet. Optional.
2185 * @param u64Arg Some simple constant argument.
2186 * @param pSession The session of the caller.
2187 * @remarks Assume called with interrupts _enabled_.
2188 */
2189VMMR0DECL(int) VMMR0EntryEx(PGVM pGVM, PVM pVM, VMCPUID idCpu, VMMR0OPERATION enmOperation,
2190 PSUPVMMR0REQHDR pReq, uint64_t u64Arg, PSUPDRVSESSION pSession)
2191{
2192 /*
2193 * Requests that should only happen on the EMT thread will be
2194 * wrapped in a setjmp so we can assert without causing trouble.
2195 */
2196 if ( pVM != NULL
2197 && pGVM != NULL
2198 && idCpu < pGVM->cCpus
2199 && pVM->pVMR0 != NULL)
2200 {
2201 switch (enmOperation)
2202 {
2203 /* These might/will be called before VMMR3Init. */
2204 case VMMR0_DO_GMM_INITIAL_RESERVATION:
2205 case VMMR0_DO_GMM_UPDATE_RESERVATION:
2206 case VMMR0_DO_GMM_ALLOCATE_PAGES:
2207 case VMMR0_DO_GMM_FREE_PAGES:
2208 case VMMR0_DO_GMM_BALLOONED_PAGES:
2209 /* On the mac we might not have a valid jmp buf, so check these as well. */
2210 case VMMR0_DO_VMMR0_INIT:
2211 case VMMR0_DO_VMMR0_TERM:
2212 {
2213 PGVMCPU pGVCpu = &pGVM->aCpus[idCpu];
2214 PVMCPU pVCpu = &pVM->aCpus[idCpu];
2215 RTNATIVETHREAD hNativeThread = RTThreadNativeSelf();
2216 if (RT_LIKELY( pGVCpu->hEMT == hNativeThread
2217 && pVCpu->hNativeThreadR0 == hNativeThread))
2218 {
2219 if (!pVCpu->vmm.s.CallRing3JmpBufR0.pvSavedStack)
2220 break;
2221
2222 /** @todo validate this EMT claim... GVM knows. */
2223 VMMR0ENTRYEXARGS Args;
2224 Args.pGVM = pGVM;
2225 Args.pVM = pVM;
2226 Args.idCpu = idCpu;
2227 Args.enmOperation = enmOperation;
2228 Args.pReq = pReq;
2229 Args.u64Arg = u64Arg;
2230 Args.pSession = pSession;
2231 return vmmR0CallRing3SetJmpEx(&pVCpu->vmm.s.CallRing3JmpBufR0, vmmR0EntryExWrapper, &Args);
2232 }
2233 return VERR_VM_THREAD_NOT_EMT;
2234 }
2235
2236 default:
2237 break;
2238 }
2239 }
2240 return vmmR0EntryExWorker(pGVM, pVM, idCpu, enmOperation, pReq, u64Arg, pSession);
2241}
2242
2243
2244/**
2245 * Checks whether we've armed the ring-0 long jump machinery.
2246 *
2247 * @returns @c true / @c false
2248 * @param pVCpu The cross context virtual CPU structure.
2249 * @thread EMT
2250 * @sa VMMIsLongJumpArmed
2251 */
2252VMMR0_INT_DECL(bool) VMMR0IsLongJumpArmed(PVMCPU pVCpu)
2253{
2254#ifdef RT_ARCH_X86
2255 return pVCpu->vmm.s.CallRing3JmpBufR0.eip
2256 && !pVCpu->vmm.s.CallRing3JmpBufR0.fInRing3Call;
2257#else
2258 return pVCpu->vmm.s.CallRing3JmpBufR0.rip
2259 && !pVCpu->vmm.s.CallRing3JmpBufR0.fInRing3Call;
2260#endif
2261}
2262
2263
2264/**
2265 * Checks whether we've done a ring-3 long jump.
2266 *
2267 * @returns @c true / @c false
2268 * @param pVCpu The cross context virtual CPU structure.
2269 * @thread EMT
2270 */
2271VMMR0_INT_DECL(bool) VMMR0IsInRing3LongJump(PVMCPU pVCpu)
2272{
2273 return pVCpu->vmm.s.CallRing3JmpBufR0.fInRing3Call;
2274}
2275
2276
2277/**
2278 * Internal R0 logger worker: Flush logger.
2279 *
2280 * @param pLogger The logger instance to flush.
2281 * @remark This function must be exported!
2282 */
2283VMMR0DECL(void) vmmR0LoggerFlush(PRTLOGGER pLogger)
2284{
2285#ifdef LOG_ENABLED
2286 /*
2287 * Convert the pLogger into a VM handle and 'call' back to Ring-3.
2288 * (This is a bit paranoid code.)
2289 */
2290 PVMMR0LOGGER pR0Logger = (PVMMR0LOGGER)((uintptr_t)pLogger - RT_UOFFSETOF(VMMR0LOGGER, Logger));
2291 if ( !VALID_PTR(pR0Logger)
2292 || !VALID_PTR(pR0Logger + 1)
2293 || pLogger->u32Magic != RTLOGGER_MAGIC)
2294 {
2295# ifdef DEBUG
2296 SUPR0Printf("vmmR0LoggerFlush: pLogger=%p!\n", pLogger);
2297# endif
2298 return;
2299 }
2300 if (pR0Logger->fFlushingDisabled)
2301 return; /* quietly */
2302
2303 PVM pVM = pR0Logger->pVM;
2304 if ( !VALID_PTR(pVM)
2305 || pVM->pVMR0 != pVM)
2306 {
2307# ifdef DEBUG
2308 SUPR0Printf("vmmR0LoggerFlush: pVM=%p! pVMR0=%p! pLogger=%p\n", pVM, pVM->pVMR0, pLogger);
2309# endif
2310 return;
2311 }
2312
2313 PVMCPU pVCpu = VMMGetCpu(pVM);
2314 if (pVCpu)
2315 {
2316 /*
2317 * Check that the jump buffer is armed.
2318 */
2319# ifdef RT_ARCH_X86
2320 if ( !pVCpu->vmm.s.CallRing3JmpBufR0.eip
2321 || pVCpu->vmm.s.CallRing3JmpBufR0.fInRing3Call)
2322# else
2323 if ( !pVCpu->vmm.s.CallRing3JmpBufR0.rip
2324 || pVCpu->vmm.s.CallRing3JmpBufR0.fInRing3Call)
2325# endif
2326 {
2327# ifdef DEBUG
2328 SUPR0Printf("vmmR0LoggerFlush: Jump buffer isn't armed!\n");
2329# endif
2330 return;
2331 }
2332 VMMRZCallRing3(pVM, pVCpu, VMMCALLRING3_VMM_LOGGER_FLUSH, 0);
2333 }
2334# ifdef DEBUG
2335 else
2336 SUPR0Printf("vmmR0LoggerFlush: invalid VCPU context!\n");
2337# endif
2338#else
2339 NOREF(pLogger);
2340#endif /* LOG_ENABLED */
2341}
2342
2343#ifdef LOG_ENABLED
2344
2345/**
2346 * Disables flushing of the ring-0 debug log.
2347 *
2348 * @param pVCpu The cross context virtual CPU structure.
2349 */
2350VMMR0_INT_DECL(void) VMMR0LogFlushDisable(PVMCPU pVCpu)
2351{
2352 if (pVCpu->vmm.s.pR0LoggerR0)
2353 pVCpu->vmm.s.pR0LoggerR0->fFlushingDisabled = true;
2354 if (pVCpu->vmm.s.pR0RelLoggerR0)
2355 pVCpu->vmm.s.pR0RelLoggerR0->fFlushingDisabled = true;
2356}
2357
2358
2359/**
2360 * Enables flushing of the ring-0 debug log.
2361 *
2362 * @param pVCpu The cross context virtual CPU structure.
2363 */
2364VMMR0_INT_DECL(void) VMMR0LogFlushEnable(PVMCPU pVCpu)
2365{
2366 if (pVCpu->vmm.s.pR0LoggerR0)
2367 pVCpu->vmm.s.pR0LoggerR0->fFlushingDisabled = false;
2368 if (pVCpu->vmm.s.pR0RelLoggerR0)
2369 pVCpu->vmm.s.pR0RelLoggerR0->fFlushingDisabled = false;
2370}
2371
2372
2373/**
2374 * Checks if log flushing is disabled or not.
2375 *
2376 * @param pVCpu The cross context virtual CPU structure.
2377 */
2378VMMR0_INT_DECL(bool) VMMR0IsLogFlushDisabled(PVMCPU pVCpu)
2379{
2380 if (pVCpu->vmm.s.pR0LoggerR0)
2381 return pVCpu->vmm.s.pR0LoggerR0->fFlushingDisabled;
2382 if (pVCpu->vmm.s.pR0RelLoggerR0)
2383 return pVCpu->vmm.s.pR0RelLoggerR0->fFlushingDisabled;
2384 return true;
2385}
2386
2387#endif /* LOG_ENABLED */
2388
2389/**
2390 * Override RTLogRelGetDefaultInstanceEx so we can do LogRel to VBox.log from EMTs in ring-0.
2391 */
2392DECLEXPORT(PRTLOGGER) RTLogRelGetDefaultInstanceEx(uint32_t fFlagsAndGroup)
2393{
2394 PGVMCPU pGVCpu = GVMMR0GetGVCpuByEMT(NIL_RTNATIVETHREAD);
2395 if (pGVCpu)
2396 {
2397 PVMCPU pVCpu = pGVCpu->pVCpu;
2398 if (RT_VALID_PTR(pVCpu))
2399 {
2400 PVMMR0LOGGER pVmmLogger = pVCpu->vmm.s.pR0RelLoggerR0;
2401 if (RT_VALID_PTR(pVmmLogger))
2402 {
2403 if ( pVmmLogger->fCreated
2404 && pVmmLogger->pVM == pGVCpu->pVM)
2405 {
2406 if (pVmmLogger->Logger.fFlags & RTLOGFLAGS_DISABLED)
2407 return NULL;
2408 uint16_t const fFlags = RT_LO_U16(fFlagsAndGroup);
2409 uint16_t const iGroup = RT_HI_U16(fFlagsAndGroup);
2410 if ( iGroup != UINT16_MAX
2411 && ( ( pVmmLogger->Logger.afGroups[iGroup < pVmmLogger->Logger.cGroups ? iGroup : 0]
2412 & (fFlags | (uint32_t)RTLOGGRPFLAGS_ENABLED))
2413 != (fFlags | (uint32_t)RTLOGGRPFLAGS_ENABLED)))
2414 return NULL;
2415 return &pVmmLogger->Logger;
2416 }
2417 }
2418 }
2419 }
2420 return SUPR0GetDefaultLogRelInstanceEx(fFlagsAndGroup);
2421}
2422
2423
2424/**
2425 * Jump back to ring-3 if we're the EMT and the longjmp is armed.
2426 *
2427 * @returns true if the breakpoint should be hit, false if it should be ignored.
2428 */
2429DECLEXPORT(bool) RTCALL RTAssertShouldPanic(void)
2430{
2431#if 0
2432 return true;
2433#else
2434 PVM pVM = GVMMR0GetVMByEMT(NIL_RTNATIVETHREAD);
2435 if (pVM)
2436 {
2437 PVMCPU pVCpu = VMMGetCpu(pVM);
2438
2439 if (pVCpu)
2440 {
2441#ifdef RT_ARCH_X86
2442 if ( pVCpu->vmm.s.CallRing3JmpBufR0.eip
2443 && !pVCpu->vmm.s.CallRing3JmpBufR0.fInRing3Call)
2444#else
2445 if ( pVCpu->vmm.s.CallRing3JmpBufR0.rip
2446 && !pVCpu->vmm.s.CallRing3JmpBufR0.fInRing3Call)
2447#endif
2448 {
2449 int rc = VMMRZCallRing3(pVM, pVCpu, VMMCALLRING3_VM_R0_ASSERTION, 0);
2450 return RT_FAILURE_NP(rc);
2451 }
2452 }
2453 }
2454#ifdef RT_OS_LINUX
2455 return true;
2456#else
2457 return false;
2458#endif
2459#endif
2460}
2461
2462
2463/**
2464 * Override this so we can push it up to ring-3.
2465 *
2466 * @param pszExpr Expression. Can be NULL.
2467 * @param uLine Location line number.
2468 * @param pszFile Location file name.
2469 * @param pszFunction Location function name.
2470 */
2471DECLEXPORT(void) RTCALL RTAssertMsg1Weak(const char *pszExpr, unsigned uLine, const char *pszFile, const char *pszFunction)
2472{
2473 /*
2474 * To the log.
2475 */
2476 LogAlways(("\n!!R0-Assertion Failed!!\n"
2477 "Expression: %s\n"
2478 "Location : %s(%d) %s\n",
2479 pszExpr, pszFile, uLine, pszFunction));
2480
2481 /*
2482 * To the global VMM buffer.
2483 */
2484 PVM pVM = GVMMR0GetVMByEMT(NIL_RTNATIVETHREAD);
2485 if (pVM)
2486 RTStrPrintf(pVM->vmm.s.szRing0AssertMsg1, sizeof(pVM->vmm.s.szRing0AssertMsg1),
2487 "\n!!R0-Assertion Failed!!\n"
2488 "Expression: %.*s\n"
2489 "Location : %s(%d) %s\n",
2490 sizeof(pVM->vmm.s.szRing0AssertMsg1) / 4 * 3, pszExpr,
2491 pszFile, uLine, pszFunction);
2492
2493 /*
2494 * Continue the normal way.
2495 */
2496 RTAssertMsg1(pszExpr, uLine, pszFile, pszFunction);
2497}
2498
2499
2500/**
2501 * Callback for RTLogFormatV which writes to the ring-3 log port.
2502 * See PFNLOGOUTPUT() for details.
2503 */
2504static DECLCALLBACK(size_t) rtLogOutput(void *pv, const char *pachChars, size_t cbChars)
2505{
2506 for (size_t i = 0; i < cbChars; i++)
2507 {
2508 LogAlways(("%c", pachChars[i])); NOREF(pachChars);
2509 }
2510
2511 NOREF(pv);
2512 return cbChars;
2513}
2514
2515
2516/**
2517 * Override this so we can push it up to ring-3.
2518 *
2519 * @param pszFormat The format string.
2520 * @param va Arguments.
2521 */
2522DECLEXPORT(void) RTCALL RTAssertMsg2WeakV(const char *pszFormat, va_list va)
2523{
2524 va_list vaCopy;
2525
2526 /*
2527 * Push the message to the loggers.
2528 */
2529 PRTLOGGER pLog = RTLogGetDefaultInstance(); /* Don't initialize it here... */
2530 if (pLog)
2531 {
2532 va_copy(vaCopy, va);
2533 RTLogFormatV(rtLogOutput, pLog, pszFormat, vaCopy);
2534 va_end(vaCopy);
2535 }
2536 pLog = RTLogRelGetDefaultInstance();
2537 if (pLog)
2538 {
2539 va_copy(vaCopy, va);
2540 RTLogFormatV(rtLogOutput, pLog, pszFormat, vaCopy);
2541 va_end(vaCopy);
2542 }
2543
2544 /*
2545 * Push it to the global VMM buffer.
2546 */
2547 PVM pVM = GVMMR0GetVMByEMT(NIL_RTNATIVETHREAD);
2548 if (pVM)
2549 {
2550 va_copy(vaCopy, va);
2551 RTStrPrintfV(pVM->vmm.s.szRing0AssertMsg2, sizeof(pVM->vmm.s.szRing0AssertMsg2), pszFormat, vaCopy);
2552 va_end(vaCopy);
2553 }
2554
2555 /*
2556 * Continue the normal way.
2557 */
2558 RTAssertMsg2V(pszFormat, va);
2559}
2560
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette