VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMAll/HMAll.cpp@ 55302

Last change on this file since 55302 was 55129, checked in by vboxsync, 10 years ago

VMM/GIM: Allow dynamic enabling of #UD traps and per-VCPU hypercalls.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 15.2 KB
Line 
1/* $Id: HMAll.cpp 55129 2015-04-08 11:31:47Z vboxsync $ */
2/** @file
3 * HM - All contexts.
4 */
5
6/*
7 * Copyright (C) 2006-2014 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*******************************************************************************
20* Header Files *
21*******************************************************************************/
22#define LOG_GROUP LOG_GROUP_HM
23#include <VBox/vmm/hm.h>
24#include <VBox/vmm/pgm.h>
25#include "HMInternal.h"
26#include <VBox/vmm/vm.h>
27#include <VBox/vmm/hm_vmx.h>
28#include <VBox/vmm/hm_svm.h>
29#include <VBox/err.h>
30#include <VBox/log.h>
31#include <iprt/param.h>
32#include <iprt/assert.h>
33#include <iprt/asm.h>
34#include <iprt/string.h>
35#include <iprt/thread.h>
36#include <iprt/x86.h>
37#include <iprt/asm-amd64-x86.h>
38
39
40/**
41 * Checks whether HM (VT-x/AMD-V) is being used by this VM.
42 *
43 * @retval @c true if used.
44 * @retval @c false if software virtualization (raw-mode) is used.
45 * @param pVM The cross context VM structure.
46 * @sa HMIsEnabled, HMR3IsEnabled
47 * @internal
48 */
49VMMDECL(bool) HMIsEnabledNotMacro(PVM pVM)
50{
51 Assert(pVM->fHMEnabledFixed);
52 return pVM->fHMEnabled;
53}
54
55
56/**
57 * Queues a page for invalidation
58 *
59 * @returns VBox status code.
60 * @param pVCpu Pointer to the VMCPU.
61 * @param GCVirt Page to invalidate
62 */
63static void hmQueueInvlPage(PVMCPU pVCpu, RTGCPTR GCVirt)
64{
65 /* Nothing to do if a TLB flush is already pending */
66 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH))
67 return;
68#if 1
69 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
70 NOREF(GCVirt);
71#else
72 /* Be very careful when activating this code! */
73 if (iPage == RT_ELEMENTS(pVCpu->hm.s.TlbShootdown.aPages))
74 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
75 else
76 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_SHOOTDOWN);
77#endif
78}
79
80
81/**
82 * Invalidates a guest page
83 *
84 * @returns VBox status code.
85 * @param pVCpu Pointer to the VMCPU.
86 * @param GCVirt Page to invalidate
87 */
88VMM_INT_DECL(int) HMInvalidatePage(PVMCPU pVCpu, RTGCPTR GCVirt)
89{
90 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushPageManual);
91#ifdef IN_RING0
92 PVM pVM = pVCpu->CTX_SUFF(pVM);
93 if (pVM->hm.s.vmx.fSupported)
94 return VMXR0InvalidatePage(pVM, pVCpu, GCVirt);
95
96 Assert(pVM->hm.s.svm.fSupported);
97 return SVMR0InvalidatePage(pVM, pVCpu, GCVirt);
98
99#else
100 hmQueueInvlPage(pVCpu, GCVirt);
101 return VINF_SUCCESS;
102#endif
103}
104
105
106/**
107 * Flushes the guest TLB.
108 *
109 * @returns VBox status code.
110 * @param pVCpu Pointer to the VMCPU.
111 */
112VMM_INT_DECL(int) HMFlushTLB(PVMCPU pVCpu)
113{
114 LogFlow(("HMFlushTLB\n"));
115
116 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
117 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlbManual);
118 return VINF_SUCCESS;
119}
120
121
122#ifdef IN_RING0
123/**
124 * Dummy RTMpOnSpecific handler since RTMpPokeCpu couldn't be used.
125 *
126 */
127static DECLCALLBACK(void) hmFlushHandler(RTCPUID idCpu, void *pvUser1, void *pvUser2)
128{
129 NOREF(idCpu); NOREF(pvUser1); NOREF(pvUser2);
130 return;
131}
132
133/**
134 * Wrapper for RTMpPokeCpu to deal with VERR_NOT_SUPPORTED.
135 */
136static void hmR0PokeCpu(PVMCPU pVCpu, RTCPUID idHostCpu)
137{
138 uint32_t cWorldSwitchExits = ASMAtomicUoReadU32(&pVCpu->hm.s.cWorldSwitchExits);
139
140 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatPoke, x);
141 int rc = RTMpPokeCpu(idHostCpu);
142 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatPoke, x);
143
144 /* Not implemented on some platforms (Darwin, Linux kernel < 2.6.19); fall
145 back to a less efficient implementation (broadcast). */
146 if (rc == VERR_NOT_SUPPORTED)
147 {
148 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatSpinPoke, z);
149 /* synchronous. */
150 RTMpOnSpecific(idHostCpu, hmFlushHandler, 0, 0);
151 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatSpinPoke, z);
152 }
153 else
154 {
155 if (rc == VINF_SUCCESS)
156 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatSpinPoke, z);
157 else
158 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatSpinPokeFailed, z);
159
160/** @todo If more than one CPU is going to be poked, we could optimize this
161 * operation by poking them first and wait afterwards. Would require
162 * recording who to poke and their current cWorldSwitchExits values,
163 * that's something not suitable for stack... So, pVCpu->hm.s.something
164 * then. */
165 /* Spin until the VCPU has switched back (poking is async). */
166 while ( ASMAtomicUoReadBool(&pVCpu->hm.s.fCheckedTLBFlush)
167 && cWorldSwitchExits == ASMAtomicUoReadU32(&pVCpu->hm.s.cWorldSwitchExits))
168 ASMNopPause();
169
170 if (rc == VINF_SUCCESS)
171 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatSpinPoke, z);
172 else
173 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatSpinPokeFailed, z);
174 }
175}
176#endif /* IN_RING0 */
177
178
179#ifndef IN_RC
180/**
181 * Poke an EMT so it can perform the appropriate TLB shootdowns.
182 *
183 * @param pVCpu The handle of the virtual CPU to poke.
184 * @param fAccountFlushStat Whether to account the call to
185 * StatTlbShootdownFlush or StatTlbShootdown.
186 */
187static void hmPokeCpuForTlbFlush(PVMCPU pVCpu, bool fAccountFlushStat)
188{
189 if (ASMAtomicUoReadBool(&pVCpu->hm.s.fCheckedTLBFlush))
190 {
191 if (fAccountFlushStat)
192 STAM_COUNTER_INC(&pVCpu->hm.s.StatTlbShootdownFlush);
193 else
194 STAM_COUNTER_INC(&pVCpu->hm.s.StatTlbShootdown);
195#ifdef IN_RING0
196 RTCPUID idHostCpu = pVCpu->hm.s.idEnteredCpu;
197 if (idHostCpu != NIL_RTCPUID)
198 hmR0PokeCpu(pVCpu, idHostCpu);
199#else
200 VMR3NotifyCpuFFU(pVCpu->pUVCpu, VMNOTIFYFF_FLAGS_POKE);
201#endif
202 }
203 else
204 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushPageManual);
205}
206
207
208/**
209 * Invalidates a guest page on all VCPUs.
210 *
211 * @returns VBox status code.
212 * @param pVM Pointer to the VM.
213 * @param GCVirt Page to invalidate
214 */
215VMM_INT_DECL(int) HMInvalidatePageOnAllVCpus(PVM pVM, RTGCPTR GCPtr)
216{
217 VMCPUID idCurCpu = VMMGetCpuId(pVM);
218 STAM_COUNTER_INC(&pVM->aCpus[idCurCpu].hm.s.StatFlushPage);
219
220 for (VMCPUID idCpu = 0; idCpu < pVM->cCpus; idCpu++)
221 {
222 PVMCPU pVCpu = &pVM->aCpus[idCpu];
223
224 /* Nothing to do if a TLB flush is already pending; the VCPU should
225 have already been poked if it were active. */
226 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH))
227 continue;
228
229 if (pVCpu->idCpu == idCurCpu)
230 HMInvalidatePage(pVCpu, GCPtr);
231 else
232 {
233 hmQueueInvlPage(pVCpu, GCPtr);
234 hmPokeCpuForTlbFlush(pVCpu, false /* fAccountFlushStat */);
235 }
236 }
237
238 return VINF_SUCCESS;
239}
240
241
242/**
243 * Flush the TLBs of all VCPUs.
244 *
245 * @returns VBox status code.
246 * @param pVM Pointer to the VM.
247 */
248VMM_INT_DECL(int) HMFlushTLBOnAllVCpus(PVM pVM)
249{
250 if (pVM->cCpus == 1)
251 return HMFlushTLB(&pVM->aCpus[0]);
252
253 VMCPUID idThisCpu = VMMGetCpuId(pVM);
254
255 STAM_COUNTER_INC(&pVM->aCpus[idThisCpu].hm.s.StatFlushTlb);
256
257 for (VMCPUID idCpu = 0; idCpu < pVM->cCpus; idCpu++)
258 {
259 PVMCPU pVCpu = &pVM->aCpus[idCpu];
260
261 /* Nothing to do if a TLB flush is already pending; the VCPU should
262 have already been poked if it were active. */
263 if (!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH))
264 {
265 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
266 if (idThisCpu != idCpu)
267 hmPokeCpuForTlbFlush(pVCpu, true /* fAccountFlushStat */);
268 }
269 }
270
271 return VINF_SUCCESS;
272}
273#endif /* !IN_RC */
274
275/**
276 * Checks if nested paging is enabled.
277 *
278 * @returns true if nested paging is active, false otherwise.
279 * @param pVM Pointer to the VM.
280 *
281 * @remarks Works before hmR3InitFinalizeR0.
282 */
283VMM_INT_DECL(bool) HMIsNestedPagingActive(PVM pVM)
284{
285 return HMIsEnabled(pVM) && pVM->hm.s.fNestedPaging;
286}
287
288
289/**
290 * Checks if both nested paging and unhampered guest execution are enabled.
291 *
292 * The almost complete guest execution in harware is only applicable to VT-x.
293 *
294 * @returns true if we have both enabled, otherwise false.
295 * @param pVM Pointer to the VM.
296 *
297 * @remarks Works before hmR3InitFinalizeR0.
298 */
299VMM_INT_DECL(bool) HMAreNestedPagingAndFullGuestExecEnabled(PVM pVM)
300{
301 return HMIsEnabled(pVM)
302 && pVM->hm.s.fNestedPaging
303 && ( pVM->hm.s.vmx.fUnrestrictedGuest
304 || pVM->hm.s.svm.fSupported);
305}
306
307
308/**
309 * Checks if this VM is long-mode capable.
310 *
311 * @returns true if long mode is allowed, false otherwise.
312 * @param pUVM The user mode VM handle.
313 */
314VMM_INT_DECL(bool) HMIsLongModeAllowed(PVM pVM)
315{
316 return HMIsEnabled(pVM) && pVM->hm.s.fAllow64BitGuests;
317}
318
319
320/**
321 * Checks if MSR bitmaps are available. It is assumed that when it's available
322 * it will be used as well.
323 *
324 * @returns true if MSR bitmaps are available, false otherwise.
325 * @param pVM Pointer to the VM.
326 */
327VMM_INT_DECL(bool) HMAreMsrBitmapsAvailable(PVM pVM)
328{
329 if (HMIsEnabled(pVM))
330 {
331 if (pVM->hm.s.svm.fSupported)
332 return true;
333
334 if ( pVM->hm.s.vmx.fSupported
335 && (pVM->hm.s.vmx.Msrs.VmxProcCtls.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC_USE_MSR_BITMAPS))
336 {
337 return true;
338 }
339 }
340 return false;
341}
342
343
344/**
345 * Return the shadow paging mode for nested paging/ept
346 *
347 * @returns shadow paging mode
348 * @param pVM Pointer to the VM.
349 */
350VMM_INT_DECL(PGMMODE) HMGetShwPagingMode(PVM pVM)
351{
352 Assert(HMIsNestedPagingActive(pVM));
353 if (pVM->hm.s.svm.fSupported)
354 return PGMMODE_NESTED;
355
356 Assert(pVM->hm.s.vmx.fSupported);
357 return PGMMODE_EPT;
358}
359
360/**
361 * Invalidates a guest page by physical address
362 *
363 * NOTE: Assumes the current instruction references this physical page though a virtual address!!
364 *
365 * @returns VBox status code.
366 * @param pVM Pointer to the VM.
367 * @param GCPhys Page to invalidate
368 */
369VMM_INT_DECL(int) HMInvalidatePhysPage(PVM pVM, RTGCPHYS GCPhys)
370{
371 if (!HMIsNestedPagingActive(pVM))
372 return VINF_SUCCESS;
373
374#ifdef IN_RING0
375 if (pVM->hm.s.vmx.fSupported)
376 {
377 VMCPUID idThisCpu = VMMGetCpuId(pVM);
378
379 for (VMCPUID idCpu = 0; idCpu < pVM->cCpus; idCpu++)
380 {
381 PVMCPU pVCpu = &pVM->aCpus[idCpu];
382
383 if (idThisCpu == idCpu)
384 {
385 /** @todo r=ramshankar: Intel does not support flushing by guest physical
386 * address either. See comment in VMXR0InvalidatePhysPage(). Fix this. */
387 VMXR0InvalidatePhysPage(pVM, pVCpu, GCPhys);
388 }
389 else
390 {
391 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
392 hmPokeCpuForTlbFlush(pVCpu, true /*fAccountFlushStat*/);
393 }
394 }
395 return VINF_SUCCESS;
396 }
397
398 /* AMD-V doesn't support invalidation with guest physical addresses; see
399 comment in SVMR0InvalidatePhysPage. */
400 Assert(pVM->hm.s.svm.fSupported);
401#else
402 NOREF(GCPhys);
403#endif
404
405 HMFlushTLBOnAllVCpus(pVM);
406 return VINF_SUCCESS;
407}
408
409/**
410 * Checks if an interrupt event is currently pending.
411 *
412 * @returns Interrupt event pending state.
413 * @param pVM Pointer to the VM.
414 */
415VMM_INT_DECL(bool) HMHasPendingIrq(PVM pVM)
416{
417 PVMCPU pVCpu = VMMGetCpu(pVM);
418 return !!pVCpu->hm.s.Event.fPending;
419}
420
421
422/**
423 * Return the PAE PDPE entries.
424 *
425 * @returns Pointer to the PAE PDPE array.
426 * @param pVCpu Pointer to the VMCPU.
427 */
428VMM_INT_DECL(PX86PDPE) HMGetPaePdpes(PVMCPU pVCpu)
429{
430 return &pVCpu->hm.s.aPdpes[0];
431}
432
433
434/**
435 * Checks if the current AMD CPU is subject to erratum 170 "In SVM mode,
436 * incorrect code bytes may be fetched after a world-switch".
437 *
438 * @param pu32Family Where to store the CPU family (can be NULL).
439 * @param pu32Model Where to store the CPU model (can be NULL).
440 * @param pu32Stepping Where to store the CPU stepping (can be NULL).
441 * @returns true if the erratum applies, false otherwise.
442 */
443VMM_INT_DECL(int) HMAmdIsSubjectToErratum170(uint32_t *pu32Family, uint32_t *pu32Model, uint32_t *pu32Stepping)
444{
445 /*
446 * Erratum 170 which requires a forced TLB flush for each world switch:
447 * See AMD spec. "Revision Guide for AMD NPT Family 0Fh Processors".
448 *
449 * All BH-G1/2 and DH-G1/2 models include a fix:
450 * Athlon X2: 0x6b 1/2
451 * 0x68 1/2
452 * Athlon 64: 0x7f 1
453 * 0x6f 2
454 * Sempron: 0x7f 1/2
455 * 0x6f 2
456 * 0x6c 2
457 * 0x7c 2
458 * Turion 64: 0x68 2
459 */
460 uint32_t u32Dummy;
461 uint32_t u32Version, u32Family, u32Model, u32Stepping, u32BaseFamily;
462 ASMCpuId(1, &u32Version, &u32Dummy, &u32Dummy, &u32Dummy);
463 u32BaseFamily = (u32Version >> 8) & 0xf;
464 u32Family = u32BaseFamily + (u32BaseFamily == 0xf ? ((u32Version >> 20) & 0x7f) : 0);
465 u32Model = ((u32Version >> 4) & 0xf);
466 u32Model = u32Model | ((u32BaseFamily == 0xf ? (u32Version >> 16) & 0x0f : 0) << 4);
467 u32Stepping = u32Version & 0xf;
468
469 bool fErratumApplies = false;
470 if ( u32Family == 0xf
471 && !((u32Model == 0x68 || u32Model == 0x6b || u32Model == 0x7f) && u32Stepping >= 1)
472 && !((u32Model == 0x6f || u32Model == 0x6c || u32Model == 0x7c) && u32Stepping >= 2))
473 {
474 fErratumApplies = true;
475 }
476
477 if (pu32Family)
478 *pu32Family = u32Family;
479 if (pu32Model)
480 *pu32Model = u32Model;
481 if (pu32Stepping)
482 *pu32Stepping = u32Stepping;
483
484 return fErratumApplies;
485}
486
487
488/**
489 * Sets or clears the single instruction flag.
490 *
491 * When set, HM will try its best to return to ring-3 after executing a single
492 * instruction. This can be used for debugging. See also
493 * EMR3HmSingleInstruction.
494 *
495 * @returns The old flag state.
496 * @param pVCpu Pointer to the cross context CPU structure of
497 * the calling EMT.
498 * @param fEnable The new flag state.
499 */
500VMM_INT_DECL(bool) HMSetSingleInstruction(PVMCPU pVCpu, bool fEnable)
501{
502 VMCPU_ASSERT_EMT(pVCpu);
503 bool fOld = pVCpu->hm.s.fSingleInstruction;
504 pVCpu->hm.s.fSingleInstruction = fEnable;
505 return fOld;
506}
507
508
509/**
510 * Notifies HM that paravirtualized hypercalls are now enabled.
511 *
512 * @param pVCpu Pointer to the VMCPU.
513 */
514VMM_INT_DECL(void) HMHypercallsEnable(PVMCPU pVCpu)
515{
516 pVCpu->hm.s.fHypercallsEnabled = true;
517}
518
519
520/**
521 * Notifies HM that paravirtualized hypercalls are now disabled.
522 *
523 * @param pVCpu Pointer to the VMCPU.
524 */
525VMM_INT_DECL(void) HMHypercallsDisable(PVMCPU pVCpu)
526{
527 pVCpu->hm.s.fHypercallsEnabled = false;
528}
529
530
531/**
532 * Notifies HM that GIM provider wants to trap #UD.
533 *
534 * @param pVCpu Pointer to the VMCPU.
535 */
536VMM_INT_DECL(void) HMTrapXcptUDForGIMEnable(PVMCPU pVCpu)
537{
538 pVCpu->hm.s.fGIMTrapXcptUD = true;
539 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_XCPT_INTERCEPTS);
540}
541
542
543/**
544 * Notifies HM that GIM provider no longer wants to trap #UD.
545 *
546 * @param pVCpu Pointer to the VMCPU.
547 */
548VMM_INT_DECL(void) HMTrapXcptUDForGIMDisable(PVMCPU pVCpu)
549{
550 pVCpu->hm.s.fGIMTrapXcptUD = false;
551 HMCPU_CF_SET(pVCpu, HM_CHANGED_GUEST_XCPT_INTERCEPTS);
552}
553
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette