VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMAll/HMAll.cpp@ 52343

Last change on this file since 52343 was 51981, checked in by vboxsync, 11 years ago

VMM/GIM, VMM/HM: Add support for Hyper-V hypervisor capabilities reporting through CPUID. Updated saved states as well, will break old states.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 14.8 KB
Line 
1/* $Id: HMAll.cpp 51981 2014-07-11 06:16:19Z vboxsync $ */
2/** @file
3 * HM - All contexts.
4 */
5
6/*
7 * Copyright (C) 2006-2014 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*******************************************************************************
20* Header Files *
21*******************************************************************************/
22#define LOG_GROUP LOG_GROUP_HM
23#include <VBox/vmm/hm.h>
24#include <VBox/vmm/pgm.h>
25#include "HMInternal.h"
26#include <VBox/vmm/vm.h>
27#include <VBox/vmm/hm_vmx.h>
28#include <VBox/vmm/hm_svm.h>
29#include <VBox/err.h>
30#include <VBox/log.h>
31#include <iprt/param.h>
32#include <iprt/assert.h>
33#include <iprt/asm.h>
34#include <iprt/string.h>
35#include <iprt/thread.h>
36#include <iprt/x86.h>
37#include <iprt/asm-amd64-x86.h>
38
39
40/**
41 * Checks whether HM (VT-x/AMD-V) is being used by this VM.
42 *
43 * @retval @c true if used.
44 * @retval @c false if software virtualization (raw-mode) is used.
45 * @param pVM The cross context VM structure.
46 * @sa HMIsEnabled, HMR3IsEnabled
47 * @internal
48 */
49VMMDECL(bool) HMIsEnabledNotMacro(PVM pVM)
50{
51 Assert(pVM->fHMEnabledFixed);
52 return pVM->fHMEnabled;
53}
54
55
56/**
57 * Queues a page for invalidation
58 *
59 * @returns VBox status code.
60 * @param pVCpu Pointer to the VMCPU.
61 * @param GCVirt Page to invalidate
62 */
63static void hmQueueInvlPage(PVMCPU pVCpu, RTGCPTR GCVirt)
64{
65 /* Nothing to do if a TLB flush is already pending */
66 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH))
67 return;
68#if 1
69 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
70 NOREF(GCVirt);
71#else
72 /* Be very careful when activating this code! */
73 if (iPage == RT_ELEMENTS(pVCpu->hm.s.TlbShootdown.aPages))
74 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
75 else
76 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_SHOOTDOWN);
77#endif
78}
79
80
81/**
82 * Invalidates a guest page
83 *
84 * @returns VBox status code.
85 * @param pVCpu Pointer to the VMCPU.
86 * @param GCVirt Page to invalidate
87 */
88VMM_INT_DECL(int) HMInvalidatePage(PVMCPU pVCpu, RTGCPTR GCVirt)
89{
90 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushPageManual);
91#ifdef IN_RING0
92 PVM pVM = pVCpu->CTX_SUFF(pVM);
93 if (pVM->hm.s.vmx.fSupported)
94 return VMXR0InvalidatePage(pVM, pVCpu, GCVirt);
95
96 Assert(pVM->hm.s.svm.fSupported);
97 return SVMR0InvalidatePage(pVM, pVCpu, GCVirt);
98
99#else
100 hmQueueInvlPage(pVCpu, GCVirt);
101 return VINF_SUCCESS;
102#endif
103}
104
105
106/**
107 * Flushes the guest TLB.
108 *
109 * @returns VBox status code.
110 * @param pVCpu Pointer to the VMCPU.
111 */
112VMM_INT_DECL(int) HMFlushTLB(PVMCPU pVCpu)
113{
114 LogFlow(("HMFlushTLB\n"));
115
116 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
117 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlbManual);
118 return VINF_SUCCESS;
119}
120
121
122#ifdef IN_RING0
123/**
124 * Dummy RTMpOnSpecific handler since RTMpPokeCpu couldn't be used.
125 *
126 */
127static DECLCALLBACK(void) hmFlushHandler(RTCPUID idCpu, void *pvUser1, void *pvUser2)
128{
129 NOREF(idCpu); NOREF(pvUser1); NOREF(pvUser2);
130 return;
131}
132
133/**
134 * Wrapper for RTMpPokeCpu to deal with VERR_NOT_SUPPORTED.
135 */
136static void hmR0PokeCpu(PVMCPU pVCpu, RTCPUID idHostCpu)
137{
138 uint32_t cWorldSwitchExits = ASMAtomicUoReadU32(&pVCpu->hm.s.cWorldSwitchExits);
139
140 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatPoke, x);
141 int rc = RTMpPokeCpu(idHostCpu);
142 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatPoke, x);
143
144 /* Not implemented on some platforms (Darwin, Linux kernel < 2.6.19); fall
145 back to a less efficient implementation (broadcast). */
146 if (rc == VERR_NOT_SUPPORTED)
147 {
148 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatSpinPoke, z);
149 /* synchronous. */
150 RTMpOnSpecific(idHostCpu, hmFlushHandler, 0, 0);
151 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatSpinPoke, z);
152 }
153 else
154 {
155 if (rc == VINF_SUCCESS)
156 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatSpinPoke, z);
157 else
158 STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatSpinPokeFailed, z);
159
160/** @todo If more than one CPU is going to be poked, we could optimize this
161 * operation by poking them first and wait afterwards. Would require
162 * recording who to poke and their current cWorldSwitchExits values,
163 * that's something not suitable for stack... So, pVCpu->hm.s.something
164 * then. */
165 /* Spin until the VCPU has switched back (poking is async). */
166 while ( ASMAtomicUoReadBool(&pVCpu->hm.s.fCheckedTLBFlush)
167 && cWorldSwitchExits == ASMAtomicUoReadU32(&pVCpu->hm.s.cWorldSwitchExits))
168 ASMNopPause();
169
170 if (rc == VINF_SUCCESS)
171 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatSpinPoke, z);
172 else
173 STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatSpinPokeFailed, z);
174 }
175}
176#endif /* IN_RING0 */
177
178
179#ifndef IN_RC
180/**
181 * Poke an EMT so it can perform the appropriate TLB shootdowns.
182 *
183 * @param pVCpu The handle of the virtual CPU to poke.
184 * @param fAccountFlushStat Whether to account the call to
185 * StatTlbShootdownFlush or StatTlbShootdown.
186 */
187static void hmPokeCpuForTlbFlush(PVMCPU pVCpu, bool fAccountFlushStat)
188{
189 if (ASMAtomicUoReadBool(&pVCpu->hm.s.fCheckedTLBFlush))
190 {
191 if (fAccountFlushStat)
192 STAM_COUNTER_INC(&pVCpu->hm.s.StatTlbShootdownFlush);
193 else
194 STAM_COUNTER_INC(&pVCpu->hm.s.StatTlbShootdown);
195#ifdef IN_RING0
196 RTCPUID idHostCpu = pVCpu->hm.s.idEnteredCpu;
197 if (idHostCpu != NIL_RTCPUID)
198 hmR0PokeCpu(pVCpu, idHostCpu);
199#else
200 VMR3NotifyCpuFFU(pVCpu->pUVCpu, VMNOTIFYFF_FLAGS_POKE);
201#endif
202 }
203 else
204 STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushPageManual);
205}
206
207
208/**
209 * Invalidates a guest page on all VCPUs.
210 *
211 * @returns VBox status code.
212 * @param pVM Pointer to the VM.
213 * @param GCVirt Page to invalidate
214 */
215VMM_INT_DECL(int) HMInvalidatePageOnAllVCpus(PVM pVM, RTGCPTR GCPtr)
216{
217 VMCPUID idCurCpu = VMMGetCpuId(pVM);
218 STAM_COUNTER_INC(&pVM->aCpus[idCurCpu].hm.s.StatFlushPage);
219
220 for (VMCPUID idCpu = 0; idCpu < pVM->cCpus; idCpu++)
221 {
222 PVMCPU pVCpu = &pVM->aCpus[idCpu];
223
224 /* Nothing to do if a TLB flush is already pending; the VCPU should
225 have already been poked if it were active. */
226 if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH))
227 continue;
228
229 if (pVCpu->idCpu == idCurCpu)
230 HMInvalidatePage(pVCpu, GCPtr);
231 else
232 {
233 hmQueueInvlPage(pVCpu, GCPtr);
234 hmPokeCpuForTlbFlush(pVCpu, false /* fAccountFlushStat */);
235 }
236 }
237
238 return VINF_SUCCESS;
239}
240
241
242/**
243 * Flush the TLBs of all VCPUs.
244 *
245 * @returns VBox status code.
246 * @param pVM Pointer to the VM.
247 */
248VMM_INT_DECL(int) HMFlushTLBOnAllVCpus(PVM pVM)
249{
250 if (pVM->cCpus == 1)
251 return HMFlushTLB(&pVM->aCpus[0]);
252
253 VMCPUID idThisCpu = VMMGetCpuId(pVM);
254
255 STAM_COUNTER_INC(&pVM->aCpus[idThisCpu].hm.s.StatFlushTlb);
256
257 for (VMCPUID idCpu = 0; idCpu < pVM->cCpus; idCpu++)
258 {
259 PVMCPU pVCpu = &pVM->aCpus[idCpu];
260
261 /* Nothing to do if a TLB flush is already pending; the VCPU should
262 have already been poked if it were active. */
263 if (!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH))
264 {
265 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
266 if (idThisCpu != idCpu)
267 hmPokeCpuForTlbFlush(pVCpu, true /* fAccountFlushStat */);
268 }
269 }
270
271 return VINF_SUCCESS;
272}
273#endif /* !IN_RC */
274
275/**
276 * Checks if nested paging is enabled.
277 *
278 * @returns true if nested paging is active, false otherwise.
279 * @param pVM Pointer to the VM.
280 */
281VMM_INT_DECL(bool) HMIsNestedPagingActive(PVM pVM)
282{
283 return HMIsEnabled(pVM) && pVM->hm.s.fNestedPaging;
284}
285
286
287/**
288 * Checks if MSR bitmaps are available. It is assumed that when it's available
289 * it will be used as well.
290 *
291 * @returns true if MSR bitmaps are available, false otherwise.
292 * @param pVM Pointer to the VM.
293 */
294VMM_INT_DECL(bool) HMAreMsrBitmapsAvailable(PVM pVM)
295{
296 if (HMIsEnabled(pVM))
297 {
298 if (pVM->hm.s.svm.fSupported)
299 return true;
300
301 if ( pVM->hm.s.vmx.fSupported
302 && (pVM->hm.s.vmx.Msrs.VmxProcCtls.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC_USE_MSR_BITMAPS))
303 {
304 return true;
305 }
306 }
307 return false;
308}
309
310
311/**
312 * Return the shadow paging mode for nested paging/ept
313 *
314 * @returns shadow paging mode
315 * @param pVM Pointer to the VM.
316 */
317VMM_INT_DECL(PGMMODE) HMGetShwPagingMode(PVM pVM)
318{
319 Assert(HMIsNestedPagingActive(pVM));
320 if (pVM->hm.s.svm.fSupported)
321 return PGMMODE_NESTED;
322
323 Assert(pVM->hm.s.vmx.fSupported);
324 return PGMMODE_EPT;
325}
326
327/**
328 * Invalidates a guest page by physical address
329 *
330 * NOTE: Assumes the current instruction references this physical page though a virtual address!!
331 *
332 * @returns VBox status code.
333 * @param pVM Pointer to the VM.
334 * @param GCPhys Page to invalidate
335 */
336VMM_INT_DECL(int) HMInvalidatePhysPage(PVM pVM, RTGCPHYS GCPhys)
337{
338 if (!HMIsNestedPagingActive(pVM))
339 return VINF_SUCCESS;
340
341#ifdef IN_RING0
342 if (pVM->hm.s.vmx.fSupported)
343 {
344 VMCPUID idThisCpu = VMMGetCpuId(pVM);
345
346 for (VMCPUID idCpu = 0; idCpu < pVM->cCpus; idCpu++)
347 {
348 PVMCPU pVCpu = &pVM->aCpus[idCpu];
349
350 if (idThisCpu == idCpu)
351 {
352 /** @todo r=ramshankar: Intel does not support flushing by guest physical
353 * address either. See comment in VMXR0InvalidatePhysPage(). Fix this. */
354 VMXR0InvalidatePhysPage(pVM, pVCpu, GCPhys);
355 }
356 else
357 {
358 VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
359 hmPokeCpuForTlbFlush(pVCpu, true /*fAccountFlushStat*/);
360 }
361 }
362 return VINF_SUCCESS;
363 }
364
365 /* AMD-V doesn't support invalidation with guest physical addresses; see
366 comment in SVMR0InvalidatePhysPage. */
367 Assert(pVM->hm.s.svm.fSupported);
368#else
369 NOREF(GCPhys);
370#endif
371
372 HMFlushTLBOnAllVCpus(pVM);
373 return VINF_SUCCESS;
374}
375
376/**
377 * Checks if an interrupt event is currently pending.
378 *
379 * @returns Interrupt event pending state.
380 * @param pVM Pointer to the VM.
381 */
382VMM_INT_DECL(bool) HMHasPendingIrq(PVM pVM)
383{
384 PVMCPU pVCpu = VMMGetCpu(pVM);
385 return !!pVCpu->hm.s.Event.fPending;
386}
387
388
389/**
390 * Return the PAE PDPE entries.
391 *
392 * @returns Pointer to the PAE PDPE array.
393 * @param pVCpu Pointer to the VMCPU.
394 */
395VMM_INT_DECL(PX86PDPE) HMGetPaePdpes(PVMCPU pVCpu)
396{
397 return &pVCpu->hm.s.aPdpes[0];
398}
399
400
401/**
402 * Checks if the current AMD CPU is subject to erratum 170 "In SVM mode,
403 * incorrect code bytes may be fetched after a world-switch".
404 *
405 * @param pu32Family Where to store the CPU family (can be NULL).
406 * @param pu32Model Where to store the CPU model (can be NULL).
407 * @param pu32Stepping Where to store the CPU stepping (can be NULL).
408 * @returns true if the erratum applies, false otherwise.
409 */
410VMM_INT_DECL(int) HMAmdIsSubjectToErratum170(uint32_t *pu32Family, uint32_t *pu32Model, uint32_t *pu32Stepping)
411{
412 /*
413 * Erratum 170 which requires a forced TLB flush for each world switch:
414 * See AMD spec. "Revision Guide for AMD NPT Family 0Fh Processors".
415 *
416 * All BH-G1/2 and DH-G1/2 models include a fix:
417 * Athlon X2: 0x6b 1/2
418 * 0x68 1/2
419 * Athlon 64: 0x7f 1
420 * 0x6f 2
421 * Sempron: 0x7f 1/2
422 * 0x6f 2
423 * 0x6c 2
424 * 0x7c 2
425 * Turion 64: 0x68 2
426 */
427 uint32_t u32Dummy;
428 uint32_t u32Version, u32Family, u32Model, u32Stepping, u32BaseFamily;
429 ASMCpuId(1, &u32Version, &u32Dummy, &u32Dummy, &u32Dummy);
430 u32BaseFamily = (u32Version >> 8) & 0xf;
431 u32Family = u32BaseFamily + (u32BaseFamily == 0xf ? ((u32Version >> 20) & 0x7f) : 0);
432 u32Model = ((u32Version >> 4) & 0xf);
433 u32Model = u32Model | ((u32BaseFamily == 0xf ? (u32Version >> 16) & 0x0f : 0) << 4);
434 u32Stepping = u32Version & 0xf;
435
436 bool fErratumApplies = false;
437 if ( u32Family == 0xf
438 && !((u32Model == 0x68 || u32Model == 0x6b || u32Model == 0x7f) && u32Stepping >= 1)
439 && !((u32Model == 0x6f || u32Model == 0x6c || u32Model == 0x7c) && u32Stepping >= 2))
440 {
441 fErratumApplies = true;
442 }
443
444 if (pu32Family)
445 *pu32Family = u32Family;
446 if (pu32Model)
447 *pu32Model = u32Model;
448 if (pu32Stepping)
449 *pu32Stepping = u32Stepping;
450
451 return fErratumApplies;
452}
453
454
455/**
456 * Sets or clears the single instruction flag.
457 *
458 * When set, HM will try its best to return to ring-3 after executing a single
459 * instruction. This can be used for debugging. See also
460 * EMR3HmSingleInstruction.
461 *
462 * @returns The old flag state.
463 * @param pVCpu Pointer to the cross context CPU structure of
464 * the calling EMT.
465 * @param fEnable The new flag state.
466 */
467VMM_INT_DECL(bool) HMSetSingleInstruction(PVMCPU pVCpu, bool fEnable)
468{
469 VMCPU_ASSERT_EMT(pVCpu);
470 bool fOld = pVCpu->hm.s.fSingleInstruction;
471 pVCpu->hm.s.fSingleInstruction = fEnable;
472 return fOld;
473}
474
475
476/**
477 * Patches the instructions necessary for making a hypercall to the hypervisor.
478 * Used by GIM.
479 *
480 * @returns VBox status code.
481 * @param pVM Pointer to the VM.
482 * @param pvBuf The buffer in the hypercall page(s) to be patched.
483 * @param cbBuf The size of the buffer.
484 * @param pcbWritten Where to store the number of bytes patched. This
485 * is reliably updated only when this function returns
486 * VINF_SUCCESS.
487 */
488VMM_INT_DECL(int) HMPatchHypercall(PVM pVM, void *pvBuf, size_t cbBuf, size_t *pcbWritten)
489{
490 AssertReturn(pvBuf, VERR_INVALID_POINTER);
491 AssertReturn(pcbWritten, VERR_INVALID_POINTER);
492 AssertReturn(HMIsEnabled(pVM), VERR_HM_IPE_5);
493
494 if (pVM->hm.s.vmx.fSupported)
495 {
496 uint8_t abHypercall[] = { 0x0F, 0x01, 0xC1 }; /* VMCALL */
497 if (RT_LIKELY(cbBuf >= sizeof(abHypercall)))
498 {
499 memcpy(pvBuf, abHypercall, sizeof(abHypercall));
500 *pcbWritten = sizeof(abHypercall);
501 return VINF_SUCCESS;
502 }
503 return VERR_BUFFER_OVERFLOW;
504 }
505 else
506 {
507 Assert(pVM->hm.s.svm.fSupported);
508 uint8_t abHypercall[] = { 0x0F, 0x01, 0xD9 }; /* VMMCALL */
509 if (RT_LIKELY(cbBuf >= sizeof(abHypercall)))
510 {
511 memcpy(pvBuf, abHypercall, sizeof(abHypercall));
512 *pcbWritten = sizeof(abHypercall);
513 return VINF_SUCCESS;
514 }
515 return VERR_BUFFER_OVERFLOW;
516 }
517}
518
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette