HMAll.cpp@ 52343

Last change on this file since 52343 was 51981, checked in by vboxsync, 11 years ago
VMM/GIM, VMM/HM: Add support for Hyper-V hypervisor capabilities reporting through CPUID. Updated saved states as well, will break old states.
Property svn:eol-style set to `native` Property svn:keywords set to `Author Date Id Revision`
File size: 14.8 KB

Line
1	/* $Id: HMAll.cpp 51981 2014-07-11 06:16:19Z vboxsync $ */
2	/** @file
3	* HM - All contexts.
4	*/
5
6	/*
7	* Copyright (C) 2006-2014 Oracle Corporation
8	*
9	* This file is part of VirtualBox Open Source Edition (OSE), as
10	* available from http://www.virtualbox.org. This file is free software;
11	* you can redistribute it and/or modify it under the terms of the GNU
12	* General Public License (GPL) as published by the Free Software
13	* Foundation, in version 2 as it comes in the "COPYING" file of the
14	* VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15	* hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16	*/
17
18
19	/*******************************************************************************
20	* Header Files *
21	*******************************************************************************/
22	#define LOG_GROUP LOG_GROUP_HM
23	#include <VBox/vmm/hm.h>
24	#include <VBox/vmm/pgm.h>
25	#include "HMInternal.h"
26	#include <VBox/vmm/vm.h>
27	#include <VBox/vmm/hm_vmx.h>
28	#include <VBox/vmm/hm_svm.h>
29	#include <VBox/err.h>
30	#include <VBox/log.h>
31	#include <iprt/param.h>
32	#include <iprt/assert.h>
33	#include <iprt/asm.h>
34	#include <iprt/string.h>
35	#include <iprt/thread.h>
36	#include <iprt/x86.h>
37	#include <iprt/asm-amd64-x86.h>
38
39
40	/**
41	* Checks whether HM (VT-x/AMD-V) is being used by this VM.
42	*
43	* @retval @c true if used.
44	* @retval @c false if software virtualization (raw-mode) is used.
45	* @param pVM The cross context VM structure.
46	* @sa HMIsEnabled, HMR3IsEnabled
47	* @internal
48	*/
49	VMMDECL(bool) HMIsEnabledNotMacro(PVM pVM)
50	{
51	Assert(pVM->fHMEnabledFixed);
52	return pVM->fHMEnabled;
53	}
54
55
56	/**
57	* Queues a page for invalidation
58	*
59	* @returns VBox status code.
60	* @param pVCpu Pointer to the VMCPU.
61	* @param GCVirt Page to invalidate
62	*/
63	static void hmQueueInvlPage(PVMCPU pVCpu, RTGCPTR GCVirt)
64	{
65	/* Nothing to do if a TLB flush is already pending */
66	if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH))
67	return;
68	#if 1
69	VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
70	NOREF(GCVirt);
71	#else
72	/* Be very careful when activating this code! */
73	if (iPage == RT_ELEMENTS(pVCpu->hm.s.TlbShootdown.aPages))
74	VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
75	else
76	VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_SHOOTDOWN);
77	#endif
78	}
79
80
81	/**
82	* Invalidates a guest page
83	*
84	* @returns VBox status code.
85	* @param pVCpu Pointer to the VMCPU.
86	* @param GCVirt Page to invalidate
87	*/
88	VMM_INT_DECL(int) HMInvalidatePage(PVMCPU pVCpu, RTGCPTR GCVirt)
89	{
90	STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushPageManual);
91	#ifdef IN_RING0
92	PVM pVM = pVCpu->CTX_SUFF(pVM);
93	if (pVM->hm.s.vmx.fSupported)
94	return VMXR0InvalidatePage(pVM, pVCpu, GCVirt);
95
96	Assert(pVM->hm.s.svm.fSupported);
97	return SVMR0InvalidatePage(pVM, pVCpu, GCVirt);
98
99	#else
100	hmQueueInvlPage(pVCpu, GCVirt);
101	return VINF_SUCCESS;
102	#endif
103	}
104
105
106	/**
107	* Flushes the guest TLB.
108	*
109	* @returns VBox status code.
110	* @param pVCpu Pointer to the VMCPU.
111	*/
112	VMM_INT_DECL(int) HMFlushTLB(PVMCPU pVCpu)
113	{
114	LogFlow(("HMFlushTLB\n"));
115
116	VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
117	STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushTlbManual);
118	return VINF_SUCCESS;
119	}
120
121
122	#ifdef IN_RING0
123	/**
124	* Dummy RTMpOnSpecific handler since RTMpPokeCpu couldn't be used.
125	*
126	*/
127	static DECLCALLBACK(void) hmFlushHandler(RTCPUID idCpu, void pvUser1, void pvUser2)
128	{
129	NOREF(idCpu); NOREF(pvUser1); NOREF(pvUser2);
130	return;
131	}
132
133	/**
134	* Wrapper for RTMpPokeCpu to deal with VERR_NOT_SUPPORTED.
135	*/
136	static void hmR0PokeCpu(PVMCPU pVCpu, RTCPUID idHostCpu)
137	{
138	uint32_t cWorldSwitchExits = ASMAtomicUoReadU32(&pVCpu->hm.s.cWorldSwitchExits);
139
140	STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatPoke, x);
141	int rc = RTMpPokeCpu(idHostCpu);
142	STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatPoke, x);
143
144	/* Not implemented on some platforms (Darwin, Linux kernel < 2.6.19); fall
145	back to a less efficient implementation (broadcast). */
146	if (rc == VERR_NOT_SUPPORTED)
147	{
148	STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatSpinPoke, z);
149	/* synchronous. */
150	RTMpOnSpecific(idHostCpu, hmFlushHandler, 0, 0);
151	STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatSpinPoke, z);
152	}
153	else
154	{
155	if (rc == VINF_SUCCESS)
156	STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatSpinPoke, z);
157	else
158	STAM_PROFILE_ADV_START(&pVCpu->hm.s.StatSpinPokeFailed, z);
159
160	/** @todo If more than one CPU is going to be poked, we could optimize this
161	* operation by poking them first and wait afterwards. Would require
162	* recording who to poke and their current cWorldSwitchExits values,
163	* that's something not suitable for stack... So, pVCpu->hm.s.something
164	* then. */
165	/* Spin until the VCPU has switched back (poking is async). */
166	while ( ASMAtomicUoReadBool(&pVCpu->hm.s.fCheckedTLBFlush)
167	&& cWorldSwitchExits == ASMAtomicUoReadU32(&pVCpu->hm.s.cWorldSwitchExits))
168	ASMNopPause();
169
170	if (rc == VINF_SUCCESS)
171	STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatSpinPoke, z);
172	else
173	STAM_PROFILE_ADV_STOP(&pVCpu->hm.s.StatSpinPokeFailed, z);
174	}
175	}
176	#endif /* IN_RING0 */
177
178
179	#ifndef IN_RC
180	/**
181	* Poke an EMT so it can perform the appropriate TLB shootdowns.
182	*
183	* @param pVCpu The handle of the virtual CPU to poke.
184	* @param fAccountFlushStat Whether to account the call to
185	* StatTlbShootdownFlush or StatTlbShootdown.
186	*/
187	static void hmPokeCpuForTlbFlush(PVMCPU pVCpu, bool fAccountFlushStat)
188	{
189	if (ASMAtomicUoReadBool(&pVCpu->hm.s.fCheckedTLBFlush))
190	{
191	if (fAccountFlushStat)
192	STAM_COUNTER_INC(&pVCpu->hm.s.StatTlbShootdownFlush);
193	else
194	STAM_COUNTER_INC(&pVCpu->hm.s.StatTlbShootdown);
195	#ifdef IN_RING0
196	RTCPUID idHostCpu = pVCpu->hm.s.idEnteredCpu;
197	if (idHostCpu != NIL_RTCPUID)
198	hmR0PokeCpu(pVCpu, idHostCpu);
199	#else
200	VMR3NotifyCpuFFU(pVCpu->pUVCpu, VMNOTIFYFF_FLAGS_POKE);
201	#endif
202	}
203	else
204	STAM_COUNTER_INC(&pVCpu->hm.s.StatFlushPageManual);
205	}
206
207
208	/**
209	* Invalidates a guest page on all VCPUs.
210	*
211	* @returns VBox status code.
212	* @param pVM Pointer to the VM.
213	* @param GCVirt Page to invalidate
214	*/
215	VMM_INT_DECL(int) HMInvalidatePageOnAllVCpus(PVM pVM, RTGCPTR GCPtr)
216	{
217	VMCPUID idCurCpu = VMMGetCpuId(pVM);
218	STAM_COUNTER_INC(&pVM->aCpus[idCurCpu].hm.s.StatFlushPage);
219
220	for (VMCPUID idCpu = 0; idCpu < pVM->cCpus; idCpu++)
221	{
222	PVMCPU pVCpu = &pVM->aCpus[idCpu];
223
224	/* Nothing to do if a TLB flush is already pending; the VCPU should
225	have already been poked if it were active. */
226	if (VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH))
227	continue;
228
229	if (pVCpu->idCpu == idCurCpu)
230	HMInvalidatePage(pVCpu, GCPtr);
231	else
232	{
233	hmQueueInvlPage(pVCpu, GCPtr);
234	hmPokeCpuForTlbFlush(pVCpu, false /* fAccountFlushStat */);
235	}
236	}
237
238	return VINF_SUCCESS;
239	}
240
241
242	/**
243	* Flush the TLBs of all VCPUs.
244	*
245	* @returns VBox status code.
246	* @param pVM Pointer to the VM.
247	*/
248	VMM_INT_DECL(int) HMFlushTLBOnAllVCpus(PVM pVM)
249	{
250	if (pVM->cCpus == 1)
251	return HMFlushTLB(&pVM->aCpus[0]);
252
253	VMCPUID idThisCpu = VMMGetCpuId(pVM);
254
255	STAM_COUNTER_INC(&pVM->aCpus[idThisCpu].hm.s.StatFlushTlb);
256
257	for (VMCPUID idCpu = 0; idCpu < pVM->cCpus; idCpu++)
258	{
259	PVMCPU pVCpu = &pVM->aCpus[idCpu];
260
261	/* Nothing to do if a TLB flush is already pending; the VCPU should
262	have already been poked if it were active. */
263	if (!VMCPU_FF_IS_SET(pVCpu, VMCPU_FF_TLB_FLUSH))
264	{
265	VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
266	if (idThisCpu != idCpu)
267	hmPokeCpuForTlbFlush(pVCpu, true /* fAccountFlushStat */);
268	}
269	}
270
271	return VINF_SUCCESS;
272	}
273	#endif /* !IN_RC */
274
275	/**
276	* Checks if nested paging is enabled.
277	*
278	* @returns true if nested paging is active, false otherwise.
279	* @param pVM Pointer to the VM.
280	*/
281	VMM_INT_DECL(bool) HMIsNestedPagingActive(PVM pVM)
282	{
283	return HMIsEnabled(pVM) && pVM->hm.s.fNestedPaging;
284	}
285
286
287	/**
288	* Checks if MSR bitmaps are available. It is assumed that when it's available
289	* it will be used as well.
290	*
291	* @returns true if MSR bitmaps are available, false otherwise.
292	* @param pVM Pointer to the VM.
293	*/
294	VMM_INT_DECL(bool) HMAreMsrBitmapsAvailable(PVM pVM)
295	{
296	if (HMIsEnabled(pVM))
297	{
298	if (pVM->hm.s.svm.fSupported)
299	return true;
300
301	if ( pVM->hm.s.vmx.fSupported
302	&& (pVM->hm.s.vmx.Msrs.VmxProcCtls.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC_USE_MSR_BITMAPS))
303	{
304	return true;
305	}
306	}
307	return false;
308	}
309
310
311	/**
312	* Return the shadow paging mode for nested paging/ept
313	*
314	* @returns shadow paging mode
315	* @param pVM Pointer to the VM.
316	*/
317	VMM_INT_DECL(PGMMODE) HMGetShwPagingMode(PVM pVM)
318	{
319	Assert(HMIsNestedPagingActive(pVM));
320	if (pVM->hm.s.svm.fSupported)
321	return PGMMODE_NESTED;
322
323	Assert(pVM->hm.s.vmx.fSupported);
324	return PGMMODE_EPT;
325	}
326
327	/**
328	* Invalidates a guest page by physical address
329	*
330	* NOTE: Assumes the current instruction references this physical page though a virtual address!!
331	*
332	* @returns VBox status code.
333	* @param pVM Pointer to the VM.
334	* @param GCPhys Page to invalidate
335	*/
336	VMM_INT_DECL(int) HMInvalidatePhysPage(PVM pVM, RTGCPHYS GCPhys)
337	{
338	if (!HMIsNestedPagingActive(pVM))
339	return VINF_SUCCESS;
340
341	#ifdef IN_RING0
342	if (pVM->hm.s.vmx.fSupported)
343	{
344	VMCPUID idThisCpu = VMMGetCpuId(pVM);
345
346	for (VMCPUID idCpu = 0; idCpu < pVM->cCpus; idCpu++)
347	{
348	PVMCPU pVCpu = &pVM->aCpus[idCpu];
349
350	if (idThisCpu == idCpu)
351	{
352	/** @todo r=ramshankar: Intel does not support flushing by guest physical
353	* address either. See comment in VMXR0InvalidatePhysPage(). Fix this. */
354	VMXR0InvalidatePhysPage(pVM, pVCpu, GCPhys);
355	}
356	else
357	{
358	VMCPU_FF_SET(pVCpu, VMCPU_FF_TLB_FLUSH);
359	hmPokeCpuForTlbFlush(pVCpu, true /fAccountFlushStat/);
360	}
361	}
362	return VINF_SUCCESS;
363	}
364
365	/* AMD-V doesn't support invalidation with guest physical addresses; see
366	comment in SVMR0InvalidatePhysPage. */
367	Assert(pVM->hm.s.svm.fSupported);
368	#else
369	NOREF(GCPhys);
370	#endif
371
372	HMFlushTLBOnAllVCpus(pVM);
373	return VINF_SUCCESS;
374	}
375
376	/**
377	* Checks if an interrupt event is currently pending.
378	*
379	* @returns Interrupt event pending state.
380	* @param pVM Pointer to the VM.
381	*/
382	VMM_INT_DECL(bool) HMHasPendingIrq(PVM pVM)
383	{
384	PVMCPU pVCpu = VMMGetCpu(pVM);
385	return !!pVCpu->hm.s.Event.fPending;
386	}
387
388
389	/**
390	* Return the PAE PDPE entries.
391	*
392	* @returns Pointer to the PAE PDPE array.
393	* @param pVCpu Pointer to the VMCPU.
394	*/
395	VMM_INT_DECL(PX86PDPE) HMGetPaePdpes(PVMCPU pVCpu)
396	{
397	return &pVCpu->hm.s.aPdpes[0];
398	}
399
400
401	/**
402	* Checks if the current AMD CPU is subject to erratum 170 "In SVM mode,
403	* incorrect code bytes may be fetched after a world-switch".
404	*
405	* @param pu32Family Where to store the CPU family (can be NULL).
406	* @param pu32Model Where to store the CPU model (can be NULL).
407	* @param pu32Stepping Where to store the CPU stepping (can be NULL).
408	* @returns true if the erratum applies, false otherwise.
409	*/
410	VMM_INT_DECL(int) HMAmdIsSubjectToErratum170(uint32_t pu32Family, uint32_t pu32Model, uint32_t *pu32Stepping)
411	{
412	/*
413	* Erratum 170 which requires a forced TLB flush for each world switch:
414	* See AMD spec. "Revision Guide for AMD NPT Family 0Fh Processors".
415	*
416	* All BH-G1/2 and DH-G1/2 models include a fix:
417	* Athlon X2: 0x6b 1/2
418	* 0x68 1/2
419	* Athlon 64: 0x7f 1
420	* 0x6f 2
421	* Sempron: 0x7f 1/2
422	* 0x6f 2
423	* 0x6c 2
424	* 0x7c 2
425	* Turion 64: 0x68 2
426	*/
427	uint32_t u32Dummy;
428	uint32_t u32Version, u32Family, u32Model, u32Stepping, u32BaseFamily;
429	ASMCpuId(1, &u32Version, &u32Dummy, &u32Dummy, &u32Dummy);
430	u32BaseFamily = (u32Version >> 8) & 0xf;
431	u32Family = u32BaseFamily + (u32BaseFamily == 0xf ? ((u32Version >> 20) & 0x7f) : 0);
432	u32Model = ((u32Version >> 4) & 0xf);
433	u32Model = u32Model \| ((u32BaseFamily == 0xf ? (u32Version >> 16) & 0x0f : 0) << 4);
434	u32Stepping = u32Version & 0xf;
435
436	bool fErratumApplies = false;
437	if ( u32Family == 0xf
438	&& !((u32Model == 0x68 \|\| u32Model == 0x6b \|\| u32Model == 0x7f) && u32Stepping >= 1)
439	&& !((u32Model == 0x6f \|\| u32Model == 0x6c \|\| u32Model == 0x7c) && u32Stepping >= 2))
440	{
441	fErratumApplies = true;
442	}
443
444	if (pu32Family)
445	*pu32Family = u32Family;
446	if (pu32Model)
447	*pu32Model = u32Model;
448	if (pu32Stepping)
449	*pu32Stepping = u32Stepping;
450
451	return fErratumApplies;
452	}
453
454
455	/**
456	* Sets or clears the single instruction flag.
457	*
458	* When set, HM will try its best to return to ring-3 after executing a single
459	* instruction. This can be used for debugging. See also
460	* EMR3HmSingleInstruction.
461	*
462	* @returns The old flag state.
463	* @param pVCpu Pointer to the cross context CPU structure of
464	* the calling EMT.
465	* @param fEnable The new flag state.
466	*/
467	VMM_INT_DECL(bool) HMSetSingleInstruction(PVMCPU pVCpu, bool fEnable)
468	{
469	VMCPU_ASSERT_EMT(pVCpu);
470	bool fOld = pVCpu->hm.s.fSingleInstruction;
471	pVCpu->hm.s.fSingleInstruction = fEnable;
472	return fOld;
473	}
474
475
476	/**
477	* Patches the instructions necessary for making a hypercall to the hypervisor.
478	* Used by GIM.
479	*
480	* @returns VBox status code.
481	* @param pVM Pointer to the VM.
482	* @param pvBuf The buffer in the hypercall page(s) to be patched.
483	* @param cbBuf The size of the buffer.
484	* @param pcbWritten Where to store the number of bytes patched. This
485	* is reliably updated only when this function returns
486	* VINF_SUCCESS.
487	*/
488	VMM_INT_DECL(int) HMPatchHypercall(PVM pVM, void pvBuf, size_t cbBuf, size_t pcbWritten)
489	{
490	AssertReturn(pvBuf, VERR_INVALID_POINTER);
491	AssertReturn(pcbWritten, VERR_INVALID_POINTER);
492	AssertReturn(HMIsEnabled(pVM), VERR_HM_IPE_5);
493
494	if (pVM->hm.s.vmx.fSupported)
495	{
496	uint8_t abHypercall[] = { 0x0F, 0x01, 0xC1 }; /* VMCALL */
497	if (RT_LIKELY(cbBuf >= sizeof(abHypercall)))
498	{
499	memcpy(pvBuf, abHypercall, sizeof(abHypercall));
500	*pcbWritten = sizeof(abHypercall);
501	return VINF_SUCCESS;
502	}
503	return VERR_BUFFER_OVERFLOW;
504	}
505	else
506	{
507	Assert(pVM->hm.s.svm.fSupported);
508	uint8_t abHypercall[] = { 0x0F, 0x01, 0xD9 }; /* VMMCALL */
509	if (RT_LIKELY(cbBuf >= sizeof(abHypercall)))
510	{
511	memcpy(pvBuf, abHypercall, sizeof(abHypercall));
512	*pcbWritten = sizeof(abHypercall);
513	return VINF_SUCCESS;
514	}
515	return VERR_BUFFER_OVERFLOW;
516	}
517	}
518

Note: See TracBrowser for help on using the repository browser.

source: vbox/trunk/src/VBox/VMM/VMMAll/HMAll.cpp@ 52343

Download in other formats: