VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMR0/CPUMR0.cpp@ 21134

Last change on this file since 21134 was 20997, checked in by vboxsync, 16 years ago

HWACCM,CPUM: Fix for 64-bit Windows trashing guest XMM registers - VMX part.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Id
File size: 16.7 KB
Line 
1/* $Id: CPUMR0.cpp 20997 2009-06-26 22:23:04Z vboxsync $ */
2/** @file
3 * CPUM - Host Context Ring 0.
4 */
5
6/*
7 * Copyright (C) 2006-2007 Sun Microsystems, Inc.
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa
18 * Clara, CA 95054 USA or visit http://www.sun.com if you need
19 * additional information or have any questions.
20 */
21
22
23/*******************************************************************************
24* Header Files *
25*******************************************************************************/
26#define LOG_GROUP LOG_GROUP_CPUM
27#include <VBox/cpum.h>
28#include "CPUMInternal.h"
29#include <VBox/vm.h>
30#include <VBox/x86.h>
31#include <VBox/err.h>
32#include <VBox/log.h>
33#include <VBox/hwaccm.h>
34#include <iprt/assert.h>
35#include <iprt/asm.h>
36
37
38
39/**
40 * Does Ring-0 CPUM initialization.
41 *
42 * This is mainly to check that the Host CPU mode is compatible
43 * with VBox.
44 *
45 * @returns VBox status code.
46 * @param pVM The VM to operate on.
47 */
48VMMR0DECL(int) CPUMR0Init(PVM pVM)
49{
50 LogFlow(("CPUMR0Init: %p\n", pVM));
51
52 /*
53 * Check CR0 & CR4 flags.
54 */
55 uint32_t u32CR0 = ASMGetCR0();
56 if ((u32CR0 & (X86_CR0_PE | X86_CR0_PG)) != (X86_CR0_PE | X86_CR0_PG)) /* a bit paranoid perhaps.. */
57 {
58 Log(("CPUMR0Init: PE or PG not set. cr0=%#x\n", u32CR0));
59 return VERR_UNSUPPORTED_CPU_MODE;
60 }
61
62 /*
63 * Check for sysenter if it's used.
64 */
65 if (ASMHasCpuId())
66 {
67 uint32_t u32CpuVersion;
68 uint32_t u32Dummy;
69 uint32_t u32Features;
70 ASMCpuId(1, &u32CpuVersion, &u32Dummy, &u32Dummy, &u32Features);
71 uint32_t u32Family = u32CpuVersion >> 8;
72 uint32_t u32Model = (u32CpuVersion >> 4) & 0xF;
73 uint32_t u32Stepping = u32CpuVersion & 0xF;
74
75 /*
76 * Intel docs claim you should test both the flag and family, model & stepping.
77 * Some Pentium Pro cpus have the SEP cpuid flag set, but don't support it.
78 */
79 if ( (u32Features & X86_CPUID_FEATURE_EDX_SEP)
80 && !(u32Family == 6 && u32Model < 3 && u32Stepping < 3))
81 {
82 /*
83 * Read the MSR and see if it's in use or not.
84 */
85 uint32_t u32 = ASMRdMsr_Low(MSR_IA32_SYSENTER_CS);
86 if (u32)
87 {
88 for (unsigned i=0;i<pVM->cCPUs;i++)
89 pVM->aCpus[i].cpum.s.fUseFlags |= CPUM_USE_SYSENTER;
90
91 Log(("CPUMR0Init: host uses sysenter cs=%08x%08x\n", ASMRdMsr_High(MSR_IA32_SYSENTER_CS), u32));
92 }
93 }
94
95 /** @todo check for AMD and syscall!!!!!! */
96 }
97
98
99 /*
100 * Check if debug registers are armed.
101 * This ASSUMES that DR7.GD is not set, or that it's handled transparently!
102 */
103 uint32_t u32DR7 = ASMGetDR7();
104 if (u32DR7 & X86_DR7_ENABLED_MASK)
105 {
106 for (unsigned i=0;i<pVM->cCPUs;i++)
107 pVM->aCpus[i].cpum.s.fUseFlags |= CPUM_USE_DEBUG_REGS_HOST;
108 Log(("CPUMR0Init: host uses debug registers (dr7=%x)\n", u32DR7));
109 }
110
111 return VINF_SUCCESS;
112}
113
114
115/**
116 * Lazily sync in the FPU/XMM state
117 *
118 * @returns VBox status code.
119 * @param pVM VM handle.
120 * @param pVCpu VMCPU handle.
121 * @param pCtx CPU context
122 */
123VMMR0DECL(int) CPUMR0LoadGuestFPU(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
124{
125 Assert(pVM->cpum.s.CPUFeatures.edx.u1FXSR);
126 Assert(ASMGetCR4() & X86_CR4_OSFSXR);
127
128 /* If the FPU state has already been loaded, then it's a guest trap. */
129 if (pVCpu->cpum.s.fUseFlags & CPUM_USED_FPU)
130 {
131 Assert( ((pCtx->cr0 & (X86_CR0_MP | X86_CR0_EM | X86_CR0_TS)) == (X86_CR0_MP | X86_CR0_EM | X86_CR0_TS))
132 || ((pCtx->cr0 & (X86_CR0_MP | X86_CR0_EM | X86_CR0_TS)) == (X86_CR0_MP | X86_CR0_TS)));
133 return VINF_EM_RAW_GUEST_TRAP;
134 }
135
136 /*
137 * There are two basic actions:
138 * 1. Save host fpu and restore guest fpu.
139 * 2. Generate guest trap.
140 *
141 * When entering the hypervisor we'll always enable MP (for proper wait
142 * trapping) and TS (for intercepting all fpu/mmx/sse stuff). The EM flag
143 * is taken from the guest OS in order to get proper SSE handling.
144 *
145 *
146 * Actions taken depending on the guest CR0 flags:
147 *
148 * 3 2 1
149 * TS | EM | MP | FPUInstr | WAIT :: VMM Action
150 * ------------------------------------------------------------------------
151 * 0 | 0 | 0 | Exec | Exec :: Clear TS & MP, Save HC, Load GC.
152 * 0 | 0 | 1 | Exec | Exec :: Clear TS, Save HC, Load GC.
153 * 0 | 1 | 0 | #NM | Exec :: Clear TS & MP, Save HC, Load GC.
154 * 0 | 1 | 1 | #NM | Exec :: Clear TS, Save HC, Load GC.
155 * 1 | 0 | 0 | #NM | Exec :: Clear MP, Save HC, Load GC. (EM is already cleared.)
156 * 1 | 0 | 1 | #NM | #NM :: Go to guest taking trap there.
157 * 1 | 1 | 0 | #NM | Exec :: Clear MP, Save HC, Load GC. (EM is already set.)
158 * 1 | 1 | 1 | #NM | #NM :: Go to guest taking trap there.
159 */
160
161 switch (pCtx->cr0 & (X86_CR0_MP | X86_CR0_EM | X86_CR0_TS))
162 {
163 case X86_CR0_MP | X86_CR0_TS:
164 case X86_CR0_MP | X86_CR0_EM | X86_CR0_TS:
165 return VINF_EM_RAW_GUEST_TRAP;
166 default:
167 break;
168 }
169
170#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
171 if (CPUMIsGuestInLongModeEx(pCtx))
172 {
173 Assert(!(pVCpu->cpum.s.fUseFlags & CPUM_SYNC_FPU_STATE));
174
175 /* Save the host state and record the fact (CPUM_USED_FPU | CPUM_USED_FPU_SINCE_REM). */
176 cpumR0SaveHostFPUState(&pVCpu->cpum.s);
177
178 /* Restore the state on entry as we need to be in 64 bits mode to access the full state. */
179 pVCpu->cpum.s.fUseFlags |= CPUM_SYNC_FPU_STATE;
180 }
181 else
182#endif
183 {
184#ifndef CPUM_CAN_HANDLE_NM_TRAPS_IN_KERNEL_MODE
185# if defined(VBOX_WITH_HYBRID_32BIT_KERNEL) || defined(VBOX_WITH_KERNEL_USING_XMM) /** @todo remove the #else here and move cpumHandleLazyFPUAsm back to VMMGC after branching out 3.0!!. */
186 /** @todo Move the FFXR handling down into
187 * cpumR0SaveHostRestoreguestFPUState to optimize the
188 * VBOX_WITH_KERNEL_USING_XMM handling. */
189 /* Clear MSR_K6_EFER_FFXSR or else we'll be unable to save/restore the XMM state with fxsave/fxrstor. */
190 uint64_t SavedEFER = 0;
191 if (pVM->cpum.s.CPUFeaturesExt.edx & X86_CPUID_AMD_FEATURE_EDX_FFXSR)
192 {
193 SavedEFER = ASMRdMsr(MSR_K6_EFER);
194 if (SavedEFER & MSR_K6_EFER_FFXSR)
195 {
196 ASMWrMsr(MSR_K6_EFER, SavedEFER & ~MSR_K6_EFER_FFXSR);
197 pVCpu->cpum.s.fUseFlags |= CPUM_MANUAL_XMM_RESTORE;
198 }
199 }
200
201 /* Do the job and record that we've switched FPU state. */
202 cpumR0SaveHostRestoreGuestFPUState(&pVCpu->cpum.s);
203
204 /* Restore EFER. */
205 if (pVCpu->cpum.s.fUseFlags & CPUM_MANUAL_XMM_RESTORE)
206 ASMWrMsr(MSR_K6_EFER, SavedEFER);
207
208# else
209 uint64_t oldMsrEFERHost = 0;
210 uint32_t oldCR0 = ASMGetCR0();
211
212 /* Clear MSR_K6_EFER_FFXSR or else we'll be unable to save/restore the XMM state with fxsave/fxrstor. */
213 if (pVM->cpum.s.CPUFeaturesExt.edx & X86_CPUID_AMD_FEATURE_EDX_FFXSR)
214 {
215 /** @todo Do we really need to read this every time?? The host could change this on the fly though.
216 * bird: what about starting by skipping the ASMWrMsr below if we didn't
217 * change anything? Ditto for the stuff in CPUMR0SaveGuestFPU. */
218 oldMsrEFERHost = ASMRdMsr(MSR_K6_EFER);
219 if (oldMsrEFERHost & MSR_K6_EFER_FFXSR)
220 {
221 ASMWrMsr(MSR_K6_EFER, oldMsrEFERHost & ~MSR_K6_EFER_FFXSR);
222 pVCpu->cpum.s.fUseFlags |= CPUM_MANUAL_XMM_RESTORE;
223 }
224 }
225
226 /* If we sync the FPU/XMM state on-demand, then we can continue execution as if nothing has happened. */
227 int rc = CPUMHandleLazyFPU(pVCpu);
228 AssertRC(rc);
229 Assert(CPUMIsGuestFPUStateActive(pVCpu));
230
231 /* Restore EFER MSR */
232 if (pVCpu->cpum.s.fUseFlags & CPUM_MANUAL_XMM_RESTORE)
233 ASMWrMsr(MSR_K6_EFER, oldMsrEFERHost);
234
235 /* CPUMHandleLazyFPU could have changed CR0; restore it. */
236 ASMSetCR0(oldCR0);
237# endif
238
239#else /* CPUM_CAN_HANDLE_NM_TRAPS_IN_KERNEL_MODE */
240
241 /*
242 * Save the FPU control word and MXCSR, so we can restore the state properly afterwards.
243 * We don't want the guest to be able to trigger floating point/SSE exceptions on the host.
244 */
245 pVCpu->cpum.s.Host.fpu.FCW = CPUMGetFCW();
246 if (pVM->cpum.s.CPUFeatures.edx.u1SSE)
247 pVCpu->cpum.s.Host.fpu.MXCSR = CPUMGetMXCSR();
248
249 cpumR0LoadFPU(pCtx);
250
251 /*
252 * The MSR_K6_EFER_FFXSR feature is AMD only so far, but check the cpuid just in case Intel adds it in the future.
253 *
254 * MSR_K6_EFER_FFXSR changes the behaviour of fxsave and fxrstore: the XMM state isn't saved/restored
255 */
256 if (pVM->cpum.s.CPUFeaturesExt.edx & X86_CPUID_AMD_FEATURE_EDX_FFXSR)
257 {
258 /** @todo Do we really need to read this every time?? The host could change this on the fly though. */
259 uint64_t msrEFERHost = ASMRdMsr(MSR_K6_EFER);
260
261 if (msrEFERHost & MSR_K6_EFER_FFXSR)
262 {
263 /* fxrstor doesn't restore the XMM state! */
264 cpumR0LoadXMM(pCtx);
265 pVCpu->cpum.s.fUseFlags |= CPUM_MANUAL_XMM_RESTORE;
266 }
267 }
268
269#endif /* CPUM_CAN_HANDLE_NM_TRAPS_IN_KERNEL_MODE */
270 }
271
272 Assert((pVCpu->cpum.s.fUseFlags & (CPUM_USED_FPU | CPUM_USED_FPU_SINCE_REM)) == (CPUM_USED_FPU | CPUM_USED_FPU_SINCE_REM));
273 return VINF_SUCCESS;
274}
275
276
277/**
278 * Save guest FPU/XMM state
279 *
280 * @returns VBox status code.
281 * @param pVM VM handle.
282 * @param pVCpu VMCPU handle.
283 * @param pCtx CPU context
284 */
285VMMR0DECL(int) CPUMR0SaveGuestFPU(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
286{
287 Assert(pVM->cpum.s.CPUFeatures.edx.u1FXSR);
288 Assert(ASMGetCR4() & X86_CR4_OSFSXR);
289 AssertReturn((pVCpu->cpum.s.fUseFlags & CPUM_USED_FPU), VINF_SUCCESS);
290
291#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
292 if (CPUMIsGuestInLongModeEx(pCtx))
293 {
294 if (!(pVCpu->cpum.s.fUseFlags & CPUM_SYNC_FPU_STATE))
295 {
296 HWACCMR0SaveFPUState(pVM, pVCpu, pCtx);
297 cpumR0RestoreHostFPUState(&pVCpu->cpum.s);
298 }
299 /* else nothing to do; we didn't perform a world switch */
300 }
301 else
302#endif
303 {
304#ifndef CPUM_CAN_HANDLE_NM_TRAPS_IN_KERNEL_MODE
305# ifdef VBOX_WITH_KERNEL_USING_XMM
306 /*
307 * We've already saved the XMM registers in the assembly wrapper, so
308 * we have to save them before saving the entire FPU state and put them
309 * back afterwards.
310 */
311 /** @todo This could be skipped if MSR_K6_EFER_FFXSR is set, but
312 * I'm not able to test such an optimization tonight.
313 * We could just all this in assembly. */
314 uint128_t aGuestXmmRegs[16];
315 memcpy(&aGuestXmmRegs[0], &pVCpu->cpum.s.Guest.fpu.aXMM[0], sizeof(aGuestXmmRegs));
316# endif
317
318 /* Clear MSR_K6_EFER_FFXSR or else we'll be unable to save/restore the XMM state with fxsave/fxrstor. */
319 uint64_t oldMsrEFERHost = 0;
320 if (pVCpu->cpum.s.fUseFlags & CPUM_MANUAL_XMM_RESTORE)
321 {
322 oldMsrEFERHost = ASMRdMsr(MSR_K6_EFER);
323 ASMWrMsr(MSR_K6_EFER, oldMsrEFERHost & ~MSR_K6_EFER_FFXSR);
324 }
325 cpumR0SaveGuestRestoreHostFPUState(&pVCpu->cpum.s);
326
327 /* Restore EFER MSR */
328 if (pVCpu->cpum.s.fUseFlags & CPUM_MANUAL_XMM_RESTORE)
329 ASMWrMsr(MSR_K6_EFER, oldMsrEFERHost | MSR_K6_EFER_FFXSR);
330
331# ifdef VBOX_WITH_KERNEL_USING_XMM
332 memcpy(&pVCpu->cpum.s.Guest.fpu.aXMM[0], &aGuestXmmRegs[0], sizeof(aGuestXmmRegs));
333# endif
334
335#else /* CPUM_CAN_HANDLE_NM_TRAPS_IN_KERNEL_MODE */
336# ifdef VBOX_WITH_KERNEL_USING_XMM
337# error "Fix all the NM_TRAPS_IN_KERNEL_MODE code path. I'm not going to fix unused code now."
338# endif
339 cpumR0SaveFPU(pCtx);
340 if (pVCpu->cpum.s.fUseFlags & CPUM_MANUAL_XMM_RESTORE)
341 {
342 /* fxsave doesn't save the XMM state! */
343 cpumR0SaveXMM(pCtx);
344 }
345
346 /*
347 * Restore the original FPU control word and MXCSR.
348 * We don't want the guest to be able to trigger floating point/SSE exceptions on the host.
349 */
350 cpumR0SetFCW(pVCpu->cpum.s.Host.fpu.FCW);
351 if (pVM->cpum.s.CPUFeatures.edx.u1SSE)
352 cpumR0SetMXCSR(pVCpu->cpum.s.Host.fpu.MXCSR);
353#endif /* CPUM_CAN_HANDLE_NM_TRAPS_IN_KERNEL_MODE */
354 }
355
356 pVCpu->cpum.s.fUseFlags &= ~(CPUM_USED_FPU | CPUM_SYNC_FPU_STATE | CPUM_MANUAL_XMM_RESTORE);
357 return VINF_SUCCESS;
358}
359
360
361/**
362 * Save guest debug state
363 *
364 * @returns VBox status code.
365 * @param pVM VM handle.
366 * @param pVCpu VMCPU handle.
367 * @param pCtx CPU context
368 * @param fDR6 Include DR6 or not
369 */
370VMMR0DECL(int) CPUMR0SaveGuestDebugState(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx, bool fDR6)
371{
372 Assert(pVCpu->cpum.s.fUseFlags & CPUM_USE_DEBUG_REGS);
373
374 /* Save the guest's debug state. The caller is responsible for DR7. */
375#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
376 if (CPUMIsGuestInLongModeEx(pCtx))
377 {
378 if (!(pVCpu->cpum.s.fUseFlags & CPUM_SYNC_DEBUG_STATE))
379 {
380 uint64_t dr6 = pCtx->dr[6];
381
382 HWACCMR0SaveDebugState(pVM, pVCpu, pCtx);
383 if (!fDR6) /* dr6 was already up-to-date */
384 pCtx->dr[6] = dr6;
385 }
386 }
387 else
388#endif
389 {
390#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
391 cpumR0SaveDRx(&pCtx->dr[0]);
392#else
393 pCtx->dr[0] = ASMGetDR0();
394 pCtx->dr[1] = ASMGetDR1();
395 pCtx->dr[2] = ASMGetDR2();
396 pCtx->dr[3] = ASMGetDR3();
397#endif
398 if (fDR6)
399 pCtx->dr[6] = ASMGetDR6();
400 }
401
402 /*
403 * Restore the host's debug state. DR0-3, DR6 and only then DR7!
404 * DR7 contains 0x400 right now.
405 */
406#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
407 AssertCompile((uintptr_t)&pVCpu->cpum.s.Host.dr3 - (uintptr_t)&pVCpu->cpum.s.Host.dr0 == sizeof(uint64_t) * 3);
408 cpumR0LoadDRx(&pVCpu->cpum.s.Host.dr0);
409#else
410 ASMSetDR0(pVCpu->cpum.s.Host.dr0);
411 ASMSetDR1(pVCpu->cpum.s.Host.dr1);
412 ASMSetDR2(pVCpu->cpum.s.Host.dr2);
413 ASMSetDR3(pVCpu->cpum.s.Host.dr3);
414#endif
415 ASMSetDR6(pVCpu->cpum.s.Host.dr6);
416 ASMSetDR7(pVCpu->cpum.s.Host.dr7);
417
418 pVCpu->cpum.s.fUseFlags &= ~CPUM_USE_DEBUG_REGS;
419 return VINF_SUCCESS;
420}
421
422
423/**
424 * Lazily sync in the debug state
425 *
426 * @returns VBox status code.
427 * @param pVM VM handle.
428 * @param pVCpu VMCPU handle.
429 * @param pCtx CPU context
430 * @param fDR6 Include DR6 or not
431 */
432VMMR0DECL(int) CPUMR0LoadGuestDebugState(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx, bool fDR6)
433{
434 /* Save the host state. */
435#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
436 AssertCompile((uintptr_t)&pVCpu->cpum.s.Host.dr3 - (uintptr_t)&pVCpu->cpum.s.Host.dr0 == sizeof(uint64_t) * 3);
437 cpumR0SaveDRx(&pVCpu->cpum.s.Host.dr0);
438#else
439 pVCpu->cpum.s.Host.dr0 = ASMGetDR0();
440 pVCpu->cpum.s.Host.dr1 = ASMGetDR1();
441 pVCpu->cpum.s.Host.dr2 = ASMGetDR2();
442 pVCpu->cpum.s.Host.dr3 = ASMGetDR3();
443#endif
444 pVCpu->cpum.s.Host.dr6 = ASMGetDR6();
445 /** @todo dr7 might already have been changed to 0x400; don't care right now as it's harmless. */
446 pVCpu->cpum.s.Host.dr7 = ASMGetDR7();
447 /* Make sure DR7 is harmless or else we could trigger breakpoints when restoring dr0-3 (!) */
448 ASMSetDR7(X86_DR7_INIT_VAL);
449
450 /* Activate the guest state DR0-3; DR7 is left to the caller. */
451#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
452 if (CPUMIsGuestInLongModeEx(pCtx))
453 {
454 /* Restore the state on entry as we need to be in 64 bits mode to access the full state. */
455 pVCpu->cpum.s.fUseFlags |= CPUM_SYNC_DEBUG_STATE;
456 }
457 else
458#endif
459 {
460#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
461 cpumR0LoadDRx(&pCtx->dr[0]);
462#else
463 ASMSetDR0(pCtx->dr[0]);
464 ASMSetDR1(pCtx->dr[1]);
465 ASMSetDR2(pCtx->dr[2]);
466 ASMSetDR3(pCtx->dr[3]);
467#endif
468 if (fDR6)
469 ASMSetDR6(pCtx->dr[6]);
470 }
471
472 pVCpu->cpum.s.fUseFlags |= CPUM_USE_DEBUG_REGS;
473 return VINF_SUCCESS;
474}
475
476
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette