VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMR0/CPUMR0.cpp@ 49152

Last change on this file since 49152 was 49019, checked in by vboxsync, 11 years ago

VMM: FPU cleanup.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Id Revision
File size: 32.7 KB
Line 
1/* $Id: CPUMR0.cpp 49019 2013-10-10 08:45:11Z vboxsync $ */
2/** @file
3 * CPUM - Host Context Ring 0.
4 */
5
6/*
7 * Copyright (C) 2006-2013 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*******************************************************************************
20* Header Files *
21*******************************************************************************/
22#define LOG_GROUP LOG_GROUP_CPUM
23#include <VBox/vmm/cpum.h>
24#include "CPUMInternal.h"
25#include <VBox/vmm/vm.h>
26#include <VBox/err.h>
27#include <VBox/log.h>
28#include <VBox/vmm/hm.h>
29#include <iprt/assert.h>
30#include <iprt/asm-amd64-x86.h>
31#ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
32# include <iprt/mem.h>
33# include <iprt/memobj.h>
34# include <VBox/apic.h>
35#endif
36#include <iprt/x86.h>
37
38
39/*******************************************************************************
40* Structures and Typedefs *
41*******************************************************************************/
42#ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
43/**
44 * Local APIC mappings.
45 */
46typedef struct CPUMHOSTLAPIC
47{
48 /** Indicates that the entry is in use and have valid data. */
49 bool fEnabled;
50 /** Whether it's operating in X2APIC mode (EXTD). */
51 bool fX2Apic;
52 /** The APIC version number. */
53 uint32_t uVersion;
54 /** Has APIC_REG_LVT_THMR. Not used. */
55 uint32_t fHasThermal;
56 /** The physical address of the APIC registers. */
57 RTHCPHYS PhysBase;
58 /** The memory object entering the physical address. */
59 RTR0MEMOBJ hMemObj;
60 /** The mapping object for hMemObj. */
61 RTR0MEMOBJ hMapObj;
62 /** The mapping address APIC registers.
63 * @remarks Different CPUs may use the same physical address to map their
64 * APICs, so this pointer is only valid when on the CPU owning the
65 * APIC. */
66 void *pv;
67} CPUMHOSTLAPIC;
68#endif
69
70
71/*******************************************************************************
72* Global Variables *
73*******************************************************************************/
74#ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
75static CPUMHOSTLAPIC g_aLApics[RTCPUSET_MAX_CPUS];
76#endif
77
78
79/*******************************************************************************
80* Internal Functions *
81*******************************************************************************/
82#ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
83static int cpumR0MapLocalApics(void);
84static void cpumR0UnmapLocalApics(void);
85#endif
86static int cpumR0SaveHostDebugState(PVMCPU pVCpu);
87
88
89/**
90 * Does the Ring-0 CPU initialization once during module load.
91 * XXX Host-CPU hot-plugging?
92 */
93VMMR0_INT_DECL(int) CPUMR0ModuleInit(void)
94{
95 int rc = VINF_SUCCESS;
96#ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
97 rc = cpumR0MapLocalApics();
98#endif
99 return rc;
100}
101
102
103/**
104 * Terminate the module.
105 */
106VMMR0_INT_DECL(int) CPUMR0ModuleTerm(void)
107{
108#ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
109 cpumR0UnmapLocalApics();
110#endif
111 return VINF_SUCCESS;
112}
113
114
115/**
116 * Check the CPUID features of this particular CPU and disable relevant features
117 * for the guest which do not exist on this CPU. We have seen systems where the
118 * X86_CPUID_FEATURE_ECX_MONITOR feature flag is only set on some host CPUs, see
119 * @bugref{5436}.
120 *
121 * @note This function might be called simultaneously on more than one CPU!
122 *
123 * @param idCpu The identifier for the CPU the function is called on.
124 * @param pvUser1 Pointer to the VM structure.
125 * @param pvUser2 Ignored.
126 */
127static DECLCALLBACK(void) cpumR0CheckCpuid(RTCPUID idCpu, void *pvUser1, void *pvUser2)
128{
129 struct
130 {
131 uint32_t uLeave; /* leave to check */
132 uint32_t ecx; /* which bits in ecx to unify between CPUs */
133 uint32_t edx; /* which bits in edx to unify between CPUs */
134 } aCpuidUnify[]
135 =
136 {
137 { 0x00000001, X86_CPUID_FEATURE_ECX_CX16
138 | X86_CPUID_FEATURE_ECX_MONITOR,
139 X86_CPUID_FEATURE_EDX_CX8 }
140 };
141 PVM pVM = (PVM)pvUser1;
142 PCPUM pCPUM = &pVM->cpum.s;
143 for (uint32_t i = 0; i < RT_ELEMENTS(aCpuidUnify); i++)
144 {
145 uint32_t uLeave = aCpuidUnify[i].uLeave;
146 uint32_t eax, ebx, ecx, edx;
147
148 ASMCpuId_Idx_ECX(uLeave, 0, &eax, &ebx, &ecx, &edx);
149 PCPUMCPUID paLeaves;
150 if (uLeave < 0x80000000)
151 paLeaves = &pCPUM->aGuestCpuIdStd[uLeave - 0x00000000];
152 else if (uLeave < 0xc0000000)
153 paLeaves = &pCPUM->aGuestCpuIdExt[uLeave - 0x80000000];
154 else
155 paLeaves = &pCPUM->aGuestCpuIdCentaur[uLeave - 0xc0000000];
156 /* unify important bits */
157 ASMAtomicAndU32(&paLeaves->ecx, ecx | ~aCpuidUnify[i].ecx);
158 ASMAtomicAndU32(&paLeaves->edx, edx | ~aCpuidUnify[i].edx);
159 }
160}
161
162
163/**
164 * Does Ring-0 CPUM initialization.
165 *
166 * This is mainly to check that the Host CPU mode is compatible
167 * with VBox.
168 *
169 * @returns VBox status code.
170 * @param pVM Pointer to the VM.
171 */
172VMMR0_INT_DECL(int) CPUMR0InitVM(PVM pVM)
173{
174 LogFlow(("CPUMR0Init: %p\n", pVM));
175
176 /*
177 * Check CR0 & CR4 flags.
178 */
179 uint32_t u32CR0 = ASMGetCR0();
180 if ((u32CR0 & (X86_CR0_PE | X86_CR0_PG)) != (X86_CR0_PE | X86_CR0_PG)) /* a bit paranoid perhaps.. */
181 {
182 Log(("CPUMR0Init: PE or PG not set. cr0=%#x\n", u32CR0));
183 return VERR_UNSUPPORTED_CPU_MODE;
184 }
185
186 /*
187 * Check for sysenter and syscall usage.
188 */
189 if (ASMHasCpuId())
190 {
191 /*
192 * SYSENTER/SYSEXIT
193 *
194 * Intel docs claim you should test both the flag and family, model &
195 * stepping because some Pentium Pro CPUs have the SEP cpuid flag set,
196 * but don't support it. AMD CPUs may support this feature in legacy
197 * mode, they've banned it from long mode. Since we switch to 32-bit
198 * mode when entering raw-mode context the feature would become
199 * accessible again on AMD CPUs, so we have to check regardless of
200 * host bitness.
201 */
202 uint32_t u32CpuVersion;
203 uint32_t u32Dummy;
204 uint32_t fFeatures;
205 ASMCpuId(1, &u32CpuVersion, &u32Dummy, &u32Dummy, &fFeatures);
206 uint32_t const u32Family = u32CpuVersion >> 8;
207 uint32_t const u32Model = (u32CpuVersion >> 4) & 0xF;
208 uint32_t const u32Stepping = u32CpuVersion & 0xF;
209 if ( (fFeatures & X86_CPUID_FEATURE_EDX_SEP)
210 && ( u32Family != 6 /* (> pentium pro) */
211 || u32Model >= 3
212 || u32Stepping >= 3
213 || !ASMIsIntelCpu())
214 )
215 {
216 /*
217 * Read the MSR and see if it's in use or not.
218 */
219 uint32_t u32 = ASMRdMsr_Low(MSR_IA32_SYSENTER_CS);
220 if (u32)
221 {
222 pVM->cpum.s.fHostUseFlags |= CPUM_USE_SYSENTER;
223 Log(("CPUMR0Init: host uses sysenter cs=%08x%08x\n", ASMRdMsr_High(MSR_IA32_SYSENTER_CS), u32));
224 }
225 }
226
227 /*
228 * SYSCALL/SYSRET
229 *
230 * This feature is indicated by the SEP bit returned in EDX by CPUID
231 * function 0x80000001. Intel CPUs only supports this feature in
232 * long mode. Since we're not running 64-bit guests in raw-mode there
233 * are no issues with 32-bit intel hosts.
234 */
235 uint32_t cExt = 0;
236 ASMCpuId(0x80000000, &cExt, &u32Dummy, &u32Dummy, &u32Dummy);
237 if (ASMIsValidExtRange(cExt))
238 {
239 uint32_t fExtFeaturesEDX = ASMCpuId_EDX(0x80000001);
240 if (fExtFeaturesEDX & X86_CPUID_EXT_FEATURE_EDX_SYSCALL)
241 {
242#ifdef RT_ARCH_X86
243# ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
244 if (fExtFeaturesEDX & X86_CPUID_EXT_FEATURE_EDX_LONG_MODE)
245# else
246 if (!ASMIsIntelCpu())
247# endif
248#endif
249 {
250 uint64_t fEfer = ASMRdMsr(MSR_K6_EFER);
251 if (fEfer & MSR_K6_EFER_SCE)
252 {
253 pVM->cpum.s.fHostUseFlags |= CPUM_USE_SYSCALL;
254 Log(("CPUMR0Init: host uses syscall\n"));
255 }
256 }
257 }
258 }
259
260 RTMpOnAll(cpumR0CheckCpuid, pVM, NULL);
261 }
262
263
264 /*
265 * Check if debug registers are armed.
266 * This ASSUMES that DR7.GD is not set, or that it's handled transparently!
267 */
268 uint32_t u32DR7 = ASMGetDR7();
269 if (u32DR7 & X86_DR7_ENABLED_MASK)
270 {
271 for (VMCPUID i = 0; i < pVM->cCpus; i++)
272 pVM->aCpus[i].cpum.s.fUseFlags |= CPUM_USE_DEBUG_REGS_HOST;
273 Log(("CPUMR0Init: host uses debug registers (dr7=%x)\n", u32DR7));
274 }
275
276 return VINF_SUCCESS;
277}
278
279
280/**
281 * Trap handler for device-not-available fault (#NM).
282 * Device not available, FP or (F)WAIT instruction.
283 *
284 * @returns VBox status code.
285 * @retval VINF_SUCCESS if the guest FPU state is loaded.
286 * @retval VINF_EM_RAW_GUEST_TRAP if it is a guest trap.
287 *
288 * @param pVM Pointer to the VM.
289 * @param pVCpu Pointer to the VMCPU.
290 * @param pCtx Pointer to the guest-CPU context.
291 */
292VMMR0_INT_DECL(int) CPUMR0Trap07Handler(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
293{
294 Assert(pVM->cpum.s.CPUFeatures.edx.u1FXSR);
295 Assert(ASMGetCR4() & X86_CR4_OSFSXR);
296
297 /* If the FPU state has already been loaded, then it's a guest trap. */
298 if (CPUMIsGuestFPUStateActive(pVCpu))
299 {
300 Assert( ((pCtx->cr0 & (X86_CR0_MP | X86_CR0_EM | X86_CR0_TS)) == (X86_CR0_MP | X86_CR0_TS))
301 || ((pCtx->cr0 & (X86_CR0_MP | X86_CR0_EM | X86_CR0_TS)) == (X86_CR0_MP | X86_CR0_TS | X86_CR0_EM)));
302 return VINF_EM_RAW_GUEST_TRAP;
303 }
304
305 /*
306 * There are two basic actions:
307 * 1. Save host fpu and restore guest fpu.
308 * 2. Generate guest trap.
309 *
310 * When entering the hypervisor we'll always enable MP (for proper wait
311 * trapping) and TS (for intercepting all fpu/mmx/sse stuff). The EM flag
312 * is taken from the guest OS in order to get proper SSE handling.
313 *
314 *
315 * Actions taken depending on the guest CR0 flags:
316 *
317 * 3 2 1
318 * TS | EM | MP | FPUInstr | WAIT :: VMM Action
319 * ------------------------------------------------------------------------
320 * 0 | 0 | 0 | Exec | Exec :: Clear TS & MP, Save HC, Load GC.
321 * 0 | 0 | 1 | Exec | Exec :: Clear TS, Save HC, Load GC.
322 * 0 | 1 | 0 | #NM | Exec :: Clear TS & MP, Save HC, Load GC.
323 * 0 | 1 | 1 | #NM | Exec :: Clear TS, Save HC, Load GC.
324 * 1 | 0 | 0 | #NM | Exec :: Clear MP, Save HC, Load GC. (EM is already cleared.)
325 * 1 | 0 | 1 | #NM | #NM :: Go to guest taking trap there.
326 * 1 | 1 | 0 | #NM | Exec :: Clear MP, Save HC, Load GC. (EM is already set.)
327 * 1 | 1 | 1 | #NM | #NM :: Go to guest taking trap there.
328 */
329
330 switch (pCtx->cr0 & (X86_CR0_MP | X86_CR0_EM | X86_CR0_TS))
331 {
332 case X86_CR0_MP | X86_CR0_TS:
333 case X86_CR0_MP | X86_CR0_TS | X86_CR0_EM:
334 return VINF_EM_RAW_GUEST_TRAP;
335 default:
336 break;
337 }
338
339 return CPUMR0LoadGuestFPU(pVM, pVCpu, pCtx);
340}
341
342
343/**
344 * Saves the host-FPU/XMM state and loads the guest-FPU state into the CPU.
345 *
346 * @returns VBox status code.
347 *
348 * @param pVM Pointer to the VM.
349 * @param pVCpu Pointer to the VMCPU.
350 * @param pCtx Pointer to the guest-CPU context.
351 */
352VMMR0_INT_DECL(int) CPUMR0LoadGuestFPU(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
353{
354 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
355#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
356 if (CPUMIsGuestInLongModeEx(pCtx))
357 {
358 Assert(!(pVCpu->cpum.s.fUseFlags & CPUM_SYNC_FPU_STATE));
359
360 /* Save the host state and record the fact (CPUM_USED_FPU | CPUM_USED_FPU_SINCE_REM). */
361 cpumR0SaveHostFPUState(&pVCpu->cpum.s);
362
363 /* Restore the state on entry as we need to be in 64-bit mode to access the full state. */
364 pVCpu->cpum.s.fUseFlags |= CPUM_SYNC_FPU_STATE;
365 }
366 else
367#endif
368 {
369 Assert(!(pVCpu->cpum.s.fUseFlags & CPUM_USED_MANUAL_XMM_RESTORE));
370 /** @todo Move the FFXR handling down into
371 * cpumR0SaveHostRestoreGuestFPUState to optimize the
372 * VBOX_WITH_KERNEL_USING_XMM handling. */
373 /* Clear MSR_K6_EFER_FFXSR or else we'll be unable to save/restore the XMM state with fxsave/fxrstor. */
374 uint64_t uHostEfer = 0;
375 bool fRestoreEfer = false;
376 if (pVM->cpum.s.CPUFeaturesExt.edx & X86_CPUID_AMD_FEATURE_EDX_FFXSR)
377 {
378 uHostEfer = ASMRdMsr(MSR_K6_EFER);
379 if (uHostEfer & MSR_K6_EFER_FFXSR)
380 {
381 ASMWrMsr(MSR_K6_EFER, uHostEfer & ~MSR_K6_EFER_FFXSR);
382 pVCpu->cpum.s.fUseFlags |= CPUM_USED_MANUAL_XMM_RESTORE;
383 fRestoreEfer = true;
384 }
385 }
386
387 /* Do the job and record that we've switched FPU state. */
388 cpumR0SaveHostRestoreGuestFPUState(&pVCpu->cpum.s);
389
390 /* Restore EFER. */
391 if (fRestoreEfer)
392 ASMWrMsr(MSR_K6_EFER, uHostEfer);
393 }
394
395 Assert((pVCpu->cpum.s.fUseFlags & (CPUM_USED_FPU | CPUM_USED_FPU_SINCE_REM)) == (CPUM_USED_FPU | CPUM_USED_FPU_SINCE_REM));
396 return VINF_SUCCESS;
397}
398
399
400/**
401 * Save guest FPU/XMM state
402 *
403 * @returns VBox status code.
404 * @param pVM Pointer to the VM.
405 * @param pVCpu Pointer to the VMCPU.
406 * @param pCtx Pointer to the guest CPU context.
407 */
408VMMR0_INT_DECL(int) CPUMR0SaveGuestFPU(PVM pVM, PVMCPU pVCpu, PCPUMCTX pCtx)
409{
410 Assert(pVM->cpum.s.CPUFeatures.edx.u1FXSR);
411 Assert(ASMGetCR4() & X86_CR4_OSFSXR);
412 AssertReturn((pVCpu->cpum.s.fUseFlags & CPUM_USED_FPU), VINF_SUCCESS);
413 NOREF(pCtx);
414
415#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
416 if (CPUMIsGuestInLongModeEx(pCtx))
417 {
418 if (!(pVCpu->cpum.s.fUseFlags & CPUM_SYNC_FPU_STATE))
419 {
420 HMR0SaveFPUState(pVM, pVCpu, pCtx);
421 cpumR0RestoreHostFPUState(&pVCpu->cpum.s);
422 }
423 /* else nothing to do; we didn't perform a world switch */
424 }
425 else
426#endif
427 {
428#ifdef VBOX_WITH_KERNEL_USING_XMM
429 /*
430 * We've already saved the XMM registers in the assembly wrapper, so
431 * we have to save them before saving the entire FPU state and put them
432 * back afterwards.
433 */
434 /** @todo This could be skipped if MSR_K6_EFER_FFXSR is set, but
435 * I'm not able to test such an optimization tonight.
436 * We could just all this in assembly. */
437 uint128_t aGuestXmmRegs[16];
438 memcpy(&aGuestXmmRegs[0], &pVCpu->cpum.s.Guest.fpu.aXMM[0], sizeof(aGuestXmmRegs));
439#endif
440
441 /* Clear MSR_K6_EFER_FFXSR or else we'll be unable to save/restore the XMM state with fxsave/fxrstor. */
442 uint64_t uHostEfer = 0;
443 bool fRestoreEfer = false;
444 if (pVCpu->cpum.s.fUseFlags & CPUM_USED_MANUAL_XMM_RESTORE)
445 {
446 uHostEfer = ASMRdMsr(MSR_K6_EFER);
447 if (uHostEfer & MSR_K6_EFER_FFXSR)
448 {
449 ASMWrMsr(MSR_K6_EFER, uHostEfer & ~MSR_K6_EFER_FFXSR);
450 fRestoreEfer = true;
451 }
452 }
453
454 cpumR0SaveGuestRestoreHostFPUState(&pVCpu->cpum.s);
455
456 /* Restore EFER MSR */
457 if (fRestoreEfer)
458 ASMWrMsr(MSR_K6_EFER, uHostEfer | MSR_K6_EFER_FFXSR);
459
460#ifdef VBOX_WITH_KERNEL_USING_XMM
461 memcpy(&pVCpu->cpum.s.Guest.fpu.aXMM[0], &aGuestXmmRegs[0], sizeof(aGuestXmmRegs));
462#endif
463 }
464
465 pVCpu->cpum.s.fUseFlags &= ~(CPUM_USED_FPU | CPUM_SYNC_FPU_STATE | CPUM_USED_MANUAL_XMM_RESTORE);
466 return VINF_SUCCESS;
467}
468
469
470/**
471 * Saves the host debug state, setting CPUM_USED_HOST_DEBUG_STATE and loading
472 * DR7 with safe values.
473 *
474 * @returns VBox status code.
475 * @param pVCpu Pointer to the VMCPU.
476 */
477static int cpumR0SaveHostDebugState(PVMCPU pVCpu)
478{
479 /*
480 * Save the host state.
481 */
482#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
483 AssertCompile((uintptr_t)&pVCpu->cpum.s.Host.dr3 - (uintptr_t)&pVCpu->cpum.s.Host.dr0 == sizeof(uint64_t) * 3);
484 cpumR0SaveDRx(&pVCpu->cpum.s.Host.dr0);
485#else
486 pVCpu->cpum.s.Host.dr0 = ASMGetDR0();
487 pVCpu->cpum.s.Host.dr1 = ASMGetDR1();
488 pVCpu->cpum.s.Host.dr2 = ASMGetDR2();
489 pVCpu->cpum.s.Host.dr3 = ASMGetDR3();
490#endif
491 pVCpu->cpum.s.Host.dr6 = ASMGetDR6();
492 /** @todo dr7 might already have been changed to 0x400; don't care right now as it's harmless. */
493 pVCpu->cpum.s.Host.dr7 = ASMGetDR7();
494
495 /* Preemption paranoia. */
496 ASMAtomicOrU32(&pVCpu->cpum.s.fUseFlags, CPUM_USED_DEBUG_REGS_HOST);
497
498 /*
499 * Make sure DR7 is harmless or else we could trigger breakpoints when
500 * load guest or hypervisor DRx values later.
501 */
502 if (pVCpu->cpum.s.Host.dr7 != X86_DR7_INIT_VAL)
503 ASMSetDR7(X86_DR7_INIT_VAL);
504
505 return VINF_SUCCESS;
506}
507
508
509/**
510 * Saves the guest DRx state residing in host registers and restore the host
511 * register values.
512 *
513 * The guest DRx state is only saved if CPUMR0LoadGuestDebugState was called,
514 * since it's assumed that we're shadowing the guest DRx register values
515 * accurately when using the combined hypervisor debug register values
516 * (CPUMR0LoadHyperDebugState).
517 *
518 * @returns true if either guest or hypervisor debug registers were loaded.
519 * @param pVCpu The cross context CPU structure for the calling EMT.
520 * @param fDr6 Whether to include DR6 or not.
521 * @thread EMT(pVCpu)
522 */
523VMMR0_INT_DECL(bool) CPUMR0DebugStateMaybeSaveGuestAndRestoreHost(PVMCPU pVCpu, bool fDr6)
524{
525 Assert(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
526 bool const fDrXLoaded = RT_BOOL(pVCpu->cpum.s.fUseFlags & (CPUM_USED_DEBUG_REGS_GUEST | CPUM_USED_DEBUG_REGS_HYPER));
527
528 /*
529 * Do we need to save the guest DRx registered loaded into host registers?
530 * (DR7 and DR6 (if fDr6 is true) are left to the caller.)
531 */
532 if (pVCpu->cpum.s.fUseFlags & CPUM_USED_DEBUG_REGS_GUEST)
533 {
534#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
535 if (CPUMIsGuestInLongModeEx(&pVCpu->cpum.s.Guest))
536 {
537 uint64_t uDr6 = pVCpu->cpum.s.Guest.dr[6];
538 HMR0SaveDebugState(pVCpu->CTX_SUFF(pVM), pVCpu, &pVCpu->cpum.s.Guest);
539 if (!fDr6)
540 pVCpu->cpum.s.Guest.dr[6] = uDr6;
541 }
542 else
543#endif
544 {
545#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
546 cpumR0SaveDRx(&pVCpu->cpum.s.Guest.dr[0]);
547#else
548 pVCpu->cpum.s.Guest.dr[0] = ASMGetDR0();
549 pVCpu->cpum.s.Guest.dr[1] = ASMGetDR1();
550 pVCpu->cpum.s.Guest.dr[2] = ASMGetDR2();
551 pVCpu->cpum.s.Guest.dr[3] = ASMGetDR3();
552#endif
553 if (fDr6)
554 pVCpu->cpum.s.Guest.dr[6] = ASMGetDR6();
555 }
556 }
557 ASMAtomicAndU32(&pVCpu->cpum.s.fUseFlags, ~( CPUM_USED_DEBUG_REGS_GUEST | CPUM_USED_DEBUG_REGS_HYPER
558 | CPUM_SYNC_DEBUG_REGS_GUEST | CPUM_SYNC_DEBUG_REGS_HYPER));
559
560 /*
561 * Restore the host's debug state. DR0-3, DR6 and only then DR7!
562 */
563 if (pVCpu->cpum.s.fUseFlags & CPUM_USED_DEBUG_REGS_HOST)
564 {
565 /* A bit of paranoia first... */
566 uint64_t uCurDR7 = ASMGetDR7();
567 if (uCurDR7 != X86_DR7_INIT_VAL)
568 ASMSetDR7(X86_DR7_INIT_VAL);
569
570#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
571 AssertCompile((uintptr_t)&pVCpu->cpum.s.Host.dr3 - (uintptr_t)&pVCpu->cpum.s.Host.dr0 == sizeof(uint64_t) * 3);
572 cpumR0LoadDRx(&pVCpu->cpum.s.Host.dr0);
573#else
574 ASMSetDR0(pVCpu->cpum.s.Host.dr0);
575 ASMSetDR1(pVCpu->cpum.s.Host.dr1);
576 ASMSetDR2(pVCpu->cpum.s.Host.dr2);
577 ASMSetDR3(pVCpu->cpum.s.Host.dr3);
578#endif
579 /** @todo consider only updating if they differ, esp. DR6. Need to figure how
580 * expensive DRx reads are over DRx writes. */
581 ASMSetDR6(pVCpu->cpum.s.Host.dr6);
582 ASMSetDR7(pVCpu->cpum.s.Host.dr7);
583
584 ASMAtomicAndU32(&pVCpu->cpum.s.fUseFlags, ~CPUM_USED_DEBUG_REGS_HOST);
585 }
586
587 return fDrXLoaded;
588}
589
590
591/**
592 * Saves the guest DRx state if it resides host registers.
593 *
594 * This does NOT clear any use flags, so the host registers remains loaded with
595 * the guest DRx state upon return. The purpose is only to make sure the values
596 * in the CPU context structure is up to date.
597 *
598 * @returns true if the host registers contains guest values, false if not.
599 * @param pVCpu The cross context CPU structure for the calling EMT.
600 * @param fDr6 Whether to include DR6 or not.
601 * @thread EMT(pVCpu)
602 */
603VMMR0_INT_DECL(bool) CPUMR0DebugStateMaybeSaveGuest(PVMCPU pVCpu, bool fDr6)
604{
605 /*
606 * Do we need to save the guest DRx registered loaded into host registers?
607 * (DR7 and DR6 (if fDr6 is true) are left to the caller.)
608 */
609 if (pVCpu->cpum.s.fUseFlags & CPUM_USED_DEBUG_REGS_GUEST)
610 {
611#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
612 if (CPUMIsGuestInLongModeEx(&pVCpu->cpum.s.Guest))
613 {
614 uint64_t uDr6 = pVCpu->cpum.s.Guest.dr[6];
615 HMR0SaveDebugState(pVCpu->CTX_SUFF(pVM), pVCpu, &pVCpu->cpum.s.Guest);
616 if (!fDr6)
617 pVCpu->cpum.s.Guest.dr[6] = uDr6;
618 }
619 else
620#endif
621 {
622#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
623 cpumR0SaveDRx(&pVCpu->cpum.s.Guest.dr[0]);
624#else
625 pVCpu->cpum.s.Guest.dr[0] = ASMGetDR0();
626 pVCpu->cpum.s.Guest.dr[1] = ASMGetDR1();
627 pVCpu->cpum.s.Guest.dr[2] = ASMGetDR2();
628 pVCpu->cpum.s.Guest.dr[3] = ASMGetDR3();
629#endif
630 if (fDr6)
631 pVCpu->cpum.s.Guest.dr[6] = ASMGetDR6();
632 }
633 return true;
634 }
635 return false;
636}
637
638
639/**
640 * Lazily sync in the debug state.
641 *
642 * @param pVCpu The cross context CPU structure for the calling EMT.
643 * @param fDr6 Whether to include DR6 or not.
644 * @thread EMT(pVCpu)
645 */
646VMMR0_INT_DECL(void) CPUMR0LoadGuestDebugState(PVMCPU pVCpu, bool fDr6)
647{
648 /*
649 * Save the host state and disarm all host BPs.
650 */
651 cpumR0SaveHostDebugState(pVCpu);
652 Assert(ASMGetDR7() == X86_DR7_INIT_VAL);
653
654 /*
655 * Activate the guest state DR0-3.
656 * DR7 and DR6 (if fDr6 is true) are left to the caller.
657 */
658#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
659 if (CPUMIsGuestInLongModeEx(&pVCpu->cpum.s.Guest))
660 ASMAtomicOrU32(&pVCpu->cpum.s.fUseFlags, CPUM_SYNC_DEBUG_REGS_GUEST); /* Postpone it to the world switch. */
661 else
662#endif
663 {
664#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
665 cpumR0LoadDRx(&pVCpu->cpum.s.Guest.dr[0]);
666#else
667 ASMSetDR0(pVCpu->cpum.s.Guest.dr[0]);
668 ASMSetDR1(pVCpu->cpum.s.Guest.dr[1]);
669 ASMSetDR2(pVCpu->cpum.s.Guest.dr[2]);
670 ASMSetDR3(pVCpu->cpum.s.Guest.dr[3]);
671#endif
672 if (fDr6)
673 ASMSetDR6(pVCpu->cpum.s.Guest.dr[6]);
674
675 ASMAtomicOrU32(&pVCpu->cpum.s.fUseFlags, CPUM_USED_DEBUG_REGS_GUEST);
676 }
677}
678
679
680/**
681 * Lazily sync in the hypervisor debug state
682 *
683 * @returns VBox status code.
684 * @param pVCpu The cross context CPU structure for the calling EMT.
685 * @param fDr6 Whether to include DR6 or not.
686 * @thread EMT(pVCpu)
687 */
688VMMR0_INT_DECL(void) CPUMR0LoadHyperDebugState(PVMCPU pVCpu, bool fDr6)
689{
690 /*
691 * Save the host state and disarm all host BPs.
692 */
693 cpumR0SaveHostDebugState(pVCpu);
694 Assert(ASMGetDR7() == X86_DR7_INIT_VAL);
695
696 /*
697 * Make sure the hypervisor values are up to date.
698 */
699 CPUMRecalcHyperDRx(pVCpu, UINT8_MAX /* no loading, please */, true);
700
701 /*
702 * Activate the guest state DR0-3.
703 * DR7 and DR6 (if fDr6 is true) are left to the caller.
704 */
705#if HC_ARCH_BITS == 32 && defined(VBOX_WITH_64_BITS_GUESTS) && !defined(VBOX_WITH_HYBRID_32BIT_KERNEL)
706 if (CPUMIsGuestInLongModeEx(&pVCpu->cpum.s.Guest))
707 ASMAtomicOrU32(&pVCpu->cpum.s.fUseFlags, CPUM_SYNC_DEBUG_REGS_HYPER); /* Postpone it. */
708 else
709#endif
710 {
711#ifdef VBOX_WITH_HYBRID_32BIT_KERNEL
712 cpumR0LoadDRx(&pVCpu->cpum.s.Hyper.dr[0]);
713#else
714 ASMSetDR0(pVCpu->cpum.s.Hyper.dr[0]);
715 ASMSetDR1(pVCpu->cpum.s.Hyper.dr[1]);
716 ASMSetDR2(pVCpu->cpum.s.Hyper.dr[2]);
717 ASMSetDR3(pVCpu->cpum.s.Hyper.dr[3]);
718#endif
719 if (fDr6)
720 ASMSetDR6(X86_DR6_INIT_VAL);
721
722 ASMAtomicOrU32(&pVCpu->cpum.s.fUseFlags, CPUM_USED_DEBUG_REGS_HYPER);
723 }
724}
725
726#ifdef VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI
727
728/**
729 * Per-CPU callback that probes the CPU for APIC support.
730 *
731 * @param idCpu The identifier for the CPU the function is called on.
732 * @param pvUser1 Ignored.
733 * @param pvUser2 Ignored.
734 */
735static DECLCALLBACK(void) cpumR0MapLocalApicCpuProber(RTCPUID idCpu, void *pvUser1, void *pvUser2)
736{
737 NOREF(pvUser1); NOREF(pvUser2);
738 int iCpu = RTMpCpuIdToSetIndex(idCpu);
739 AssertReturnVoid(iCpu >= 0 && (unsigned)iCpu < RT_ELEMENTS(g_aLApics));
740
741 /*
742 * Check for APIC support.
743 */
744 uint32_t uMaxLeaf, u32EBX, u32ECX, u32EDX;
745 ASMCpuId(0, &uMaxLeaf, &u32EBX, &u32ECX, &u32EDX);
746 if ( ( ASMIsIntelCpuEx(u32EBX, u32ECX, u32EDX)
747 || ASMIsAmdCpuEx(u32EBX, u32ECX, u32EDX)
748 || ASMIsViaCentaurCpuEx(u32EBX, u32ECX, u32EDX))
749 && ASMIsValidStdRange(uMaxLeaf))
750 {
751 uint32_t uDummy;
752 ASMCpuId(1, &uDummy, &u32EBX, &u32ECX, &u32EDX);
753 if ( (u32EDX & X86_CPUID_FEATURE_EDX_APIC)
754 && (u32EDX & X86_CPUID_FEATURE_EDX_MSR))
755 {
756 /*
757 * Safe to access the MSR. Read it and calc the BASE (a little complicated).
758 */
759 uint64_t u64ApicBase = ASMRdMsr(MSR_IA32_APICBASE);
760 uint64_t u64Mask = MSR_IA32_APICBASE_BASE_MIN;
761
762 /* see Intel Manual: Local APIC Status and Location: MAXPHYADDR default is bit 36 */
763 uint32_t uMaxExtLeaf;
764 ASMCpuId(0x80000000, &uMaxExtLeaf, &u32EBX, &u32ECX, &u32EDX);
765 if ( uMaxExtLeaf >= UINT32_C(0x80000008)
766 && ASMIsValidExtRange(uMaxExtLeaf))
767 {
768 uint32_t u32PhysBits;
769 ASMCpuId(0x80000008, &u32PhysBits, &u32EBX, &u32ECX, &u32EDX);
770 u32PhysBits &= 0xff;
771 u64Mask = ((UINT64_C(1) << u32PhysBits) - 1) & UINT64_C(0xfffffffffffff000);
772 }
773
774 AssertCompile(sizeof(g_aLApics[iCpu].PhysBase) == sizeof(u64ApicBase));
775 g_aLApics[iCpu].PhysBase = u64ApicBase & u64Mask;
776 g_aLApics[iCpu].fEnabled = RT_BOOL(u64ApicBase & MSR_IA32_APICBASE_EN);
777 g_aLApics[iCpu].fX2Apic = (u64ApicBase & (MSR_IA32_APICBASE_EXTD | MSR_IA32_APICBASE_EN))
778 == (MSR_IA32_APICBASE_EXTD | MSR_IA32_APICBASE_EN);
779 }
780 }
781}
782
783
784
785/**
786 * Per-CPU callback that verifies our APIC expectations.
787 *
788 * @param idCpu The identifier for the CPU the function is called on.
789 * @param pvUser1 Ignored.
790 * @param pvUser2 Ignored.
791 */
792static DECLCALLBACK(void) cpumR0MapLocalApicCpuChecker(RTCPUID idCpu, void *pvUser1, void *pvUser2)
793{
794 int iCpu = RTMpCpuIdToSetIndex(idCpu);
795 AssertReturnVoid(iCpu >= 0 && (unsigned)iCpu < RT_ELEMENTS(g_aLApics));
796 if (!g_aLApics[iCpu].fEnabled)
797 return;
798
799 /*
800 * 0x0X 82489 external APIC
801 * 0x1X Local APIC
802 * 0x2X..0xFF reserved
803 */
804 uint32_t uApicVersion;
805 if (g_aLApics[iCpu].fX2Apic)
806 uApicVersion = ApicX2RegRead32(APIC_REG_VERSION);
807 else
808 uApicVersion = ApicRegRead(g_aLApics[iCpu].pv, APIC_REG_VERSION);
809 if ((APIC_REG_VERSION_GET_VER(uApicVersion) & 0xF0) == 0x10)
810 {
811 g_aLApics[iCpu].uVersion = uApicVersion;
812 g_aLApics[iCpu].fHasThermal = APIC_REG_VERSION_GET_MAX_LVT(uApicVersion) >= 5;
813
814#if 0 /* enable if you need it. */
815 if (g_aLApics[iCpu].fX2Apic)
816 SUPR0Printf("CPUM: X2APIC %02u - ver %#010x, lint0=%#07x lint1=%#07x pc=%#07x thmr=%#07x\n",
817 iCpu, uApicVersion,
818 ApicX2RegRead32(APIC_REG_LVT_LINT0), ApicX2RegRead32(APIC_REG_LVT_LINT1),
819 ApicX2RegRead32(APIC_REG_LVT_PC), ApicX2RegRead32(APIC_REG_LVT_THMR) );
820 else
821 SUPR0Printf("CPUM: APIC %02u at %RGp (mapped at %p) - ver %#010x, lint0=%#07x lint1=%#07x pc=%#07x thmr=%#07x\n",
822 iCpu, g_aLApics[iCpu].PhysBase, g_aLApics[iCpu].pv, uApicVersion,
823 ApicRegRead(g_aLApics[iCpu].pv, APIC_REG_LVT_LINT0), ApicRegRead(g_aLApics[iCpu].pv, APIC_REG_LVT_LINT1),
824 ApicRegRead(g_aLApics[iCpu].pv, APIC_REG_LVT_PC), ApicRegRead(g_aLApics[iCpu].pv, APIC_REG_LVT_THMR) );
825#endif
826 }
827 else
828 {
829 g_aLApics[iCpu].fEnabled = false;
830 g_aLApics[iCpu].fX2Apic = false;
831 SUPR0Printf("VBox/CPUM: Unsupported APIC version %#x (iCpu=%d)\n", uApicVersion, iCpu);
832 }
833}
834
835
836/**
837 * Map the MMIO page of each local APIC in the system.
838 */
839static int cpumR0MapLocalApics(void)
840{
841 /*
842 * Check that we'll always stay within the array bounds.
843 */
844 if (RTMpGetArraySize() > RT_ELEMENTS(g_aLApics))
845 {
846 LogRel(("CPUM: Too many real CPUs/cores/threads - %u, max %u\n", RTMpGetArraySize(), RT_ELEMENTS(g_aLApics)));
847 return VERR_TOO_MANY_CPUS;
848 }
849
850 /*
851 * Create mappings for all online CPUs we think have legacy APICs.
852 */
853 int rc = RTMpOnAll(cpumR0MapLocalApicCpuProber, NULL, NULL);
854
855 for (unsigned iCpu = 0; RT_SUCCESS(rc) && iCpu < RT_ELEMENTS(g_aLApics); iCpu++)
856 {
857 if (g_aLApics[iCpu].fEnabled && !g_aLApics[iCpu].fX2Apic)
858 {
859 rc = RTR0MemObjEnterPhys(&g_aLApics[iCpu].hMemObj, g_aLApics[iCpu].PhysBase,
860 PAGE_SIZE, RTMEM_CACHE_POLICY_MMIO);
861 if (RT_SUCCESS(rc))
862 {
863 rc = RTR0MemObjMapKernel(&g_aLApics[iCpu].hMapObj, g_aLApics[iCpu].hMemObj, (void *)-1,
864 PAGE_SIZE, RTMEM_PROT_READ | RTMEM_PROT_WRITE);
865 if (RT_SUCCESS(rc))
866 {
867 g_aLApics[iCpu].pv = RTR0MemObjAddress(g_aLApics[iCpu].hMapObj);
868 continue;
869 }
870 RTR0MemObjFree(g_aLApics[iCpu].hMemObj, true /* fFreeMappings */);
871 }
872 g_aLApics[iCpu].fEnabled = false;
873 }
874 g_aLApics[iCpu].pv = NULL;
875 }
876
877 /*
878 * Check the APICs.
879 */
880 if (RT_SUCCESS(rc))
881 rc = RTMpOnAll(cpumR0MapLocalApicCpuChecker, NULL, NULL);
882
883 if (RT_FAILURE(rc))
884 {
885 cpumR0UnmapLocalApics();
886 return rc;
887 }
888
889#ifdef LOG_ENABLED
890 /*
891 * Log the result (pretty useless, requires enabling CPUM in VBoxDrv
892 * and !VBOX_WITH_R0_LOGGING).
893 */
894 if (LogIsEnabled())
895 {
896 uint32_t cEnabled = 0;
897 uint32_t cX2Apics = 0;
898 for (unsigned iCpu = 0; iCpu < RT_ELEMENTS(g_aLApics); iCpu++)
899 if (g_aLApics[iCpu].fEnabled)
900 {
901 cEnabled++;
902 cX2Apics += g_aLApics[iCpu].fX2Apic;
903 }
904 Log(("CPUM: %u APICs, %u X2APICs\n", cEnabled, cX2Apics));
905 }
906#endif
907
908 return VINF_SUCCESS;
909}
910
911
912/**
913 * Unmap the Local APIC of all host CPUs.
914 */
915static void cpumR0UnmapLocalApics(void)
916{
917 for (unsigned iCpu = RT_ELEMENTS(g_aLApics); iCpu-- > 0;)
918 {
919 if (g_aLApics[iCpu].pv)
920 {
921 RTR0MemObjFree(g_aLApics[iCpu].hMapObj, true /* fFreeMappings */);
922 RTR0MemObjFree(g_aLApics[iCpu].hMemObj, true /* fFreeMappings */);
923 g_aLApics[iCpu].hMapObj = NIL_RTR0MEMOBJ;
924 g_aLApics[iCpu].hMemObj = NIL_RTR0MEMOBJ;
925 g_aLApics[iCpu].fEnabled = false;
926 g_aLApics[iCpu].fX2Apic = false;
927 g_aLApics[iCpu].pv = NULL;
928 }
929 }
930}
931
932
933/**
934 * Updates CPUMCPU::pvApicBase and CPUMCPU::fX2Apic prior to world switch.
935 *
936 * Writes the Local APIC mapping address of the current host CPU to CPUMCPU so
937 * the world switchers can access the APIC registers for the purpose of
938 * disabling and re-enabling the NMIs. Must be called with disabled preemption
939 * or disabled interrupts!
940 *
941 * @param pVCpu Pointer to the cross context CPU structure of the
942 * calling EMT.
943 * @param idHostCpu The ID of the current host CPU.
944 */
945VMMR0_INT_DECL(void) CPUMR0SetLApic(PVMCPU pVCpu, RTCPUID idHostCpu)
946{
947 int idxCpu = RTMpCpuIdToSetIndex(idHostCpu);
948 pVCpu->cpum.s.pvApicBase = g_aLApics[idxCpu].pv;
949 pVCpu->cpum.s.fX2Apic = g_aLApics[idxCpu].fX2Apic;
950// Log6(("CPUMR0SetLApic: pvApicBase=%p fX2Apic=%d\n", g_aLApics[idxCpu].pv, g_aLApics[idxCpu].fX2Apic));
951}
952
953#endif /* VBOX_WITH_VMMR0_DISABLE_LAPIC_NMI */
954
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette