VirtualBox

source: vbox/trunk/src/VBox/VMM/VMMR3/GIMKvm.cpp@ 55628

Last change on this file since 55628 was 55510, checked in by vboxsync, 10 years ago

VMM/GIM: EMT Rendezvous while updating global wall-clock struct.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 16.7 KB
Line 
1/* $Id: GIMKvm.cpp 55510 2015-04-29 10:13:15Z vboxsync $ */
2/** @file
3 * GIM - Guest Interface Manager, KVM implementation.
4 */
5
6/*
7 * Copyright (C) 2015 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18/*******************************************************************************
19* Header Files *
20*******************************************************************************/
21#define LOG_GROUP LOG_GROUP_GIM
22#include "GIMInternal.h"
23
24#include <iprt/asm-math.h>
25#include <iprt/assert.h>
26#include <iprt/err.h>
27#include <iprt/string.h>
28#include <iprt/mem.h>
29#include <iprt/spinlock.h>
30
31#include <VBox/vmm/cpum.h>
32#include <VBox/disopcode.h>
33#include <VBox/vmm/ssm.h>
34#include <VBox/vmm/vm.h>
35#include <VBox/vmm/hm.h>
36#include <VBox/vmm/pdmapi.h>
37#include <VBox/version.h>
38
39
40/*******************************************************************************
41* Defined Constants And Macros *
42*******************************************************************************/
43
44/**
45 * GIM KVM saved-state version.
46 */
47#define GIM_KVM_SAVED_STATE_VERSION UINT32_C(1)
48
49/**
50 * VBox internal struct. to passback to EMT rendezvous callback while enabling
51 * the KVM wall-clock.
52 */
53typedef struct KVMWALLCLOCKINFO
54{
55 /** Guest physical address of the wall-clock struct. */
56 RTGCPHYS GCPhysWallClock;
57} KVMWALLCLOCKINFO;
58/** Pointer to the wall-clock info. struct. */
59typedef KVMWALLCLOCKINFO *PKVMWALLCLOCKINFO;
60
61/*******************************************************************************
62* Global Variables *
63*******************************************************************************/
64#ifdef VBOX_WITH_STATISTICS
65# define GIMKVM_MSRRANGE(a_uFirst, a_uLast, a_szName) \
66 { (a_uFirst), (a_uLast), kCpumMsrRdFn_Gim, kCpumMsrWrFn_Gim, 0, 0, 0, 0, 0, a_szName, { 0 }, { 0 }, { 0 }, { 0 } }
67#else
68# define GIMKVM_MSRRANGE(a_uFirst, a_uLast, a_szName) \
69 { (a_uFirst), (a_uLast), kCpumMsrRdFn_Gim, kCpumMsrWrFn_Gim, 0, 0, 0, 0, 0, a_szName }
70#endif
71
72/**
73 * Array of MSR ranges supported by KVM.
74 */
75static CPUMMSRRANGE const g_aMsrRanges_Kvm[] =
76{
77 GIMKVM_MSRRANGE(MSR_GIM_KVM_RANGE0_START, MSR_GIM_KVM_RANGE0_END, "KVM range 0"),
78 GIMKVM_MSRRANGE(MSR_GIM_KVM_RANGE1_START, MSR_GIM_KVM_RANGE1_END, "KVM range 1")
79};
80#undef GIMKVM_MSRRANGE
81
82
83/**
84 * Initializes the KVM GIM provider.
85 *
86 * @returns VBox status code.
87 * @param pVM Pointer to the VM.
88 * @param uVersion The interface version this VM should use.
89 */
90VMMR3_INT_DECL(int) gimR3KvmInit(PVM pVM)
91{
92 AssertReturn(pVM, VERR_INVALID_PARAMETER);
93 AssertReturn(pVM->gim.s.enmProviderId == GIMPROVIDERID_KVM, VERR_INTERNAL_ERROR_5);
94
95 int rc;
96 PGIMKVM pKvm = &pVM->gim.s.u.Kvm;
97
98 /*
99 * Determine interface capabilities based on the version.
100 */
101 if (!pVM->gim.s.u32Version)
102 {
103 /* Basic features. */
104 pKvm->uBaseFeat = 0
105 | GIM_KVM_BASE_FEAT_CLOCK_OLD
106 //| GIM_KVM_BASE_FEAT_NOP_IO_DELAY
107 //| GIM_KVM_BASE_FEAT_MMU_OP
108 | GIM_KVM_BASE_FEAT_CLOCK
109 //| GIM_KVM_BASE_FEAT_ASYNC_PF
110 //| GIM_KVM_BASE_FEAT_STEAL_TIME
111 //| GIM_KVM_BASE_FEAT_PV_EOI
112 | GIM_KVM_BASE_FEAT_PV_UNHALT
113 ;
114 /* Rest of the features are determined in gimR3KvmInitCompleted(). */
115 }
116
117 /*
118 * Expose HVP (Hypervisor Present) bit to the guest.
119 */
120 CPUMSetGuestCpuIdFeature(pVM, CPUMCPUIDFEATURE_HVP);
121
122 /*
123 * Modify the standard hypervisor leaves for KVM.
124 */
125 CPUMCPUIDLEAF HyperLeaf;
126 RT_ZERO(HyperLeaf);
127 HyperLeaf.uLeaf = UINT32_C(0x40000000);
128 HyperLeaf.uEax = UINT32_C(0x40000001); /* Minimum value for KVM is 0x40000001. */
129 HyperLeaf.uEbx = 0x4B4D564B; /* 'KVMK' */
130 HyperLeaf.uEcx = 0x564B4D56; /* 'VMKV' */
131 HyperLeaf.uEdx = 0x0000004D; /* 'M000' */
132 rc = CPUMR3CpuIdInsert(pVM, &HyperLeaf);
133 AssertLogRelRCReturn(rc, rc);
134
135 /*
136 * Add KVM specific leaves.
137 */
138 HyperLeaf.uLeaf = UINT32_C(0x40000001);
139 HyperLeaf.uEax = pKvm->uBaseFeat;
140 HyperLeaf.uEbx = 0; /* Reserved */
141 HyperLeaf.uEcx = 0; /* Reserved */
142 HyperLeaf.uEdx = 0; /* Reserved */
143 rc = CPUMR3CpuIdInsert(pVM, &HyperLeaf);
144 AssertLogRelRCReturn(rc, rc);
145
146 /*
147 * Insert all MSR ranges of KVM.
148 */
149 for (unsigned i = 0; i < RT_ELEMENTS(g_aMsrRanges_Kvm); i++)
150 {
151 rc = CPUMR3MsrRangesInsert(pVM, &g_aMsrRanges_Kvm[i]);
152 AssertLogRelRCReturn(rc, rc);
153 }
154
155 /*
156 * Setup hypercall and #UD handling.
157 */
158 for (VMCPUID i = 0; i < pVM->cCpus; i++)
159 VMMHypercallsEnable(&pVM->aCpus[i]);
160
161 if (ASMIsAmdCpu())
162 {
163 pKvm->fTrapXcptUD = true;
164 pKvm->uOpCodeNative = OP_VMMCALL;
165 }
166 else
167 {
168 Assert(ASMIsIntelCpu() || ASMIsViaCentaurCpu());
169 pKvm->fTrapXcptUD = false;
170 pKvm->uOpCodeNative = OP_VMCALL;
171 }
172
173 /* We always need to trap VMCALL/VMMCALL hypercall using #UDs for raw-mode VMs. */
174 if (!HMIsEnabled(pVM))
175 pKvm->fTrapXcptUD = true;
176
177 return VINF_SUCCESS;
178}
179
180
181/**
182 * Initializes remaining bits of the KVM provider.
183 *
184 * This is called after initializing HM and almost all other VMM components.
185 *
186 * @returns VBox status code.
187 * @param pVM Pointer to the VM.
188 */
189VMMR3_INT_DECL(int) gimR3KvmInitCompleted(PVM pVM)
190{
191 if (TMR3CpuTickIsFixedRateMonotonic(pVM, true /* fWithParavirtEnabled */))
192 {
193 PGIMKVM pKvm = &pVM->gim.s.u.Kvm;
194 pKvm->uBaseFeat |= GIM_KVM_BASE_FEAT_TSC_STABLE;
195
196 CPUMCPUIDLEAF HyperLeaf;
197 RT_ZERO(HyperLeaf);
198 HyperLeaf.uLeaf = UINT32_C(0x40000001);
199 HyperLeaf.uEax = pKvm->uBaseFeat;
200 HyperLeaf.uEbx = 0;
201 HyperLeaf.uEcx = 0;
202 HyperLeaf.uEdx = 0;
203 int rc = CPUMR3CpuIdInsert(pVM, &HyperLeaf);
204 AssertLogRelRCReturn(rc, rc);
205 }
206
207 return VINF_SUCCESS;
208}
209
210
211/**
212 * Terminates the KVM GIM provider.
213 *
214 * @returns VBox status code.
215 * @param pVM Pointer to the VM.
216 */
217VMMR3_INT_DECL(int) gimR3KvmTerm(PVM pVM)
218{
219 gimR3KvmReset(pVM);
220 return VINF_SUCCESS;
221}
222
223
224/**
225 * Applies relocations to data and code managed by this component.
226 *
227 * This function will be called at init and whenever the VMM need to relocate
228 * itself inside the GC.
229 *
230 * @param pVM Pointer to the VM.
231 * @param offDelta Relocation delta relative to old location.
232 */
233VMMR3_INT_DECL(void) gimR3KvmRelocate(PVM pVM, RTGCINTPTR offDelta)
234{
235 NOREF(pVM); NOREF(offDelta);
236}
237
238
239/**
240 * This resets KVM provider MSRs and unmaps whatever KVM regions that
241 * the guest may have mapped.
242 *
243 * This is called when the VM is being reset.
244 *
245 * @param pVM Pointer to the VM.
246 * @thread EMT(0).
247 */
248VMMR3_INT_DECL(void) gimR3KvmReset(PVM pVM)
249{
250 VM_ASSERT_EMT0(pVM);
251 LogRel(("GIM: KVM: Resetting MSRs\n"));
252
253 /*
254 * Reset MSRs.
255 */
256 PGIMKVM pKvm = &pVM->gim.s.u.Kvm;
257 pKvm->u64WallClockMsr = 0;
258 for (VMCPUID iCpu = 0; iCpu < pVM->cCpus; iCpu++)
259 {
260 PGIMKVMCPU pKvmCpu = &pVM->aCpus[iCpu].gim.s.u.KvmCpu;
261 pKvmCpu->u64SystemTimeMsr = 0;
262 }
263}
264
265
266/**
267 * KVM state-save operation.
268 *
269 * @returns VBox status code.
270 * @param pVM Pointer to the VM.
271 * @param pSSM Pointer to the SSM handle.
272 */
273VMMR3_INT_DECL(int) gimR3KvmSave(PVM pVM, PSSMHANDLE pSSM)
274{
275 PCGIMKVM pcKvm = &pVM->gim.s.u.Kvm;
276
277 /*
278 * Save the KVM SSM version.
279 */
280 SSMR3PutU32(pSSM, GIM_KVM_SAVED_STATE_VERSION);
281
282 /*
283 * Save per-VCPU data.
284 */
285 for (uint32_t i = 0; i < pVM->cCpus; i++)
286 {
287 PCGIMKVMCPU pcKvmCpu = &pVM->aCpus[i].gim.s.u.KvmCpu;
288
289 /* Guest may alter flags (namely GIM_KVM_SYSTEM_TIME_FLAGS_GUEST_PAUSED bit). So re-read them from guest-memory. */
290 GIMKVMSYSTEMTIME SystemTime;
291 RT_ZERO(SystemTime);
292 if (MSR_GIM_KVM_SYSTEM_TIME_IS_ENABLED(pcKvmCpu->u64SystemTimeMsr))
293 {
294 int rc = PGMPhysSimpleReadGCPhys(pVM, &SystemTime, pcKvmCpu->GCPhysSystemTime, sizeof(GIMKVMSYSTEMTIME));
295 AssertRCReturn(rc, rc);
296 }
297
298 SSMR3PutU64(pSSM, pcKvmCpu->u64SystemTimeMsr);
299 SSMR3PutU64(pSSM, pcKvmCpu->uTsc);
300 SSMR3PutU64(pSSM, pcKvmCpu->uVirtNanoTS);
301 SSMR3PutGCPhys(pSSM, pcKvmCpu->GCPhysSystemTime);
302 SSMR3PutU32(pSSM, pcKvmCpu->u32SystemTimeVersion);
303 SSMR3PutU8(pSSM, SystemTime.fFlags);
304 }
305
306 /*
307 * Save per-VM data.
308 */
309 SSMR3PutU64(pSSM, pcKvm->u64WallClockMsr);
310 return SSMR3PutU32(pSSM, pcKvm->uBaseFeat);
311}
312
313
314/**
315 * KVM state-load operation, final pass.
316 *
317 * @returns VBox status code.
318 * @param pVM Pointer to the VM.
319 * @param pSSM Pointer to the SSM handle.
320 * @param uSSMVersion The GIM saved-state version.
321 */
322VMMR3_INT_DECL(int) gimR3KvmLoad(PVM pVM, PSSMHANDLE pSSM, uint32_t uSSMVersion)
323{
324 /*
325 * Load the KVM SSM version first.
326 */
327 uint32_t uKvmSavedStatVersion;
328 int rc = SSMR3GetU32(pSSM, &uKvmSavedStatVersion);
329 AssertRCReturn(rc, rc);
330 if (uKvmSavedStatVersion != GIM_KVM_SAVED_STATE_VERSION)
331 return SSMR3SetLoadError(pSSM, VERR_SSM_UNSUPPORTED_DATA_UNIT_VERSION, RT_SRC_POS,
332 N_("Unsupported KVM saved-state version %u (expected %u)."), uKvmSavedStatVersion,
333 GIM_KVM_SAVED_STATE_VERSION);
334
335 /*
336 * Load per-VCPU data.
337 */
338 for (uint32_t i = 0; i < pVM->cCpus; i++)
339 {
340 PVMCPU pVCpu = &pVM->aCpus[i];
341 PGIMKVMCPU pKvmCpu = &pVCpu->gim.s.u.KvmCpu;
342
343 uint8_t fSystemTimeFlags = 0;
344 SSMR3GetU64(pSSM, &pKvmCpu->u64SystemTimeMsr);
345 SSMR3GetU64(pSSM, &pKvmCpu->uTsc);
346 SSMR3GetU64(pSSM, &pKvmCpu->uVirtNanoTS);
347 SSMR3GetGCPhys(pSSM, &pKvmCpu->GCPhysSystemTime);
348 SSMR3GetU32(pSSM, &pKvmCpu->u32SystemTimeVersion);
349 SSMR3GetU8(pSSM, &fSystemTimeFlags);
350
351 /* Enable the system-time struct. if necessary. */
352 if (MSR_GIM_KVM_SYSTEM_TIME_IS_ENABLED(pKvmCpu->u64SystemTimeMsr))
353 {
354 Assert(!TMVirtualIsTicking(pVM)); /* paranoia. */
355 Assert(!TMCpuTickIsTicking(pVCpu));
356 rc = gimR3KvmEnableSystemTime(pVM, pVCpu, pKvmCpu, fSystemTimeFlags);
357 AssertRCReturn(rc, rc);
358 }
359 }
360
361 /*
362 * Load per-VM data.
363 */
364 PGIMKVM pKvm = &pVM->gim.s.u.Kvm;
365 SSMR3GetU64(pSSM, &pKvm->u64WallClockMsr);
366 rc = SSMR3GetU32(pSSM, &pKvm->uBaseFeat);
367 AssertRCReturn(rc, rc);
368
369 return VINF_SUCCESS;
370}
371
372
373/**
374 * Enables the KVM VCPU system-time structure.
375 *
376 * @returns VBox status code.
377 * @param pVM Pointer to the VM.
378 * @param pVCpu Pointer to the VMCPU.
379 * @param pKvmCpu Pointer to the GIMKVMCPU with all fields
380 * populated by the caller.
381 * @param fFlags The system-time struct. flags.
382 *
383 * @remarks Don't do any release assertions here, these can be triggered by
384 * guest R0 code.
385 */
386VMMR3_INT_DECL(int) gimR3KvmEnableSystemTime(PVM pVM, PVMCPU pVCpu, PGIMKVMCPU pKvmCpu, uint8_t fFlags)
387{
388 GIMKVMSYSTEMTIME SystemTime;
389 RT_ZERO(SystemTime);
390 SystemTime.u32Version = pKvmCpu->u32SystemTimeVersion;
391 SystemTime.u64NanoTS = pKvmCpu->uVirtNanoTS;
392 SystemTime.u64Tsc = pKvmCpu->uTsc;
393 SystemTime.fFlags = fFlags | GIM_KVM_SYSTEM_TIME_FLAGS_TSC_STABLE;
394
395 /*
396 * How the guest calculates the system time (nanoseconds):
397 *
398 * tsc = rdtsc - SysTime.u64Tsc
399 * if (SysTime.i8TscShift >= 0)
400 * tsc <<= i8TscShift;
401 * else
402 * tsc >>= -i8TscShift;
403 * time = ((tsc * SysTime.u32TscScale) >> 32) + SysTime.u64NanoTS
404 */
405 uint64_t u64TscFreq = TMCpuTicksPerSecond(pVM);
406 SystemTime.i8TscShift = 0;
407 while (u64TscFreq > 2 * RT_NS_1SEC_64)
408 {
409 u64TscFreq >>= 1;
410 SystemTime.i8TscShift--;
411 }
412 uint32_t uTscFreqLo = (uint32_t)u64TscFreq;
413 while (uTscFreqLo <= RT_NS_1SEC)
414 {
415 uTscFreqLo <<= 1;
416 SystemTime.i8TscShift++;
417 }
418 SystemTime.u32TscScale = ASMDivU64ByU32RetU32(RT_NS_1SEC_64 << 32, uTscFreqLo);
419
420 Assert(!(SystemTime.u32Version & UINT32_C(1)));
421 Assert(PGMPhysIsGCPhysNormal(pVM, pKvmCpu->GCPhysSystemTime));
422 int rc = PGMPhysSimpleWriteGCPhys(pVM, pKvmCpu->GCPhysSystemTime, &SystemTime, sizeof(GIMKVMSYSTEMTIME));
423 if (RT_SUCCESS(rc))
424 {
425 LogRel(("GIM: KVM: VCPU%3d: Enabled system-time struct. at %#RGp - u32TscScale=%#RX32 i8TscShift=%d uVersion=%#RU32 "
426 "fFlags=%#x uTsc=%#RX64 uVirtNanoTS=%#RX64\n", pVCpu->idCpu, pKvmCpu->GCPhysSystemTime, SystemTime.u32TscScale,
427 SystemTime.i8TscShift, SystemTime.u32Version, SystemTime.fFlags, pKvmCpu->uTsc, pKvmCpu->uVirtNanoTS));
428 TMR3CpuTickParavirtEnable(pVM);
429 }
430 else
431 LogRel(("GIM: KVM: VCPU%3d: Failed to write system-time struct. at %#RGp. rc=%Rrc\n", pKvmCpu->GCPhysSystemTime, rc));
432
433 return rc;
434}
435
436
437/**
438 * Disables the KVM system-time struct.
439 *
440 * @returns VBox status code.
441 * @param pVM Pointer to the VM.
442 */
443VMMR3_INT_DECL(int) gimR3KvmDisableSystemTime(PVM pVM)
444{
445 TMR3CpuTickParavirtDisable(pVM);
446 return VINF_SUCCESS;
447}
448
449
450/**
451 * @callback_method_impl{PFNVMMEMTRENDEZVOUS,
452 * Worker for gimR3KvmEnableWallClock}
453 */
454static DECLCALLBACK(VBOXSTRICTRC) gimR3KvmEnableWallClockCallback(PVM pVM, PVMCPU pVCpu, void *pvData)
455{
456 Assert(pvData);
457 PKVMWALLCLOCKINFO pWallClockInfo = (PKVMWALLCLOCKINFO)pvData;
458 RTGCPHYS GCPhysWallClock = pWallClockInfo->GCPhysWallClock;
459
460 /*
461 * Read the wall-clock version (sequence) from the guest.
462 */
463 uint32_t uVersion;
464 Assert(PGMPhysIsGCPhysNormal(pVM, GCPhysWallClock));
465 int rc = PGMPhysSimpleReadGCPhys(pVM, &uVersion, GCPhysWallClock, sizeof(uVersion));
466 if (RT_FAILURE(rc))
467 {
468 LogRel(("GIM: KVM: Failed to read wall-clock struct. version at %#RGp. rc=%Rrc\n", GCPhysWallClock, rc));
469 return rc;
470 }
471
472 /*
473 * Ensure the version is incrementally even.
474 */
475 if (!(uVersion & 1))
476 ++uVersion;
477 ++uVersion;
478
479 /*
480 * Update wall-clock guest struct. with UTC information.
481 */
482 RTTIMESPEC TimeSpec;
483 int32_t iSec;
484 int32_t iNano;
485 TMR3UtcNow(pVM, &TimeSpec);
486 RTTimeSpecGetSecondsAndNano(&TimeSpec, &iSec, &iNano);
487
488 GIMKVMWALLCLOCK WallClock;
489 RT_ZERO(WallClock);
490 AssertCompile(sizeof(uVersion) == sizeof(WallClock.u32Version));
491 WallClock.u32Version = uVersion;
492 WallClock.u32Sec = iSec;
493 WallClock.u32Nano = iNano;
494
495 /*
496 * Write out the wall-clock struct. to guest memory.
497 */
498 Assert(!(WallClock.u32Version & 1));
499 rc = PGMPhysSimpleWriteGCPhys(pVM, GCPhysWallClock, &WallClock, sizeof(GIMKVMWALLCLOCK));
500 if (RT_SUCCESS(rc))
501 {
502 LogRel(("GIM: KVM: Enabled wall-clock struct. at %#RGp - u32Sec=%u u32Nano=%u uVersion=%#RU32\n", GCPhysWallClock,
503 WallClock.u32Sec, WallClock.u32Nano, WallClock.u32Version));
504 }
505 else
506 LogRel(("GIM: KVM: Failed to write wall-clock struct. at %#RGp. rc=%Rrc\n", GCPhysWallClock, rc));
507 return rc;
508}
509
510
511/**
512 * Enables the KVM wall-clock structure.
513 *
514 * Since the wall-clock can be read by any VCPU but it is a global struct. in
515 * guest-memory, we do an EMT rendezvous here to be on the safe side. The
516 * alternative is to use an MMIO2 region and use the WallClock.u32Version field
517 * for transactional update. However, this MSR is rarely written to (typically
518 * once during bootup) it's currently not a performance issue.
519 *
520 * @returns VBox status code.
521 * @param pVM Pointer to the VM.
522 * @param GCPhysWallClock Where the guest wall-clock structure is located.
523 * @param uVersion The version (sequence number) value to use.
524 *
525 * @remarks Don't do any release assertions here, these can be triggered by
526 * guest R0 code.
527 */
528VMMR3_INT_DECL(int) gimR3KvmEnableWallClock(PVM pVM, RTGCPHYS GCPhysWallClock)
529{
530 KVMWALLCLOCKINFO WallClockInfo;
531 WallClockInfo.GCPhysWallClock = GCPhysWallClock;
532 return VMMR3EmtRendezvous(pVM, VMMEMTRENDEZVOUS_FLAGS_TYPE_ONCE, gimR3KvmEnableWallClockCallback, &WallClockInfo);
533}
534
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette