VirtualBox

source: vbox/trunk/src/VBox/HostDrivers/Support/SUPDrv.c@ 40740

Last change on this file since 40740 was 40740, checked in by vboxsync, 13 years ago

SUPDrv: Update GIP data behind a spinlock for online/offline race conditions.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 217.1 KB
Line 
1/* $Revision: 40740 $ */
2/** @file
3 * VBoxDrv - The VirtualBox Support Driver - Common code.
4 */
5
6/*
7 * Copyright (C) 2006-2011 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * The contents of this file may alternatively be used under the terms
18 * of the Common Development and Distribution License Version 1.0
19 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20 * VirtualBox OSE distribution, in which case the provisions of the
21 * CDDL are applicable instead of those of the GPL.
22 *
23 * You may elect to license modified versions of this file under the
24 * terms and conditions of either the GPL or the CDDL or both.
25 */
26
27/*******************************************************************************
28* Header Files *
29*******************************************************************************/
30#define LOG_GROUP LOG_GROUP_SUP_DRV
31#define SUPDRV_AGNOSTIC
32#include "SUPDrvInternal.h"
33#ifndef PAGE_SHIFT
34# include <iprt/param.h>
35#endif
36#include <iprt/asm.h>
37#include <iprt/asm-amd64-x86.h>
38#include <iprt/asm-math.h>
39#include <iprt/cpuset.h>
40#include <iprt/handletable.h>
41#include <iprt/mem.h>
42#include <iprt/mp.h>
43#include <iprt/power.h>
44#include <iprt/process.h>
45#include <iprt/semaphore.h>
46#include <iprt/spinlock.h>
47#include <iprt/thread.h>
48#include <iprt/uuid.h>
49#include <iprt/net.h>
50#include <iprt/crc.h>
51#include <iprt/string.h>
52#include <iprt/timer.h>
53#if defined(RT_OS_DARWIN) || defined(RT_OS_SOLARIS) || defined(RT_OS_FREEBSD)
54# include <iprt/rand.h>
55# include <iprt/path.h>
56#endif
57#include <iprt/x86.h>
58
59#include <VBox/param.h>
60#include <VBox/log.h>
61#include <VBox/err.h>
62#include <VBox/vmm/hwacc_svm.h>
63#include <VBox/vmm/hwacc_vmx.h>
64
65#if defined(RT_OS_SOLARIS) || defined(RT_OS_DARWIN)
66# include "dtrace/SUPDrv.h"
67#else
68# define VBOXDRV_SESSION_CREATE(pvSession, fUser) do { } while (0)
69# define VBOXDRV_SESSION_CLOSE(pvSession) do { } while (0)
70# define VBOXDRV_IOCTL_ENTRY(pvSession, uIOCtl, pvReqHdr) do { } while (0)
71# define VBOXDRV_IOCTL_RETURN(pvSession, uIOCtl, pvReqHdr, rcRet, rcReq) do { } while (0)
72#endif
73
74/*
75 * Logging assignments:
76 * Log - useful stuff, like failures.
77 * LogFlow - program flow, except the really noisy bits.
78 * Log2 - Cleanup.
79 * Log3 - Loader flow noise.
80 * Log4 - Call VMMR0 flow noise.
81 * Log5 - Native yet-to-be-defined noise.
82 * Log6 - Native ioctl flow noise.
83 *
84 * Logging requires BUILD_TYPE=debug and possibly changes to the logger
85 * instantiation in log-vbox.c(pp).
86 */
87
88
89/*******************************************************************************
90* Defined Constants And Macros *
91*******************************************************************************/
92/** The frequency by which we recalculate the u32UpdateHz and
93 * u32UpdateIntervalNS GIP members. The value must be a power of 2. */
94#define GIP_UPDATEHZ_RECALC_FREQ 0x800
95
96/** @def VBOX_SVN_REV
97 * The makefile should define this if it can. */
98#ifndef VBOX_SVN_REV
99# define VBOX_SVN_REV 0
100#endif
101
102#if 0 /* Don't start the GIP timers. Useful when debugging the IPRT timer code. */
103# define DO_NOT_START_GIP
104#endif
105
106
107/*******************************************************************************
108* Internal Functions *
109*******************************************************************************/
110static DECLCALLBACK(int) supdrvSessionObjHandleRetain(RTHANDLETABLE hHandleTable, void *pvObj, void *pvCtx, void *pvUser);
111static DECLCALLBACK(void) supdrvSessionObjHandleDelete(RTHANDLETABLE hHandleTable, uint32_t h, void *pvObj, void *pvCtx, void *pvUser);
112static int supdrvMemAdd(PSUPDRVMEMREF pMem, PSUPDRVSESSION pSession);
113static int supdrvMemRelease(PSUPDRVSESSION pSession, RTHCUINTPTR uPtr, SUPDRVMEMREFTYPE eType);
114static int supdrvIOCtl_LdrOpen(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLDROPEN pReq);
115static int supdrvIOCtl_LdrLoad(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLDRLOAD pReq);
116static int supdrvIOCtl_LdrFree(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLDRFREE pReq);
117static int supdrvIOCtl_LdrGetSymbol(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLDRGETSYMBOL pReq);
118static int supdrvIDC_LdrGetSymbol(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPDRVIDCREQGETSYM pReq);
119static int supdrvLdrSetVMMR0EPs(PSUPDRVDEVEXT pDevExt, void *pvVMMR0, void *pvVMMR0EntryInt, void *pvVMMR0EntryFast, void *pvVMMR0EntryEx);
120static void supdrvLdrUnsetVMMR0EPs(PSUPDRVDEVEXT pDevExt);
121static int supdrvLdrAddUsage(PSUPDRVSESSION pSession, PSUPDRVLDRIMAGE pImage);
122static void supdrvLdrFree(PSUPDRVDEVEXT pDevExt, PSUPDRVLDRIMAGE pImage);
123DECLINLINE(int) supdrvLdrLock(PSUPDRVDEVEXT pDevExt);
124DECLINLINE(int) supdrvLdrUnlock(PSUPDRVDEVEXT pDevExt);
125static int supdrvIOCtl_CallServiceModule(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPCALLSERVICE pReq);
126static int supdrvIOCtl_LoggerSettings(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLOGGERSETTINGS pReq);
127static int supdrvGipCreate(PSUPDRVDEVEXT pDevExt);
128static void supdrvGipDestroy(PSUPDRVDEVEXT pDevExt);
129static DECLCALLBACK(void) supdrvGipSyncTimer(PRTTIMER pTimer, void *pvUser, uint64_t iTick);
130static DECLCALLBACK(void) supdrvGipAsyncTimer(PRTTIMER pTimer, void *pvUser, uint64_t iTick);
131static DECLCALLBACK(void) supdrvGipMpEvent(RTMPEVENT enmEvent, RTCPUID idCpu, void *pvUser);
132static void supdrvGipInit(PSUPDRVDEVEXT pDevExt, PSUPGLOBALINFOPAGE pGip, RTHCPHYS HCPhys,
133 uint64_t u64NanoTS, unsigned uUpdateHz, unsigned cCpus);
134static DECLCALLBACK(void) supdrvGipInitOnCpu(RTCPUID idCpu, void *pvUser1, void *pvUser2);
135static void supdrvGipTerm(PSUPGLOBALINFOPAGE pGip);
136static void supdrvGipUpdate(PSUPGLOBALINFOPAGE pGip, uint64_t u64NanoTS, uint64_t u64TSC, RTCPUID idCpu, uint64_t iTick);
137static void supdrvGipUpdatePerCpu(PSUPGLOBALINFOPAGE pGip, uint64_t u64NanoTS, uint64_t u64TSC,
138 RTCPUID idCpu, uint8_t idApic, uint64_t iTick);
139static void supdrvGipInitCpu(PSUPGLOBALINFOPAGE pGip, PSUPGIPCPU pCpu, uint64_t u64NanoTS);
140
141
142/*******************************************************************************
143* Global Variables *
144*******************************************************************************/
145DECLEXPORT(PSUPGLOBALINFOPAGE) g_pSUPGlobalInfoPage = NULL;
146
147/**
148 * Array of the R0 SUP API.
149 */
150static SUPFUNC g_aFunctions[] =
151{
152 /* name function */
153 /* Entries with absolute addresses determined at runtime, fixup
154 code makes ugly ASSUMPTIONS about the order here: */
155 { "SUPR0AbsIs64bit", (void *)0 },
156 { "SUPR0Abs64bitKernelCS", (void *)0 },
157 { "SUPR0Abs64bitKernelSS", (void *)0 },
158 { "SUPR0Abs64bitKernelDS", (void *)0 },
159 { "SUPR0AbsKernelCS", (void *)0 },
160 { "SUPR0AbsKernelSS", (void *)0 },
161 { "SUPR0AbsKernelDS", (void *)0 },
162 { "SUPR0AbsKernelES", (void *)0 },
163 { "SUPR0AbsKernelFS", (void *)0 },
164 { "SUPR0AbsKernelGS", (void *)0 },
165 { "SUPR0VtgFireProbe", (void *)SUPR0VtgFireProbe },
166 /* Normal function pointers: */
167 { "SUPR0ComponentRegisterFactory", (void *)SUPR0ComponentRegisterFactory },
168 { "SUPR0ComponentDeregisterFactory", (void *)SUPR0ComponentDeregisterFactory },
169 { "SUPR0ComponentQueryFactory", (void *)SUPR0ComponentQueryFactory },
170 { "SUPR0ObjRegister", (void *)SUPR0ObjRegister },
171 { "SUPR0ObjAddRef", (void *)SUPR0ObjAddRef },
172 { "SUPR0ObjAddRefEx", (void *)SUPR0ObjAddRefEx },
173 { "SUPR0ObjRelease", (void *)SUPR0ObjRelease },
174 { "SUPR0ObjVerifyAccess", (void *)SUPR0ObjVerifyAccess },
175 { "SUPR0LockMem", (void *)SUPR0LockMem },
176 { "SUPR0UnlockMem", (void *)SUPR0UnlockMem },
177 { "SUPR0ContAlloc", (void *)SUPR0ContAlloc },
178 { "SUPR0ContFree", (void *)SUPR0ContFree },
179 { "SUPR0LowAlloc", (void *)SUPR0LowAlloc },
180 { "SUPR0LowFree", (void *)SUPR0LowFree },
181 { "SUPR0MemAlloc", (void *)SUPR0MemAlloc },
182 { "SUPR0MemGetPhys", (void *)SUPR0MemGetPhys },
183 { "SUPR0MemFree", (void *)SUPR0MemFree },
184 { "SUPR0PageAllocEx", (void *)SUPR0PageAllocEx },
185 { "SUPR0PageFree", (void *)SUPR0PageFree },
186 { "SUPR0Printf", (void *)SUPR0Printf }, /** @todo needs wrapping? */
187 { "SUPSemEventCreate", (void *)SUPSemEventCreate },
188 { "SUPSemEventClose", (void *)SUPSemEventClose },
189 { "SUPSemEventSignal", (void *)SUPSemEventSignal },
190 { "SUPSemEventWait", (void *)SUPSemEventWait },
191 { "SUPSemEventWaitNoResume", (void *)SUPSemEventWaitNoResume },
192 { "SUPSemEventWaitNsAbsIntr", (void *)SUPSemEventWaitNsAbsIntr },
193 { "SUPSemEventWaitNsRelIntr", (void *)SUPSemEventWaitNsRelIntr },
194 { "SUPSemEventGetResolution", (void *)SUPSemEventGetResolution },
195 { "SUPSemEventMultiCreate", (void *)SUPSemEventMultiCreate },
196 { "SUPSemEventMultiClose", (void *)SUPSemEventMultiClose },
197 { "SUPSemEventMultiSignal", (void *)SUPSemEventMultiSignal },
198 { "SUPSemEventMultiReset", (void *)SUPSemEventMultiReset },
199 { "SUPSemEventMultiWait", (void *)SUPSemEventMultiWait },
200 { "SUPSemEventMultiWaitNoResume", (void *)SUPSemEventMultiWaitNoResume },
201 { "SUPSemEventMultiWaitNsAbsIntr", (void *)SUPSemEventMultiWaitNsAbsIntr },
202 { "SUPSemEventMultiWaitNsRelIntr", (void *)SUPSemEventMultiWaitNsRelIntr },
203 { "SUPSemEventMultiGetResolution", (void *)SUPSemEventMultiGetResolution },
204 { "SUPR0GetPagingMode", (void *)SUPR0GetPagingMode },
205 { "SUPR0EnableVTx", (void *)SUPR0EnableVTx },
206 { "SUPR0VtgRegisterModule", (void *)SUPR0VtgRegisterModule },
207 { "SUPGetGIP", (void *)SUPGetGIP },
208 { "g_pSUPGlobalInfoPage", (void *)&g_pSUPGlobalInfoPage },
209 { "RTMemAllocTag", (void *)RTMemAllocTag },
210 { "RTMemAllocZTag", (void *)RTMemAllocZTag },
211 { "RTMemAllocVarTag", (void *)RTMemAllocVarTag },
212 { "RTMemAllocZVarTag", (void *)RTMemAllocZVarTag },
213 { "RTMemFree", (void *)RTMemFree },
214 { "RTMemDupTag", (void *)RTMemDupTag },
215 { "RTMemDupExTag", (void *)RTMemDupExTag },
216 { "RTMemReallocTag", (void *)RTMemReallocTag },
217 { "RTR0MemObjAllocLowTag", (void *)RTR0MemObjAllocLowTag },
218 { "RTR0MemObjAllocPageTag", (void *)RTR0MemObjAllocPageTag },
219 { "RTR0MemObjAllocPhysTag", (void *)RTR0MemObjAllocPhysTag },
220 { "RTR0MemObjAllocPhysExTag", (void *)RTR0MemObjAllocPhysExTag },
221 { "RTR0MemObjAllocPhysNCTag", (void *)RTR0MemObjAllocPhysNCTag },
222 { "RTR0MemObjAllocContTag", (void *)RTR0MemObjAllocContTag },
223 { "RTR0MemObjEnterPhysTag", (void *)RTR0MemObjEnterPhysTag },
224 { "RTR0MemObjLockUserTag", (void *)RTR0MemObjLockUserTag },
225 { "RTR0MemObjMapKernelTag", (void *)RTR0MemObjMapKernelTag },
226 { "RTR0MemObjMapKernelExTag", (void *)RTR0MemObjMapKernelExTag },
227 { "RTR0MemObjMapUserTag", (void *)RTR0MemObjMapUserTag },
228 { "RTR0MemObjProtect", (void *)RTR0MemObjProtect },
229 { "RTR0MemObjAddress", (void *)RTR0MemObjAddress },
230 { "RTR0MemObjAddressR3", (void *)RTR0MemObjAddressR3 },
231 { "RTR0MemObjSize", (void *)RTR0MemObjSize },
232 { "RTR0MemObjIsMapping", (void *)RTR0MemObjIsMapping },
233 { "RTR0MemObjGetPagePhysAddr", (void *)RTR0MemObjGetPagePhysAddr },
234 { "RTR0MemObjFree", (void *)RTR0MemObjFree },
235 { "RTR0MemUserCopyFrom", (void *)RTR0MemUserCopyFrom },
236 { "RTR0MemUserCopyTo", (void *)RTR0MemUserCopyTo },
237 { "RTR0MemUserIsValidAddr", (void *)RTR0MemUserIsValidAddr },
238 { "RTR0MemKernelIsValidAddr", (void *)RTR0MemKernelIsValidAddr },
239 { "RTR0MemAreKrnlAndUsrDifferent", (void *)RTR0MemAreKrnlAndUsrDifferent },
240 { "RTSemMutexCreate", (void *)RTSemMutexCreate },
241 { "RTSemMutexRequest", (void *)RTSemMutexRequest },
242 { "RTSemMutexRequestDebug", (void *)RTSemMutexRequestDebug },
243 { "RTSemMutexRequestNoResume", (void *)RTSemMutexRequestNoResume },
244 { "RTSemMutexRequestNoResumeDebug", (void *)RTSemMutexRequestNoResumeDebug },
245 { "RTSemMutexRelease", (void *)RTSemMutexRelease },
246 { "RTSemMutexDestroy", (void *)RTSemMutexDestroy },
247 { "RTProcSelf", (void *)RTProcSelf },
248 { "RTR0ProcHandleSelf", (void *)RTR0ProcHandleSelf },
249 { "RTSemFastMutexCreate", (void *)RTSemFastMutexCreate },
250 { "RTSemFastMutexDestroy", (void *)RTSemFastMutexDestroy },
251 { "RTSemFastMutexRequest", (void *)RTSemFastMutexRequest },
252 { "RTSemFastMutexRelease", (void *)RTSemFastMutexRelease },
253 { "RTSemEventCreate", (void *)RTSemEventCreate },
254 { "RTSemEventSignal", (void *)RTSemEventSignal },
255 { "RTSemEventWait", (void *)RTSemEventWait },
256 { "RTSemEventWaitNoResume", (void *)RTSemEventWaitNoResume },
257 { "RTSemEventWaitEx", (void *)RTSemEventWaitEx },
258 { "RTSemEventWaitExDebug", (void *)RTSemEventWaitExDebug },
259 { "RTSemEventGetResolution", (void *)RTSemEventGetResolution },
260 { "RTSemEventDestroy", (void *)RTSemEventDestroy },
261 { "RTSemEventMultiCreate", (void *)RTSemEventMultiCreate },
262 { "RTSemEventMultiSignal", (void *)RTSemEventMultiSignal },
263 { "RTSemEventMultiReset", (void *)RTSemEventMultiReset },
264 { "RTSemEventMultiWait", (void *)RTSemEventMultiWait },
265 { "RTSemEventMultiWaitNoResume", (void *)RTSemEventMultiWaitNoResume },
266 { "RTSemEventMultiWaitEx", (void *)RTSemEventMultiWaitEx },
267 { "RTSemEventMultiWaitExDebug", (void *)RTSemEventMultiWaitExDebug },
268 { "RTSemEventMultiGetResolution", (void *)RTSemEventMultiGetResolution },
269 { "RTSemEventMultiDestroy", (void *)RTSemEventMultiDestroy },
270 { "RTSpinlockCreate", (void *)RTSpinlockCreate },
271 { "RTSpinlockDestroy", (void *)RTSpinlockDestroy },
272 { "RTSpinlockAcquire", (void *)RTSpinlockAcquire },
273 { "RTSpinlockRelease", (void *)RTSpinlockRelease },
274 { "RTSpinlockAcquireNoInts", (void *)RTSpinlockAcquireNoInts },
275 { "RTSpinlockReleaseNoInts", (void *)RTSpinlockReleaseNoInts },
276 { "RTTimeNanoTS", (void *)RTTimeNanoTS },
277 { "RTTimeMilliTS", (void *)RTTimeMilliTS },
278 { "RTTimeSystemNanoTS", (void *)RTTimeSystemNanoTS },
279 { "RTTimeSystemMilliTS", (void *)RTTimeSystemMilliTS },
280 { "RTThreadNativeSelf", (void *)RTThreadNativeSelf },
281 { "RTThreadSleep", (void *)RTThreadSleep },
282 { "RTThreadYield", (void *)RTThreadYield },
283 { "RTThreadSelf", (void *)RTThreadSelf },
284 { "RTThreadCreate", (void *)RTThreadCreate },
285 { "RTThreadGetNative", (void *)RTThreadGetNative },
286 { "RTThreadWait", (void *)RTThreadWait },
287 { "RTThreadWaitNoResume", (void *)RTThreadWaitNoResume },
288 { "RTThreadGetName", (void *)RTThreadGetName },
289 { "RTThreadSelfName", (void *)RTThreadSelfName },
290 { "RTThreadGetType", (void *)RTThreadGetType },
291 { "RTThreadUserSignal", (void *)RTThreadUserSignal },
292 { "RTThreadUserReset", (void *)RTThreadUserReset },
293 { "RTThreadUserWait", (void *)RTThreadUserWait },
294 { "RTThreadUserWaitNoResume", (void *)RTThreadUserWaitNoResume },
295 { "RTThreadPreemptIsEnabled", (void *)RTThreadPreemptIsEnabled },
296 { "RTThreadPreemptIsPending", (void *)RTThreadPreemptIsPending },
297 { "RTThreadPreemptIsPendingTrusty", (void *)RTThreadPreemptIsPendingTrusty },
298 { "RTThreadPreemptIsPossible", (void *)RTThreadPreemptIsPossible },
299 { "RTThreadPreemptDisable", (void *)RTThreadPreemptDisable },
300 { "RTThreadPreemptRestore", (void *)RTThreadPreemptRestore },
301 { "RTThreadIsInInterrupt", (void *)RTThreadIsInInterrupt },
302 { "RTTimerCreate", (void *)RTTimerCreate },
303 { "RTTimerCreateEx", (void *)RTTimerCreateEx },
304 { "RTTimerDestroy", (void *)RTTimerDestroy },
305 { "RTTimerStart", (void *)RTTimerStart },
306 { "RTTimerStop", (void *)RTTimerStop },
307 { "RTTimerChangeInterval", (void *)RTTimerChangeInterval },
308 { "RTTimerGetSystemGranularity", (void *)RTTimerGetSystemGranularity },
309 { "RTTimerRequestSystemGranularity", (void *)RTTimerRequestSystemGranularity },
310 { "RTTimerReleaseSystemGranularity", (void *)RTTimerReleaseSystemGranularity },
311 { "RTTimerCanDoHighResolution", (void *)RTTimerCanDoHighResolution },
312
313 { "RTLogDefaultInstance", (void *)RTLogDefaultInstance },
314 { "RTMpCpuId", (void *)RTMpCpuId },
315 { "RTMpCpuIdFromSetIndex", (void *)RTMpCpuIdFromSetIndex },
316 { "RTMpCpuIdToSetIndex", (void *)RTMpCpuIdToSetIndex },
317 { "RTMpGetArraySize", (void *)RTMpGetArraySize },
318 { "RTMpIsCpuPossible", (void *)RTMpIsCpuPossible },
319 { "RTMpGetCount", (void *)RTMpGetCount },
320 { "RTMpGetMaxCpuId", (void *)RTMpGetMaxCpuId },
321 { "RTMpGetOnlineCount", (void *)RTMpGetOnlineCount },
322 { "RTMpGetOnlineSet", (void *)RTMpGetOnlineSet },
323 { "RTMpGetSet", (void *)RTMpGetSet },
324 { "RTMpIsCpuOnline", (void *)RTMpIsCpuOnline },
325 { "RTMpIsCpuWorkPending", (void *)RTMpIsCpuWorkPending },
326 { "RTMpNotificationRegister", (void *)RTMpNotificationRegister },
327 { "RTMpNotificationDeregister", (void *)RTMpNotificationDeregister },
328 { "RTMpOnAll", (void *)RTMpOnAll },
329 { "RTMpOnOthers", (void *)RTMpOnOthers },
330 { "RTMpOnSpecific", (void *)RTMpOnSpecific },
331 { "RTMpPokeCpu", (void *)RTMpPokeCpu },
332 { "RTPowerNotificationRegister", (void *)RTPowerNotificationRegister },
333 { "RTPowerNotificationDeregister", (void *)RTPowerNotificationDeregister },
334 { "RTLogRelDefaultInstance", (void *)RTLogRelDefaultInstance },
335 { "RTLogSetDefaultInstanceThread", (void *)RTLogSetDefaultInstanceThread },
336 { "RTLogLoggerExV", (void *)RTLogLoggerExV },
337 { "RTLogPrintfV", (void *)RTLogPrintfV },
338 { "RTR0AssertPanicSystem", (void *)RTR0AssertPanicSystem },
339 { "RTAssertMsg1", (void *)RTAssertMsg1 },
340 { "RTAssertMsg2V", (void *)RTAssertMsg2V },
341 { "RTAssertMsg2AddV", (void *)RTAssertMsg2AddV },
342 { "RTAssertSetQuiet", (void *)RTAssertSetQuiet },
343 { "RTAssertMayPanic", (void *)RTAssertMayPanic },
344 { "RTAssertSetMayPanic", (void *)RTAssertSetMayPanic },
345 { "RTAssertAreQuiet", (void *)RTAssertAreQuiet },
346 { "RTStrFormat", (void *)RTStrFormat },
347 { "RTStrFormatNumber", (void *)RTStrFormatNumber },
348 { "RTStrFormatTypeDeregister", (void *)RTStrFormatTypeDeregister },
349 { "RTStrFormatTypeRegister", (void *)RTStrFormatTypeRegister },
350 { "RTStrFormatTypeSetUser", (void *)RTStrFormatTypeSetUser },
351 { "RTStrFormatV", (void *)RTStrFormatV },
352 { "RTStrPrintf", (void *)RTStrPrintf },
353 { "RTStrPrintfEx", (void *)RTStrPrintfEx },
354 { "RTStrPrintfExV", (void *)RTStrPrintfExV },
355 { "RTStrPrintfV", (void *)RTStrPrintfV },
356 { "RTHandleTableAllocWithCtx", (void *)RTHandleTableAllocWithCtx },
357 { "RTHandleTableCreate", (void *)RTHandleTableCreate },
358 { "RTHandleTableCreateEx", (void *)RTHandleTableCreateEx },
359 { "RTHandleTableDestroy", (void *)RTHandleTableDestroy },
360 { "RTHandleTableFreeWithCtx", (void *)RTHandleTableFreeWithCtx },
361 { "RTHandleTableLookupWithCtx", (void *)RTHandleTableLookupWithCtx },
362 { "RTNetIPv4AddDataChecksum", (void *)RTNetIPv4AddDataChecksum },
363 { "RTNetIPv4AddTCPChecksum", (void *)RTNetIPv4AddTCPChecksum },
364 { "RTNetIPv4AddUDPChecksum", (void *)RTNetIPv4AddUDPChecksum },
365 { "RTNetIPv4FinalizeChecksum", (void *)RTNetIPv4FinalizeChecksum },
366 { "RTNetIPv4HdrChecksum", (void *)RTNetIPv4HdrChecksum },
367 { "RTNetIPv4IsDHCPValid", (void *)RTNetIPv4IsDHCPValid },
368 { "RTNetIPv4IsHdrValid", (void *)RTNetIPv4IsHdrValid },
369 { "RTNetIPv4IsTCPSizeValid", (void *)RTNetIPv4IsTCPSizeValid },
370 { "RTNetIPv4IsTCPValid", (void *)RTNetIPv4IsTCPValid },
371 { "RTNetIPv4IsUDPSizeValid", (void *)RTNetIPv4IsUDPSizeValid },
372 { "RTNetIPv4IsUDPValid", (void *)RTNetIPv4IsUDPValid },
373 { "RTNetIPv4PseudoChecksum", (void *)RTNetIPv4PseudoChecksum },
374 { "RTNetIPv4PseudoChecksumBits", (void *)RTNetIPv4PseudoChecksumBits },
375 { "RTNetIPv4TCPChecksum", (void *)RTNetIPv4TCPChecksum },
376 { "RTNetIPv4UDPChecksum", (void *)RTNetIPv4UDPChecksum },
377 { "RTNetIPv6PseudoChecksum", (void *)RTNetIPv6PseudoChecksum },
378 { "RTNetIPv6PseudoChecksumBits", (void *)RTNetIPv6PseudoChecksumBits },
379 { "RTNetIPv6PseudoChecksumEx", (void *)RTNetIPv6PseudoChecksumEx },
380 { "RTNetTCPChecksum", (void *)RTNetTCPChecksum },
381 { "RTNetUDPChecksum", (void *)RTNetUDPChecksum },
382 { "RTCrc32", (void *)RTCrc32 },
383 { "RTCrc32Finish", (void *)RTCrc32Finish },
384 { "RTCrc32Process", (void *)RTCrc32Process },
385 { "RTCrc32Start", (void *)RTCrc32Start },
386};
387
388#if defined(RT_OS_DARWIN) || defined(RT_OS_SOLARIS) || defined(RT_OS_FREEBSD)
389/**
390 * Drag in the rest of IRPT since we share it with the
391 * rest of the kernel modules on darwin.
392 */
393PFNRT g_apfnVBoxDrvIPRTDeps[] =
394{
395 /* VBoxNetFlt */
396 (PFNRT)RTErrConvertFromErrno,
397 (PFNRT)RTUuidCompare,
398 (PFNRT)RTUuidCompareStr,
399 (PFNRT)RTUuidFromStr,
400 (PFNRT)RTStrDupTag,
401 (PFNRT)RTStrFree,
402 (PFNRT)RTStrCopy,
403 (PFNRT)RTStrNCmp,
404 /* VBoxNetAdp */
405 (PFNRT)RTRandBytes,
406 /* VBoxUSB */
407 (PFNRT)RTPathStripFilename,
408 NULL
409};
410#endif /* RT_OS_DARWIN || RT_OS_SOLARIS || RT_OS_SOLARIS */
411
412
413/**
414 * Initializes the device extentsion structure.
415 *
416 * @returns IPRT status code.
417 * @param pDevExt The device extension to initialize.
418 * @param cbSession The size of the session structure. The size of
419 * SUPDRVSESSION may be smaller when SUPDRV_AGNOSTIC is
420 * defined because we're skipping the OS specific members
421 * then.
422 */
423int VBOXCALL supdrvInitDevExt(PSUPDRVDEVEXT pDevExt, size_t cbSession)
424{
425 int rc;
426
427#ifdef SUPDRV_WITH_RELEASE_LOGGER
428 /*
429 * Create the release log.
430 */
431 static const char * const s_apszGroups[] = VBOX_LOGGROUP_NAMES;
432 PRTLOGGER pRelLogger;
433 rc = RTLogCreate(&pRelLogger, 0 /* fFlags */, "all",
434 "VBOX_RELEASE_LOG", RT_ELEMENTS(s_apszGroups), s_apszGroups, RTLOGDEST_STDOUT | RTLOGDEST_DEBUGGER, NULL);
435 if (RT_SUCCESS(rc))
436 RTLogRelSetDefaultInstance(pRelLogger);
437 /** @todo Add native hook for getting logger config parameters and setting
438 * them. On linux we should use the module parameter stuff... */
439#endif
440
441 /*
442 * Initialize it.
443 */
444 memset(pDevExt, 0, sizeof(*pDevExt));
445 rc = RTSpinlockCreate(&pDevExt->Spinlock);
446 if (RT_SUCCESS(rc))
447 {
448#ifdef SUPDRV_USE_MUTEX_FOR_LDR
449 rc = RTSemMutexCreate(&pDevExt->mtxLdr);
450#else
451 rc = RTSemFastMutexCreate(&pDevExt->mtxLdr);
452#endif
453 if (RT_SUCCESS(rc))
454 {
455 rc = RTSemFastMutexCreate(&pDevExt->mtxComponentFactory);
456 if (RT_SUCCESS(rc))
457 {
458#ifdef SUPDRV_USE_MUTEX_FOR_LDR
459 rc = RTSemMutexCreate(&pDevExt->mtxGip);
460#else
461 rc = RTSemFastMutexCreate(&pDevExt->mtxGip);
462#endif
463 if (RT_SUCCESS(rc))
464 {
465 rc = supdrvGipCreate(pDevExt);
466 if (RT_SUCCESS(rc))
467 {
468#ifdef VBOX_WITH_DTRACE_R0DRV
469 rc = supdrvVtgInit(pDevExt, &g_aFunctions[10]);
470 if (RT_SUCCESS(rc))
471#endif
472 {
473 pDevExt->pLdrInitImage = NULL;
474 pDevExt->hLdrInitThread = NIL_RTNATIVETHREAD;
475 pDevExt->u32Cookie = BIRD; /** @todo make this random? */
476 pDevExt->cbSession = (uint32_t)cbSession;
477
478 /*
479 * Fixup the absolute symbols.
480 *
481 * Because of the table indexing assumptions we'll have a little #ifdef orgy
482 * here rather than distributing this to OS specific files. At least for now.
483 */
484#ifdef RT_OS_DARWIN
485# if ARCH_BITS == 32
486 if (SUPR0GetPagingMode() >= SUPPAGINGMODE_AMD64)
487 {
488 g_aFunctions[0].pfn = (void *)1; /* SUPR0AbsIs64bit */
489 g_aFunctions[1].pfn = (void *)0x80; /* SUPR0Abs64bitKernelCS - KERNEL64_CS, seg.h */
490 g_aFunctions[2].pfn = (void *)0x88; /* SUPR0Abs64bitKernelSS - KERNEL64_SS, seg.h */
491 g_aFunctions[3].pfn = (void *)0x88; /* SUPR0Abs64bitKernelDS - KERNEL64_SS, seg.h */
492 }
493 else
494 g_aFunctions[0].pfn = g_aFunctions[1].pfn = g_aFunctions[2].pfn = g_aFunctions[4].pfn = (void *)0;
495 g_aFunctions[4].pfn = (void *)0x08; /* SUPR0AbsKernelCS - KERNEL_CS, seg.h */
496 g_aFunctions[5].pfn = (void *)0x10; /* SUPR0AbsKernelSS - KERNEL_DS, seg.h */
497 g_aFunctions[6].pfn = (void *)0x10; /* SUPR0AbsKernelDS - KERNEL_DS, seg.h */
498 g_aFunctions[7].pfn = (void *)0x10; /* SUPR0AbsKernelES - KERNEL_DS, seg.h */
499 g_aFunctions[8].pfn = (void *)0x10; /* SUPR0AbsKernelFS - KERNEL_DS, seg.h */
500 g_aFunctions[9].pfn = (void *)0x48; /* SUPR0AbsKernelGS - CPU_DATA_GS, seg.h */
501# else /* 64-bit darwin: */
502 g_aFunctions[0].pfn = (void *)1; /* SUPR0AbsIs64bit */
503 g_aFunctions[1].pfn = (void *)(uintptr_t)ASMGetCS(); /* SUPR0Abs64bitKernelCS */
504 g_aFunctions[2].pfn = (void *)(uintptr_t)ASMGetSS(); /* SUPR0Abs64bitKernelSS */
505 g_aFunctions[3].pfn = (void *)0; /* SUPR0Abs64bitKernelDS */
506 g_aFunctions[4].pfn = (void *)(uintptr_t)ASMGetCS(); /* SUPR0AbsKernelCS */
507 g_aFunctions[5].pfn = (void *)(uintptr_t)ASMGetSS(); /* SUPR0AbsKernelSS */
508 g_aFunctions[6].pfn = (void *)0; /* SUPR0AbsKernelDS */
509 g_aFunctions[7].pfn = (void *)0; /* SUPR0AbsKernelES */
510 g_aFunctions[8].pfn = (void *)0; /* SUPR0AbsKernelFS */
511 g_aFunctions[9].pfn = (void *)0; /* SUPR0AbsKernelGS */
512
513# endif
514#else /* !RT_OS_DARWIN */
515# if ARCH_BITS == 64
516 g_aFunctions[0].pfn = (void *)1; /* SUPR0AbsIs64bit */
517 g_aFunctions[1].pfn = (void *)(uintptr_t)ASMGetCS(); /* SUPR0Abs64bitKernelCS */
518 g_aFunctions[2].pfn = (void *)(uintptr_t)ASMGetSS(); /* SUPR0Abs64bitKernelSS */
519 g_aFunctions[3].pfn = (void *)(uintptr_t)ASMGetDS(); /* SUPR0Abs64bitKernelDS */
520# else
521 g_aFunctions[0].pfn = g_aFunctions[1].pfn = g_aFunctions[2].pfn = g_aFunctions[4].pfn = (void *)0;
522# endif
523 g_aFunctions[4].pfn = (void *)(uintptr_t)ASMGetCS(); /* SUPR0AbsKernelCS */
524 g_aFunctions[5].pfn = (void *)(uintptr_t)ASMGetSS(); /* SUPR0AbsKernelSS */
525 g_aFunctions[6].pfn = (void *)(uintptr_t)ASMGetDS(); /* SUPR0AbsKernelDS */
526 g_aFunctions[7].pfn = (void *)(uintptr_t)ASMGetES(); /* SUPR0AbsKernelES */
527 g_aFunctions[8].pfn = (void *)(uintptr_t)ASMGetFS(); /* SUPR0AbsKernelFS */
528 g_aFunctions[9].pfn = (void *)(uintptr_t)ASMGetGS(); /* SUPR0AbsKernelGS */
529#endif /* !RT_OS_DARWIN */
530 return VINF_SUCCESS;
531 }
532
533#ifdef VBOX_WITH_DTRACE_R0DRV
534 supdrvGipDestroy(pDevExt);
535#endif
536 }
537
538#ifdef SUPDRV_USE_MUTEX_FOR_GIP
539 RTSemMutexDestroy(pDevExt->mtxGip);
540 pDevExt->mtxGip = NIL_RTSEMMUTEX;
541#else
542 RTSemFastMutexDestroy(pDevExt->mtxGip);
543 pDevExt->mtxGip = NIL_RTSEMFASTMUTEX;
544#endif
545 }
546 RTSemFastMutexDestroy(pDevExt->mtxComponentFactory);
547 pDevExt->mtxComponentFactory = NIL_RTSEMFASTMUTEX;
548 }
549#ifdef SUPDRV_USE_MUTEX_FOR_LDR
550 RTSemMutexDestroy(pDevExt->mtxLdr);
551 pDevExt->mtxLdr = NIL_RTSEMMUTEX;
552#else
553 RTSemFastMutexDestroy(pDevExt->mtxLdr);
554 pDevExt->mtxLdr = NIL_RTSEMFASTMUTEX;
555#endif
556 }
557 RTSpinlockDestroy(pDevExt->Spinlock);
558 pDevExt->Spinlock = NIL_RTSPINLOCK;
559 }
560#ifdef SUPDRV_WITH_RELEASE_LOGGER
561 RTLogDestroy(RTLogRelSetDefaultInstance(NULL));
562 RTLogDestroy(RTLogSetDefaultInstance(NULL));
563#endif
564
565 return rc;
566}
567
568
569/**
570 * Delete the device extension (e.g. cleanup members).
571 *
572 * @param pDevExt The device extension to delete.
573 */
574void VBOXCALL supdrvDeleteDevExt(PSUPDRVDEVEXT pDevExt)
575{
576 PSUPDRVOBJ pObj;
577 PSUPDRVUSAGE pUsage;
578
579 /*
580 * Kill mutexes and spinlocks.
581 */
582#ifdef SUPDRV_USE_MUTEX_FOR_GIP
583 RTSemMutexDestroy(pDevExt->mtxGip);
584 pDevExt->mtxGip = NIL_RTSEMMUTEX;
585#else
586 RTSemFastMutexDestroy(pDevExt->mtxGip);
587 pDevExt->mtxGip = NIL_RTSEMFASTMUTEX;
588#endif
589#ifdef SUPDRV_USE_MUTEX_FOR_LDR
590 RTSemMutexDestroy(pDevExt->mtxLdr);
591 pDevExt->mtxLdr = NIL_RTSEMMUTEX;
592#else
593 RTSemFastMutexDestroy(pDevExt->mtxLdr);
594 pDevExt->mtxLdr = NIL_RTSEMFASTMUTEX;
595#endif
596 RTSpinlockDestroy(pDevExt->Spinlock);
597 pDevExt->Spinlock = NIL_RTSPINLOCK;
598 RTSemFastMutexDestroy(pDevExt->mtxComponentFactory);
599 pDevExt->mtxComponentFactory = NIL_RTSEMFASTMUTEX;
600
601 /*
602 * Free lists.
603 */
604 /* objects. */
605 pObj = pDevExt->pObjs;
606 Assert(!pObj); /* (can trigger on forced unloads) */
607 pDevExt->pObjs = NULL;
608 while (pObj)
609 {
610 void *pvFree = pObj;
611 pObj = pObj->pNext;
612 RTMemFree(pvFree);
613 }
614
615 /* usage records. */
616 pUsage = pDevExt->pUsageFree;
617 pDevExt->pUsageFree = NULL;
618 while (pUsage)
619 {
620 void *pvFree = pUsage;
621 pUsage = pUsage->pNext;
622 RTMemFree(pvFree);
623 }
624
625 /* kill the GIP. */
626 supdrvGipDestroy(pDevExt);
627
628#ifdef VBOX_WITH_DTRACE_R0DRV
629 supdrvVtgTerm(pDevExt);
630#endif
631
632#ifdef SUPDRV_WITH_RELEASE_LOGGER
633 /* destroy the loggers. */
634 RTLogDestroy(RTLogRelSetDefaultInstance(NULL));
635 RTLogDestroy(RTLogSetDefaultInstance(NULL));
636#endif
637}
638
639
640/**
641 * Create session.
642 *
643 * @returns IPRT status code.
644 * @param pDevExt Device extension.
645 * @param fUser Flag indicating whether this is a user or kernel session.
646 * @param ppSession Where to store the pointer to the session data.
647 */
648int VBOXCALL supdrvCreateSession(PSUPDRVDEVEXT pDevExt, bool fUser, PSUPDRVSESSION *ppSession)
649{
650 /*
651 * Allocate memory for the session data.
652 */
653 int rc;
654 PSUPDRVSESSION pSession = *ppSession = (PSUPDRVSESSION)RTMemAllocZ(pDevExt->cbSession);
655 if (pSession)
656 {
657 /* Initialize session data. */
658 rc = RTSpinlockCreate(&pSession->Spinlock);
659 if (!rc)
660 {
661 rc = RTHandleTableCreateEx(&pSession->hHandleTable,
662 RTHANDLETABLE_FLAGS_LOCKED | RTHANDLETABLE_FLAGS_CONTEXT,
663 1 /*uBase*/, 32768 /*cMax*/, supdrvSessionObjHandleRetain, pSession);
664 if (RT_SUCCESS(rc))
665 {
666 Assert(pSession->Spinlock != NIL_RTSPINLOCK);
667 pSession->pDevExt = pDevExt;
668 pSession->u32Cookie = BIRD_INV;
669 /*pSession->pLdrUsage = NULL;
670 pSession->pVM = NULL;
671 pSession->pUsage = NULL;
672 pSession->pGip = NULL;
673 pSession->fGipReferenced = false;
674 pSession->Bundle.cUsed = 0; */
675 pSession->Uid = NIL_RTUID;
676 pSession->Gid = NIL_RTGID;
677 if (fUser)
678 {
679 pSession->Process = RTProcSelf();
680 pSession->R0Process = RTR0ProcHandleSelf();
681 }
682 else
683 {
684 pSession->Process = NIL_RTPROCESS;
685 pSession->R0Process = NIL_RTR0PROCESS;
686 }
687
688 VBOXDRV_SESSION_CREATE(pSession, fUser);
689 LogFlow(("Created session %p initial cookie=%#x\n", pSession, pSession->u32Cookie));
690 return VINF_SUCCESS;
691 }
692
693 RTSpinlockDestroy(pSession->Spinlock);
694 }
695 RTMemFree(pSession);
696 *ppSession = NULL;
697 Log(("Failed to create spinlock, rc=%d!\n", rc));
698 }
699 else
700 rc = VERR_NO_MEMORY;
701
702 return rc;
703}
704
705
706/**
707 * Shared code for cleaning up a session.
708 *
709 * @param pDevExt Device extension.
710 * @param pSession Session data.
711 * This data will be freed by this routine.
712 */
713void VBOXCALL supdrvCloseSession(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession)
714{
715 VBOXDRV_SESSION_CLOSE(pSession);
716
717 /*
718 * Cleanup the session first.
719 */
720 supdrvCleanupSession(pDevExt, pSession);
721
722 /*
723 * Free the rest of the session stuff.
724 */
725 RTSpinlockDestroy(pSession->Spinlock);
726 pSession->Spinlock = NIL_RTSPINLOCK;
727 pSession->pDevExt = NULL;
728 RTMemFree(pSession);
729 LogFlow(("supdrvCloseSession: returns\n"));
730}
731
732
733/**
734 * Shared code for cleaning up a session (but not quite freeing it).
735 *
736 * This is primarily intended for MAC OS X where we have to clean up the memory
737 * stuff before the file handle is closed.
738 *
739 * @param pDevExt Device extension.
740 * @param pSession Session data.
741 * This data will be freed by this routine.
742 */
743void VBOXCALL supdrvCleanupSession(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession)
744{
745 int rc;
746 PSUPDRVBUNDLE pBundle;
747 LogFlow(("supdrvCleanupSession: pSession=%p\n", pSession));
748
749 /*
750 * Remove logger instances related to this session.
751 */
752 RTLogSetDefaultInstanceThread(NULL, (uintptr_t)pSession);
753
754 /*
755 * Destroy the handle table.
756 */
757 rc = RTHandleTableDestroy(pSession->hHandleTable, supdrvSessionObjHandleDelete, pSession);
758 AssertRC(rc);
759 pSession->hHandleTable = NIL_RTHANDLETABLE;
760
761 /*
762 * Release object references made in this session.
763 * In theory there should be noone racing us in this session.
764 */
765 Log2(("release objects - start\n"));
766 if (pSession->pUsage)
767 {
768 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
769 PSUPDRVUSAGE pUsage;
770 RTSpinlockAcquire(pDevExt->Spinlock, &SpinlockTmp);
771
772 while ((pUsage = pSession->pUsage) != NULL)
773 {
774 PSUPDRVOBJ pObj = pUsage->pObj;
775 pSession->pUsage = pUsage->pNext;
776
777 AssertMsg(pUsage->cUsage >= 1 && pObj->cUsage >= pUsage->cUsage, ("glob %d; sess %d\n", pObj->cUsage, pUsage->cUsage));
778 if (pUsage->cUsage < pObj->cUsage)
779 {
780 pObj->cUsage -= pUsage->cUsage;
781 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
782 }
783 else
784 {
785 /* Destroy the object and free the record. */
786 if (pDevExt->pObjs == pObj)
787 pDevExt->pObjs = pObj->pNext;
788 else
789 {
790 PSUPDRVOBJ pObjPrev;
791 for (pObjPrev = pDevExt->pObjs; pObjPrev; pObjPrev = pObjPrev->pNext)
792 if (pObjPrev->pNext == pObj)
793 {
794 pObjPrev->pNext = pObj->pNext;
795 break;
796 }
797 Assert(pObjPrev);
798 }
799 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
800
801 Log(("supdrvCleanupSession: destroying %p/%d (%p/%p) cpid=%RTproc pid=%RTproc dtor=%p\n",
802 pObj, pObj->enmType, pObj->pvUser1, pObj->pvUser2, pObj->CreatorProcess, RTProcSelf(), pObj->pfnDestructor));
803 if (pObj->pfnDestructor)
804 pObj->pfnDestructor(pObj, pObj->pvUser1, pObj->pvUser2);
805 RTMemFree(pObj);
806 }
807
808 /* free it and continue. */
809 RTMemFree(pUsage);
810
811 RTSpinlockAcquire(pDevExt->Spinlock, &SpinlockTmp);
812 }
813
814 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
815 AssertMsg(!pSession->pUsage, ("Some buster reregistered an object during desturction!\n"));
816 }
817 Log2(("release objects - done\n"));
818
819 /*
820 * Release memory allocated in the session.
821 *
822 * We do not serialize this as we assume that the application will
823 * not allocated memory while closing the file handle object.
824 */
825 Log2(("freeing memory:\n"));
826 pBundle = &pSession->Bundle;
827 while (pBundle)
828 {
829 PSUPDRVBUNDLE pToFree;
830 unsigned i;
831
832 /*
833 * Check and unlock all entries in the bundle.
834 */
835 for (i = 0; i < RT_ELEMENTS(pBundle->aMem); i++)
836 {
837 if (pBundle->aMem[i].MemObj != NIL_RTR0MEMOBJ)
838 {
839 Log2(("eType=%d pvR0=%p pvR3=%p cb=%ld\n", pBundle->aMem[i].eType, RTR0MemObjAddress(pBundle->aMem[i].MemObj),
840 (void *)RTR0MemObjAddressR3(pBundle->aMem[i].MapObjR3), (long)RTR0MemObjSize(pBundle->aMem[i].MemObj)));
841 if (pBundle->aMem[i].MapObjR3 != NIL_RTR0MEMOBJ)
842 {
843 rc = RTR0MemObjFree(pBundle->aMem[i].MapObjR3, false);
844 AssertRC(rc); /** @todo figure out how to handle this. */
845 pBundle->aMem[i].MapObjR3 = NIL_RTR0MEMOBJ;
846 }
847 rc = RTR0MemObjFree(pBundle->aMem[i].MemObj, true /* fFreeMappings */);
848 AssertRC(rc); /** @todo figure out how to handle this. */
849 pBundle->aMem[i].MemObj = NIL_RTR0MEMOBJ;
850 pBundle->aMem[i].eType = MEMREF_TYPE_UNUSED;
851 }
852 }
853
854 /*
855 * Advance and free previous bundle.
856 */
857 pToFree = pBundle;
858 pBundle = pBundle->pNext;
859
860 pToFree->pNext = NULL;
861 pToFree->cUsed = 0;
862 if (pToFree != &pSession->Bundle)
863 RTMemFree(pToFree);
864 }
865 Log2(("freeing memory - done\n"));
866
867 /*
868 * Deregister component factories.
869 */
870 RTSemFastMutexRequest(pDevExt->mtxComponentFactory);
871 Log2(("deregistering component factories:\n"));
872 if (pDevExt->pComponentFactoryHead)
873 {
874 PSUPDRVFACTORYREG pPrev = NULL;
875 PSUPDRVFACTORYREG pCur = pDevExt->pComponentFactoryHead;
876 while (pCur)
877 {
878 if (pCur->pSession == pSession)
879 {
880 /* unlink it */
881 PSUPDRVFACTORYREG pNext = pCur->pNext;
882 if (pPrev)
883 pPrev->pNext = pNext;
884 else
885 pDevExt->pComponentFactoryHead = pNext;
886
887 /* free it */
888 pCur->pNext = NULL;
889 pCur->pSession = NULL;
890 pCur->pFactory = NULL;
891 RTMemFree(pCur);
892
893 /* next */
894 pCur = pNext;
895 }
896 else
897 {
898 /* next */
899 pPrev = pCur;
900 pCur = pCur->pNext;
901 }
902 }
903 }
904 RTSemFastMutexRelease(pDevExt->mtxComponentFactory);
905 Log2(("deregistering component factories - done\n"));
906
907 /*
908 * Loaded images needs to be dereferenced and possibly freed up.
909 */
910 supdrvLdrLock(pDevExt);
911 Log2(("freeing images:\n"));
912 if (pSession->pLdrUsage)
913 {
914 PSUPDRVLDRUSAGE pUsage = pSession->pLdrUsage;
915 pSession->pLdrUsage = NULL;
916 while (pUsage)
917 {
918 void *pvFree = pUsage;
919 PSUPDRVLDRIMAGE pImage = pUsage->pImage;
920 if (pImage->cUsage > pUsage->cUsage)
921 pImage->cUsage -= pUsage->cUsage;
922 else
923 supdrvLdrFree(pDevExt, pImage);
924 pUsage->pImage = NULL;
925 pUsage = pUsage->pNext;
926 RTMemFree(pvFree);
927 }
928 }
929 supdrvLdrUnlock(pDevExt);
930 Log2(("freeing images - done\n"));
931
932 /*
933 * Unmap the GIP.
934 */
935 Log2(("umapping GIP:\n"));
936 if (pSession->GipMapObjR3 != NIL_RTR0MEMOBJ)
937 {
938 SUPR0GipUnmap(pSession);
939 pSession->fGipReferenced = 0;
940 }
941 Log2(("umapping GIP - done\n"));
942}
943
944
945/**
946 * RTHandleTableDestroy callback used by supdrvCleanupSession.
947 *
948 * @returns IPRT status code, see SUPR0ObjAddRef.
949 * @param hHandleTable The handle table handle. Ignored.
950 * @param pvObj The object pointer.
951 * @param pvCtx Context, the handle type. Ignored.
952 * @param pvUser Session pointer.
953 */
954static DECLCALLBACK(int) supdrvSessionObjHandleRetain(RTHANDLETABLE hHandleTable, void *pvObj, void *pvCtx, void *pvUser)
955{
956 NOREF(pvCtx);
957 NOREF(hHandleTable);
958 return SUPR0ObjAddRefEx(pvObj, (PSUPDRVSESSION)pvUser, true /*fNoBlocking*/);
959}
960
961
962/**
963 * RTHandleTableDestroy callback used by supdrvCleanupSession.
964 *
965 * @param hHandleTable The handle table handle. Ignored.
966 * @param h The handle value. Ignored.
967 * @param pvObj The object pointer.
968 * @param pvCtx Context, the handle type. Ignored.
969 * @param pvUser Session pointer.
970 */
971static DECLCALLBACK(void) supdrvSessionObjHandleDelete(RTHANDLETABLE hHandleTable, uint32_t h, void *pvObj, void *pvCtx, void *pvUser)
972{
973 NOREF(pvCtx);
974 NOREF(h);
975 NOREF(hHandleTable);
976 SUPR0ObjRelease(pvObj, (PSUPDRVSESSION)pvUser);
977}
978
979
980/**
981 * Fast path I/O Control worker.
982 *
983 * @returns VBox status code that should be passed down to ring-3 unchanged.
984 * @param uIOCtl Function number.
985 * @param idCpu VMCPU id.
986 * @param pDevExt Device extention.
987 * @param pSession Session data.
988 */
989int VBOXCALL supdrvIOCtlFast(uintptr_t uIOCtl, VMCPUID idCpu, PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession)
990{
991 /*
992 * We check the two prereqs after doing this only to allow the compiler to optimize things better.
993 */
994 if (RT_LIKELY( RT_VALID_PTR(pSession)
995 && pSession->pVM
996 && pDevExt->pfnVMMR0EntryFast))
997 {
998 switch (uIOCtl)
999 {
1000 case SUP_IOCTL_FAST_DO_RAW_RUN:
1001 pDevExt->pfnVMMR0EntryFast(pSession->pVM, idCpu, SUP_VMMR0_DO_RAW_RUN);
1002 break;
1003 case SUP_IOCTL_FAST_DO_HWACC_RUN:
1004 pDevExt->pfnVMMR0EntryFast(pSession->pVM, idCpu, SUP_VMMR0_DO_HWACC_RUN);
1005 break;
1006 case SUP_IOCTL_FAST_DO_NOP:
1007 pDevExt->pfnVMMR0EntryFast(pSession->pVM, idCpu, SUP_VMMR0_DO_NOP);
1008 break;
1009 default:
1010 return VERR_INTERNAL_ERROR;
1011 }
1012 return VINF_SUCCESS;
1013 }
1014 return VERR_INTERNAL_ERROR;
1015}
1016
1017
1018/**
1019 * Helper for supdrvIOCtl. Check if pszStr contains any character of pszChars.
1020 * We would use strpbrk here if this function would be contained in the RedHat kABI white
1021 * list, see http://www.kerneldrivers.org/RHEL5.
1022 *
1023 * @returns 1 if pszStr does contain any character of pszChars, 0 otherwise.
1024 * @param pszStr String to check
1025 * @param pszChars Character set
1026 */
1027static int supdrvCheckInvalidChar(const char *pszStr, const char *pszChars)
1028{
1029 int chCur;
1030 while ((chCur = *pszStr++) != '\0')
1031 {
1032 int ch;
1033 const char *psz = pszChars;
1034 while ((ch = *psz++) != '\0')
1035 if (ch == chCur)
1036 return 1;
1037
1038 }
1039 return 0;
1040}
1041
1042
1043/**
1044 * I/O Control worker.
1045 *
1046 * @returns IPRT status code.
1047 * @retval VERR_INVALID_PARAMETER if the request is invalid.
1048 *
1049 * @param uIOCtl Function number.
1050 * @param pDevExt Device extention.
1051 * @param pSession Session data.
1052 * @param pReqHdr The request header.
1053 */
1054int VBOXCALL supdrvIOCtl(uintptr_t uIOCtl, PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPREQHDR pReqHdr)
1055{
1056 VBOXDRV_IOCTL_ENTRY(pSession, uIOCtl, pReqHdr);
1057
1058 /*
1059 * Validate the request.
1060 */
1061 /* this first check could probably be omitted as its also done by the OS specific code... */
1062 if (RT_UNLIKELY( (pReqHdr->fFlags & SUPREQHDR_FLAGS_MAGIC_MASK) != SUPREQHDR_FLAGS_MAGIC
1063 || pReqHdr->cbIn < sizeof(*pReqHdr)
1064 || pReqHdr->cbOut < sizeof(*pReqHdr)))
1065 {
1066 OSDBGPRINT(("vboxdrv: Bad ioctl request header; cbIn=%#lx cbOut=%#lx fFlags=%#lx\n",
1067 (long)pReqHdr->cbIn, (long)pReqHdr->cbOut, (long)pReqHdr->fFlags));
1068 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_INVALID_PARAMETER, VINF_SUCCESS);
1069 return VERR_INVALID_PARAMETER;
1070 }
1071 if (RT_UNLIKELY(!RT_VALID_PTR(pSession)))
1072 {
1073 OSDBGPRINT(("vboxdrv: Invalid pSession valud %p (ioctl=%p)\n", pSession, (void *)uIOCtl));
1074 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_INVALID_PARAMETER, VINF_SUCCESS);
1075 return VERR_INVALID_PARAMETER;
1076 }
1077 if (RT_UNLIKELY(uIOCtl == SUP_IOCTL_COOKIE))
1078 {
1079 if (pReqHdr->u32Cookie != SUPCOOKIE_INITIAL_COOKIE)
1080 {
1081 OSDBGPRINT(("SUP_IOCTL_COOKIE: bad cookie %#lx\n", (long)pReqHdr->u32Cookie));
1082 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_INVALID_PARAMETER, VINF_SUCCESS);
1083 return VERR_INVALID_PARAMETER;
1084 }
1085 }
1086 else if (RT_UNLIKELY( pReqHdr->u32Cookie != pDevExt->u32Cookie
1087 || pReqHdr->u32SessionCookie != pSession->u32Cookie))
1088 {
1089 OSDBGPRINT(("vboxdrv: bad cookie %#lx / %#lx.\n", (long)pReqHdr->u32Cookie, (long)pReqHdr->u32SessionCookie));
1090 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_INVALID_PARAMETER, VINF_SUCCESS);
1091 return VERR_INVALID_PARAMETER;
1092 }
1093
1094/*
1095 * Validation macros
1096 */
1097#define REQ_CHECK_SIZES_EX(Name, cbInExpect, cbOutExpect) \
1098 do { \
1099 if (RT_UNLIKELY(pReqHdr->cbIn != (cbInExpect) || pReqHdr->cbOut != (cbOutExpect))) \
1100 { \
1101 OSDBGPRINT(( #Name ": Invalid input/output sizes. cbIn=%ld expected %ld. cbOut=%ld expected %ld.\n", \
1102 (long)pReq->Hdr.cbIn, (long)(cbInExpect), (long)pReq->Hdr.cbOut, (long)(cbOutExpect))); \
1103 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_INVALID_PARAMETER, VERR_INVALID_PARAMETER); \
1104 return pReq->Hdr.rc = VERR_INVALID_PARAMETER; \
1105 } \
1106 } while (0)
1107
1108#define REQ_CHECK_SIZES(Name) REQ_CHECK_SIZES_EX(Name, Name ## _SIZE_IN, Name ## _SIZE_OUT)
1109
1110#define REQ_CHECK_SIZE_IN(Name, cbInExpect) \
1111 do { \
1112 if (RT_UNLIKELY(pReqHdr->cbIn != (cbInExpect))) \
1113 { \
1114 OSDBGPRINT(( #Name ": Invalid input/output sizes. cbIn=%ld expected %ld.\n", \
1115 (long)pReq->Hdr.cbIn, (long)(cbInExpect))); \
1116 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_INVALID_PARAMETER, VERR_INVALID_PARAMETER); \
1117 return pReq->Hdr.rc = VERR_INVALID_PARAMETER; \
1118 } \
1119 } while (0)
1120
1121#define REQ_CHECK_SIZE_OUT(Name, cbOutExpect) \
1122 do { \
1123 if (RT_UNLIKELY(pReqHdr->cbOut != (cbOutExpect))) \
1124 { \
1125 OSDBGPRINT(( #Name ": Invalid input/output sizes. cbOut=%ld expected %ld.\n", \
1126 (long)pReq->Hdr.cbOut, (long)(cbOutExpect))); \
1127 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_INVALID_PARAMETER, VERR_INVALID_PARAMETER); \
1128 return pReq->Hdr.rc = VERR_INVALID_PARAMETER; \
1129 } \
1130 } while (0)
1131
1132#define REQ_CHECK_EXPR(Name, expr) \
1133 do { \
1134 if (RT_UNLIKELY(!(expr))) \
1135 { \
1136 OSDBGPRINT(( #Name ": %s\n", #expr)); \
1137 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_INVALID_PARAMETER, VERR_INVALID_PARAMETER); \
1138 return pReq->Hdr.rc = VERR_INVALID_PARAMETER; \
1139 } \
1140 } while (0)
1141
1142#define REQ_CHECK_EXPR_FMT(expr, fmt) \
1143 do { \
1144 if (RT_UNLIKELY(!(expr))) \
1145 { \
1146 OSDBGPRINT( fmt ); \
1147 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_INVALID_PARAMETER, VERR_INVALID_PARAMETER); \
1148 return pReq->Hdr.rc = VERR_INVALID_PARAMETER; \
1149 } \
1150 } while (0)
1151
1152 /*
1153 * The switch.
1154 */
1155 switch (SUP_CTL_CODE_NO_SIZE(uIOCtl))
1156 {
1157 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_COOKIE):
1158 {
1159 PSUPCOOKIE pReq = (PSUPCOOKIE)pReqHdr;
1160 REQ_CHECK_SIZES(SUP_IOCTL_COOKIE);
1161 if (strncmp(pReq->u.In.szMagic, SUPCOOKIE_MAGIC, sizeof(pReq->u.In.szMagic)))
1162 {
1163 OSDBGPRINT(("SUP_IOCTL_COOKIE: invalid magic %.16s\n", pReq->u.In.szMagic));
1164 pReq->Hdr.rc = VERR_INVALID_MAGIC;
1165 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, VERR_INVALID_MAGIC);
1166 return 0;
1167 }
1168
1169#if 0
1170 /*
1171 * Call out to the OS specific code and let it do permission checks on the
1172 * client process.
1173 */
1174 if (!supdrvOSValidateClientProcess(pDevExt, pSession))
1175 {
1176 pReq->u.Out.u32Cookie = 0xffffffff;
1177 pReq->u.Out.u32SessionCookie = 0xffffffff;
1178 pReq->u.Out.u32SessionVersion = 0xffffffff;
1179 pReq->u.Out.u32DriverVersion = SUPDRV_IOC_VERSION;
1180 pReq->u.Out.pSession = NULL;
1181 pReq->u.Out.cFunctions = 0;
1182 pReq->Hdr.rc = VERR_PERMISSION_DENIED;
1183 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, VERR_PERMISSION_DENIED);
1184 return 0;
1185 }
1186#endif
1187
1188 /*
1189 * Match the version.
1190 * The current logic is very simple, match the major interface version.
1191 */
1192 if ( pReq->u.In.u32MinVersion > SUPDRV_IOC_VERSION
1193 || (pReq->u.In.u32MinVersion & 0xffff0000) != (SUPDRV_IOC_VERSION & 0xffff0000))
1194 {
1195 OSDBGPRINT(("SUP_IOCTL_COOKIE: Version mismatch. Requested: %#x Min: %#x Current: %#x\n",
1196 pReq->u.In.u32ReqVersion, pReq->u.In.u32MinVersion, SUPDRV_IOC_VERSION));
1197 pReq->u.Out.u32Cookie = 0xffffffff;
1198 pReq->u.Out.u32SessionCookie = 0xffffffff;
1199 pReq->u.Out.u32SessionVersion = 0xffffffff;
1200 pReq->u.Out.u32DriverVersion = SUPDRV_IOC_VERSION;
1201 pReq->u.Out.pSession = NULL;
1202 pReq->u.Out.cFunctions = 0;
1203 pReq->Hdr.rc = VERR_VERSION_MISMATCH;
1204 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1205 return 0;
1206 }
1207
1208 /*
1209 * Fill in return data and be gone.
1210 * N.B. The first one to change SUPDRV_IOC_VERSION shall makes sure that
1211 * u32SessionVersion <= u32ReqVersion!
1212 */
1213 /** @todo Somehow validate the client and negotiate a secure cookie... */
1214 pReq->u.Out.u32Cookie = pDevExt->u32Cookie;
1215 pReq->u.Out.u32SessionCookie = pSession->u32Cookie;
1216 pReq->u.Out.u32SessionVersion = SUPDRV_IOC_VERSION;
1217 pReq->u.Out.u32DriverVersion = SUPDRV_IOC_VERSION;
1218 pReq->u.Out.pSession = pSession;
1219 pReq->u.Out.cFunctions = sizeof(g_aFunctions) / sizeof(g_aFunctions[0]);
1220 pReq->Hdr.rc = VINF_SUCCESS;
1221 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1222 return 0;
1223 }
1224
1225 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_QUERY_FUNCS(0)):
1226 {
1227 /* validate */
1228 PSUPQUERYFUNCS pReq = (PSUPQUERYFUNCS)pReqHdr;
1229 REQ_CHECK_SIZES_EX(SUP_IOCTL_QUERY_FUNCS, SUP_IOCTL_QUERY_FUNCS_SIZE_IN, SUP_IOCTL_QUERY_FUNCS_SIZE_OUT(RT_ELEMENTS(g_aFunctions)));
1230
1231 /* execute */
1232 pReq->u.Out.cFunctions = RT_ELEMENTS(g_aFunctions);
1233 memcpy(&pReq->u.Out.aFunctions[0], g_aFunctions, sizeof(g_aFunctions));
1234 pReq->Hdr.rc = VINF_SUCCESS;
1235 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1236 return 0;
1237 }
1238
1239 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_PAGE_LOCK):
1240 {
1241 /* validate */
1242 PSUPPAGELOCK pReq = (PSUPPAGELOCK)pReqHdr;
1243 REQ_CHECK_SIZE_IN(SUP_IOCTL_PAGE_LOCK, SUP_IOCTL_PAGE_LOCK_SIZE_IN);
1244 REQ_CHECK_SIZE_OUT(SUP_IOCTL_PAGE_LOCK, SUP_IOCTL_PAGE_LOCK_SIZE_OUT(pReq->u.In.cPages));
1245 REQ_CHECK_EXPR(SUP_IOCTL_PAGE_LOCK, pReq->u.In.cPages > 0);
1246 REQ_CHECK_EXPR(SUP_IOCTL_PAGE_LOCK, pReq->u.In.pvR3 >= PAGE_SIZE);
1247
1248 /* execute */
1249 pReq->Hdr.rc = SUPR0LockMem(pSession, pReq->u.In.pvR3, pReq->u.In.cPages, &pReq->u.Out.aPages[0]);
1250 if (RT_FAILURE(pReq->Hdr.rc))
1251 pReq->Hdr.cbOut = sizeof(pReq->Hdr);
1252 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1253 return 0;
1254 }
1255
1256 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_PAGE_UNLOCK):
1257 {
1258 /* validate */
1259 PSUPPAGEUNLOCK pReq = (PSUPPAGEUNLOCK)pReqHdr;
1260 REQ_CHECK_SIZES(SUP_IOCTL_PAGE_UNLOCK);
1261
1262 /* execute */
1263 pReq->Hdr.rc = SUPR0UnlockMem(pSession, pReq->u.In.pvR3);
1264 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1265 return 0;
1266 }
1267
1268 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_CONT_ALLOC):
1269 {
1270 /* validate */
1271 PSUPCONTALLOC pReq = (PSUPCONTALLOC)pReqHdr;
1272 REQ_CHECK_SIZES(SUP_IOCTL_CONT_ALLOC);
1273
1274 /* execute */
1275 pReq->Hdr.rc = SUPR0ContAlloc(pSession, pReq->u.In.cPages, &pReq->u.Out.pvR0, &pReq->u.Out.pvR3, &pReq->u.Out.HCPhys);
1276 if (RT_FAILURE(pReq->Hdr.rc))
1277 pReq->Hdr.cbOut = sizeof(pReq->Hdr);
1278 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1279 return 0;
1280 }
1281
1282 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_CONT_FREE):
1283 {
1284 /* validate */
1285 PSUPCONTFREE pReq = (PSUPCONTFREE)pReqHdr;
1286 REQ_CHECK_SIZES(SUP_IOCTL_CONT_FREE);
1287
1288 /* execute */
1289 pReq->Hdr.rc = SUPR0ContFree(pSession, (RTHCUINTPTR)pReq->u.In.pvR3);
1290 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1291 return 0;
1292 }
1293
1294 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_LDR_OPEN):
1295 {
1296 /* validate */
1297 PSUPLDROPEN pReq = (PSUPLDROPEN)pReqHdr;
1298 REQ_CHECK_SIZES(SUP_IOCTL_LDR_OPEN);
1299 REQ_CHECK_EXPR(SUP_IOCTL_LDR_OPEN, pReq->u.In.cbImageWithTabs > 0);
1300 REQ_CHECK_EXPR(SUP_IOCTL_LDR_OPEN, pReq->u.In.cbImageWithTabs < 16*_1M);
1301 REQ_CHECK_EXPR(SUP_IOCTL_LDR_OPEN, pReq->u.In.cbImageBits > 0);
1302 REQ_CHECK_EXPR(SUP_IOCTL_LDR_OPEN, pReq->u.In.cbImageBits > 0);
1303 REQ_CHECK_EXPR(SUP_IOCTL_LDR_OPEN, pReq->u.In.cbImageBits < pReq->u.In.cbImageWithTabs);
1304 REQ_CHECK_EXPR(SUP_IOCTL_LDR_OPEN, pReq->u.In.szName[0]);
1305 REQ_CHECK_EXPR(SUP_IOCTL_LDR_OPEN, RTStrEnd(pReq->u.In.szName, sizeof(pReq->u.In.szName)));
1306 REQ_CHECK_EXPR(SUP_IOCTL_LDR_OPEN, !supdrvCheckInvalidChar(pReq->u.In.szName, ";:()[]{}/\\|&*%#@!~`\"'"));
1307 REQ_CHECK_EXPR(SUP_IOCTL_LDR_OPEN, RTStrEnd(pReq->u.In.szFilename, sizeof(pReq->u.In.szFilename)));
1308
1309 /* execute */
1310 pReq->Hdr.rc = supdrvIOCtl_LdrOpen(pDevExt, pSession, pReq);
1311 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1312 return 0;
1313 }
1314
1315 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_LDR_LOAD):
1316 {
1317 /* validate */
1318 PSUPLDRLOAD pReq = (PSUPLDRLOAD)pReqHdr;
1319 REQ_CHECK_EXPR(Name, pReq->Hdr.cbIn >= sizeof(*pReq));
1320 REQ_CHECK_SIZES_EX(SUP_IOCTL_LDR_LOAD, SUP_IOCTL_LDR_LOAD_SIZE_IN(pReq->u.In.cbImageWithTabs), SUP_IOCTL_LDR_LOAD_SIZE_OUT);
1321 REQ_CHECK_EXPR(SUP_IOCTL_LDR_LOAD, pReq->u.In.cSymbols <= 16384);
1322 REQ_CHECK_EXPR_FMT( !pReq->u.In.cSymbols
1323 || ( pReq->u.In.offSymbols < pReq->u.In.cbImageWithTabs
1324 && pReq->u.In.offSymbols + pReq->u.In.cSymbols * sizeof(SUPLDRSYM) <= pReq->u.In.cbImageWithTabs),
1325 ("SUP_IOCTL_LDR_LOAD: offSymbols=%#lx cSymbols=%#lx cbImageWithTabs=%#lx\n", (long)pReq->u.In.offSymbols,
1326 (long)pReq->u.In.cSymbols, (long)pReq->u.In.cbImageWithTabs));
1327 REQ_CHECK_EXPR_FMT( !pReq->u.In.cbStrTab
1328 || ( pReq->u.In.offStrTab < pReq->u.In.cbImageWithTabs
1329 && pReq->u.In.offStrTab + pReq->u.In.cbStrTab <= pReq->u.In.cbImageWithTabs
1330 && pReq->u.In.cbStrTab <= pReq->u.In.cbImageWithTabs),
1331 ("SUP_IOCTL_LDR_LOAD: offStrTab=%#lx cbStrTab=%#lx cbImageWithTabs=%#lx\n", (long)pReq->u.In.offStrTab,
1332 (long)pReq->u.In.cbStrTab, (long)pReq->u.In.cbImageWithTabs));
1333
1334 if (pReq->u.In.cSymbols)
1335 {
1336 uint32_t i;
1337 PSUPLDRSYM paSyms = (PSUPLDRSYM)&pReq->u.In.abImage[pReq->u.In.offSymbols];
1338 for (i = 0; i < pReq->u.In.cSymbols; i++)
1339 {
1340 REQ_CHECK_EXPR_FMT(paSyms[i].offSymbol < pReq->u.In.cbImageWithTabs,
1341 ("SUP_IOCTL_LDR_LOAD: sym #%ld: symb off %#lx (max=%#lx)\n", (long)i, (long)paSyms[i].offSymbol, (long)pReq->u.In.cbImageWithTabs));
1342 REQ_CHECK_EXPR_FMT(paSyms[i].offName < pReq->u.In.cbStrTab,
1343 ("SUP_IOCTL_LDR_LOAD: sym #%ld: name off %#lx (max=%#lx)\n", (long)i, (long)paSyms[i].offName, (long)pReq->u.In.cbImageWithTabs));
1344 REQ_CHECK_EXPR_FMT(RTStrEnd((char const *)&pReq->u.In.abImage[pReq->u.In.offStrTab + paSyms[i].offName],
1345 pReq->u.In.cbStrTab - paSyms[i].offName),
1346 ("SUP_IOCTL_LDR_LOAD: sym #%ld: unterminated name! (%#lx / %#lx)\n", (long)i, (long)paSyms[i].offName, (long)pReq->u.In.cbImageWithTabs));
1347 }
1348 }
1349
1350 /* execute */
1351 pReq->Hdr.rc = supdrvIOCtl_LdrLoad(pDevExt, pSession, pReq);
1352 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1353 return 0;
1354 }
1355
1356 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_LDR_FREE):
1357 {
1358 /* validate */
1359 PSUPLDRFREE pReq = (PSUPLDRFREE)pReqHdr;
1360 REQ_CHECK_SIZES(SUP_IOCTL_LDR_FREE);
1361
1362 /* execute */
1363 pReq->Hdr.rc = supdrvIOCtl_LdrFree(pDevExt, pSession, pReq);
1364 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1365 return 0;
1366 }
1367
1368 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_LDR_GET_SYMBOL):
1369 {
1370 /* validate */
1371 PSUPLDRGETSYMBOL pReq = (PSUPLDRGETSYMBOL)pReqHdr;
1372 REQ_CHECK_SIZES(SUP_IOCTL_LDR_GET_SYMBOL);
1373 REQ_CHECK_EXPR(SUP_IOCTL_LDR_GET_SYMBOL, RTStrEnd(pReq->u.In.szSymbol, sizeof(pReq->u.In.szSymbol)));
1374
1375 /* execute */
1376 pReq->Hdr.rc = supdrvIOCtl_LdrGetSymbol(pDevExt, pSession, pReq);
1377 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1378 return 0;
1379 }
1380
1381 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_CALL_VMMR0(0)):
1382 {
1383 /* validate */
1384 PSUPCALLVMMR0 pReq = (PSUPCALLVMMR0)pReqHdr;
1385 Log4(("SUP_IOCTL_CALL_VMMR0: op=%u in=%u arg=%RX64 p/t=%RTproc/%RTthrd\n",
1386 pReq->u.In.uOperation, pReq->Hdr.cbIn, pReq->u.In.u64Arg, RTProcSelf(), RTThreadNativeSelf()));
1387
1388 if (pReq->Hdr.cbIn == SUP_IOCTL_CALL_VMMR0_SIZE(0))
1389 {
1390 REQ_CHECK_SIZES_EX(SUP_IOCTL_CALL_VMMR0, SUP_IOCTL_CALL_VMMR0_SIZE_IN(0), SUP_IOCTL_CALL_VMMR0_SIZE_OUT(0));
1391
1392 /* execute */
1393 if (RT_LIKELY(pDevExt->pfnVMMR0EntryEx))
1394 pReq->Hdr.rc = pDevExt->pfnVMMR0EntryEx(pReq->u.In.pVMR0, pReq->u.In.idCpu, pReq->u.In.uOperation, NULL, pReq->u.In.u64Arg, pSession);
1395 else
1396 pReq->Hdr.rc = VERR_WRONG_ORDER;
1397 }
1398 else
1399 {
1400 PSUPVMMR0REQHDR pVMMReq = (PSUPVMMR0REQHDR)&pReq->abReqPkt[0];
1401 REQ_CHECK_EXPR_FMT(pReq->Hdr.cbIn >= SUP_IOCTL_CALL_VMMR0_SIZE(sizeof(SUPVMMR0REQHDR)),
1402 ("SUP_IOCTL_CALL_VMMR0: cbIn=%#x < %#lx\n", pReq->Hdr.cbIn, SUP_IOCTL_CALL_VMMR0_SIZE(sizeof(SUPVMMR0REQHDR))));
1403 REQ_CHECK_EXPR(SUP_IOCTL_CALL_VMMR0, pVMMReq->u32Magic == SUPVMMR0REQHDR_MAGIC);
1404 REQ_CHECK_SIZES_EX(SUP_IOCTL_CALL_VMMR0, SUP_IOCTL_CALL_VMMR0_SIZE_IN(pVMMReq->cbReq), SUP_IOCTL_CALL_VMMR0_SIZE_OUT(pVMMReq->cbReq));
1405
1406 /* execute */
1407 if (RT_LIKELY(pDevExt->pfnVMMR0EntryEx))
1408 pReq->Hdr.rc = pDevExt->pfnVMMR0EntryEx(pReq->u.In.pVMR0, pReq->u.In.idCpu, pReq->u.In.uOperation, pVMMReq, pReq->u.In.u64Arg, pSession);
1409 else
1410 pReq->Hdr.rc = VERR_WRONG_ORDER;
1411 }
1412
1413 if ( RT_FAILURE(pReq->Hdr.rc)
1414 && pReq->Hdr.rc != VERR_INTERRUPTED
1415 && pReq->Hdr.rc != VERR_TIMEOUT)
1416 Log(("SUP_IOCTL_CALL_VMMR0: rc=%Rrc op=%u out=%u arg=%RX64 p/t=%RTproc/%RTthrd\n",
1417 pReq->Hdr.rc, pReq->u.In.uOperation, pReq->Hdr.cbOut, pReq->u.In.u64Arg, RTProcSelf(), RTThreadNativeSelf()));
1418 else
1419 Log4(("SUP_IOCTL_CALL_VMMR0: rc=%Rrc op=%u out=%u arg=%RX64 p/t=%RTproc/%RTthrd\n",
1420 pReq->Hdr.rc, pReq->u.In.uOperation, pReq->Hdr.cbOut, pReq->u.In.u64Arg, RTProcSelf(), RTThreadNativeSelf()));
1421 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1422 return 0;
1423 }
1424
1425 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_CALL_VMMR0_BIG):
1426 {
1427 /* validate */
1428 PSUPCALLVMMR0 pReq = (PSUPCALLVMMR0)pReqHdr;
1429 PSUPVMMR0REQHDR pVMMReq;
1430 Log4(("SUP_IOCTL_CALL_VMMR0_BIG: op=%u in=%u arg=%RX64 p/t=%RTproc/%RTthrd\n",
1431 pReq->u.In.uOperation, pReq->Hdr.cbIn, pReq->u.In.u64Arg, RTProcSelf(), RTThreadNativeSelf()));
1432
1433 pVMMReq = (PSUPVMMR0REQHDR)&pReq->abReqPkt[0];
1434 REQ_CHECK_EXPR_FMT(pReq->Hdr.cbIn >= SUP_IOCTL_CALL_VMMR0_BIG_SIZE(sizeof(SUPVMMR0REQHDR)),
1435 ("SUP_IOCTL_CALL_VMMR0_BIG: cbIn=%#x < %#lx\n", pReq->Hdr.cbIn, SUP_IOCTL_CALL_VMMR0_BIG_SIZE(sizeof(SUPVMMR0REQHDR))));
1436 REQ_CHECK_EXPR(SUP_IOCTL_CALL_VMMR0_BIG, pVMMReq->u32Magic == SUPVMMR0REQHDR_MAGIC);
1437 REQ_CHECK_SIZES_EX(SUP_IOCTL_CALL_VMMR0_BIG, SUP_IOCTL_CALL_VMMR0_BIG_SIZE_IN(pVMMReq->cbReq), SUP_IOCTL_CALL_VMMR0_BIG_SIZE_OUT(pVMMReq->cbReq));
1438
1439 /* execute */
1440 if (RT_LIKELY(pDevExt->pfnVMMR0EntryEx))
1441 pReq->Hdr.rc = pDevExt->pfnVMMR0EntryEx(pReq->u.In.pVMR0, pReq->u.In.idCpu, pReq->u.In.uOperation, pVMMReq, pReq->u.In.u64Arg, pSession);
1442 else
1443 pReq->Hdr.rc = VERR_WRONG_ORDER;
1444
1445 if ( RT_FAILURE(pReq->Hdr.rc)
1446 && pReq->Hdr.rc != VERR_INTERRUPTED
1447 && pReq->Hdr.rc != VERR_TIMEOUT)
1448 Log(("SUP_IOCTL_CALL_VMMR0_BIG: rc=%Rrc op=%u out=%u arg=%RX64 p/t=%RTproc/%RTthrd\n",
1449 pReq->Hdr.rc, pReq->u.In.uOperation, pReq->Hdr.cbOut, pReq->u.In.u64Arg, RTProcSelf(), RTThreadNativeSelf()));
1450 else
1451 Log4(("SUP_IOCTL_CALL_VMMR0_BIG: rc=%Rrc op=%u out=%u arg=%RX64 p/t=%RTproc/%RTthrd\n",
1452 pReq->Hdr.rc, pReq->u.In.uOperation, pReq->Hdr.cbOut, pReq->u.In.u64Arg, RTProcSelf(), RTThreadNativeSelf()));
1453 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1454 return 0;
1455 }
1456
1457 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_GET_PAGING_MODE):
1458 {
1459 /* validate */
1460 PSUPGETPAGINGMODE pReq = (PSUPGETPAGINGMODE)pReqHdr;
1461 REQ_CHECK_SIZES(SUP_IOCTL_GET_PAGING_MODE);
1462
1463 /* execute */
1464 pReq->Hdr.rc = VINF_SUCCESS;
1465 pReq->u.Out.enmMode = SUPR0GetPagingMode();
1466 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1467 return 0;
1468 }
1469
1470 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_LOW_ALLOC):
1471 {
1472 /* validate */
1473 PSUPLOWALLOC pReq = (PSUPLOWALLOC)pReqHdr;
1474 REQ_CHECK_EXPR(SUP_IOCTL_LOW_ALLOC, pReq->Hdr.cbIn <= SUP_IOCTL_LOW_ALLOC_SIZE_IN);
1475 REQ_CHECK_SIZES_EX(SUP_IOCTL_LOW_ALLOC, SUP_IOCTL_LOW_ALLOC_SIZE_IN, SUP_IOCTL_LOW_ALLOC_SIZE_OUT(pReq->u.In.cPages));
1476
1477 /* execute */
1478 pReq->Hdr.rc = SUPR0LowAlloc(pSession, pReq->u.In.cPages, &pReq->u.Out.pvR0, &pReq->u.Out.pvR3, &pReq->u.Out.aPages[0]);
1479 if (RT_FAILURE(pReq->Hdr.rc))
1480 pReq->Hdr.cbOut = sizeof(pReq->Hdr);
1481 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1482 return 0;
1483 }
1484
1485 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_LOW_FREE):
1486 {
1487 /* validate */
1488 PSUPLOWFREE pReq = (PSUPLOWFREE)pReqHdr;
1489 REQ_CHECK_SIZES(SUP_IOCTL_LOW_FREE);
1490
1491 /* execute */
1492 pReq->Hdr.rc = SUPR0LowFree(pSession, (RTHCUINTPTR)pReq->u.In.pvR3);
1493 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1494 return 0;
1495 }
1496
1497 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_GIP_MAP):
1498 {
1499 /* validate */
1500 PSUPGIPMAP pReq = (PSUPGIPMAP)pReqHdr;
1501 REQ_CHECK_SIZES(SUP_IOCTL_GIP_MAP);
1502
1503 /* execute */
1504 pReq->Hdr.rc = SUPR0GipMap(pSession, &pReq->u.Out.pGipR3, &pReq->u.Out.HCPhysGip);
1505 if (RT_SUCCESS(pReq->Hdr.rc))
1506 pReq->u.Out.pGipR0 = pDevExt->pGip;
1507 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1508 return 0;
1509 }
1510
1511 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_GIP_UNMAP):
1512 {
1513 /* validate */
1514 PSUPGIPUNMAP pReq = (PSUPGIPUNMAP)pReqHdr;
1515 REQ_CHECK_SIZES(SUP_IOCTL_GIP_UNMAP);
1516
1517 /* execute */
1518 pReq->Hdr.rc = SUPR0GipUnmap(pSession);
1519 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1520 return 0;
1521 }
1522
1523 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_SET_VM_FOR_FAST):
1524 {
1525 /* validate */
1526 PSUPSETVMFORFAST pReq = (PSUPSETVMFORFAST)pReqHdr;
1527 REQ_CHECK_SIZES(SUP_IOCTL_SET_VM_FOR_FAST);
1528 REQ_CHECK_EXPR_FMT( !pReq->u.In.pVMR0
1529 || ( VALID_PTR(pReq->u.In.pVMR0)
1530 && !((uintptr_t)pReq->u.In.pVMR0 & (PAGE_SIZE - 1))),
1531 ("SUP_IOCTL_SET_VM_FOR_FAST: pVMR0=%p!\n", pReq->u.In.pVMR0));
1532 /* execute */
1533 pSession->pVM = pReq->u.In.pVMR0;
1534 pReq->Hdr.rc = VINF_SUCCESS;
1535 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1536 return 0;
1537 }
1538
1539 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_PAGE_ALLOC_EX):
1540 {
1541 /* validate */
1542 PSUPPAGEALLOCEX pReq = (PSUPPAGEALLOCEX)pReqHdr;
1543 REQ_CHECK_EXPR(SUP_IOCTL_PAGE_ALLOC_EX, pReq->Hdr.cbIn <= SUP_IOCTL_PAGE_ALLOC_EX_SIZE_IN);
1544 REQ_CHECK_SIZES_EX(SUP_IOCTL_PAGE_ALLOC_EX, SUP_IOCTL_PAGE_ALLOC_EX_SIZE_IN, SUP_IOCTL_PAGE_ALLOC_EX_SIZE_OUT(pReq->u.In.cPages));
1545 REQ_CHECK_EXPR_FMT(pReq->u.In.fKernelMapping || pReq->u.In.fUserMapping,
1546 ("SUP_IOCTL_PAGE_ALLOC_EX: No mapping requested!\n"));
1547 REQ_CHECK_EXPR_FMT(pReq->u.In.fUserMapping,
1548 ("SUP_IOCTL_PAGE_ALLOC_EX: Must have user mapping!\n"));
1549 REQ_CHECK_EXPR_FMT(!pReq->u.In.fReserved0 && !pReq->u.In.fReserved1,
1550 ("SUP_IOCTL_PAGE_ALLOC_EX: fReserved0=%d fReserved1=%d\n", pReq->u.In.fReserved0, pReq->u.In.fReserved1));
1551
1552 /* execute */
1553 pReq->Hdr.rc = SUPR0PageAllocEx(pSession, pReq->u.In.cPages, 0 /* fFlags */,
1554 pReq->u.In.fUserMapping ? &pReq->u.Out.pvR3 : NULL,
1555 pReq->u.In.fKernelMapping ? &pReq->u.Out.pvR0 : NULL,
1556 &pReq->u.Out.aPages[0]);
1557 if (RT_FAILURE(pReq->Hdr.rc))
1558 pReq->Hdr.cbOut = sizeof(pReq->Hdr);
1559 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1560 return 0;
1561 }
1562
1563 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_PAGE_MAP_KERNEL):
1564 {
1565 /* validate */
1566 PSUPPAGEMAPKERNEL pReq = (PSUPPAGEMAPKERNEL)pReqHdr;
1567 REQ_CHECK_SIZES(SUP_IOCTL_PAGE_MAP_KERNEL);
1568 REQ_CHECK_EXPR_FMT(!pReq->u.In.fFlags, ("SUP_IOCTL_PAGE_MAP_KERNEL: fFlags=%#x! MBZ\n", pReq->u.In.fFlags));
1569 REQ_CHECK_EXPR_FMT(!(pReq->u.In.offSub & PAGE_OFFSET_MASK), ("SUP_IOCTL_PAGE_MAP_KERNEL: offSub=%#x\n", pReq->u.In.offSub));
1570 REQ_CHECK_EXPR_FMT(pReq->u.In.cbSub && !(pReq->u.In.cbSub & PAGE_OFFSET_MASK),
1571 ("SUP_IOCTL_PAGE_MAP_KERNEL: cbSub=%#x\n", pReq->u.In.cbSub));
1572
1573 /* execute */
1574 pReq->Hdr.rc = SUPR0PageMapKernel(pSession, pReq->u.In.pvR3, pReq->u.In.offSub, pReq->u.In.cbSub,
1575 pReq->u.In.fFlags, &pReq->u.Out.pvR0);
1576 if (RT_FAILURE(pReq->Hdr.rc))
1577 pReq->Hdr.cbOut = sizeof(pReq->Hdr);
1578 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1579 return 0;
1580 }
1581
1582 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_PAGE_PROTECT):
1583 {
1584 /* validate */
1585 PSUPPAGEPROTECT pReq = (PSUPPAGEPROTECT)pReqHdr;
1586 REQ_CHECK_SIZES(SUP_IOCTL_PAGE_PROTECT);
1587 REQ_CHECK_EXPR_FMT(!(pReq->u.In.fProt & ~(RTMEM_PROT_READ | RTMEM_PROT_WRITE | RTMEM_PROT_EXEC | RTMEM_PROT_NONE)),
1588 ("SUP_IOCTL_PAGE_PROTECT: fProt=%#x!\n", pReq->u.In.fProt));
1589 REQ_CHECK_EXPR_FMT(!(pReq->u.In.offSub & PAGE_OFFSET_MASK), ("SUP_IOCTL_PAGE_PROTECT: offSub=%#x\n", pReq->u.In.offSub));
1590 REQ_CHECK_EXPR_FMT(pReq->u.In.cbSub && !(pReq->u.In.cbSub & PAGE_OFFSET_MASK),
1591 ("SUP_IOCTL_PAGE_PROTECT: cbSub=%#x\n", pReq->u.In.cbSub));
1592
1593 /* execute */
1594 pReq->Hdr.rc = SUPR0PageProtect(pSession, pReq->u.In.pvR3, pReq->u.In.pvR0, pReq->u.In.offSub, pReq->u.In.cbSub, pReq->u.In.fProt);
1595 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1596 return 0;
1597 }
1598
1599 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_PAGE_FREE):
1600 {
1601 /* validate */
1602 PSUPPAGEFREE pReq = (PSUPPAGEFREE)pReqHdr;
1603 REQ_CHECK_SIZES(SUP_IOCTL_PAGE_FREE);
1604
1605 /* execute */
1606 pReq->Hdr.rc = SUPR0PageFree(pSession, pReq->u.In.pvR3);
1607 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1608 return 0;
1609 }
1610
1611 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_CALL_SERVICE(0)):
1612 {
1613 /* validate */
1614 PSUPCALLSERVICE pReq = (PSUPCALLSERVICE)pReqHdr;
1615 Log4(("SUP_IOCTL_CALL_SERVICE: op=%u in=%u arg=%RX64 p/t=%RTproc/%RTthrd\n",
1616 pReq->u.In.uOperation, pReq->Hdr.cbIn, pReq->u.In.u64Arg, RTProcSelf(), RTThreadNativeSelf()));
1617
1618 if (pReq->Hdr.cbIn == SUP_IOCTL_CALL_SERVICE_SIZE(0))
1619 REQ_CHECK_SIZES_EX(SUP_IOCTL_CALL_SERVICE, SUP_IOCTL_CALL_SERVICE_SIZE_IN(0), SUP_IOCTL_CALL_SERVICE_SIZE_OUT(0));
1620 else
1621 {
1622 PSUPR0SERVICEREQHDR pSrvReq = (PSUPR0SERVICEREQHDR)&pReq->abReqPkt[0];
1623 REQ_CHECK_EXPR_FMT(pReq->Hdr.cbIn >= SUP_IOCTL_CALL_SERVICE_SIZE(sizeof(SUPR0SERVICEREQHDR)),
1624 ("SUP_IOCTL_CALL_SERVICE: cbIn=%#x < %#lx\n", pReq->Hdr.cbIn, SUP_IOCTL_CALL_SERVICE_SIZE(sizeof(SUPR0SERVICEREQHDR))));
1625 REQ_CHECK_EXPR(SUP_IOCTL_CALL_SERVICE, pSrvReq->u32Magic == SUPR0SERVICEREQHDR_MAGIC);
1626 REQ_CHECK_SIZES_EX(SUP_IOCTL_CALL_SERVICE, SUP_IOCTL_CALL_SERVICE_SIZE_IN(pSrvReq->cbReq), SUP_IOCTL_CALL_SERVICE_SIZE_OUT(pSrvReq->cbReq));
1627 }
1628 REQ_CHECK_EXPR(SUP_IOCTL_CALL_SERVICE, RTStrEnd(pReq->u.In.szName, sizeof(pReq->u.In.szName)));
1629
1630 /* execute */
1631 pReq->Hdr.rc = supdrvIOCtl_CallServiceModule(pDevExt, pSession, pReq);
1632 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1633 return 0;
1634 }
1635
1636 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_LOGGER_SETTINGS(0)):
1637 {
1638 /* validate */
1639 PSUPLOGGERSETTINGS pReq = (PSUPLOGGERSETTINGS)pReqHdr;
1640 size_t cbStrTab;
1641 REQ_CHECK_SIZE_OUT(SUP_IOCTL_LOGGER_SETTINGS, SUP_IOCTL_LOGGER_SETTINGS_SIZE_OUT);
1642 REQ_CHECK_EXPR(SUP_IOCTL_LOGGER_SETTINGS, pReq->Hdr.cbIn >= SUP_IOCTL_LOGGER_SETTINGS_SIZE_IN(1));
1643 cbStrTab = pReq->Hdr.cbIn - SUP_IOCTL_LOGGER_SETTINGS_SIZE_IN(0);
1644 REQ_CHECK_EXPR(SUP_IOCTL_LOGGER_SETTINGS, pReq->u.In.offGroups < cbStrTab);
1645 REQ_CHECK_EXPR(SUP_IOCTL_LOGGER_SETTINGS, pReq->u.In.offFlags < cbStrTab);
1646 REQ_CHECK_EXPR(SUP_IOCTL_LOGGER_SETTINGS, pReq->u.In.offDestination < cbStrTab);
1647 REQ_CHECK_EXPR_FMT(pReq->u.In.szStrings[cbStrTab - 1] == '\0',
1648 ("SUP_IOCTL_LOGGER_SETTINGS: cbIn=%#x cbStrTab=%#zx LastChar=%d\n",
1649 pReq->Hdr.cbIn, cbStrTab, pReq->u.In.szStrings[cbStrTab - 1]));
1650 REQ_CHECK_EXPR(SUP_IOCTL_LOGGER_SETTINGS, pReq->u.In.fWhich <= SUPLOGGERSETTINGS_WHICH_RELEASE);
1651 REQ_CHECK_EXPR(SUP_IOCTL_LOGGER_SETTINGS, pReq->u.In.fWhat <= SUPLOGGERSETTINGS_WHAT_DESTROY);
1652
1653 /* execute */
1654 pReq->Hdr.rc = supdrvIOCtl_LoggerSettings(pDevExt, pSession, pReq);
1655 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1656 return 0;
1657 }
1658
1659 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_SEM_OP2):
1660 {
1661 /* validate */
1662 PSUPSEMOP2 pReq = (PSUPSEMOP2)pReqHdr;
1663 REQ_CHECK_SIZES_EX(SUP_IOCTL_SEM_OP2, SUP_IOCTL_SEM_OP2_SIZE_IN, SUP_IOCTL_SEM_OP2_SIZE_OUT);
1664 REQ_CHECK_EXPR(SUP_IOCTL_SEM_OP2, pReq->u.In.uReserved == 0);
1665
1666 /* execute */
1667 switch (pReq->u.In.uType)
1668 {
1669 case SUP_SEM_TYPE_EVENT:
1670 {
1671 SUPSEMEVENT hEvent = (SUPSEMEVENT)(uintptr_t)pReq->u.In.hSem;
1672 switch (pReq->u.In.uOp)
1673 {
1674 case SUPSEMOP2_WAIT_MS_REL:
1675 pReq->Hdr.rc = SUPSemEventWaitNoResume(pSession, hEvent, pReq->u.In.uArg.cRelMsTimeout);
1676 break;
1677 case SUPSEMOP2_WAIT_NS_ABS:
1678 pReq->Hdr.rc = SUPSemEventWaitNsAbsIntr(pSession, hEvent, pReq->u.In.uArg.uAbsNsTimeout);
1679 break;
1680 case SUPSEMOP2_WAIT_NS_REL:
1681 pReq->Hdr.rc = SUPSemEventWaitNsRelIntr(pSession, hEvent, pReq->u.In.uArg.cRelNsTimeout);
1682 break;
1683 case SUPSEMOP2_SIGNAL:
1684 pReq->Hdr.rc = SUPSemEventSignal(pSession, hEvent);
1685 break;
1686 case SUPSEMOP2_CLOSE:
1687 pReq->Hdr.rc = SUPSemEventClose(pSession, hEvent);
1688 break;
1689 case SUPSEMOP2_RESET:
1690 default:
1691 pReq->Hdr.rc = VERR_INVALID_FUNCTION;
1692 break;
1693 }
1694 break;
1695 }
1696
1697 case SUP_SEM_TYPE_EVENT_MULTI:
1698 {
1699 SUPSEMEVENTMULTI hEventMulti = (SUPSEMEVENTMULTI)(uintptr_t)pReq->u.In.hSem;
1700 switch (pReq->u.In.uOp)
1701 {
1702 case SUPSEMOP2_WAIT_MS_REL:
1703 pReq->Hdr.rc = SUPSemEventMultiWaitNoResume(pSession, hEventMulti, pReq->u.In.uArg.cRelMsTimeout);
1704 break;
1705 case SUPSEMOP2_WAIT_NS_ABS:
1706 pReq->Hdr.rc = SUPSemEventMultiWaitNsAbsIntr(pSession, hEventMulti, pReq->u.In.uArg.uAbsNsTimeout);
1707 break;
1708 case SUPSEMOP2_WAIT_NS_REL:
1709 pReq->Hdr.rc = SUPSemEventMultiWaitNsRelIntr(pSession, hEventMulti, pReq->u.In.uArg.cRelNsTimeout);
1710 break;
1711 case SUPSEMOP2_SIGNAL:
1712 pReq->Hdr.rc = SUPSemEventMultiSignal(pSession, hEventMulti);
1713 break;
1714 case SUPSEMOP2_CLOSE:
1715 pReq->Hdr.rc = SUPSemEventMultiClose(pSession, hEventMulti);
1716 break;
1717 case SUPSEMOP2_RESET:
1718 pReq->Hdr.rc = SUPSemEventMultiReset(pSession, hEventMulti);
1719 break;
1720 default:
1721 pReq->Hdr.rc = VERR_INVALID_FUNCTION;
1722 break;
1723 }
1724 break;
1725 }
1726
1727 default:
1728 pReq->Hdr.rc = VERR_INVALID_PARAMETER;
1729 break;
1730 }
1731 return 0;
1732 }
1733
1734 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_SEM_OP3):
1735 {
1736 /* validate */
1737 PSUPSEMOP3 pReq = (PSUPSEMOP3)pReqHdr;
1738 REQ_CHECK_SIZES_EX(SUP_IOCTL_SEM_OP3, SUP_IOCTL_SEM_OP3_SIZE_IN, SUP_IOCTL_SEM_OP3_SIZE_OUT);
1739 REQ_CHECK_EXPR(SUP_IOCTL_SEM_OP3, pReq->u.In.u32Reserved == 0 && pReq->u.In.u64Reserved == 0);
1740
1741 /* execute */
1742 switch (pReq->u.In.uType)
1743 {
1744 case SUP_SEM_TYPE_EVENT:
1745 {
1746 SUPSEMEVENT hEvent = (SUPSEMEVENT)(uintptr_t)pReq->u.In.hSem;
1747 switch (pReq->u.In.uOp)
1748 {
1749 case SUPSEMOP3_CREATE:
1750 REQ_CHECK_EXPR(SUP_IOCTL_SEM_OP3, hEvent == NIL_SUPSEMEVENT);
1751 pReq->Hdr.rc = SUPSemEventCreate(pSession, &hEvent);
1752 pReq->u.Out.hSem = (uint32_t)(uintptr_t)hEvent;
1753 break;
1754 case SUPSEMOP3_GET_RESOLUTION:
1755 REQ_CHECK_EXPR(SUP_IOCTL_SEM_OP3, hEvent == NIL_SUPSEMEVENT);
1756 pReq->Hdr.rc = VINF_SUCCESS;
1757 pReq->Hdr.cbOut = sizeof(*pReq);
1758 pReq->u.Out.cNsResolution = SUPSemEventGetResolution(pSession);
1759 break;
1760 default:
1761 pReq->Hdr.rc = VERR_INVALID_FUNCTION;
1762 break;
1763 }
1764 break;
1765 }
1766
1767 case SUP_SEM_TYPE_EVENT_MULTI:
1768 {
1769 SUPSEMEVENTMULTI hEventMulti = (SUPSEMEVENTMULTI)(uintptr_t)pReq->u.In.hSem;
1770 switch (pReq->u.In.uOp)
1771 {
1772 case SUPSEMOP3_CREATE:
1773 REQ_CHECK_EXPR(SUP_IOCTL_SEM_OP3, hEventMulti == NIL_SUPSEMEVENTMULTI);
1774 pReq->Hdr.rc = SUPSemEventMultiCreate(pSession, &hEventMulti);
1775 pReq->u.Out.hSem = (uint32_t)(uintptr_t)hEventMulti;
1776 break;
1777 case SUPSEMOP3_GET_RESOLUTION:
1778 REQ_CHECK_EXPR(SUP_IOCTL_SEM_OP3, hEventMulti == NIL_SUPSEMEVENTMULTI);
1779 pReq->Hdr.rc = VINF_SUCCESS;
1780 pReq->u.Out.cNsResolution = SUPSemEventMultiGetResolution(pSession);
1781 break;
1782 default:
1783 pReq->Hdr.rc = VERR_INVALID_FUNCTION;
1784 break;
1785 }
1786 break;
1787 }
1788
1789 default:
1790 pReq->Hdr.rc = VERR_INVALID_PARAMETER;
1791 break;
1792 }
1793 return 0;
1794 }
1795
1796 case SUP_CTL_CODE_NO_SIZE(SUP_IOCTL_VT_CAPS):
1797 {
1798 /* validate */
1799 PSUPVTCAPS pReq = (PSUPVTCAPS)pReqHdr;
1800 REQ_CHECK_SIZES(SUP_IOCTL_VT_CAPS);
1801 REQ_CHECK_EXPR(SUP_IOCTL_VT_CAPS, pReq->Hdr.cbIn <= SUP_IOCTL_VT_CAPS_SIZE_IN);
1802
1803 /* execute */
1804 pReq->Hdr.rc = SUPR0QueryVTCaps(pSession, &pReq->u.Out.Caps);
1805 if (RT_FAILURE(pReq->Hdr.rc))
1806 pReq->Hdr.cbOut = sizeof(pReq->Hdr);
1807 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VINF_SUCCESS, pReq->Hdr.rc);
1808 return 0;
1809 }
1810
1811 default:
1812 Log(("Unknown IOCTL %#lx\n", (long)uIOCtl));
1813 break;
1814 }
1815 VBOXDRV_IOCTL_RETURN(pSession, uIOCtl, pReqHdr, VERR_GENERAL_FAILURE, VERR_GENERAL_FAILURE);
1816 return VERR_GENERAL_FAILURE;
1817}
1818
1819
1820/**
1821 * Inter-Driver Communication (IDC) worker.
1822 *
1823 * @returns VBox status code.
1824 * @retval VINF_SUCCESS on success.
1825 * @retval VERR_INVALID_PARAMETER if the request is invalid.
1826 * @retval VERR_NOT_SUPPORTED if the request isn't supported.
1827 *
1828 * @param uReq The request (function) code.
1829 * @param pDevExt Device extention.
1830 * @param pSession Session data.
1831 * @param pReqHdr The request header.
1832 */
1833int VBOXCALL supdrvIDC(uintptr_t uReq, PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPDRVIDCREQHDR pReqHdr)
1834{
1835 /*
1836 * The OS specific code has already validated the pSession
1837 * pointer, and the request size being greater or equal to
1838 * size of the header.
1839 *
1840 * So, just check that pSession is a kernel context session.
1841 */
1842 if (RT_UNLIKELY( pSession
1843 && pSession->R0Process != NIL_RTR0PROCESS))
1844 return VERR_INVALID_PARAMETER;
1845
1846/*
1847 * Validation macro.
1848 */
1849#define REQ_CHECK_IDC_SIZE(Name, cbExpect) \
1850 do { \
1851 if (RT_UNLIKELY(pReqHdr->cb != (cbExpect))) \
1852 { \
1853 OSDBGPRINT(( #Name ": Invalid input/output sizes. cb=%ld expected %ld.\n", \
1854 (long)pReqHdr->cb, (long)(cbExpect))); \
1855 return pReqHdr->rc = VERR_INVALID_PARAMETER; \
1856 } \
1857 } while (0)
1858
1859 switch (uReq)
1860 {
1861 case SUPDRV_IDC_REQ_CONNECT:
1862 {
1863 PSUPDRVIDCREQCONNECT pReq = (PSUPDRVIDCREQCONNECT)pReqHdr;
1864 REQ_CHECK_IDC_SIZE(SUPDRV_IDC_REQ_CONNECT, sizeof(*pReq));
1865
1866 /*
1867 * Validate the cookie and other input.
1868 */
1869 if (pReq->Hdr.pSession != NULL)
1870 {
1871 OSDBGPRINT(("SUPDRV_IDC_REQ_CONNECT: Hdr.pSession=%p expected NULL!\n", pReq->Hdr.pSession));
1872 return pReqHdr->rc = VERR_INVALID_PARAMETER;
1873 }
1874 if (pReq->u.In.u32MagicCookie != SUPDRVIDCREQ_CONNECT_MAGIC_COOKIE)
1875 {
1876 OSDBGPRINT(("SUPDRV_IDC_REQ_CONNECT: u32MagicCookie=%#x expected %#x!\n",
1877 (unsigned)pReq->u.In.u32MagicCookie, (unsigned)SUPDRVIDCREQ_CONNECT_MAGIC_COOKIE));
1878 return pReqHdr->rc = VERR_INVALID_PARAMETER;
1879 }
1880 if ( pReq->u.In.uMinVersion > pReq->u.In.uReqVersion
1881 || (pReq->u.In.uMinVersion & UINT32_C(0xffff0000)) != (pReq->u.In.uReqVersion & UINT32_C(0xffff0000)))
1882 {
1883 OSDBGPRINT(("SUPDRV_IDC_REQ_CONNECT: uMinVersion=%#x uMaxVersion=%#x doesn't match!\n",
1884 pReq->u.In.uMinVersion, pReq->u.In.uReqVersion));
1885 return pReqHdr->rc = VERR_INVALID_PARAMETER;
1886 }
1887 if (pSession != NULL)
1888 {
1889 OSDBGPRINT(("SUPDRV_IDC_REQ_CONNECT: pSession=%p expected NULL!\n", pSession));
1890 return pReqHdr->rc = VERR_INVALID_PARAMETER;
1891 }
1892
1893 /*
1894 * Match the version.
1895 * The current logic is very simple, match the major interface version.
1896 */
1897 if ( pReq->u.In.uMinVersion > SUPDRV_IDC_VERSION
1898 || (pReq->u.In.uMinVersion & 0xffff0000) != (SUPDRV_IDC_VERSION & 0xffff0000))
1899 {
1900 OSDBGPRINT(("SUPDRV_IDC_REQ_CONNECT: Version mismatch. Requested: %#x Min: %#x Current: %#x\n",
1901 pReq->u.In.uReqVersion, pReq->u.In.uMinVersion, (unsigned)SUPDRV_IDC_VERSION));
1902 pReq->u.Out.pSession = NULL;
1903 pReq->u.Out.uSessionVersion = 0xffffffff;
1904 pReq->u.Out.uDriverVersion = SUPDRV_IDC_VERSION;
1905 pReq->u.Out.uDriverRevision = VBOX_SVN_REV;
1906 pReq->Hdr.rc = VERR_VERSION_MISMATCH;
1907 return VINF_SUCCESS;
1908 }
1909
1910 pReq->u.Out.pSession = NULL;
1911 pReq->u.Out.uSessionVersion = SUPDRV_IDC_VERSION;
1912 pReq->u.Out.uDriverVersion = SUPDRV_IDC_VERSION;
1913 pReq->u.Out.uDriverRevision = VBOX_SVN_REV;
1914
1915 pReq->Hdr.rc = supdrvCreateSession(pDevExt, false /* fUser */, &pSession);
1916 if (RT_FAILURE(pReq->Hdr.rc))
1917 {
1918 OSDBGPRINT(("SUPDRV_IDC_REQ_CONNECT: failed to create session, rc=%d\n", pReq->Hdr.rc));
1919 return VINF_SUCCESS;
1920 }
1921
1922 pReq->u.Out.pSession = pSession;
1923 pReq->Hdr.pSession = pSession;
1924
1925 return VINF_SUCCESS;
1926 }
1927
1928 case SUPDRV_IDC_REQ_DISCONNECT:
1929 {
1930 REQ_CHECK_IDC_SIZE(SUPDRV_IDC_REQ_DISCONNECT, sizeof(*pReqHdr));
1931
1932 supdrvCloseSession(pDevExt, pSession);
1933 return pReqHdr->rc = VINF_SUCCESS;
1934 }
1935
1936 case SUPDRV_IDC_REQ_GET_SYMBOL:
1937 {
1938 PSUPDRVIDCREQGETSYM pReq = (PSUPDRVIDCREQGETSYM)pReqHdr;
1939 REQ_CHECK_IDC_SIZE(SUPDRV_IDC_REQ_GET_SYMBOL, sizeof(*pReq));
1940
1941 pReq->Hdr.rc = supdrvIDC_LdrGetSymbol(pDevExt, pSession, pReq);
1942 return VINF_SUCCESS;
1943 }
1944
1945 case SUPDRV_IDC_REQ_COMPONENT_REGISTER_FACTORY:
1946 {
1947 PSUPDRVIDCREQCOMPREGFACTORY pReq = (PSUPDRVIDCREQCOMPREGFACTORY)pReqHdr;
1948 REQ_CHECK_IDC_SIZE(SUPDRV_IDC_REQ_COMPONENT_REGISTER_FACTORY, sizeof(*pReq));
1949
1950 pReq->Hdr.rc = SUPR0ComponentRegisterFactory(pSession, pReq->u.In.pFactory);
1951 return VINF_SUCCESS;
1952 }
1953
1954 case SUPDRV_IDC_REQ_COMPONENT_DEREGISTER_FACTORY:
1955 {
1956 PSUPDRVIDCREQCOMPDEREGFACTORY pReq = (PSUPDRVIDCREQCOMPDEREGFACTORY)pReqHdr;
1957 REQ_CHECK_IDC_SIZE(SUPDRV_IDC_REQ_COMPONENT_DEREGISTER_FACTORY, sizeof(*pReq));
1958
1959 pReq->Hdr.rc = SUPR0ComponentDeregisterFactory(pSession, pReq->u.In.pFactory);
1960 return VINF_SUCCESS;
1961 }
1962
1963 default:
1964 Log(("Unknown IDC %#lx\n", (long)uReq));
1965 break;
1966 }
1967
1968#undef REQ_CHECK_IDC_SIZE
1969 return VERR_NOT_SUPPORTED;
1970}
1971
1972
1973/**
1974 * Register a object for reference counting.
1975 * The object is registered with one reference in the specified session.
1976 *
1977 * @returns Unique identifier on success (pointer).
1978 * All future reference must use this identifier.
1979 * @returns NULL on failure.
1980 * @param pfnDestructor The destructore function which will be called when the reference count reaches 0.
1981 * @param pvUser1 The first user argument.
1982 * @param pvUser2 The second user argument.
1983 */
1984SUPR0DECL(void *) SUPR0ObjRegister(PSUPDRVSESSION pSession, SUPDRVOBJTYPE enmType, PFNSUPDRVDESTRUCTOR pfnDestructor, void *pvUser1, void *pvUser2)
1985{
1986 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
1987 PSUPDRVDEVEXT pDevExt = pSession->pDevExt;
1988 PSUPDRVOBJ pObj;
1989 PSUPDRVUSAGE pUsage;
1990
1991 /*
1992 * Validate the input.
1993 */
1994 AssertReturn(SUP_IS_SESSION_VALID(pSession), NULL);
1995 AssertReturn(enmType > SUPDRVOBJTYPE_INVALID && enmType < SUPDRVOBJTYPE_END, NULL);
1996 AssertPtrReturn(pfnDestructor, NULL);
1997
1998 /*
1999 * Allocate and initialize the object.
2000 */
2001 pObj = (PSUPDRVOBJ)RTMemAlloc(sizeof(*pObj));
2002 if (!pObj)
2003 return NULL;
2004 pObj->u32Magic = SUPDRVOBJ_MAGIC;
2005 pObj->enmType = enmType;
2006 pObj->pNext = NULL;
2007 pObj->cUsage = 1;
2008 pObj->pfnDestructor = pfnDestructor;
2009 pObj->pvUser1 = pvUser1;
2010 pObj->pvUser2 = pvUser2;
2011 pObj->CreatorUid = pSession->Uid;
2012 pObj->CreatorGid = pSession->Gid;
2013 pObj->CreatorProcess= pSession->Process;
2014 supdrvOSObjInitCreator(pObj, pSession);
2015
2016 /*
2017 * Allocate the usage record.
2018 * (We keep freed usage records around to simplify SUPR0ObjAddRefEx().)
2019 */
2020 RTSpinlockAcquire(pDevExt->Spinlock, &SpinlockTmp);
2021
2022 pUsage = pDevExt->pUsageFree;
2023 if (pUsage)
2024 pDevExt->pUsageFree = pUsage->pNext;
2025 else
2026 {
2027 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
2028 pUsage = (PSUPDRVUSAGE)RTMemAlloc(sizeof(*pUsage));
2029 if (!pUsage)
2030 {
2031 RTMemFree(pObj);
2032 return NULL;
2033 }
2034 RTSpinlockAcquire(pDevExt->Spinlock, &SpinlockTmp);
2035 }
2036
2037 /*
2038 * Insert the object and create the session usage record.
2039 */
2040 /* The object. */
2041 pObj->pNext = pDevExt->pObjs;
2042 pDevExt->pObjs = pObj;
2043
2044 /* The session record. */
2045 pUsage->cUsage = 1;
2046 pUsage->pObj = pObj;
2047 pUsage->pNext = pSession->pUsage;
2048 /* Log2(("SUPR0ObjRegister: pUsage=%p:{.pObj=%p, .pNext=%p}\n", pUsage, pUsage->pObj, pUsage->pNext)); */
2049 pSession->pUsage = pUsage;
2050
2051 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
2052
2053 Log(("SUPR0ObjRegister: returns %p (pvUser1=%p, pvUser=%p)\n", pObj, pvUser1, pvUser2));
2054 return pObj;
2055}
2056
2057
2058/**
2059 * Increment the reference counter for the object associating the reference
2060 * with the specified session.
2061 *
2062 * @returns IPRT status code.
2063 * @param pvObj The identifier returned by SUPR0ObjRegister().
2064 * @param pSession The session which is referencing the object.
2065 *
2066 * @remarks The caller should not own any spinlocks and must carefully protect
2067 * itself against potential race with the destructor so freed memory
2068 * isn't accessed here.
2069 */
2070SUPR0DECL(int) SUPR0ObjAddRef(void *pvObj, PSUPDRVSESSION pSession)
2071{
2072 return SUPR0ObjAddRefEx(pvObj, pSession, false /* fNoBlocking */);
2073}
2074
2075
2076/**
2077 * Increment the reference counter for the object associating the reference
2078 * with the specified session.
2079 *
2080 * @returns IPRT status code.
2081 * @retval VERR_TRY_AGAIN if fNoBlocking was set and a new usage record
2082 * couldn't be allocated. (If you see this you're not doing the right
2083 * thing and it won't ever work reliably.)
2084 *
2085 * @param pvObj The identifier returned by SUPR0ObjRegister().
2086 * @param pSession The session which is referencing the object.
2087 * @param fNoBlocking Set if it's not OK to block. Never try to make the
2088 * first reference to an object in a session with this
2089 * argument set.
2090 *
2091 * @remarks The caller should not own any spinlocks and must carefully protect
2092 * itself against potential race with the destructor so freed memory
2093 * isn't accessed here.
2094 */
2095SUPR0DECL(int) SUPR0ObjAddRefEx(void *pvObj, PSUPDRVSESSION pSession, bool fNoBlocking)
2096{
2097 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
2098 PSUPDRVDEVEXT pDevExt = pSession->pDevExt;
2099 PSUPDRVOBJ pObj = (PSUPDRVOBJ)pvObj;
2100 int rc = VINF_SUCCESS;
2101 PSUPDRVUSAGE pUsagePre;
2102 PSUPDRVUSAGE pUsage;
2103
2104 /*
2105 * Validate the input.
2106 * Be ready for the destruction race (someone might be stuck in the
2107 * destructor waiting a lock we own).
2108 */
2109 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2110 AssertPtrReturn(pObj, VERR_INVALID_POINTER);
2111 AssertMsgReturn(pObj->u32Magic == SUPDRVOBJ_MAGIC || pObj->u32Magic == SUPDRVOBJ_MAGIC_DEAD,
2112 ("Invalid pvObj=%p magic=%#x (expected %#x or %#x)\n", pvObj, pObj->u32Magic, SUPDRVOBJ_MAGIC, SUPDRVOBJ_MAGIC_DEAD),
2113 VERR_INVALID_PARAMETER);
2114
2115 RTSpinlockAcquire(pDevExt->Spinlock, &SpinlockTmp);
2116
2117 if (RT_UNLIKELY(pObj->u32Magic != SUPDRVOBJ_MAGIC))
2118 {
2119 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
2120
2121 AssertMsgFailed(("pvObj=%p magic=%#x\n", pvObj, pObj->u32Magic));
2122 return VERR_WRONG_ORDER;
2123 }
2124
2125 /*
2126 * Preallocate the usage record if we can.
2127 */
2128 pUsagePre = pDevExt->pUsageFree;
2129 if (pUsagePre)
2130 pDevExt->pUsageFree = pUsagePre->pNext;
2131 else if (!fNoBlocking)
2132 {
2133 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
2134 pUsagePre = (PSUPDRVUSAGE)RTMemAlloc(sizeof(*pUsagePre));
2135 if (!pUsagePre)
2136 return VERR_NO_MEMORY;
2137
2138 RTSpinlockAcquire(pDevExt->Spinlock, &SpinlockTmp);
2139 if (RT_UNLIKELY(pObj->u32Magic != SUPDRVOBJ_MAGIC))
2140 {
2141 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
2142
2143 AssertMsgFailed(("pvObj=%p magic=%#x\n", pvObj, pObj->u32Magic));
2144 return VERR_WRONG_ORDER;
2145 }
2146 }
2147
2148 /*
2149 * Reference the object.
2150 */
2151 pObj->cUsage++;
2152
2153 /*
2154 * Look for the session record.
2155 */
2156 for (pUsage = pSession->pUsage; pUsage; pUsage = pUsage->pNext)
2157 {
2158 /*Log(("SUPR0AddRef: pUsage=%p:{.pObj=%p, .pNext=%p}\n", pUsage, pUsage->pObj, pUsage->pNext));*/
2159 if (pUsage->pObj == pObj)
2160 break;
2161 }
2162 if (pUsage)
2163 pUsage->cUsage++;
2164 else if (pUsagePre)
2165 {
2166 /* create a new session record. */
2167 pUsagePre->cUsage = 1;
2168 pUsagePre->pObj = pObj;
2169 pUsagePre->pNext = pSession->pUsage;
2170 pSession->pUsage = pUsagePre;
2171 /*Log(("SUPR0AddRef: pUsagePre=%p:{.pObj=%p, .pNext=%p}\n", pUsagePre, pUsagePre->pObj, pUsagePre->pNext));*/
2172
2173 pUsagePre = NULL;
2174 }
2175 else
2176 {
2177 pObj->cUsage--;
2178 rc = VERR_TRY_AGAIN;
2179 }
2180
2181 /*
2182 * Put any unused usage record into the free list..
2183 */
2184 if (pUsagePre)
2185 {
2186 pUsagePre->pNext = pDevExt->pUsageFree;
2187 pDevExt->pUsageFree = pUsagePre;
2188 }
2189
2190 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
2191
2192 return rc;
2193}
2194
2195
2196/**
2197 * Decrement / destroy a reference counter record for an object.
2198 *
2199 * The object is uniquely identified by pfnDestructor+pvUser1+pvUser2.
2200 *
2201 * @returns IPRT status code.
2202 * @retval VINF_SUCCESS if not destroyed.
2203 * @retval VINF_OBJECT_DESTROYED if it's destroyed by this release call.
2204 * @retval VERR_INVALID_PARAMETER if the object isn't valid. Will assert in
2205 * string builds.
2206 *
2207 * @param pvObj The identifier returned by SUPR0ObjRegister().
2208 * @param pSession The session which is referencing the object.
2209 */
2210SUPR0DECL(int) SUPR0ObjRelease(void *pvObj, PSUPDRVSESSION pSession)
2211{
2212 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
2213 PSUPDRVDEVEXT pDevExt = pSession->pDevExt;
2214 PSUPDRVOBJ pObj = (PSUPDRVOBJ)pvObj;
2215 int rc = VERR_INVALID_PARAMETER;
2216 PSUPDRVUSAGE pUsage;
2217 PSUPDRVUSAGE pUsagePrev;
2218
2219 /*
2220 * Validate the input.
2221 */
2222 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2223 AssertMsgReturn(VALID_PTR(pObj) && pObj->u32Magic == SUPDRVOBJ_MAGIC,
2224 ("Invalid pvObj=%p magic=%#x (exepcted %#x)\n", pvObj, pObj ? pObj->u32Magic : 0, SUPDRVOBJ_MAGIC),
2225 VERR_INVALID_PARAMETER);
2226
2227 /*
2228 * Acquire the spinlock and look for the usage record.
2229 */
2230 RTSpinlockAcquire(pDevExt->Spinlock, &SpinlockTmp);
2231
2232 for (pUsagePrev = NULL, pUsage = pSession->pUsage;
2233 pUsage;
2234 pUsagePrev = pUsage, pUsage = pUsage->pNext)
2235 {
2236 /*Log2(("SUPR0ObjRelease: pUsage=%p:{.pObj=%p, .pNext=%p}\n", pUsage, pUsage->pObj, pUsage->pNext));*/
2237 if (pUsage->pObj == pObj)
2238 {
2239 rc = VINF_SUCCESS;
2240 AssertMsg(pUsage->cUsage >= 1 && pObj->cUsage >= pUsage->cUsage, ("glob %d; sess %d\n", pObj->cUsage, pUsage->cUsage));
2241 if (pUsage->cUsage > 1)
2242 {
2243 pObj->cUsage--;
2244 pUsage->cUsage--;
2245 }
2246 else
2247 {
2248 /*
2249 * Free the session record.
2250 */
2251 if (pUsagePrev)
2252 pUsagePrev->pNext = pUsage->pNext;
2253 else
2254 pSession->pUsage = pUsage->pNext;
2255 pUsage->pNext = pDevExt->pUsageFree;
2256 pDevExt->pUsageFree = pUsage;
2257
2258 /* What about the object? */
2259 if (pObj->cUsage > 1)
2260 pObj->cUsage--;
2261 else
2262 {
2263 /*
2264 * Object is to be destroyed, unlink it.
2265 */
2266 pObj->u32Magic = SUPDRVOBJ_MAGIC_DEAD;
2267 rc = VINF_OBJECT_DESTROYED;
2268 if (pDevExt->pObjs == pObj)
2269 pDevExt->pObjs = pObj->pNext;
2270 else
2271 {
2272 PSUPDRVOBJ pObjPrev;
2273 for (pObjPrev = pDevExt->pObjs; pObjPrev; pObjPrev = pObjPrev->pNext)
2274 if (pObjPrev->pNext == pObj)
2275 {
2276 pObjPrev->pNext = pObj->pNext;
2277 break;
2278 }
2279 Assert(pObjPrev);
2280 }
2281 }
2282 }
2283 break;
2284 }
2285 }
2286
2287 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
2288
2289 /*
2290 * Call the destructor and free the object if required.
2291 */
2292 if (rc == VINF_OBJECT_DESTROYED)
2293 {
2294 Log(("SUPR0ObjRelease: destroying %p/%d (%p/%p) cpid=%RTproc pid=%RTproc dtor=%p\n",
2295 pObj, pObj->enmType, pObj->pvUser1, pObj->pvUser2, pObj->CreatorProcess, RTProcSelf(), pObj->pfnDestructor));
2296 if (pObj->pfnDestructor)
2297 pObj->pfnDestructor(pObj, pObj->pvUser1, pObj->pvUser2);
2298 RTMemFree(pObj);
2299 }
2300
2301 AssertMsg(pUsage, ("pvObj=%p\n", pvObj));
2302 return rc;
2303}
2304
2305
2306/**
2307 * Verifies that the current process can access the specified object.
2308 *
2309 * @returns The following IPRT status code:
2310 * @retval VINF_SUCCESS if access was granted.
2311 * @retval VERR_PERMISSION_DENIED if denied access.
2312 * @retval VERR_INVALID_PARAMETER if invalid parameter.
2313 *
2314 * @param pvObj The identifier returned by SUPR0ObjRegister().
2315 * @param pSession The session which wishes to access the object.
2316 * @param pszObjName Object string name. This is optional and depends on the object type.
2317 *
2318 * @remark The caller is responsible for making sure the object isn't removed while
2319 * we're inside this function. If uncertain about this, just call AddRef before calling us.
2320 */
2321SUPR0DECL(int) SUPR0ObjVerifyAccess(void *pvObj, PSUPDRVSESSION pSession, const char *pszObjName)
2322{
2323 PSUPDRVOBJ pObj = (PSUPDRVOBJ)pvObj;
2324 int rc;
2325
2326 /*
2327 * Validate the input.
2328 */
2329 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2330 AssertMsgReturn(VALID_PTR(pObj) && pObj->u32Magic == SUPDRVOBJ_MAGIC,
2331 ("Invalid pvObj=%p magic=%#x (exepcted %#x)\n", pvObj, pObj ? pObj->u32Magic : 0, SUPDRVOBJ_MAGIC),
2332 VERR_INVALID_PARAMETER);
2333
2334 /*
2335 * Check access. (returns true if a decision has been made.)
2336 */
2337 rc = VERR_INTERNAL_ERROR;
2338 if (supdrvOSObjCanAccess(pObj, pSession, pszObjName, &rc))
2339 return rc;
2340
2341 /*
2342 * Default policy is to allow the user to access his own
2343 * stuff but nothing else.
2344 */
2345 if (pObj->CreatorUid == pSession->Uid)
2346 return VINF_SUCCESS;
2347 return VERR_PERMISSION_DENIED;
2348}
2349
2350
2351/**
2352 * Lock pages.
2353 *
2354 * @returns IPRT status code.
2355 * @param pSession Session to which the locked memory should be associated.
2356 * @param pvR3 Start of the memory range to lock.
2357 * This must be page aligned.
2358 * @param cPages Number of pages to lock.
2359 * @param paPages Where to put the physical addresses of locked memory.
2360 */
2361SUPR0DECL(int) SUPR0LockMem(PSUPDRVSESSION pSession, RTR3PTR pvR3, uint32_t cPages, PRTHCPHYS paPages)
2362{
2363 int rc;
2364 SUPDRVMEMREF Mem = { NIL_RTR0MEMOBJ, NIL_RTR0MEMOBJ, MEMREF_TYPE_UNUSED };
2365 const size_t cb = (size_t)cPages << PAGE_SHIFT;
2366 LogFlow(("SUPR0LockMem: pSession=%p pvR3=%p cPages=%d paPages=%p\n", pSession, (void *)pvR3, cPages, paPages));
2367
2368 /*
2369 * Verify input.
2370 */
2371 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2372 AssertPtrReturn(paPages, VERR_INVALID_PARAMETER);
2373 if ( RT_ALIGN_R3PT(pvR3, PAGE_SIZE, RTR3PTR) != pvR3
2374 || !pvR3)
2375 {
2376 Log(("pvR3 (%p) must be page aligned and not NULL!\n", (void *)pvR3));
2377 return VERR_INVALID_PARAMETER;
2378 }
2379
2380 /*
2381 * Let IPRT do the job.
2382 */
2383 Mem.eType = MEMREF_TYPE_LOCKED;
2384 rc = RTR0MemObjLockUser(&Mem.MemObj, pvR3, cb, RTMEM_PROT_READ | RTMEM_PROT_WRITE, RTR0ProcHandleSelf());
2385 if (RT_SUCCESS(rc))
2386 {
2387 uint32_t iPage = cPages;
2388 AssertMsg(RTR0MemObjAddressR3(Mem.MemObj) == pvR3, ("%p == %p\n", RTR0MemObjAddressR3(Mem.MemObj), pvR3));
2389 AssertMsg(RTR0MemObjSize(Mem.MemObj) == cb, ("%x == %x\n", RTR0MemObjSize(Mem.MemObj), cb));
2390
2391 while (iPage-- > 0)
2392 {
2393 paPages[iPage] = RTR0MemObjGetPagePhysAddr(Mem.MemObj, iPage);
2394 if (RT_UNLIKELY(paPages[iPage] == NIL_RTCCPHYS))
2395 {
2396 AssertMsgFailed(("iPage=%d\n", iPage));
2397 rc = VERR_INTERNAL_ERROR;
2398 break;
2399 }
2400 }
2401 if (RT_SUCCESS(rc))
2402 rc = supdrvMemAdd(&Mem, pSession);
2403 if (RT_FAILURE(rc))
2404 {
2405 int rc2 = RTR0MemObjFree(Mem.MemObj, false);
2406 AssertRC(rc2);
2407 }
2408 }
2409
2410 return rc;
2411}
2412
2413
2414/**
2415 * Unlocks the memory pointed to by pv.
2416 *
2417 * @returns IPRT status code.
2418 * @param pSession Session to which the memory was locked.
2419 * @param pvR3 Memory to unlock.
2420 */
2421SUPR0DECL(int) SUPR0UnlockMem(PSUPDRVSESSION pSession, RTR3PTR pvR3)
2422{
2423 LogFlow(("SUPR0UnlockMem: pSession=%p pvR3=%p\n", pSession, (void *)pvR3));
2424 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2425 return supdrvMemRelease(pSession, (RTHCUINTPTR)pvR3, MEMREF_TYPE_LOCKED);
2426}
2427
2428
2429/**
2430 * Allocates a chunk of page aligned memory with contiguous and fixed physical
2431 * backing.
2432 *
2433 * @returns IPRT status code.
2434 * @param pSession Session data.
2435 * @param cPages Number of pages to allocate.
2436 * @param ppvR0 Where to put the address of Ring-0 mapping the allocated memory.
2437 * @param ppvR3 Where to put the address of Ring-3 mapping the allocated memory.
2438 * @param pHCPhys Where to put the physical address of allocated memory.
2439 */
2440SUPR0DECL(int) SUPR0ContAlloc(PSUPDRVSESSION pSession, uint32_t cPages, PRTR0PTR ppvR0, PRTR3PTR ppvR3, PRTHCPHYS pHCPhys)
2441{
2442 int rc;
2443 SUPDRVMEMREF Mem = { NIL_RTR0MEMOBJ, NIL_RTR0MEMOBJ, MEMREF_TYPE_UNUSED };
2444 LogFlow(("SUPR0ContAlloc: pSession=%p cPages=%d ppvR0=%p ppvR3=%p pHCPhys=%p\n", pSession, cPages, ppvR0, ppvR3, pHCPhys));
2445
2446 /*
2447 * Validate input.
2448 */
2449 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2450 if (!ppvR3 || !ppvR0 || !pHCPhys)
2451 {
2452 Log(("Null pointer. All of these should be set: pSession=%p ppvR0=%p ppvR3=%p pHCPhys=%p\n",
2453 pSession, ppvR0, ppvR3, pHCPhys));
2454 return VERR_INVALID_PARAMETER;
2455
2456 }
2457 if (cPages < 1 || cPages >= 256)
2458 {
2459 Log(("Illegal request cPages=%d, must be greater than 0 and smaller than 256.\n", cPages));
2460 return VERR_PAGE_COUNT_OUT_OF_RANGE;
2461 }
2462
2463 /*
2464 * Let IPRT do the job.
2465 */
2466 rc = RTR0MemObjAllocCont(&Mem.MemObj, cPages << PAGE_SHIFT, true /* executable R0 mapping */);
2467 if (RT_SUCCESS(rc))
2468 {
2469 int rc2;
2470 rc = RTR0MemObjMapUser(&Mem.MapObjR3, Mem.MemObj, (RTR3PTR)-1, 0,
2471 RTMEM_PROT_EXEC | RTMEM_PROT_WRITE | RTMEM_PROT_READ, RTR0ProcHandleSelf());
2472 if (RT_SUCCESS(rc))
2473 {
2474 Mem.eType = MEMREF_TYPE_CONT;
2475 rc = supdrvMemAdd(&Mem, pSession);
2476 if (!rc)
2477 {
2478 *ppvR0 = RTR0MemObjAddress(Mem.MemObj);
2479 *ppvR3 = RTR0MemObjAddressR3(Mem.MapObjR3);
2480 *pHCPhys = RTR0MemObjGetPagePhysAddr(Mem.MemObj, 0);
2481 return 0;
2482 }
2483
2484 rc2 = RTR0MemObjFree(Mem.MapObjR3, false);
2485 AssertRC(rc2);
2486 }
2487 rc2 = RTR0MemObjFree(Mem.MemObj, false);
2488 AssertRC(rc2);
2489 }
2490
2491 return rc;
2492}
2493
2494
2495/**
2496 * Frees memory allocated using SUPR0ContAlloc().
2497 *
2498 * @returns IPRT status code.
2499 * @param pSession The session to which the memory was allocated.
2500 * @param uPtr Pointer to the memory (ring-3 or ring-0).
2501 */
2502SUPR0DECL(int) SUPR0ContFree(PSUPDRVSESSION pSession, RTHCUINTPTR uPtr)
2503{
2504 LogFlow(("SUPR0ContFree: pSession=%p uPtr=%p\n", pSession, (void *)uPtr));
2505 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2506 return supdrvMemRelease(pSession, uPtr, MEMREF_TYPE_CONT);
2507}
2508
2509
2510/**
2511 * Allocates a chunk of page aligned memory with fixed physical backing below 4GB.
2512 *
2513 * The memory isn't zeroed.
2514 *
2515 * @returns IPRT status code.
2516 * @param pSession Session data.
2517 * @param cPages Number of pages to allocate.
2518 * @param ppvR0 Where to put the address of Ring-0 mapping of the allocated memory.
2519 * @param ppvR3 Where to put the address of Ring-3 mapping of the allocated memory.
2520 * @param paPages Where to put the physical addresses of allocated memory.
2521 */
2522SUPR0DECL(int) SUPR0LowAlloc(PSUPDRVSESSION pSession, uint32_t cPages, PRTR0PTR ppvR0, PRTR3PTR ppvR3, PRTHCPHYS paPages)
2523{
2524 unsigned iPage;
2525 int rc;
2526 SUPDRVMEMREF Mem = { NIL_RTR0MEMOBJ, NIL_RTR0MEMOBJ, MEMREF_TYPE_UNUSED };
2527 LogFlow(("SUPR0LowAlloc: pSession=%p cPages=%d ppvR3=%p ppvR0=%p paPages=%p\n", pSession, cPages, ppvR3, ppvR0, paPages));
2528
2529 /*
2530 * Validate input.
2531 */
2532 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2533 if (!ppvR3 || !ppvR0 || !paPages)
2534 {
2535 Log(("Null pointer. All of these should be set: pSession=%p ppvR3=%p ppvR0=%p paPages=%p\n",
2536 pSession, ppvR3, ppvR0, paPages));
2537 return VERR_INVALID_PARAMETER;
2538
2539 }
2540 if (cPages < 1 || cPages >= 256)
2541 {
2542 Log(("Illegal request cPages=%d, must be greater than 0 and smaller than 256.\n", cPages));
2543 return VERR_PAGE_COUNT_OUT_OF_RANGE;
2544 }
2545
2546 /*
2547 * Let IPRT do the work.
2548 */
2549 rc = RTR0MemObjAllocLow(&Mem.MemObj, cPages << PAGE_SHIFT, true /* executable ring-0 mapping */);
2550 if (RT_SUCCESS(rc))
2551 {
2552 int rc2;
2553 rc = RTR0MemObjMapUser(&Mem.MapObjR3, Mem.MemObj, (RTR3PTR)-1, 0,
2554 RTMEM_PROT_EXEC | RTMEM_PROT_WRITE | RTMEM_PROT_READ, RTR0ProcHandleSelf());
2555 if (RT_SUCCESS(rc))
2556 {
2557 Mem.eType = MEMREF_TYPE_LOW;
2558 rc = supdrvMemAdd(&Mem, pSession);
2559 if (!rc)
2560 {
2561 for (iPage = 0; iPage < cPages; iPage++)
2562 {
2563 paPages[iPage] = RTR0MemObjGetPagePhysAddr(Mem.MemObj, iPage);
2564 AssertMsg(!(paPages[iPage] & (PAGE_SIZE - 1)), ("iPage=%d Phys=%RHp\n", paPages[iPage]));
2565 }
2566 *ppvR0 = RTR0MemObjAddress(Mem.MemObj);
2567 *ppvR3 = RTR0MemObjAddressR3(Mem.MapObjR3);
2568 return 0;
2569 }
2570
2571 rc2 = RTR0MemObjFree(Mem.MapObjR3, false);
2572 AssertRC(rc2);
2573 }
2574
2575 rc2 = RTR0MemObjFree(Mem.MemObj, false);
2576 AssertRC(rc2);
2577 }
2578
2579 return rc;
2580}
2581
2582
2583/**
2584 * Frees memory allocated using SUPR0LowAlloc().
2585 *
2586 * @returns IPRT status code.
2587 * @param pSession The session to which the memory was allocated.
2588 * @param uPtr Pointer to the memory (ring-3 or ring-0).
2589 */
2590SUPR0DECL(int) SUPR0LowFree(PSUPDRVSESSION pSession, RTHCUINTPTR uPtr)
2591{
2592 LogFlow(("SUPR0LowFree: pSession=%p uPtr=%p\n", pSession, (void *)uPtr));
2593 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2594 return supdrvMemRelease(pSession, uPtr, MEMREF_TYPE_LOW);
2595}
2596
2597
2598
2599/**
2600 * Allocates a chunk of memory with both R0 and R3 mappings.
2601 * The memory is fixed and it's possible to query the physical addresses using SUPR0MemGetPhys().
2602 *
2603 * @returns IPRT status code.
2604 * @param pSession The session to associated the allocation with.
2605 * @param cb Number of bytes to allocate.
2606 * @param ppvR0 Where to store the address of the Ring-0 mapping.
2607 * @param ppvR3 Where to store the address of the Ring-3 mapping.
2608 */
2609SUPR0DECL(int) SUPR0MemAlloc(PSUPDRVSESSION pSession, uint32_t cb, PRTR0PTR ppvR0, PRTR3PTR ppvR3)
2610{
2611 int rc;
2612 SUPDRVMEMREF Mem = { NIL_RTR0MEMOBJ, NIL_RTR0MEMOBJ, MEMREF_TYPE_UNUSED };
2613 LogFlow(("SUPR0MemAlloc: pSession=%p cb=%d ppvR0=%p ppvR3=%p\n", pSession, cb, ppvR0, ppvR3));
2614
2615 /*
2616 * Validate input.
2617 */
2618 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2619 AssertPtrReturn(ppvR0, VERR_INVALID_POINTER);
2620 AssertPtrReturn(ppvR3, VERR_INVALID_POINTER);
2621 if (cb < 1 || cb >= _4M)
2622 {
2623 Log(("Illegal request cb=%u; must be greater than 0 and smaller than 4MB.\n", cb));
2624 return VERR_INVALID_PARAMETER;
2625 }
2626
2627 /*
2628 * Let IPRT do the work.
2629 */
2630 rc = RTR0MemObjAllocPage(&Mem.MemObj, cb, true /* executable ring-0 mapping */);
2631 if (RT_SUCCESS(rc))
2632 {
2633 int rc2;
2634 rc = RTR0MemObjMapUser(&Mem.MapObjR3, Mem.MemObj, (RTR3PTR)-1, 0,
2635 RTMEM_PROT_EXEC | RTMEM_PROT_WRITE | RTMEM_PROT_READ, RTR0ProcHandleSelf());
2636 if (RT_SUCCESS(rc))
2637 {
2638 Mem.eType = MEMREF_TYPE_MEM;
2639 rc = supdrvMemAdd(&Mem, pSession);
2640 if (!rc)
2641 {
2642 *ppvR0 = RTR0MemObjAddress(Mem.MemObj);
2643 *ppvR3 = RTR0MemObjAddressR3(Mem.MapObjR3);
2644 return VINF_SUCCESS;
2645 }
2646
2647 rc2 = RTR0MemObjFree(Mem.MapObjR3, false);
2648 AssertRC(rc2);
2649 }
2650
2651 rc2 = RTR0MemObjFree(Mem.MemObj, false);
2652 AssertRC(rc2);
2653 }
2654
2655 return rc;
2656}
2657
2658
2659/**
2660 * Get the physical addresses of memory allocated using SUPR0MemAlloc().
2661 *
2662 * @returns IPRT status code.
2663 * @param pSession The session to which the memory was allocated.
2664 * @param uPtr The Ring-0 or Ring-3 address returned by SUPR0MemAlloc().
2665 * @param paPages Where to store the physical addresses.
2666 */
2667SUPR0DECL(int) SUPR0MemGetPhys(PSUPDRVSESSION pSession, RTHCUINTPTR uPtr, PSUPPAGE paPages) /** @todo switch this bugger to RTHCPHYS */
2668{
2669 PSUPDRVBUNDLE pBundle;
2670 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
2671 LogFlow(("SUPR0MemGetPhys: pSession=%p uPtr=%p paPages=%p\n", pSession, (void *)uPtr, paPages));
2672
2673 /*
2674 * Validate input.
2675 */
2676 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2677 AssertPtrReturn(paPages, VERR_INVALID_POINTER);
2678 AssertReturn(uPtr, VERR_INVALID_PARAMETER);
2679
2680 /*
2681 * Search for the address.
2682 */
2683 RTSpinlockAcquire(pSession->Spinlock, &SpinlockTmp);
2684 for (pBundle = &pSession->Bundle; pBundle; pBundle = pBundle->pNext)
2685 {
2686 if (pBundle->cUsed > 0)
2687 {
2688 unsigned i;
2689 for (i = 0; i < RT_ELEMENTS(pBundle->aMem); i++)
2690 {
2691 if ( pBundle->aMem[i].eType == MEMREF_TYPE_MEM
2692 && pBundle->aMem[i].MemObj != NIL_RTR0MEMOBJ
2693 && ( (RTHCUINTPTR)RTR0MemObjAddress(pBundle->aMem[i].MemObj) == uPtr
2694 || ( pBundle->aMem[i].MapObjR3 != NIL_RTR0MEMOBJ
2695 && RTR0MemObjAddressR3(pBundle->aMem[i].MapObjR3) == uPtr)
2696 )
2697 )
2698 {
2699 const size_t cPages = RTR0MemObjSize(pBundle->aMem[i].MemObj) >> PAGE_SHIFT;
2700 size_t iPage;
2701 for (iPage = 0; iPage < cPages; iPage++)
2702 {
2703 paPages[iPage].Phys = RTR0MemObjGetPagePhysAddr(pBundle->aMem[i].MemObj, iPage);
2704 paPages[iPage].uReserved = 0;
2705 }
2706 RTSpinlockRelease(pSession->Spinlock, &SpinlockTmp);
2707 return VINF_SUCCESS;
2708 }
2709 }
2710 }
2711 }
2712 RTSpinlockRelease(pSession->Spinlock, &SpinlockTmp);
2713 Log(("Failed to find %p!!!\n", (void *)uPtr));
2714 return VERR_INVALID_PARAMETER;
2715}
2716
2717
2718/**
2719 * Free memory allocated by SUPR0MemAlloc().
2720 *
2721 * @returns IPRT status code.
2722 * @param pSession The session owning the allocation.
2723 * @param uPtr The Ring-0 or Ring-3 address returned by SUPR0MemAlloc().
2724 */
2725SUPR0DECL(int) SUPR0MemFree(PSUPDRVSESSION pSession, RTHCUINTPTR uPtr)
2726{
2727 LogFlow(("SUPR0MemFree: pSession=%p uPtr=%p\n", pSession, (void *)uPtr));
2728 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2729 return supdrvMemRelease(pSession, uPtr, MEMREF_TYPE_MEM);
2730}
2731
2732
2733/**
2734 * Allocates a chunk of memory with a kernel or/and a user mode mapping.
2735 *
2736 * The memory is fixed and it's possible to query the physical addresses using
2737 * SUPR0MemGetPhys().
2738 *
2739 * @returns IPRT status code.
2740 * @param pSession The session to associated the allocation with.
2741 * @param cPages The number of pages to allocate.
2742 * @param fFlags Flags, reserved for the future. Must be zero.
2743 * @param ppvR3 Where to store the address of the Ring-3 mapping.
2744 * NULL if no ring-3 mapping.
2745 * @param ppvR3 Where to store the address of the Ring-0 mapping.
2746 * NULL if no ring-0 mapping.
2747 * @param paPages Where to store the addresses of the pages. Optional.
2748 */
2749SUPR0DECL(int) SUPR0PageAllocEx(PSUPDRVSESSION pSession, uint32_t cPages, uint32_t fFlags, PRTR3PTR ppvR3, PRTR0PTR ppvR0, PRTHCPHYS paPages)
2750{
2751 int rc;
2752 SUPDRVMEMREF Mem = { NIL_RTR0MEMOBJ, NIL_RTR0MEMOBJ, MEMREF_TYPE_UNUSED };
2753 LogFlow(("SUPR0PageAlloc: pSession=%p cb=%d ppvR3=%p\n", pSession, cPages, ppvR3));
2754
2755 /*
2756 * Validate input. The allowed allocation size must be at least equal to the maximum guest VRAM size.
2757 */
2758 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2759 AssertPtrNullReturn(ppvR3, VERR_INVALID_POINTER);
2760 AssertPtrNullReturn(ppvR0, VERR_INVALID_POINTER);
2761 AssertReturn(ppvR3 || ppvR0, VERR_INVALID_PARAMETER);
2762 AssertReturn(!fFlags, VERR_INVALID_PARAMETER);
2763 if (cPages < 1 || cPages > VBOX_MAX_ALLOC_PAGE_COUNT)
2764 {
2765 Log(("SUPR0PageAlloc: Illegal request cb=%u; must be greater than 0 and smaller than %uMB (VBOX_MAX_ALLOC_PAGE_COUNT pages).\n", cPages, VBOX_MAX_ALLOC_PAGE_COUNT * (_1M / _4K)));
2766 return VERR_PAGE_COUNT_OUT_OF_RANGE;
2767 }
2768
2769 /*
2770 * Let IPRT do the work.
2771 */
2772 if (ppvR0)
2773 rc = RTR0MemObjAllocPage(&Mem.MemObj, (size_t)cPages * PAGE_SIZE, true /* fExecutable */);
2774 else
2775 rc = RTR0MemObjAllocPhysNC(&Mem.MemObj, (size_t)cPages * PAGE_SIZE, NIL_RTHCPHYS);
2776 if (RT_SUCCESS(rc))
2777 {
2778 int rc2;
2779 if (ppvR3)
2780 rc = RTR0MemObjMapUser(&Mem.MapObjR3, Mem.MemObj, (RTR3PTR)-1, 0,
2781 RTMEM_PROT_EXEC | RTMEM_PROT_WRITE | RTMEM_PROT_READ, RTR0ProcHandleSelf());
2782 else
2783 Mem.MapObjR3 = NIL_RTR0MEMOBJ;
2784 if (RT_SUCCESS(rc))
2785 {
2786 Mem.eType = MEMREF_TYPE_PAGE;
2787 rc = supdrvMemAdd(&Mem, pSession);
2788 if (!rc)
2789 {
2790 if (ppvR3)
2791 *ppvR3 = RTR0MemObjAddressR3(Mem.MapObjR3);
2792 if (ppvR0)
2793 *ppvR0 = RTR0MemObjAddress(Mem.MemObj);
2794 if (paPages)
2795 {
2796 uint32_t iPage = cPages;
2797 while (iPage-- > 0)
2798 {
2799 paPages[iPage] = RTR0MemObjGetPagePhysAddr(Mem.MapObjR3, iPage);
2800 Assert(paPages[iPage] != NIL_RTHCPHYS);
2801 }
2802 }
2803 return VINF_SUCCESS;
2804 }
2805
2806 rc2 = RTR0MemObjFree(Mem.MapObjR3, false);
2807 AssertRC(rc2);
2808 }
2809
2810 rc2 = RTR0MemObjFree(Mem.MemObj, false);
2811 AssertRC(rc2);
2812 }
2813 return rc;
2814}
2815
2816
2817/**
2818 * Maps a chunk of memory previously allocated by SUPR0PageAllocEx into kernel
2819 * space.
2820 *
2821 * @returns IPRT status code.
2822 * @param pSession The session to associated the allocation with.
2823 * @param pvR3 The ring-3 address returned by SUPR0PageAllocEx.
2824 * @param offSub Where to start mapping. Must be page aligned.
2825 * @param cbSub How much to map. Must be page aligned.
2826 * @param fFlags Flags, MBZ.
2827 * @param ppvR0 Where to return the address of the ring-0 mapping on
2828 * success.
2829 */
2830SUPR0DECL(int) SUPR0PageMapKernel(PSUPDRVSESSION pSession, RTR3PTR pvR3, uint32_t offSub, uint32_t cbSub,
2831 uint32_t fFlags, PRTR0PTR ppvR0)
2832{
2833 int rc;
2834 PSUPDRVBUNDLE pBundle;
2835 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
2836 RTR0MEMOBJ hMemObj = NIL_RTR0MEMOBJ;
2837 LogFlow(("SUPR0PageMapKernel: pSession=%p pvR3=%p offSub=%#x cbSub=%#x\n", pSession, pvR3, offSub, cbSub));
2838
2839 /*
2840 * Validate input. The allowed allocation size must be at least equal to the maximum guest VRAM size.
2841 */
2842 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2843 AssertPtrNullReturn(ppvR0, VERR_INVALID_POINTER);
2844 AssertReturn(!fFlags, VERR_INVALID_PARAMETER);
2845 AssertReturn(!(offSub & PAGE_OFFSET_MASK), VERR_INVALID_PARAMETER);
2846 AssertReturn(!(cbSub & PAGE_OFFSET_MASK), VERR_INVALID_PARAMETER);
2847 AssertReturn(cbSub, VERR_INVALID_PARAMETER);
2848
2849 /*
2850 * Find the memory object.
2851 */
2852 RTSpinlockAcquire(pSession->Spinlock, &SpinlockTmp);
2853 for (pBundle = &pSession->Bundle; pBundle; pBundle = pBundle->pNext)
2854 {
2855 if (pBundle->cUsed > 0)
2856 {
2857 unsigned i;
2858 for (i = 0; i < RT_ELEMENTS(pBundle->aMem); i++)
2859 {
2860 if ( ( pBundle->aMem[i].eType == MEMREF_TYPE_PAGE
2861 && pBundle->aMem[i].MemObj != NIL_RTR0MEMOBJ
2862 && pBundle->aMem[i].MapObjR3 != NIL_RTR0MEMOBJ
2863 && RTR0MemObjAddressR3(pBundle->aMem[i].MapObjR3) == pvR3)
2864 || ( pBundle->aMem[i].eType == MEMREF_TYPE_LOCKED
2865 && pBundle->aMem[i].MemObj != NIL_RTR0MEMOBJ
2866 && pBundle->aMem[i].MapObjR3 == NIL_RTR0MEMOBJ
2867 && RTR0MemObjAddressR3(pBundle->aMem[i].MemObj) == pvR3))
2868 {
2869 hMemObj = pBundle->aMem[i].MemObj;
2870 break;
2871 }
2872 }
2873 }
2874 }
2875 RTSpinlockRelease(pSession->Spinlock, &SpinlockTmp);
2876
2877 rc = VERR_INVALID_PARAMETER;
2878 if (hMemObj != NIL_RTR0MEMOBJ)
2879 {
2880 /*
2881 * Do some further input validations before calling IPRT.
2882 * (Cleanup is done indirectly by telling RTR0MemObjFree to include mappings.)
2883 */
2884 size_t cbMemObj = RTR0MemObjSize(hMemObj);
2885 if ( offSub < cbMemObj
2886 && cbSub <= cbMemObj
2887 && offSub + cbSub <= cbMemObj)
2888 {
2889 RTR0MEMOBJ hMapObj;
2890 rc = RTR0MemObjMapKernelEx(&hMapObj, hMemObj, (void *)-1, 0,
2891 RTMEM_PROT_READ | RTMEM_PROT_WRITE, offSub, cbSub);
2892 if (RT_SUCCESS(rc))
2893 *ppvR0 = RTR0MemObjAddress(hMapObj);
2894 }
2895 else
2896 SUPR0Printf("SUPR0PageMapKernel: cbMemObj=%#x offSub=%#x cbSub=%#x\n", cbMemObj, offSub, cbSub);
2897
2898 }
2899 return rc;
2900}
2901
2902
2903/**
2904 * Changes the page level protection of one or more pages previously allocated
2905 * by SUPR0PageAllocEx.
2906 *
2907 * @returns IPRT status code.
2908 * @param pSession The session to associated the allocation with.
2909 * @param pvR3 The ring-3 address returned by SUPR0PageAllocEx.
2910 * NIL_RTR3PTR if the ring-3 mapping should be unaffected.
2911 * @param pvR0 The ring-0 address returned by SUPR0PageAllocEx.
2912 * NIL_RTR0PTR if the ring-0 mapping should be unaffected.
2913 * @param offSub Where to start changing. Must be page aligned.
2914 * @param cbSub How much to change. Must be page aligned.
2915 * @param fProt The new page level protection, see RTMEM_PROT_*.
2916 */
2917SUPR0DECL(int) SUPR0PageProtect(PSUPDRVSESSION pSession, RTR3PTR pvR3, RTR0PTR pvR0, uint32_t offSub, uint32_t cbSub, uint32_t fProt)
2918{
2919 int rc;
2920 PSUPDRVBUNDLE pBundle;
2921 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
2922 RTR0MEMOBJ hMemObjR0 = NIL_RTR0MEMOBJ;
2923 RTR0MEMOBJ hMemObjR3 = NIL_RTR0MEMOBJ;
2924 LogFlow(("SUPR0PageProtect: pSession=%p pvR3=%p pvR0=%p offSub=%#x cbSub=%#x fProt-%#x\n", pSession, pvR3, pvR0, offSub, cbSub, fProt));
2925
2926 /*
2927 * Validate input. The allowed allocation size must be at least equal to the maximum guest VRAM size.
2928 */
2929 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
2930 AssertReturn(!(fProt & ~(RTMEM_PROT_READ | RTMEM_PROT_WRITE | RTMEM_PROT_EXEC | RTMEM_PROT_NONE)), VERR_INVALID_PARAMETER);
2931 AssertReturn(!(offSub & PAGE_OFFSET_MASK), VERR_INVALID_PARAMETER);
2932 AssertReturn(!(cbSub & PAGE_OFFSET_MASK), VERR_INVALID_PARAMETER);
2933 AssertReturn(cbSub, VERR_INVALID_PARAMETER);
2934
2935 /*
2936 * Find the memory object.
2937 */
2938 RTSpinlockAcquire(pSession->Spinlock, &SpinlockTmp);
2939 for (pBundle = &pSession->Bundle; pBundle; pBundle = pBundle->pNext)
2940 {
2941 if (pBundle->cUsed > 0)
2942 {
2943 unsigned i;
2944 for (i = 0; i < RT_ELEMENTS(pBundle->aMem); i++)
2945 {
2946 if ( pBundle->aMem[i].eType == MEMREF_TYPE_PAGE
2947 && pBundle->aMem[i].MemObj != NIL_RTR0MEMOBJ
2948 && ( pBundle->aMem[i].MapObjR3 != NIL_RTR0MEMOBJ
2949 || pvR3 == NIL_RTR3PTR)
2950 && ( pvR0 == NIL_RTR0PTR
2951 || RTR0MemObjAddress(pBundle->aMem[i].MemObj) == pvR0)
2952 && ( pvR3 == NIL_RTR3PTR
2953 || RTR0MemObjAddressR3(pBundle->aMem[i].MapObjR3) == pvR3))
2954 {
2955 if (pvR0 != NIL_RTR0PTR)
2956 hMemObjR0 = pBundle->aMem[i].MemObj;
2957 if (pvR3 != NIL_RTR3PTR)
2958 hMemObjR3 = pBundle->aMem[i].MapObjR3;
2959 break;
2960 }
2961 }
2962 }
2963 }
2964 RTSpinlockRelease(pSession->Spinlock, &SpinlockTmp);
2965
2966 rc = VERR_INVALID_PARAMETER;
2967 if ( hMemObjR0 != NIL_RTR0MEMOBJ
2968 || hMemObjR3 != NIL_RTR0MEMOBJ)
2969 {
2970 /*
2971 * Do some further input validations before calling IPRT.
2972 */
2973 size_t cbMemObj = hMemObjR0 != NIL_RTR0PTR ? RTR0MemObjSize(hMemObjR0) : RTR0MemObjSize(hMemObjR3);
2974 if ( offSub < cbMemObj
2975 && cbSub <= cbMemObj
2976 && offSub + cbSub <= cbMemObj)
2977 {
2978 rc = VINF_SUCCESS;
2979 if (hMemObjR3 != NIL_RTR0PTR)
2980 rc = RTR0MemObjProtect(hMemObjR3, offSub, cbSub, fProt);
2981 if (hMemObjR0 != NIL_RTR0PTR && RT_SUCCESS(rc))
2982 rc = RTR0MemObjProtect(hMemObjR0, offSub, cbSub, fProt);
2983 }
2984 else
2985 SUPR0Printf("SUPR0PageMapKernel: cbMemObj=%#x offSub=%#x cbSub=%#x\n", cbMemObj, offSub, cbSub);
2986
2987 }
2988 return rc;
2989
2990}
2991
2992
2993/**
2994 * Free memory allocated by SUPR0PageAlloc() and SUPR0PageAllocEx().
2995 *
2996 * @returns IPRT status code.
2997 * @param pSession The session owning the allocation.
2998 * @param pvR3 The Ring-3 address returned by SUPR0PageAlloc() or
2999 * SUPR0PageAllocEx().
3000 */
3001SUPR0DECL(int) SUPR0PageFree(PSUPDRVSESSION pSession, RTR3PTR pvR3)
3002{
3003 LogFlow(("SUPR0PageFree: pSession=%p pvR3=%p\n", pSession, (void *)pvR3));
3004 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
3005 return supdrvMemRelease(pSession, (RTHCUINTPTR)pvR3, MEMREF_TYPE_PAGE);
3006}
3007
3008
3009/**
3010 * Gets the paging mode of the current CPU.
3011 *
3012 * @returns Paging mode, SUPPAGEINGMODE_INVALID on error.
3013 */
3014SUPR0DECL(SUPPAGINGMODE) SUPR0GetPagingMode(void)
3015{
3016 SUPPAGINGMODE enmMode;
3017
3018 RTR0UINTREG cr0 = ASMGetCR0();
3019 if ((cr0 & (X86_CR0_PG | X86_CR0_PE)) != (X86_CR0_PG | X86_CR0_PE))
3020 enmMode = SUPPAGINGMODE_INVALID;
3021 else
3022 {
3023 RTR0UINTREG cr4 = ASMGetCR4();
3024 uint32_t fNXEPlusLMA = 0;
3025 if (cr4 & X86_CR4_PAE)
3026 {
3027 uint32_t fAmdFeatures = ASMCpuId_EDX(0x80000001);
3028 if (fAmdFeatures & (X86_CPUID_AMD_FEATURE_EDX_NX | X86_CPUID_AMD_FEATURE_EDX_LONG_MODE))
3029 {
3030 uint64_t efer = ASMRdMsr(MSR_K6_EFER);
3031 if ((fAmdFeatures & X86_CPUID_AMD_FEATURE_EDX_NX) && (efer & MSR_K6_EFER_NXE))
3032 fNXEPlusLMA |= RT_BIT(0);
3033 if ((fAmdFeatures & X86_CPUID_AMD_FEATURE_EDX_LONG_MODE) && (efer & MSR_K6_EFER_LMA))
3034 fNXEPlusLMA |= RT_BIT(1);
3035 }
3036 }
3037
3038 switch ((cr4 & (X86_CR4_PAE | X86_CR4_PGE)) | fNXEPlusLMA)
3039 {
3040 case 0:
3041 enmMode = SUPPAGINGMODE_32_BIT;
3042 break;
3043
3044 case X86_CR4_PGE:
3045 enmMode = SUPPAGINGMODE_32_BIT_GLOBAL;
3046 break;
3047
3048 case X86_CR4_PAE:
3049 enmMode = SUPPAGINGMODE_PAE;
3050 break;
3051
3052 case X86_CR4_PAE | RT_BIT(0):
3053 enmMode = SUPPAGINGMODE_PAE_NX;
3054 break;
3055
3056 case X86_CR4_PAE | X86_CR4_PGE:
3057 enmMode = SUPPAGINGMODE_PAE_GLOBAL;
3058 break;
3059
3060 case X86_CR4_PAE | X86_CR4_PGE | RT_BIT(0):
3061 enmMode = SUPPAGINGMODE_PAE_GLOBAL;
3062 break;
3063
3064 case RT_BIT(1) | X86_CR4_PAE:
3065 enmMode = SUPPAGINGMODE_AMD64;
3066 break;
3067
3068 case RT_BIT(1) | X86_CR4_PAE | RT_BIT(0):
3069 enmMode = SUPPAGINGMODE_AMD64_NX;
3070 break;
3071
3072 case RT_BIT(1) | X86_CR4_PAE | X86_CR4_PGE:
3073 enmMode = SUPPAGINGMODE_AMD64_GLOBAL;
3074 break;
3075
3076 case RT_BIT(1) | X86_CR4_PAE | X86_CR4_PGE | RT_BIT(0):
3077 enmMode = SUPPAGINGMODE_AMD64_GLOBAL_NX;
3078 break;
3079
3080 default:
3081 AssertMsgFailed(("Cannot happen! cr4=%#x fNXEPlusLMA=%d\n", cr4, fNXEPlusLMA));
3082 enmMode = SUPPAGINGMODE_INVALID;
3083 break;
3084 }
3085 }
3086 return enmMode;
3087}
3088
3089
3090/**
3091 * Enables or disabled hardware virtualization extensions using native OS APIs.
3092 *
3093 * @returns VBox status code.
3094 * @retval VINF_SUCCESS on success.
3095 * @retval VERR_NOT_SUPPORTED if not supported by the native OS.
3096 *
3097 * @param fEnable Whether to enable or disable.
3098 */
3099SUPR0DECL(int) SUPR0EnableVTx(bool fEnable)
3100{
3101#ifdef RT_OS_DARWIN
3102 return supdrvOSEnableVTx(fEnable);
3103#else
3104 return VERR_NOT_SUPPORTED;
3105#endif
3106}
3107
3108
3109/** @todo document me */
3110SUPR0DECL(int) SUPR0QueryVTCaps(PSUPDRVSESSION pSession, uint32_t *pfCaps)
3111{
3112 /*
3113 * Input validation.
3114 */
3115 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
3116 AssertPtrReturn(pfCaps, VERR_INVALID_POINTER);
3117
3118 *pfCaps = 0;
3119
3120 if (ASMHasCpuId())
3121 {
3122 uint32_t u32FeaturesECX;
3123 uint32_t u32Dummy;
3124 uint32_t u32FeaturesEDX;
3125 uint32_t u32VendorEBX, u32VendorECX, u32VendorEDX, u32AMDFeatureEDX, u32AMDFeatureECX;
3126 uint64_t val;
3127
3128 ASMCpuId(0, &u32Dummy, &u32VendorEBX, &u32VendorECX, &u32VendorEDX);
3129 ASMCpuId(1, &u32Dummy, &u32Dummy, &u32FeaturesECX, &u32FeaturesEDX);
3130 /* Query AMD features. */
3131 ASMCpuId(0x80000001, &u32Dummy, &u32Dummy, &u32AMDFeatureECX, &u32AMDFeatureEDX);
3132
3133 if ( u32VendorEBX == X86_CPUID_VENDOR_INTEL_EBX
3134 && u32VendorECX == X86_CPUID_VENDOR_INTEL_ECX
3135 && u32VendorEDX == X86_CPUID_VENDOR_INTEL_EDX
3136 )
3137 {
3138 if ( (u32FeaturesECX & X86_CPUID_FEATURE_ECX_VMX)
3139 && (u32FeaturesEDX & X86_CPUID_FEATURE_EDX_MSR)
3140 && (u32FeaturesEDX & X86_CPUID_FEATURE_EDX_FXSR)
3141 )
3142 {
3143 val = ASMRdMsr(MSR_IA32_FEATURE_CONTROL);
3144 /*
3145 * Both the LOCK and VMXON bit must be set; otherwise VMXON will generate a #GP.
3146 * Once the lock bit is set, this MSR can no longer be modified.
3147 */
3148 if ( (val & (MSR_IA32_FEATURE_CONTROL_VMXON|MSR_IA32_FEATURE_CONTROL_LOCK))
3149 == (MSR_IA32_FEATURE_CONTROL_VMXON|MSR_IA32_FEATURE_CONTROL_LOCK) /* enabled and locked */
3150 || !(val & MSR_IA32_FEATURE_CONTROL_LOCK) /* not enabled, but not locked either */
3151 )
3152 {
3153 VMX_CAPABILITY vtCaps;
3154
3155 *pfCaps |= SUPVTCAPS_VT_X;
3156
3157 vtCaps.u = ASMRdMsr(MSR_IA32_VMX_PROCBASED_CTLS);
3158 if (vtCaps.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC_USE_SECONDARY_EXEC_CTRL)
3159 {
3160 vtCaps.u = ASMRdMsr(MSR_IA32_VMX_PROCBASED_CTLS2);
3161 if (vtCaps.n.allowed1 & VMX_VMCS_CTRL_PROC_EXEC2_EPT)
3162 *pfCaps |= SUPVTCAPS_NESTED_PAGING;
3163 }
3164 return VINF_SUCCESS;
3165 }
3166 return VERR_VMX_MSR_LOCKED_OR_DISABLED;
3167 }
3168 return VERR_VMX_NO_VMX;
3169 }
3170
3171 if ( u32VendorEBX == X86_CPUID_VENDOR_AMD_EBX
3172 && u32VendorECX == X86_CPUID_VENDOR_AMD_ECX
3173 && u32VendorEDX == X86_CPUID_VENDOR_AMD_EDX
3174 )
3175 {
3176 if ( (u32AMDFeatureECX & X86_CPUID_AMD_FEATURE_ECX_SVM)
3177 && (u32FeaturesEDX & X86_CPUID_FEATURE_EDX_MSR)
3178 && (u32FeaturesEDX & X86_CPUID_FEATURE_EDX_FXSR)
3179 )
3180 {
3181 /* Check if SVM is disabled */
3182 val = ASMRdMsr(MSR_K8_VM_CR);
3183 if (!(val & MSR_K8_VM_CR_SVM_DISABLE))
3184 {
3185 *pfCaps |= SUPVTCAPS_AMD_V;
3186
3187 /* Query AMD features. */
3188 ASMCpuId(0x8000000A, &u32Dummy, &u32Dummy, &u32Dummy, &u32FeaturesEDX);
3189
3190 if (u32FeaturesEDX & AMD_CPUID_SVM_FEATURE_EDX_NESTED_PAGING)
3191 *pfCaps |= SUPVTCAPS_NESTED_PAGING;
3192
3193 return VINF_SUCCESS;
3194 }
3195 return VERR_SVM_DISABLED;
3196 }
3197 return VERR_SVM_NO_SVM;
3198 }
3199 }
3200
3201 return VERR_UNSUPPORTED_CPU;
3202}
3203
3204
3205/**
3206 * (Re-)initializes the per-cpu structure prior to starting or resuming the GIP
3207 * updating.
3208 *
3209 * @param pGipCpu The per CPU structure for this CPU.
3210 * @param u64NanoTS The current time.
3211 */
3212static void supdrvGipReInitCpu(PSUPGIPCPU pGipCpu, uint64_t u64NanoTS)
3213{
3214 pGipCpu->u64TSC = ASMReadTSC() - pGipCpu->u32UpdateIntervalTSC;
3215 pGipCpu->u64NanoTS = u64NanoTS;
3216}
3217
3218
3219/**
3220 * Set the current TSC and NanoTS value for the CPU.
3221 *
3222 * @param idCpu The CPU ID. Unused - we have to use the APIC ID.
3223 * @param pvUser1 Pointer to the ring-0 GIP mapping.
3224 * @param pvUser2 Pointer to the variable holding the current time.
3225 */
3226static DECLCALLBACK(void) supdrvGipReInitCpuCallback(RTCPUID idCpu, void *pvUser1, void *pvUser2)
3227{
3228 PSUPGLOBALINFOPAGE pGip = (PSUPGLOBALINFOPAGE)pvUser1;
3229 unsigned iCpu = pGip->aiCpuFromApicId[ASMGetApicId()];
3230
3231 if (RT_LIKELY(iCpu < pGip->cCpus && pGip->aCPUs[iCpu].idCpu == idCpu))
3232 supdrvGipReInitCpu(&pGip->aCPUs[iCpu], *(uint64_t *)pvUser2);
3233
3234 NOREF(pvUser2);
3235 NOREF(idCpu);
3236}
3237
3238
3239/**
3240 * Maps the GIP into userspace and/or get the physical address of the GIP.
3241 *
3242 * @returns IPRT status code.
3243 * @param pSession Session to which the GIP mapping should belong.
3244 * @param ppGipR3 Where to store the address of the ring-3 mapping. (optional)
3245 * @param pHCPhysGip Where to store the physical address. (optional)
3246 *
3247 * @remark There is no reference counting on the mapping, so one call to this function
3248 * count globally as one reference. One call to SUPR0GipUnmap() is will unmap GIP
3249 * and remove the session as a GIP user.
3250 */
3251SUPR0DECL(int) SUPR0GipMap(PSUPDRVSESSION pSession, PRTR3PTR ppGipR3, PRTHCPHYS pHCPhysGip)
3252{
3253 int rc;
3254 PSUPDRVDEVEXT pDevExt = pSession->pDevExt;
3255 RTR3PTR pGipR3 = NIL_RTR3PTR;
3256 RTHCPHYS HCPhys = NIL_RTHCPHYS;
3257 LogFlow(("SUPR0GipMap: pSession=%p ppGipR3=%p pHCPhysGip=%p\n", pSession, ppGipR3, pHCPhysGip));
3258
3259 /*
3260 * Validate
3261 */
3262 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
3263 AssertPtrNullReturn(ppGipR3, VERR_INVALID_POINTER);
3264 AssertPtrNullReturn(pHCPhysGip, VERR_INVALID_POINTER);
3265
3266#ifdef SUPDRV_USE_MUTEX_FOR_GIP
3267 RTSemMutexRequest(pDevExt->mtxGip, RT_INDEFINITE_WAIT);
3268#else
3269 RTSemFastMutexRequest(pDevExt->mtxGip);
3270#endif
3271 if (pDevExt->pGip)
3272 {
3273 /*
3274 * Map it?
3275 */
3276 rc = VINF_SUCCESS;
3277 if (ppGipR3)
3278 {
3279 if (pSession->GipMapObjR3 == NIL_RTR0MEMOBJ)
3280 rc = RTR0MemObjMapUser(&pSession->GipMapObjR3, pDevExt->GipMemObj, (RTR3PTR)-1, 0,
3281 RTMEM_PROT_READ, RTR0ProcHandleSelf());
3282 if (RT_SUCCESS(rc))
3283 pGipR3 = RTR0MemObjAddressR3(pSession->GipMapObjR3);
3284 }
3285
3286 /*
3287 * Get physical address.
3288 */
3289 if (pHCPhysGip && RT_SUCCESS(rc))
3290 HCPhys = pDevExt->HCPhysGip;
3291
3292 /*
3293 * Reference globally.
3294 */
3295 if (!pSession->fGipReferenced && RT_SUCCESS(rc))
3296 {
3297 pSession->fGipReferenced = 1;
3298 pDevExt->cGipUsers++;
3299 if (pDevExt->cGipUsers == 1)
3300 {
3301 PSUPGLOBALINFOPAGE pGipR0 = pDevExt->pGip;
3302 uint64_t u64NanoTS;
3303 uint32_t u32SystemResolution;
3304 unsigned i;
3305
3306 LogFlow(("SUPR0GipMap: Resumes GIP updating\n"));
3307
3308 /*
3309 * Try bump up the system timer resolution.
3310 * The more interrupts the better...
3311 */
3312 if ( RT_SUCCESS_NP(RTTimerRequestSystemGranularity( 976563 /* 1024 HZ */, &u32SystemResolution))
3313 || RT_SUCCESS_NP(RTTimerRequestSystemGranularity( 1000000 /* 1000 HZ */, &u32SystemResolution))
3314 || RT_SUCCESS_NP(RTTimerRequestSystemGranularity( 1953125 /* 512 HZ */, &u32SystemResolution))
3315 || RT_SUCCESS_NP(RTTimerRequestSystemGranularity( 2000000 /* 500 HZ */, &u32SystemResolution))
3316 )
3317 {
3318 Assert(RTTimerGetSystemGranularity() <= u32SystemResolution);
3319 pDevExt->u32SystemTimerGranularityGrant = u32SystemResolution;
3320 }
3321
3322 if (pGipR0->aCPUs[0].u32TransactionId != 2 /* not the first time */)
3323 {
3324 for (i = 0; i < RT_ELEMENTS(pGipR0->aCPUs); i++)
3325 ASMAtomicUoWriteU32(&pGipR0->aCPUs[i].u32TransactionId,
3326 (pGipR0->aCPUs[i].u32TransactionId + GIP_UPDATEHZ_RECALC_FREQ * 2)
3327 & ~(GIP_UPDATEHZ_RECALC_FREQ * 2 - 1));
3328 ASMAtomicWriteU64(&pGipR0->u64NanoTSLastUpdateHz, 0);
3329 }
3330
3331 u64NanoTS = RTTimeSystemNanoTS() - pGipR0->u32UpdateIntervalNS;
3332 if ( pGipR0->u32Mode == SUPGIPMODE_SYNC_TSC
3333 || RTMpGetOnlineCount() == 1)
3334 supdrvGipReInitCpu(&pGipR0->aCPUs[0], u64NanoTS);
3335 else
3336 RTMpOnAll(supdrvGipReInitCpuCallback, pGipR0, &u64NanoTS);
3337
3338#ifndef DO_NOT_START_GIP
3339 rc = RTTimerStart(pDevExt->pGipTimer, 0); AssertRC(rc);
3340#endif
3341 rc = VINF_SUCCESS;
3342 }
3343 }
3344 }
3345 else
3346 {
3347 rc = VERR_GENERAL_FAILURE;
3348 Log(("SUPR0GipMap: GIP is not available!\n"));
3349 }
3350#ifdef SUPDRV_USE_MUTEX_FOR_GIP
3351 RTSemMutexRelease(pDevExt->mtxGip);
3352#else
3353 RTSemFastMutexRelease(pDevExt->mtxGip);
3354#endif
3355
3356 /*
3357 * Write returns.
3358 */
3359 if (pHCPhysGip)
3360 *pHCPhysGip = HCPhys;
3361 if (ppGipR3)
3362 *ppGipR3 = pGipR3;
3363
3364#ifdef DEBUG_DARWIN_GIP
3365 OSDBGPRINT(("SUPR0GipMap: returns %d *pHCPhysGip=%lx pGipR3=%p\n", rc, (unsigned long)HCPhys, (void *)pGipR3));
3366#else
3367 LogFlow(( "SUPR0GipMap: returns %d *pHCPhysGip=%lx pGipR3=%p\n", rc, (unsigned long)HCPhys, (void *)pGipR3));
3368#endif
3369 return rc;
3370}
3371
3372
3373/**
3374 * Unmaps any user mapping of the GIP and terminates all GIP access
3375 * from this session.
3376 *
3377 * @returns IPRT status code.
3378 * @param pSession Session to which the GIP mapping should belong.
3379 */
3380SUPR0DECL(int) SUPR0GipUnmap(PSUPDRVSESSION pSession)
3381{
3382 int rc = VINF_SUCCESS;
3383 PSUPDRVDEVEXT pDevExt = pSession->pDevExt;
3384#ifdef DEBUG_DARWIN_GIP
3385 OSDBGPRINT(("SUPR0GipUnmap: pSession=%p pGip=%p GipMapObjR3=%p\n",
3386 pSession,
3387 pSession->GipMapObjR3 != NIL_RTR0MEMOBJ ? RTR0MemObjAddress(pSession->GipMapObjR3) : NULL,
3388 pSession->GipMapObjR3));
3389#else
3390 LogFlow(("SUPR0GipUnmap: pSession=%p\n", pSession));
3391#endif
3392 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
3393
3394#ifdef SUPDRV_USE_MUTEX_FOR_GIP
3395 RTSemMutexRequest(pDevExt->mtxGip, RT_INDEFINITE_WAIT);
3396#else
3397 RTSemFastMutexRequest(pDevExt->mtxGip);
3398#endif
3399
3400 /*
3401 * Unmap anything?
3402 */
3403 if (pSession->GipMapObjR3 != NIL_RTR0MEMOBJ)
3404 {
3405 rc = RTR0MemObjFree(pSession->GipMapObjR3, false);
3406 AssertRC(rc);
3407 if (RT_SUCCESS(rc))
3408 pSession->GipMapObjR3 = NIL_RTR0MEMOBJ;
3409 }
3410
3411 /*
3412 * Dereference global GIP.
3413 */
3414 if (pSession->fGipReferenced && !rc)
3415 {
3416 pSession->fGipReferenced = 0;
3417 if ( pDevExt->cGipUsers > 0
3418 && !--pDevExt->cGipUsers)
3419 {
3420 LogFlow(("SUPR0GipUnmap: Suspends GIP updating\n"));
3421#ifndef DO_NOT_START_GIP
3422 rc = RTTimerStop(pDevExt->pGipTimer); AssertRC(rc); rc = VINF_SUCCESS;
3423#endif
3424
3425 if (pDevExt->u32SystemTimerGranularityGrant)
3426 {
3427 int rc2 = RTTimerReleaseSystemGranularity(pDevExt->u32SystemTimerGranularityGrant);
3428 AssertRC(rc2);
3429 pDevExt->u32SystemTimerGranularityGrant = 0;
3430 }
3431 }
3432 }
3433
3434#ifdef SUPDRV_USE_MUTEX_FOR_GIP
3435 RTSemMutexRelease(pDevExt->mtxGip);
3436#else
3437 RTSemFastMutexRelease(pDevExt->mtxGip);
3438#endif
3439
3440 return rc;
3441}
3442
3443
3444/**
3445 * Gets the GIP pointer.
3446 *
3447 * @returns Pointer to the GIP or NULL.
3448 */
3449SUPDECL(PSUPGLOBALINFOPAGE) SUPGetGIP(void)
3450{
3451 return g_pSUPGlobalInfoPage;
3452}
3453
3454
3455/**
3456 * Register a component factory with the support driver.
3457 *
3458 * This is currently restricted to kernel sessions only.
3459 *
3460 * @returns VBox status code.
3461 * @retval VINF_SUCCESS on success.
3462 * @retval VERR_NO_MEMORY if we're out of memory.
3463 * @retval VERR_ALREADY_EXISTS if the factory has already been registered.
3464 * @retval VERR_ACCESS_DENIED if it isn't a kernel session.
3465 * @retval VERR_INVALID_PARAMETER on invalid parameter.
3466 * @retval VERR_INVALID_POINTER on invalid pointer parameter.
3467 *
3468 * @param pSession The SUPDRV session (must be a ring-0 session).
3469 * @param pFactory Pointer to the component factory registration structure.
3470 *
3471 * @remarks This interface is also available via SUPR0IdcComponentRegisterFactory.
3472 */
3473SUPR0DECL(int) SUPR0ComponentRegisterFactory(PSUPDRVSESSION pSession, PCSUPDRVFACTORY pFactory)
3474{
3475 PSUPDRVFACTORYREG pNewReg;
3476 const char *psz;
3477 int rc;
3478
3479 /*
3480 * Validate parameters.
3481 */
3482 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
3483 AssertReturn(pSession->R0Process == NIL_RTR0PROCESS, VERR_ACCESS_DENIED);
3484 AssertPtrReturn(pFactory, VERR_INVALID_POINTER);
3485 AssertPtrReturn(pFactory->pfnQueryFactoryInterface, VERR_INVALID_POINTER);
3486 psz = RTStrEnd(pFactory->szName, sizeof(pFactory->szName));
3487 AssertReturn(psz, VERR_INVALID_PARAMETER);
3488
3489 /*
3490 * Allocate and initialize a new registration structure.
3491 */
3492 pNewReg = (PSUPDRVFACTORYREG)RTMemAlloc(sizeof(SUPDRVFACTORYREG));
3493 if (pNewReg)
3494 {
3495 pNewReg->pNext = NULL;
3496 pNewReg->pFactory = pFactory;
3497 pNewReg->pSession = pSession;
3498 pNewReg->cchName = psz - &pFactory->szName[0];
3499
3500 /*
3501 * Add it to the tail of the list after checking for prior registration.
3502 */
3503 rc = RTSemFastMutexRequest(pSession->pDevExt->mtxComponentFactory);
3504 if (RT_SUCCESS(rc))
3505 {
3506 PSUPDRVFACTORYREG pPrev = NULL;
3507 PSUPDRVFACTORYREG pCur = pSession->pDevExt->pComponentFactoryHead;
3508 while (pCur && pCur->pFactory != pFactory)
3509 {
3510 pPrev = pCur;
3511 pCur = pCur->pNext;
3512 }
3513 if (!pCur)
3514 {
3515 if (pPrev)
3516 pPrev->pNext = pNewReg;
3517 else
3518 pSession->pDevExt->pComponentFactoryHead = pNewReg;
3519 rc = VINF_SUCCESS;
3520 }
3521 else
3522 rc = VERR_ALREADY_EXISTS;
3523
3524 RTSemFastMutexRelease(pSession->pDevExt->mtxComponentFactory);
3525 }
3526
3527 if (RT_FAILURE(rc))
3528 RTMemFree(pNewReg);
3529 }
3530 else
3531 rc = VERR_NO_MEMORY;
3532 return rc;
3533}
3534
3535
3536/**
3537 * Deregister a component factory.
3538 *
3539 * @returns VBox status code.
3540 * @retval VINF_SUCCESS on success.
3541 * @retval VERR_NOT_FOUND if the factory wasn't registered.
3542 * @retval VERR_ACCESS_DENIED if it isn't a kernel session.
3543 * @retval VERR_INVALID_PARAMETER on invalid parameter.
3544 * @retval VERR_INVALID_POINTER on invalid pointer parameter.
3545 *
3546 * @param pSession The SUPDRV session (must be a ring-0 session).
3547 * @param pFactory Pointer to the component factory registration structure
3548 * previously passed SUPR0ComponentRegisterFactory().
3549 *
3550 * @remarks This interface is also available via SUPR0IdcComponentDeregisterFactory.
3551 */
3552SUPR0DECL(int) SUPR0ComponentDeregisterFactory(PSUPDRVSESSION pSession, PCSUPDRVFACTORY pFactory)
3553{
3554 int rc;
3555
3556 /*
3557 * Validate parameters.
3558 */
3559 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
3560 AssertReturn(pSession->R0Process == NIL_RTR0PROCESS, VERR_ACCESS_DENIED);
3561 AssertPtrReturn(pFactory, VERR_INVALID_POINTER);
3562
3563 /*
3564 * Take the lock and look for the registration record.
3565 */
3566 rc = RTSemFastMutexRequest(pSession->pDevExt->mtxComponentFactory);
3567 if (RT_SUCCESS(rc))
3568 {
3569 PSUPDRVFACTORYREG pPrev = NULL;
3570 PSUPDRVFACTORYREG pCur = pSession->pDevExt->pComponentFactoryHead;
3571 while (pCur && pCur->pFactory != pFactory)
3572 {
3573 pPrev = pCur;
3574 pCur = pCur->pNext;
3575 }
3576 if (pCur)
3577 {
3578 if (!pPrev)
3579 pSession->pDevExt->pComponentFactoryHead = pCur->pNext;
3580 else
3581 pPrev->pNext = pCur->pNext;
3582
3583 pCur->pNext = NULL;
3584 pCur->pFactory = NULL;
3585 pCur->pSession = NULL;
3586 rc = VINF_SUCCESS;
3587 }
3588 else
3589 rc = VERR_NOT_FOUND;
3590
3591 RTSemFastMutexRelease(pSession->pDevExt->mtxComponentFactory);
3592
3593 RTMemFree(pCur);
3594 }
3595 return rc;
3596}
3597
3598
3599/**
3600 * Queries a component factory.
3601 *
3602 * @returns VBox status code.
3603 * @retval VERR_INVALID_PARAMETER on invalid parameter.
3604 * @retval VERR_INVALID_POINTER on invalid pointer parameter.
3605 * @retval VERR_SUPDRV_COMPONENT_NOT_FOUND if the component factory wasn't found.
3606 * @retval VERR_SUPDRV_INTERFACE_NOT_SUPPORTED if the interface wasn't supported.
3607 *
3608 * @param pSession The SUPDRV session.
3609 * @param pszName The name of the component factory.
3610 * @param pszInterfaceUuid The UUID of the factory interface (stringified).
3611 * @param ppvFactoryIf Where to store the factory interface.
3612 */
3613SUPR0DECL(int) SUPR0ComponentQueryFactory(PSUPDRVSESSION pSession, const char *pszName, const char *pszInterfaceUuid, void **ppvFactoryIf)
3614{
3615 const char *pszEnd;
3616 size_t cchName;
3617 int rc;
3618
3619 /*
3620 * Validate parameters.
3621 */
3622 AssertReturn(SUP_IS_SESSION_VALID(pSession), VERR_INVALID_PARAMETER);
3623
3624 AssertPtrReturn(pszName, VERR_INVALID_POINTER);
3625 pszEnd = RTStrEnd(pszName, RT_SIZEOFMEMB(SUPDRVFACTORY, szName));
3626 AssertReturn(pszEnd, VERR_INVALID_PARAMETER);
3627 cchName = pszEnd - pszName;
3628
3629 AssertPtrReturn(pszInterfaceUuid, VERR_INVALID_POINTER);
3630 pszEnd = RTStrEnd(pszInterfaceUuid, RTUUID_STR_LENGTH);
3631 AssertReturn(pszEnd, VERR_INVALID_PARAMETER);
3632
3633 AssertPtrReturn(ppvFactoryIf, VERR_INVALID_POINTER);
3634 *ppvFactoryIf = NULL;
3635
3636 /*
3637 * Take the lock and try all factories by this name.
3638 */
3639 rc = RTSemFastMutexRequest(pSession->pDevExt->mtxComponentFactory);
3640 if (RT_SUCCESS(rc))
3641 {
3642 PSUPDRVFACTORYREG pCur = pSession->pDevExt->pComponentFactoryHead;
3643 rc = VERR_SUPDRV_COMPONENT_NOT_FOUND;
3644 while (pCur)
3645 {
3646 if ( pCur->cchName == cchName
3647 && !memcmp(pCur->pFactory->szName, pszName, cchName))
3648 {
3649 void *pvFactory = pCur->pFactory->pfnQueryFactoryInterface(pCur->pFactory, pSession, pszInterfaceUuid);
3650 if (pvFactory)
3651 {
3652 *ppvFactoryIf = pvFactory;
3653 rc = VINF_SUCCESS;
3654 break;
3655 }
3656 rc = VERR_SUPDRV_INTERFACE_NOT_SUPPORTED;
3657 }
3658
3659 /* next */
3660 pCur = pCur->pNext;
3661 }
3662
3663 RTSemFastMutexRelease(pSession->pDevExt->mtxComponentFactory);
3664 }
3665 return rc;
3666}
3667
3668
3669#if !defined(VBOX_WITH_DTRACE_R0DRV) || defined(RT_OS_SOLARIS)
3670/**
3671 * Stub function.
3672 */
3673SUPR0DECL(void) SUPR0VtgFireProbe(uint32_t idProbe, uintptr_t uArg0, uintptr_t uArg1, uintptr_t uArg2,
3674 uintptr_t uArg3, uintptr_t uArg4)
3675{
3676 NOREF(idProbe); NOREF(uArg0); NOREF(uArg1); NOREF(uArg2); NOREF(uArg3); NOREF(uArg4);
3677}
3678#endif
3679
3680#ifndef VBOX_WITH_DTRACE_R0DRV
3681/**
3682 * Stub function.
3683 */
3684SUPR0DECL(int) SUPR0VtgRegisterModule(void *hMod, struct VTGOBJHDR *pVtgHdr)
3685{
3686 NOREF(hMod); NOREF(pVtgHdr);
3687 return VINF_SUCCESS;
3688}
3689#endif
3690
3691
3692/**
3693 * Adds a memory object to the session.
3694 *
3695 * @returns IPRT status code.
3696 * @param pMem Memory tracking structure containing the
3697 * information to track.
3698 * @param pSession The session.
3699 */
3700static int supdrvMemAdd(PSUPDRVMEMREF pMem, PSUPDRVSESSION pSession)
3701{
3702 PSUPDRVBUNDLE pBundle;
3703 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
3704
3705 /*
3706 * Find free entry and record the allocation.
3707 */
3708 RTSpinlockAcquire(pSession->Spinlock, &SpinlockTmp);
3709 for (pBundle = &pSession->Bundle; pBundle; pBundle = pBundle->pNext)
3710 {
3711 if (pBundle->cUsed < RT_ELEMENTS(pBundle->aMem))
3712 {
3713 unsigned i;
3714 for (i = 0; i < RT_ELEMENTS(pBundle->aMem); i++)
3715 {
3716 if (pBundle->aMem[i].MemObj == NIL_RTR0MEMOBJ)
3717 {
3718 pBundle->cUsed++;
3719 pBundle->aMem[i] = *pMem;
3720 RTSpinlockRelease(pSession->Spinlock, &SpinlockTmp);
3721 return VINF_SUCCESS;
3722 }
3723 }
3724 AssertFailed(); /* !!this can't be happening!!! */
3725 }
3726 }
3727 RTSpinlockRelease(pSession->Spinlock, &SpinlockTmp);
3728
3729 /*
3730 * Need to allocate a new bundle.
3731 * Insert into the last entry in the bundle.
3732 */
3733 pBundle = (PSUPDRVBUNDLE)RTMemAllocZ(sizeof(*pBundle));
3734 if (!pBundle)
3735 return VERR_NO_MEMORY;
3736
3737 /* take last entry. */
3738 pBundle->cUsed++;
3739 pBundle->aMem[RT_ELEMENTS(pBundle->aMem) - 1] = *pMem;
3740
3741 /* insert into list. */
3742 RTSpinlockAcquire(pSession->Spinlock, &SpinlockTmp);
3743 pBundle->pNext = pSession->Bundle.pNext;
3744 pSession->Bundle.pNext = pBundle;
3745 RTSpinlockRelease(pSession->Spinlock, &SpinlockTmp);
3746
3747 return VINF_SUCCESS;
3748}
3749
3750
3751/**
3752 * Releases a memory object referenced by pointer and type.
3753 *
3754 * @returns IPRT status code.
3755 * @param pSession Session data.
3756 * @param uPtr Pointer to memory. This is matched against both the R0 and R3 addresses.
3757 * @param eType Memory type.
3758 */
3759static int supdrvMemRelease(PSUPDRVSESSION pSession, RTHCUINTPTR uPtr, SUPDRVMEMREFTYPE eType)
3760{
3761 PSUPDRVBUNDLE pBundle;
3762 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
3763
3764 /*
3765 * Validate input.
3766 */
3767 if (!uPtr)
3768 {
3769 Log(("Illegal address %p\n", (void *)uPtr));
3770 return VERR_INVALID_PARAMETER;
3771 }
3772
3773 /*
3774 * Search for the address.
3775 */
3776 RTSpinlockAcquire(pSession->Spinlock, &SpinlockTmp);
3777 for (pBundle = &pSession->Bundle; pBundle; pBundle = pBundle->pNext)
3778 {
3779 if (pBundle->cUsed > 0)
3780 {
3781 unsigned i;
3782 for (i = 0; i < RT_ELEMENTS(pBundle->aMem); i++)
3783 {
3784 if ( pBundle->aMem[i].eType == eType
3785 && pBundle->aMem[i].MemObj != NIL_RTR0MEMOBJ
3786 && ( (RTHCUINTPTR)RTR0MemObjAddress(pBundle->aMem[i].MemObj) == uPtr
3787 || ( pBundle->aMem[i].MapObjR3 != NIL_RTR0MEMOBJ
3788 && RTR0MemObjAddressR3(pBundle->aMem[i].MapObjR3) == uPtr))
3789 )
3790 {
3791 /* Make a copy of it and release it outside the spinlock. */
3792 SUPDRVMEMREF Mem = pBundle->aMem[i];
3793 pBundle->aMem[i].eType = MEMREF_TYPE_UNUSED;
3794 pBundle->aMem[i].MemObj = NIL_RTR0MEMOBJ;
3795 pBundle->aMem[i].MapObjR3 = NIL_RTR0MEMOBJ;
3796 RTSpinlockRelease(pSession->Spinlock, &SpinlockTmp);
3797
3798 if (Mem.MapObjR3 != NIL_RTR0MEMOBJ)
3799 {
3800 int rc = RTR0MemObjFree(Mem.MapObjR3, false);
3801 AssertRC(rc); /** @todo figure out how to handle this. */
3802 }
3803 if (Mem.MemObj != NIL_RTR0MEMOBJ)
3804 {
3805 int rc = RTR0MemObjFree(Mem.MemObj, true /* fFreeMappings */);
3806 AssertRC(rc); /** @todo figure out how to handle this. */
3807 }
3808 return VINF_SUCCESS;
3809 }
3810 }
3811 }
3812 }
3813 RTSpinlockRelease(pSession->Spinlock, &SpinlockTmp);
3814 Log(("Failed to find %p!!! (eType=%d)\n", (void *)uPtr, eType));
3815 return VERR_INVALID_PARAMETER;
3816}
3817
3818
3819/**
3820 * Opens an image. If it's the first time it's opened the call must upload
3821 * the bits using the supdrvIOCtl_LdrLoad() / SUPDRV_IOCTL_LDR_LOAD function.
3822 *
3823 * This is the 1st step of the loading.
3824 *
3825 * @returns IPRT status code.
3826 * @param pDevExt Device globals.
3827 * @param pSession Session data.
3828 * @param pReq The open request.
3829 */
3830static int supdrvIOCtl_LdrOpen(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLDROPEN pReq)
3831{
3832 int rc;
3833 PSUPDRVLDRIMAGE pImage;
3834 void *pv;
3835 size_t cchName = strlen(pReq->u.In.szName); /* (caller checked < 32). */
3836 LogFlow(("supdrvIOCtl_LdrOpen: szName=%s cbImageWithTabs=%d\n", pReq->u.In.szName, pReq->u.In.cbImageWithTabs));
3837
3838 /*
3839 * Check if we got an instance of the image already.
3840 */
3841 supdrvLdrLock(pDevExt);
3842 for (pImage = pDevExt->pLdrImages; pImage; pImage = pImage->pNext)
3843 {
3844 if ( pImage->szName[cchName] == '\0'
3845 && !memcmp(pImage->szName, pReq->u.In.szName, cchName))
3846 {
3847 /** @todo check cbImageBits and cbImageWithTabs here, if they differs that indicates that the images are different. */
3848 pImage->cUsage++;
3849 pReq->u.Out.pvImageBase = pImage->pvImage;
3850 pReq->u.Out.fNeedsLoading = pImage->uState == SUP_IOCTL_LDR_OPEN;
3851 pReq->u.Out.fNativeLoader = pImage->fNative;
3852 supdrvLdrAddUsage(pSession, pImage);
3853 supdrvLdrUnlock(pDevExt);
3854 return VINF_SUCCESS;
3855 }
3856 }
3857 /* (not found - add it!) */
3858
3859 /*
3860 * Allocate memory.
3861 */
3862 pv = RTMemAlloc(RT_OFFSETOF(SUPDRVLDRIMAGE, szName[cchName + 1]));
3863 if (!pv)
3864 {
3865 supdrvLdrUnlock(pDevExt);
3866 Log(("supdrvIOCtl_LdrOpen: RTMemAlloc() failed\n"));
3867 return /*VERR_NO_MEMORY*/ VERR_INTERNAL_ERROR_2;
3868 }
3869
3870 /*
3871 * Setup and link in the LDR stuff.
3872 */
3873 pImage = (PSUPDRVLDRIMAGE)pv;
3874 pImage->pvImage = NULL;
3875 pImage->pvImageAlloc = NULL;
3876 pImage->cbImageWithTabs = pReq->u.In.cbImageWithTabs;
3877 pImage->cbImageBits = pReq->u.In.cbImageBits;
3878 pImage->cSymbols = 0;
3879 pImage->paSymbols = NULL;
3880 pImage->pachStrTab = NULL;
3881 pImage->cbStrTab = 0;
3882 pImage->pfnModuleInit = NULL;
3883 pImage->pfnModuleTerm = NULL;
3884 pImage->pfnServiceReqHandler = NULL;
3885 pImage->uState = SUP_IOCTL_LDR_OPEN;
3886 pImage->cUsage = 1;
3887 pImage->pDevExt = pDevExt;
3888 memcpy(pImage->szName, pReq->u.In.szName, cchName + 1);
3889
3890 /*
3891 * Try load it using the native loader, if that isn't supported, fall back
3892 * on the older method.
3893 */
3894 pImage->fNative = true;
3895 rc = supdrvOSLdrOpen(pDevExt, pImage, pReq->u.In.szFilename);
3896 if (rc == VERR_NOT_SUPPORTED)
3897 {
3898 pImage->pvImageAlloc = RTMemExecAlloc(pImage->cbImageBits + 31);
3899 pImage->pvImage = RT_ALIGN_P(pImage->pvImageAlloc, 32);
3900 pImage->fNative = false;
3901 rc = pImage->pvImageAlloc ? VINF_SUCCESS : VERR_NO_EXEC_MEMORY;
3902 }
3903 if (RT_FAILURE(rc))
3904 {
3905 supdrvLdrUnlock(pDevExt);
3906 RTMemFree(pImage);
3907 Log(("supdrvIOCtl_LdrOpen(%s): failed - %Rrc\n", pReq->u.In.szName, rc));
3908 return rc;
3909 }
3910 Assert(VALID_PTR(pImage->pvImage) || RT_FAILURE(rc));
3911
3912 /*
3913 * Link it.
3914 */
3915 pImage->pNext = pDevExt->pLdrImages;
3916 pDevExt->pLdrImages = pImage;
3917
3918 supdrvLdrAddUsage(pSession, pImage);
3919
3920 pReq->u.Out.pvImageBase = pImage->pvImage;
3921 pReq->u.Out.fNeedsLoading = true;
3922 pReq->u.Out.fNativeLoader = pImage->fNative;
3923 supdrvLdrUnlock(pDevExt);
3924
3925#if defined(RT_OS_WINDOWS) && defined(DEBUG)
3926 SUPR0Printf("VBoxDrv: windbg> .reload /f %s=%#p\n", pImage->szName, pImage->pvImage);
3927#endif
3928 return VINF_SUCCESS;
3929}
3930
3931
3932/**
3933 * Worker that validates a pointer to an image entrypoint.
3934 *
3935 * @returns IPRT status code.
3936 * @param pDevExt The device globals.
3937 * @param pImage The loader image.
3938 * @param pv The pointer into the image.
3939 * @param fMayBeNull Whether it may be NULL.
3940 * @param pszWhat What is this entrypoint? (for logging)
3941 * @param pbImageBits The image bits prepared by ring-3.
3942 *
3943 * @remarks Will leave the lock on failure.
3944 */
3945static int supdrvLdrValidatePointer(PSUPDRVDEVEXT pDevExt, PSUPDRVLDRIMAGE pImage, void *pv,
3946 bool fMayBeNull, const uint8_t *pbImageBits, const char *pszWhat)
3947{
3948 if (!fMayBeNull || pv)
3949 {
3950 if ((uintptr_t)pv - (uintptr_t)pImage->pvImage >= pImage->cbImageBits)
3951 {
3952 supdrvLdrUnlock(pDevExt);
3953 Log(("Out of range (%p LB %#x): %s=%p\n", pImage->pvImage, pImage->cbImageBits, pszWhat, pv));
3954 return VERR_INVALID_PARAMETER;
3955 }
3956
3957 if (pImage->fNative)
3958 {
3959 int rc = supdrvOSLdrValidatePointer(pDevExt, pImage, pv, pbImageBits);
3960 if (RT_FAILURE(rc))
3961 {
3962 supdrvLdrUnlock(pDevExt);
3963 Log(("Bad entry point address: %s=%p (rc=%Rrc)\n", pszWhat, pv, rc));
3964 return rc;
3965 }
3966 }
3967 }
3968 return VINF_SUCCESS;
3969}
3970
3971
3972/**
3973 * Loads the image bits.
3974 *
3975 * This is the 2nd step of the loading.
3976 *
3977 * @returns IPRT status code.
3978 * @param pDevExt Device globals.
3979 * @param pSession Session data.
3980 * @param pReq The request.
3981 */
3982static int supdrvIOCtl_LdrLoad(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLDRLOAD pReq)
3983{
3984 PSUPDRVLDRUSAGE pUsage;
3985 PSUPDRVLDRIMAGE pImage;
3986 int rc;
3987 LogFlow(("supdrvIOCtl_LdrLoad: pvImageBase=%p cbImageWithBits=%d\n", pReq->u.In.pvImageBase, pReq->u.In.cbImageWithTabs));
3988
3989 /*
3990 * Find the ldr image.
3991 */
3992 supdrvLdrLock(pDevExt);
3993 pUsage = pSession->pLdrUsage;
3994 while (pUsage && pUsage->pImage->pvImage != pReq->u.In.pvImageBase)
3995 pUsage = pUsage->pNext;
3996 if (!pUsage)
3997 {
3998 supdrvLdrUnlock(pDevExt);
3999 Log(("SUP_IOCTL_LDR_LOAD: couldn't find image!\n"));
4000 return VERR_INVALID_HANDLE;
4001 }
4002 pImage = pUsage->pImage;
4003
4004 /*
4005 * Validate input.
4006 */
4007 if ( pImage->cbImageWithTabs != pReq->u.In.cbImageWithTabs
4008 || pImage->cbImageBits != pReq->u.In.cbImageBits)
4009 {
4010 supdrvLdrUnlock(pDevExt);
4011 Log(("SUP_IOCTL_LDR_LOAD: image size mismatch!! %d(prep) != %d(load) or %d != %d\n",
4012 pImage->cbImageWithTabs, pReq->u.In.cbImageWithTabs, pImage->cbImageBits, pReq->u.In.cbImageBits));
4013 return VERR_INVALID_HANDLE;
4014 }
4015
4016 if (pImage->uState != SUP_IOCTL_LDR_OPEN)
4017 {
4018 unsigned uState = pImage->uState;
4019 supdrvLdrUnlock(pDevExt);
4020 if (uState != SUP_IOCTL_LDR_LOAD)
4021 AssertMsgFailed(("SUP_IOCTL_LDR_LOAD: invalid image state %d (%#x)!\n", uState, uState));
4022 return VERR_ALREADY_LOADED;
4023 }
4024
4025 switch (pReq->u.In.eEPType)
4026 {
4027 case SUPLDRLOADEP_NOTHING:
4028 break;
4029
4030 case SUPLDRLOADEP_VMMR0:
4031 rc = supdrvLdrValidatePointer( pDevExt, pImage, pReq->u.In.EP.VMMR0.pvVMMR0, false, pReq->u.In.abImage, "pvVMMR0");
4032 if (RT_SUCCESS(rc))
4033 rc = supdrvLdrValidatePointer(pDevExt, pImage, pReq->u.In.EP.VMMR0.pvVMMR0EntryInt, false, pReq->u.In.abImage, "pvVMMR0EntryInt");
4034 if (RT_SUCCESS(rc))
4035 rc = supdrvLdrValidatePointer(pDevExt, pImage, pReq->u.In.EP.VMMR0.pvVMMR0EntryFast, false, pReq->u.In.abImage, "pvVMMR0EntryFast");
4036 if (RT_SUCCESS(rc))
4037 rc = supdrvLdrValidatePointer(pDevExt, pImage, pReq->u.In.EP.VMMR0.pvVMMR0EntryEx, false, pReq->u.In.abImage, "pvVMMR0EntryEx");
4038 if (RT_FAILURE(rc))
4039 return rc;
4040 break;
4041
4042 case SUPLDRLOADEP_SERVICE:
4043 rc = supdrvLdrValidatePointer(pDevExt, pImage, pReq->u.In.EP.Service.pfnServiceReq, false, pReq->u.In.abImage, "pfnServiceReq");
4044 if (RT_FAILURE(rc))
4045 return rc;
4046 if ( pReq->u.In.EP.Service.apvReserved[0] != NIL_RTR0PTR
4047 || pReq->u.In.EP.Service.apvReserved[1] != NIL_RTR0PTR
4048 || pReq->u.In.EP.Service.apvReserved[2] != NIL_RTR0PTR)
4049 {
4050 supdrvLdrUnlock(pDevExt);
4051 Log(("Out of range (%p LB %#x): apvReserved={%p,%p,%p} MBZ!\n",
4052 pImage->pvImage, pReq->u.In.cbImageWithTabs,
4053 pReq->u.In.EP.Service.apvReserved[0],
4054 pReq->u.In.EP.Service.apvReserved[1],
4055 pReq->u.In.EP.Service.apvReserved[2]));
4056 return VERR_INVALID_PARAMETER;
4057 }
4058 break;
4059
4060 default:
4061 supdrvLdrUnlock(pDevExt);
4062 Log(("Invalid eEPType=%d\n", pReq->u.In.eEPType));
4063 return VERR_INVALID_PARAMETER;
4064 }
4065
4066 rc = supdrvLdrValidatePointer(pDevExt, pImage, pReq->u.In.pfnModuleInit, true, pReq->u.In.abImage, "pfnModuleInit");
4067 if (RT_FAILURE(rc))
4068 return rc;
4069 rc = supdrvLdrValidatePointer(pDevExt, pImage, pReq->u.In.pfnModuleTerm, true, pReq->u.In.abImage, "pfnModuleTerm");
4070 if (RT_FAILURE(rc))
4071 return rc;
4072
4073 /*
4074 * Allocate and copy the tables.
4075 * (No need to do try/except as this is a buffered request.)
4076 */
4077 pImage->cbStrTab = pReq->u.In.cbStrTab;
4078 if (pImage->cbStrTab)
4079 {
4080 pImage->pachStrTab = (char *)RTMemAlloc(pImage->cbStrTab);
4081 if (pImage->pachStrTab)
4082 memcpy(pImage->pachStrTab, &pReq->u.In.abImage[pReq->u.In.offStrTab], pImage->cbStrTab);
4083 else
4084 rc = /*VERR_NO_MEMORY*/ VERR_INTERNAL_ERROR_3;
4085 }
4086
4087 pImage->cSymbols = pReq->u.In.cSymbols;
4088 if (RT_SUCCESS(rc) && pImage->cSymbols)
4089 {
4090 size_t cbSymbols = pImage->cSymbols * sizeof(SUPLDRSYM);
4091 pImage->paSymbols = (PSUPLDRSYM)RTMemAlloc(cbSymbols);
4092 if (pImage->paSymbols)
4093 memcpy(pImage->paSymbols, &pReq->u.In.abImage[pReq->u.In.offSymbols], cbSymbols);
4094 else
4095 rc = /*VERR_NO_MEMORY*/ VERR_INTERNAL_ERROR_4;
4096 }
4097
4098 /*
4099 * Copy the bits / complete native loading.
4100 */
4101 if (RT_SUCCESS(rc))
4102 {
4103 pImage->uState = SUP_IOCTL_LDR_LOAD;
4104 pImage->pfnModuleInit = pReq->u.In.pfnModuleInit;
4105 pImage->pfnModuleTerm = pReq->u.In.pfnModuleTerm;
4106
4107 if (pImage->fNative)
4108 rc = supdrvOSLdrLoad(pDevExt, pImage, pReq->u.In.abImage, pReq);
4109 else
4110 memcpy(pImage->pvImage, &pReq->u.In.abImage[0], pImage->cbImageBits);
4111 }
4112
4113 /*
4114 * Update any entry points.
4115 */
4116 if (RT_SUCCESS(rc))
4117 {
4118 switch (pReq->u.In.eEPType)
4119 {
4120 default:
4121 case SUPLDRLOADEP_NOTHING:
4122 rc = VINF_SUCCESS;
4123 break;
4124 case SUPLDRLOADEP_VMMR0:
4125 rc = supdrvLdrSetVMMR0EPs(pDevExt, pReq->u.In.EP.VMMR0.pvVMMR0, pReq->u.In.EP.VMMR0.pvVMMR0EntryInt,
4126 pReq->u.In.EP.VMMR0.pvVMMR0EntryFast, pReq->u.In.EP.VMMR0.pvVMMR0EntryEx);
4127 break;
4128 case SUPLDRLOADEP_SERVICE:
4129 pImage->pfnServiceReqHandler = pReq->u.In.EP.Service.pfnServiceReq;
4130 rc = VINF_SUCCESS;
4131 break;
4132 }
4133 }
4134
4135 /*
4136 * On success call the module initialization.
4137 */
4138 LogFlow(("supdrvIOCtl_LdrLoad: pfnModuleInit=%p\n", pImage->pfnModuleInit));
4139 if (RT_SUCCESS(rc) && pImage->pfnModuleInit)
4140 {
4141 Log(("supdrvIOCtl_LdrLoad: calling pfnModuleInit=%p\n", pImage->pfnModuleInit));
4142 pDevExt->pLdrInitImage = pImage;
4143 pDevExt->hLdrInitThread = RTThreadNativeSelf();
4144 rc = pImage->pfnModuleInit(pImage);
4145 pDevExt->pLdrInitImage = NULL;
4146 pDevExt->hLdrInitThread = NIL_RTNATIVETHREAD;
4147 if (RT_FAILURE(rc) && pDevExt->pvVMMR0 == pImage->pvImage)
4148 supdrvLdrUnsetVMMR0EPs(pDevExt);
4149 }
4150
4151 if (RT_FAILURE(rc))
4152 {
4153#ifdef VBOX_WITH_DTRACE_R0DRV
4154 /* Inform the tracing component in case ModuleInit registered TPs. */
4155 supdrvVtgModuleUnloading(pDevExt, pImage);
4156#endif
4157
4158 pImage->uState = SUP_IOCTL_LDR_OPEN;
4159 pImage->pfnModuleInit = NULL;
4160 pImage->pfnModuleTerm = NULL;
4161 pImage->pfnServiceReqHandler= NULL;
4162 pImage->cbStrTab = 0;
4163 RTMemFree(pImage->pachStrTab);
4164 pImage->pachStrTab = NULL;
4165 RTMemFree(pImage->paSymbols);
4166 pImage->paSymbols = NULL;
4167 pImage->cSymbols = 0;
4168 }
4169
4170 supdrvLdrUnlock(pDevExt);
4171 return rc;
4172}
4173
4174
4175/**
4176 * Frees a previously loaded (prep'ed) image.
4177 *
4178 * @returns IPRT status code.
4179 * @param pDevExt Device globals.
4180 * @param pSession Session data.
4181 * @param pReq The request.
4182 */
4183static int supdrvIOCtl_LdrFree(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLDRFREE pReq)
4184{
4185 int rc;
4186 PSUPDRVLDRUSAGE pUsagePrev;
4187 PSUPDRVLDRUSAGE pUsage;
4188 PSUPDRVLDRIMAGE pImage;
4189 LogFlow(("supdrvIOCtl_LdrFree: pvImageBase=%p\n", pReq->u.In.pvImageBase));
4190
4191 /*
4192 * Find the ldr image.
4193 */
4194 supdrvLdrLock(pDevExt);
4195 pUsagePrev = NULL;
4196 pUsage = pSession->pLdrUsage;
4197 while (pUsage && pUsage->pImage->pvImage != pReq->u.In.pvImageBase)
4198 {
4199 pUsagePrev = pUsage;
4200 pUsage = pUsage->pNext;
4201 }
4202 if (!pUsage)
4203 {
4204 supdrvLdrUnlock(pDevExt);
4205 Log(("SUP_IOCTL_LDR_FREE: couldn't find image!\n"));
4206 return VERR_INVALID_HANDLE;
4207 }
4208
4209 /*
4210 * Check if we can remove anything.
4211 */
4212 rc = VINF_SUCCESS;
4213 pImage = pUsage->pImage;
4214 if (pImage->cUsage <= 1 || pUsage->cUsage <= 1)
4215 {
4216 /*
4217 * Check if there are any objects with destructors in the image, if
4218 * so leave it for the session cleanup routine so we get a chance to
4219 * clean things up in the right order and not leave them all dangling.
4220 */
4221 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
4222 RTSpinlockAcquire(pDevExt->Spinlock, &SpinlockTmp);
4223 if (pImage->cUsage <= 1)
4224 {
4225 PSUPDRVOBJ pObj;
4226 for (pObj = pDevExt->pObjs; pObj; pObj = pObj->pNext)
4227 if (RT_UNLIKELY((uintptr_t)pObj->pfnDestructor - (uintptr_t)pImage->pvImage < pImage->cbImageBits))
4228 {
4229 rc = VERR_DANGLING_OBJECTS;
4230 break;
4231 }
4232 }
4233 else
4234 {
4235 PSUPDRVUSAGE pGenUsage;
4236 for (pGenUsage = pSession->pUsage; pGenUsage; pGenUsage = pGenUsage->pNext)
4237 if (RT_UNLIKELY((uintptr_t)pGenUsage->pObj->pfnDestructor - (uintptr_t)pImage->pvImage < pImage->cbImageBits))
4238 {
4239 rc = VERR_DANGLING_OBJECTS;
4240 break;
4241 }
4242 }
4243 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
4244 if (rc == VINF_SUCCESS)
4245 {
4246 /* unlink it */
4247 if (pUsagePrev)
4248 pUsagePrev->pNext = pUsage->pNext;
4249 else
4250 pSession->pLdrUsage = pUsage->pNext;
4251
4252 /* free it */
4253 pUsage->pImage = NULL;
4254 pUsage->pNext = NULL;
4255 RTMemFree(pUsage);
4256
4257 /*
4258 * Dereference the image.
4259 */
4260 if (pImage->cUsage <= 1)
4261 supdrvLdrFree(pDevExt, pImage);
4262 else
4263 pImage->cUsage--;
4264 }
4265 else
4266 {
4267 Log(("supdrvIOCtl_LdrFree: Dangling objects in %p/%s!\n", pImage->pvImage, pImage->szName));
4268 rc = VINF_SUCCESS; /** @todo BRANCH-2.1: remove this after branching. */
4269 }
4270 }
4271 else
4272 {
4273 /*
4274 * Dereference both image and usage.
4275 */
4276 pImage->cUsage--;
4277 pUsage->cUsage--;
4278 }
4279
4280 supdrvLdrUnlock(pDevExt);
4281 return rc;
4282}
4283
4284
4285/**
4286 * Gets the address of a symbol in an open image.
4287 *
4288 * @returns IPRT status code.
4289 * @param pDevExt Device globals.
4290 * @param pSession Session data.
4291 * @param pReq The request buffer.
4292 */
4293static int supdrvIOCtl_LdrGetSymbol(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLDRGETSYMBOL pReq)
4294{
4295 PSUPDRVLDRIMAGE pImage;
4296 PSUPDRVLDRUSAGE pUsage;
4297 uint32_t i;
4298 PSUPLDRSYM paSyms;
4299 const char *pchStrings;
4300 const size_t cbSymbol = strlen(pReq->u.In.szSymbol) + 1;
4301 void *pvSymbol = NULL;
4302 int rc = VERR_GENERAL_FAILURE;
4303 Log3(("supdrvIOCtl_LdrGetSymbol: pvImageBase=%p szSymbol=\"%s\"\n", pReq->u.In.pvImageBase, pReq->u.In.szSymbol));
4304
4305 /*
4306 * Find the ldr image.
4307 */
4308 supdrvLdrLock(pDevExt);
4309 pUsage = pSession->pLdrUsage;
4310 while (pUsage && pUsage->pImage->pvImage != pReq->u.In.pvImageBase)
4311 pUsage = pUsage->pNext;
4312 if (!pUsage)
4313 {
4314 supdrvLdrUnlock(pDevExt);
4315 Log(("SUP_IOCTL_LDR_GET_SYMBOL: couldn't find image!\n"));
4316 return VERR_INVALID_HANDLE;
4317 }
4318 pImage = pUsage->pImage;
4319 if (pImage->uState != SUP_IOCTL_LDR_LOAD)
4320 {
4321 unsigned uState = pImage->uState;
4322 supdrvLdrUnlock(pDevExt);
4323 Log(("SUP_IOCTL_LDR_GET_SYMBOL: invalid image state %d (%#x)!\n", uState, uState)); NOREF(uState);
4324 return VERR_ALREADY_LOADED;
4325 }
4326
4327 /*
4328 * Search the symbol strings.
4329 *
4330 * Note! The int32_t is for native loading on solaris where the data
4331 * and text segments are in very different places.
4332 */
4333 pchStrings = pImage->pachStrTab;
4334 paSyms = pImage->paSymbols;
4335 for (i = 0; i < pImage->cSymbols; i++)
4336 {
4337 if ( paSyms[i].offName + cbSymbol <= pImage->cbStrTab
4338 && !memcmp(pchStrings + paSyms[i].offName, pReq->u.In.szSymbol, cbSymbol))
4339 {
4340 pvSymbol = (uint8_t *)pImage->pvImage + (int32_t)paSyms[i].offSymbol;
4341 rc = VINF_SUCCESS;
4342 break;
4343 }
4344 }
4345 supdrvLdrUnlock(pDevExt);
4346 pReq->u.Out.pvSymbol = pvSymbol;
4347 return rc;
4348}
4349
4350
4351/**
4352 * Gets the address of a symbol in an open image or the support driver.
4353 *
4354 * @returns VINF_SUCCESS on success.
4355 * @returns
4356 * @param pDevExt Device globals.
4357 * @param pSession Session data.
4358 * @param pReq The request buffer.
4359 */
4360static int supdrvIDC_LdrGetSymbol(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPDRVIDCREQGETSYM pReq)
4361{
4362 int rc = VINF_SUCCESS;
4363 const char *pszSymbol = pReq->u.In.pszSymbol;
4364 const char *pszModule = pReq->u.In.pszModule;
4365 size_t cbSymbol;
4366 char const *pszEnd;
4367 uint32_t i;
4368
4369 /*
4370 * Input validation.
4371 */
4372 AssertPtrReturn(pszSymbol, VERR_INVALID_POINTER);
4373 pszEnd = RTStrEnd(pszSymbol, 512);
4374 AssertReturn(pszEnd, VERR_INVALID_PARAMETER);
4375 cbSymbol = pszEnd - pszSymbol + 1;
4376
4377 if (pszModule)
4378 {
4379 AssertPtrReturn(pszModule, VERR_INVALID_POINTER);
4380 pszEnd = RTStrEnd(pszModule, 64);
4381 AssertReturn(pszEnd, VERR_INVALID_PARAMETER);
4382 }
4383 Log3(("supdrvIDC_LdrGetSymbol: pszModule=%p:{%s} pszSymbol=%p:{%s}\n", pszModule, pszModule, pszSymbol, pszSymbol));
4384
4385
4386 if ( !pszModule
4387 || !strcmp(pszModule, "SupDrv"))
4388 {
4389 /*
4390 * Search the support driver export table.
4391 */
4392 for (i = 0; i < RT_ELEMENTS(g_aFunctions); i++)
4393 if (!strcmp(g_aFunctions[i].szName, pszSymbol))
4394 {
4395 pReq->u.Out.pfnSymbol = g_aFunctions[i].pfn;
4396 break;
4397 }
4398 }
4399 else
4400 {
4401 /*
4402 * Find the loader image.
4403 */
4404 PSUPDRVLDRIMAGE pImage;
4405
4406 supdrvLdrLock(pDevExt);
4407
4408 for (pImage = pDevExt->pLdrImages; pImage; pImage = pImage->pNext)
4409 if (!strcmp(pImage->szName, pszModule))
4410 break;
4411 if (pImage && pImage->uState == SUP_IOCTL_LDR_LOAD)
4412 {
4413 /*
4414 * Search the symbol strings.
4415 */
4416 const char *pchStrings = pImage->pachStrTab;
4417 PCSUPLDRSYM paSyms = pImage->paSymbols;
4418 for (i = 0; i < pImage->cSymbols; i++)
4419 {
4420 if ( paSyms[i].offName + cbSymbol <= pImage->cbStrTab
4421 && !memcmp(pchStrings + paSyms[i].offName, pszSymbol, cbSymbol))
4422 {
4423 /*
4424 * Found it! Calc the symbol address and add a reference to the module.
4425 */
4426 pReq->u.Out.pfnSymbol = (PFNRT)((uint8_t *)pImage->pvImage + (int32_t)paSyms[i].offSymbol);
4427 rc = supdrvLdrAddUsage(pSession, pImage);
4428 break;
4429 }
4430 }
4431 }
4432 else
4433 rc = pImage ? VERR_WRONG_ORDER : VERR_MODULE_NOT_FOUND;
4434
4435 supdrvLdrUnlock(pDevExt);
4436 }
4437 return rc;
4438}
4439
4440
4441/**
4442 * Updates the VMMR0 entry point pointers.
4443 *
4444 * @returns IPRT status code.
4445 * @param pDevExt Device globals.
4446 * @param pSession Session data.
4447 * @param pVMMR0 VMMR0 image handle.
4448 * @param pvVMMR0EntryInt VMMR0EntryInt address.
4449 * @param pvVMMR0EntryFast VMMR0EntryFast address.
4450 * @param pvVMMR0EntryEx VMMR0EntryEx address.
4451 * @remark Caller must own the loader mutex.
4452 */
4453static int supdrvLdrSetVMMR0EPs(PSUPDRVDEVEXT pDevExt, void *pvVMMR0, void *pvVMMR0EntryInt, void *pvVMMR0EntryFast, void *pvVMMR0EntryEx)
4454{
4455 int rc = VINF_SUCCESS;
4456 LogFlow(("supdrvLdrSetR0EP pvVMMR0=%p pvVMMR0EntryInt=%p\n", pvVMMR0, pvVMMR0EntryInt));
4457
4458
4459 /*
4460 * Check if not yet set.
4461 */
4462 if (!pDevExt->pvVMMR0)
4463 {
4464 pDevExt->pvVMMR0 = pvVMMR0;
4465 pDevExt->pfnVMMR0EntryInt = pvVMMR0EntryInt;
4466 pDevExt->pfnVMMR0EntryFast = pvVMMR0EntryFast;
4467 pDevExt->pfnVMMR0EntryEx = pvVMMR0EntryEx;
4468 }
4469 else
4470 {
4471 /*
4472 * Return failure or success depending on whether the values match or not.
4473 */
4474 if ( pDevExt->pvVMMR0 != pvVMMR0
4475 || (void *)pDevExt->pfnVMMR0EntryInt != pvVMMR0EntryInt
4476 || (void *)pDevExt->pfnVMMR0EntryFast != pvVMMR0EntryFast
4477 || (void *)pDevExt->pfnVMMR0EntryEx != pvVMMR0EntryEx)
4478 {
4479 AssertMsgFailed(("SUP_IOCTL_LDR_SETR0EP: Already set pointing to a different module!\n"));
4480 rc = VERR_INVALID_PARAMETER;
4481 }
4482 }
4483 return rc;
4484}
4485
4486
4487/**
4488 * Unsets the VMMR0 entry point installed by supdrvLdrSetR0EP.
4489 *
4490 * @param pDevExt Device globals.
4491 */
4492static void supdrvLdrUnsetVMMR0EPs(PSUPDRVDEVEXT pDevExt)
4493{
4494 pDevExt->pvVMMR0 = NULL;
4495 pDevExt->pfnVMMR0EntryInt = NULL;
4496 pDevExt->pfnVMMR0EntryFast = NULL;
4497 pDevExt->pfnVMMR0EntryEx = NULL;
4498}
4499
4500
4501/**
4502 * Adds a usage reference in the specified session of an image.
4503 *
4504 * Called while owning the loader semaphore.
4505 *
4506 * @returns VINF_SUCCESS on success and VERR_NO_MEMORY on failure.
4507 * @param pSession Session in question.
4508 * @param pImage Image which the session is using.
4509 */
4510static int supdrvLdrAddUsage(PSUPDRVSESSION pSession, PSUPDRVLDRIMAGE pImage)
4511{
4512 PSUPDRVLDRUSAGE pUsage;
4513 LogFlow(("supdrvLdrAddUsage: pImage=%p\n", pImage));
4514
4515 /*
4516 * Referenced it already?
4517 */
4518 pUsage = pSession->pLdrUsage;
4519 while (pUsage)
4520 {
4521 if (pUsage->pImage == pImage)
4522 {
4523 pUsage->cUsage++;
4524 return VINF_SUCCESS;
4525 }
4526 pUsage = pUsage->pNext;
4527 }
4528
4529 /*
4530 * Allocate new usage record.
4531 */
4532 pUsage = (PSUPDRVLDRUSAGE)RTMemAlloc(sizeof(*pUsage));
4533 AssertReturn(pUsage, /*VERR_NO_MEMORY*/ VERR_INTERNAL_ERROR_5);
4534 pUsage->cUsage = 1;
4535 pUsage->pImage = pImage;
4536 pUsage->pNext = pSession->pLdrUsage;
4537 pSession->pLdrUsage = pUsage;
4538 return VINF_SUCCESS;
4539}
4540
4541
4542/**
4543 * Frees a load image.
4544 *
4545 * @param pDevExt Pointer to device extension.
4546 * @param pImage Pointer to the image we're gonna free.
4547 * This image must exit!
4548 * @remark The caller MUST own SUPDRVDEVEXT::mtxLdr!
4549 */
4550static void supdrvLdrFree(PSUPDRVDEVEXT pDevExt, PSUPDRVLDRIMAGE pImage)
4551{
4552 PSUPDRVLDRIMAGE pImagePrev;
4553 LogFlow(("supdrvLdrFree: pImage=%p\n", pImage));
4554
4555 /* find it - arg. should've used doubly linked list. */
4556 Assert(pDevExt->pLdrImages);
4557 pImagePrev = NULL;
4558 if (pDevExt->pLdrImages != pImage)
4559 {
4560 pImagePrev = pDevExt->pLdrImages;
4561 while (pImagePrev->pNext != pImage)
4562 pImagePrev = pImagePrev->pNext;
4563 Assert(pImagePrev->pNext == pImage);
4564 }
4565
4566 /* unlink */
4567 if (pImagePrev)
4568 pImagePrev->pNext = pImage->pNext;
4569 else
4570 pDevExt->pLdrImages = pImage->pNext;
4571
4572 /* check if this is VMMR0.r0 unset its entry point pointers. */
4573 if (pDevExt->pvVMMR0 == pImage->pvImage)
4574 supdrvLdrUnsetVMMR0EPs(pDevExt);
4575
4576 /* check for objects with destructors in this image. (Shouldn't happen.) */
4577 if (pDevExt->pObjs)
4578 {
4579 unsigned cObjs = 0;
4580 PSUPDRVOBJ pObj;
4581 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
4582 RTSpinlockAcquire(pDevExt->Spinlock, &SpinlockTmp);
4583 for (pObj = pDevExt->pObjs; pObj; pObj = pObj->pNext)
4584 if (RT_UNLIKELY((uintptr_t)pObj->pfnDestructor - (uintptr_t)pImage->pvImage < pImage->cbImageBits))
4585 {
4586 pObj->pfnDestructor = NULL;
4587 cObjs++;
4588 }
4589 RTSpinlockRelease(pDevExt->Spinlock, &SpinlockTmp);
4590 if (cObjs)
4591 OSDBGPRINT(("supdrvLdrFree: Image '%s' has %d dangling objects!\n", pImage->szName, cObjs));
4592 }
4593
4594 /* call termination function if fully loaded. */
4595 if ( pImage->pfnModuleTerm
4596 && pImage->uState == SUP_IOCTL_LDR_LOAD)
4597 {
4598 LogFlow(("supdrvIOCtl_LdrLoad: calling pfnModuleTerm=%p\n", pImage->pfnModuleTerm));
4599 pImage->pfnModuleTerm(pImage);
4600 }
4601
4602#ifdef VBOX_WITH_DTRACE_R0DRV
4603 /* Inform the tracing component. */
4604 supdrvVtgModuleUnloading(pDevExt, pImage);
4605#endif
4606
4607 /* do native unload if appropriate. */
4608 if (pImage->fNative)
4609 supdrvOSLdrUnload(pDevExt, pImage);
4610
4611 /* free the image */
4612 pImage->cUsage = 0;
4613 pImage->pDevExt = NULL;
4614 pImage->pNext = NULL;
4615 pImage->uState = SUP_IOCTL_LDR_FREE;
4616 RTMemExecFree(pImage->pvImageAlloc, pImage->cbImageBits + 31);
4617 pImage->pvImageAlloc = NULL;
4618 RTMemFree(pImage->pachStrTab);
4619 pImage->pachStrTab = NULL;
4620 RTMemFree(pImage->paSymbols);
4621 pImage->paSymbols = NULL;
4622 RTMemFree(pImage);
4623}
4624
4625
4626/**
4627 * Acquires the loader lock.
4628 *
4629 * @returns IPRT status code.
4630 * @param pDevExt The device extension.
4631 */
4632DECLINLINE(int) supdrvLdrLock(PSUPDRVDEVEXT pDevExt)
4633{
4634#ifdef SUPDRV_USE_MUTEX_FOR_LDR
4635 int rc = RTSemMutexRequest(pDevExt->mtxLdr, RT_INDEFINITE_WAIT);
4636#else
4637 int rc = RTSemFastMutexRequest(pDevExt->mtxLdr);
4638#endif
4639 AssertRC(rc);
4640 return rc;
4641}
4642
4643
4644/**
4645 * Releases the loader lock.
4646 *
4647 * @returns IPRT status code.
4648 * @param pDevExt The device extension.
4649 */
4650DECLINLINE(int) supdrvLdrUnlock(PSUPDRVDEVEXT pDevExt)
4651{
4652#ifdef SUPDRV_USE_MUTEX_FOR_LDR
4653 return RTSemMutexRelease(pDevExt->mtxLdr);
4654#else
4655 return RTSemFastMutexRelease(pDevExt->mtxLdr);
4656#endif
4657}
4658
4659
4660/**
4661 * Implements the service call request.
4662 *
4663 * @returns VBox status code.
4664 * @param pDevExt The device extension.
4665 * @param pSession The calling session.
4666 * @param pReq The request packet, valid.
4667 */
4668static int supdrvIOCtl_CallServiceModule(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPCALLSERVICE pReq)
4669{
4670#if !defined(RT_OS_WINDOWS) || defined(DEBUG)
4671 int rc;
4672
4673 /*
4674 * Find the module first in the module referenced by the calling session.
4675 */
4676 rc = supdrvLdrLock(pDevExt);
4677 if (RT_SUCCESS(rc))
4678 {
4679 PFNSUPR0SERVICEREQHANDLER pfnServiceReqHandler = NULL;
4680 PSUPDRVLDRUSAGE pUsage;
4681
4682 for (pUsage = pSession->pLdrUsage; pUsage; pUsage = pUsage->pNext)
4683 if ( pUsage->pImage->pfnServiceReqHandler
4684 && !strcmp(pUsage->pImage->szName, pReq->u.In.szName))
4685 {
4686 pfnServiceReqHandler = pUsage->pImage->pfnServiceReqHandler;
4687 break;
4688 }
4689 supdrvLdrUnlock(pDevExt);
4690
4691 if (pfnServiceReqHandler)
4692 {
4693 /*
4694 * Call it.
4695 */
4696 if (pReq->Hdr.cbIn == SUP_IOCTL_CALL_SERVICE_SIZE(0))
4697 rc = pfnServiceReqHandler(pSession, pReq->u.In.uOperation, pReq->u.In.u64Arg, NULL);
4698 else
4699 rc = pfnServiceReqHandler(pSession, pReq->u.In.uOperation, pReq->u.In.u64Arg, (PSUPR0SERVICEREQHDR)&pReq->abReqPkt[0]);
4700 }
4701 else
4702 rc = VERR_SUPDRV_SERVICE_NOT_FOUND;
4703 }
4704
4705 /* log it */
4706 if ( RT_FAILURE(rc)
4707 && rc != VERR_INTERRUPTED
4708 && rc != VERR_TIMEOUT)
4709 Log(("SUP_IOCTL_CALL_SERVICE: rc=%Rrc op=%u out=%u arg=%RX64 p/t=%RTproc/%RTthrd\n",
4710 rc, pReq->u.In.uOperation, pReq->Hdr.cbOut, pReq->u.In.u64Arg, RTProcSelf(), RTThreadNativeSelf()));
4711 else
4712 Log4(("SUP_IOCTL_CALL_SERVICE: rc=%Rrc op=%u out=%u arg=%RX64 p/t=%RTproc/%RTthrd\n",
4713 rc, pReq->u.In.uOperation, pReq->Hdr.cbOut, pReq->u.In.u64Arg, RTProcSelf(), RTThreadNativeSelf()));
4714 return rc;
4715#else /* RT_OS_WINDOWS && !DEBUG */
4716 return VERR_NOT_IMPLEMENTED;
4717#endif /* RT_OS_WINDOWS && !DEBUG */
4718}
4719
4720
4721/**
4722 * Implements the logger settings request.
4723 *
4724 * @returns VBox status code.
4725 * @param pDevExt The device extension.
4726 * @param pSession The caller's session.
4727 * @param pReq The request.
4728 */
4729static int supdrvIOCtl_LoggerSettings(PSUPDRVDEVEXT pDevExt, PSUPDRVSESSION pSession, PSUPLOGGERSETTINGS pReq)
4730{
4731 const char *pszGroup = &pReq->u.In.szStrings[pReq->u.In.offGroups];
4732 const char *pszFlags = &pReq->u.In.szStrings[pReq->u.In.offFlags];
4733 const char *pszDest = &pReq->u.In.szStrings[pReq->u.In.offDestination];
4734 PRTLOGGER pLogger = NULL;
4735 int rc;
4736
4737 /*
4738 * Some further validation.
4739 */
4740 switch (pReq->u.In.fWhat)
4741 {
4742 case SUPLOGGERSETTINGS_WHAT_SETTINGS:
4743 case SUPLOGGERSETTINGS_WHAT_CREATE:
4744 break;
4745
4746 case SUPLOGGERSETTINGS_WHAT_DESTROY:
4747 if (*pszGroup || *pszFlags || *pszDest)
4748 return VERR_INVALID_PARAMETER;
4749 if (pReq->u.In.fWhich == SUPLOGGERSETTINGS_WHICH_RELEASE)
4750 return VERR_ACCESS_DENIED;
4751 break;
4752
4753 default:
4754 return VERR_INTERNAL_ERROR;
4755 }
4756
4757 /*
4758 * Get the logger.
4759 */
4760 switch (pReq->u.In.fWhich)
4761 {
4762 case SUPLOGGERSETTINGS_WHICH_DEBUG:
4763 pLogger = RTLogGetDefaultInstance();
4764 break;
4765
4766 case SUPLOGGERSETTINGS_WHICH_RELEASE:
4767 pLogger = RTLogRelDefaultInstance();
4768 break;
4769
4770 default:
4771 return VERR_INTERNAL_ERROR;
4772 }
4773
4774 /*
4775 * Do the job.
4776 */
4777 switch (pReq->u.In.fWhat)
4778 {
4779 case SUPLOGGERSETTINGS_WHAT_SETTINGS:
4780 if (pLogger)
4781 {
4782 rc = RTLogFlags(pLogger, pszFlags);
4783 if (RT_SUCCESS(rc))
4784 rc = RTLogGroupSettings(pLogger, pszGroup);
4785 NOREF(pszDest);
4786 }
4787 else
4788 rc = VERR_NOT_FOUND;
4789 break;
4790
4791 case SUPLOGGERSETTINGS_WHAT_CREATE:
4792 {
4793 if (pLogger)
4794 rc = VERR_ALREADY_EXISTS;
4795 else
4796 {
4797 static const char * const s_apszGroups[] = VBOX_LOGGROUP_NAMES;
4798
4799 rc = RTLogCreate(&pLogger,
4800 0 /* fFlags */,
4801 pszGroup,
4802 pReq->u.In.fWhich == SUPLOGGERSETTINGS_WHICH_DEBUG
4803 ? "VBOX_LOG"
4804 : "VBOX_RELEASE_LOG",
4805 RT_ELEMENTS(s_apszGroups),
4806 s_apszGroups,
4807 RTLOGDEST_STDOUT | RTLOGDEST_DEBUGGER,
4808 NULL);
4809 if (RT_SUCCESS(rc))
4810 {
4811 rc = RTLogFlags(pLogger, pszFlags);
4812 NOREF(pszDest);
4813 if (RT_SUCCESS(rc))
4814 {
4815 switch (pReq->u.In.fWhich)
4816 {
4817 case SUPLOGGERSETTINGS_WHICH_DEBUG:
4818 pLogger = RTLogSetDefaultInstance(pLogger);
4819 break;
4820 case SUPLOGGERSETTINGS_WHICH_RELEASE:
4821 pLogger = RTLogRelSetDefaultInstance(pLogger);
4822 break;
4823 }
4824 }
4825 RTLogDestroy(pLogger);
4826 }
4827 }
4828 break;
4829 }
4830
4831 case SUPLOGGERSETTINGS_WHAT_DESTROY:
4832 switch (pReq->u.In.fWhich)
4833 {
4834 case SUPLOGGERSETTINGS_WHICH_DEBUG:
4835 pLogger = RTLogSetDefaultInstance(NULL);
4836 break;
4837 case SUPLOGGERSETTINGS_WHICH_RELEASE:
4838 pLogger = RTLogRelSetDefaultInstance(NULL);
4839 break;
4840 }
4841 rc = RTLogDestroy(pLogger);
4842 break;
4843
4844 default:
4845 {
4846 rc = VERR_INTERNAL_ERROR;
4847 break;
4848 }
4849 }
4850
4851 return rc;
4852}
4853
4854
4855/**
4856 * Creates the GIP.
4857 *
4858 * @returns VBox status code.
4859 * @param pDevExt Instance data. GIP stuff may be updated.
4860 */
4861static int supdrvGipCreate(PSUPDRVDEVEXT pDevExt)
4862{
4863 PSUPGLOBALINFOPAGE pGip;
4864 RTHCPHYS HCPhysGip;
4865 uint32_t u32SystemResolution;
4866 uint32_t u32Interval;
4867 unsigned cCpus;
4868 int rc;
4869
4870
4871 LogFlow(("supdrvGipCreate:\n"));
4872
4873 /* assert order */
4874 Assert(pDevExt->u32SystemTimerGranularityGrant == 0);
4875 Assert(pDevExt->GipMemObj == NIL_RTR0MEMOBJ);
4876 Assert(!pDevExt->pGipTimer);
4877
4878 /*
4879 * Check the CPU count.
4880 */
4881 cCpus = RTMpGetArraySize();
4882 if ( cCpus > RTCPUSET_MAX_CPUS
4883 || cCpus > 256 /*ApicId is used for the mappings*/)
4884 {
4885 SUPR0Printf("VBoxDrv: Too many CPUs (%u) for the GIP (max %u)\n", cCpus, RT_MIN(RTCPUSET_MAX_CPUS, 256));
4886 return VERR_TOO_MANY_CPUS;
4887 }
4888
4889 /*
4890 * Allocate a contiguous set of pages with a default kernel mapping.
4891 */
4892 rc = RTR0MemObjAllocCont(&pDevExt->GipMemObj, RT_UOFFSETOF(SUPGLOBALINFOPAGE, aCPUs[cCpus]), false /*fExecutable*/);
4893 if (RT_FAILURE(rc))
4894 {
4895 OSDBGPRINT(("supdrvGipCreate: failed to allocate the GIP page. rc=%d\n", rc));
4896 return rc;
4897 }
4898 pGip = (PSUPGLOBALINFOPAGE)RTR0MemObjAddress(pDevExt->GipMemObj); AssertPtr(pGip);
4899 HCPhysGip = RTR0MemObjGetPagePhysAddr(pDevExt->GipMemObj, 0); Assert(HCPhysGip != NIL_RTHCPHYS);
4900
4901 /*
4902 * Find a reasonable update interval and initialize the structure.
4903 */
4904 u32Interval = u32SystemResolution = RTTimerGetSystemGranularity();
4905 while (u32Interval < 10000000 /* 10 ms */)
4906 u32Interval += u32SystemResolution;
4907
4908 supdrvGipInit(pDevExt, pGip, HCPhysGip, RTTimeSystemNanoTS(), 1000000000 / u32Interval /*=Hz*/, cCpus);
4909
4910 rc = RTSpinlockCreate(&pGip->Spinlock);
4911 if (RT_FAILURE(rc))
4912 {
4913 supdrvGipDestroy(pDevExt);
4914 return rc;
4915 }
4916
4917 /*
4918 * Create the timer.
4919 * If CPU_ALL isn't supported we'll have to fall back to synchronous mode.
4920 */
4921 if (pGip->u32Mode == SUPGIPMODE_ASYNC_TSC)
4922 {
4923 rc = RTTimerCreateEx(&pDevExt->pGipTimer, u32Interval, RTTIMER_FLAGS_CPU_ALL, supdrvGipAsyncTimer, pDevExt);
4924 if (rc == VERR_NOT_SUPPORTED)
4925 {
4926 OSDBGPRINT(("supdrvGipCreate: omni timer not supported, falling back to synchronous mode\n"));
4927 pGip->u32Mode = SUPGIPMODE_SYNC_TSC;
4928 }
4929 }
4930 if (pGip->u32Mode != SUPGIPMODE_ASYNC_TSC)
4931 rc = RTTimerCreateEx(&pDevExt->pGipTimer, u32Interval, 0, supdrvGipSyncTimer, pDevExt);
4932 if (RT_SUCCESS(rc))
4933 {
4934 rc = RTMpNotificationRegister(supdrvGipMpEvent, pDevExt);
4935 if (RT_SUCCESS(rc))
4936 {
4937 rc = RTMpOnAll(supdrvGipInitOnCpu, pDevExt, pGip);
4938 if (RT_SUCCESS(rc))
4939 {
4940 /*
4941 * We're good.
4942 */
4943 Log(("supdrvGipCreate: %u ns interval.\n", u32Interval));
4944 g_pSUPGlobalInfoPage = pGip;
4945 return VINF_SUCCESS;
4946 }
4947
4948 OSDBGPRINT(("supdrvGipCreate: RTMpOnAll failed with rc=%Rrc\n", rc));
4949 RTMpNotificationDeregister(supdrvGipMpEvent, pDevExt);
4950
4951 }
4952 else
4953 OSDBGPRINT(("supdrvGipCreate: failed to register MP event notfication. rc=%Rrc\n", rc));
4954 }
4955 else
4956 {
4957 OSDBGPRINT(("supdrvGipCreate: failed create GIP timer at %u ns interval. rc=%Rrc\n", u32Interval, rc));
4958 Assert(!pDevExt->pGipTimer);
4959 }
4960 supdrvGipDestroy(pDevExt);
4961 return rc;
4962}
4963
4964
4965/**
4966 * Terminates the GIP.
4967 *
4968 * @param pDevExt Instance data. GIP stuff may be updated.
4969 */
4970static void supdrvGipDestroy(PSUPDRVDEVEXT pDevExt)
4971{
4972 int rc;
4973#ifdef DEBUG_DARWIN_GIP
4974 OSDBGPRINT(("supdrvGipDestroy: pDevExt=%p pGip=%p pGipTimer=%p GipMemObj=%p\n", pDevExt,
4975 pDevExt->GipMemObj != NIL_RTR0MEMOBJ ? RTR0MemObjAddress(pDevExt->GipMemObj) : NULL,
4976 pDevExt->pGipTimer, pDevExt->GipMemObj));
4977#endif
4978
4979 /*
4980 * Invalid the GIP data.
4981 */
4982 if (pDevExt->pGip)
4983 {
4984 supdrvGipTerm(pDevExt->pGip);
4985 if (pDevExt->pGip->Spinlock)
4986 {
4987 RTSpinlockDestroy(pDevExt->pGip->Spinlock);
4988 pDevExt->pGip->Spinlock = NIL_RTSPINLOCK;
4989 }
4990
4991 pDevExt->pGip = NULL;
4992 }
4993 g_pSUPGlobalInfoPage = NULL;
4994
4995 /*
4996 * Destroy the timer and free the GIP memory object.
4997 */
4998 if (pDevExt->pGipTimer)
4999 {
5000 rc = RTTimerDestroy(pDevExt->pGipTimer); AssertRC(rc);
5001 pDevExt->pGipTimer = NULL;
5002 }
5003
5004 if (pDevExt->GipMemObj != NIL_RTR0MEMOBJ)
5005 {
5006 rc = RTR0MemObjFree(pDevExt->GipMemObj, true /* free mappings */); AssertRC(rc);
5007 pDevExt->GipMemObj = NIL_RTR0MEMOBJ;
5008 }
5009
5010 /*
5011 * Finally, make sure we've release the system timer resolution request
5012 * if one actually succeeded and is still pending.
5013 */
5014 if (pDevExt->u32SystemTimerGranularityGrant)
5015 {
5016 rc = RTTimerReleaseSystemGranularity(pDevExt->u32SystemTimerGranularityGrant); AssertRC(rc);
5017 pDevExt->u32SystemTimerGranularityGrant = 0;
5018 }
5019}
5020
5021
5022/**
5023 * Timer callback function sync GIP mode.
5024 * @param pTimer The timer.
5025 * @param pvUser The device extension.
5026 */
5027static DECLCALLBACK(void) supdrvGipSyncTimer(PRTTIMER pTimer, void *pvUser, uint64_t iTick)
5028{
5029 RTCCUINTREG fOldFlags = ASMIntDisableFlags(); /* No interruptions please (real problem on S10). */
5030 PSUPDRVDEVEXT pDevExt = (PSUPDRVDEVEXT)pvUser;
5031 uint64_t u64TSC = ASMReadTSC();
5032 uint64_t NanoTS = RTTimeSystemNanoTS();
5033
5034 supdrvGipUpdate(pDevExt->pGip, NanoTS, u64TSC, NIL_RTCPUID, iTick);
5035
5036 ASMSetFlags(fOldFlags);
5037}
5038
5039
5040/**
5041 * Timer callback function for async GIP mode.
5042 * @param pTimer The timer.
5043 * @param pvUser The device extension.
5044 */
5045static DECLCALLBACK(void) supdrvGipAsyncTimer(PRTTIMER pTimer, void *pvUser, uint64_t iTick)
5046{
5047 RTCCUINTREG fOldFlags = ASMIntDisableFlags(); /* No interruptions please (real problem on S10). */
5048 PSUPDRVDEVEXT pDevExt = (PSUPDRVDEVEXT)pvUser;
5049 RTCPUID idCpu = RTMpCpuId();
5050 uint64_t u64TSC = ASMReadTSC();
5051 uint64_t NanoTS = RTTimeSystemNanoTS();
5052
5053 /** @todo reset the transaction number and whatnot when iTick == 1. */
5054 if (pDevExt->idGipMaster == idCpu)
5055 supdrvGipUpdate(pDevExt->pGip, NanoTS, u64TSC, idCpu, iTick);
5056 else
5057 supdrvGipUpdatePerCpu(pDevExt->pGip, NanoTS, u64TSC, idCpu, ASMGetApicId(), iTick);
5058
5059 ASMSetFlags(fOldFlags);
5060}
5061
5062
5063/**
5064 * Finds our (@a idCpu) entry, or allocates a new one if not found.
5065 *
5066 * @returns Index of the CPU in the cache set.
5067 * @param pGip The GIP.
5068 * @param idCpu The CPU ID.
5069 */
5070static uint32_t supdrvGipCpuIndexFromCpuId(PSUPGLOBALINFOPAGE pGip, RTCPUID idCpu)
5071{
5072 uint32_t i, cTries;
5073
5074 /*
5075 * ASSUMES that CPU IDs are constant.
5076 */
5077 for (i = 0; i < pGip->cCpus; i++)
5078 if (pGip->aCPUs[i].idCpu == idCpu)
5079 return i;
5080
5081 cTries = 0;
5082 do
5083 {
5084 for (i = 0; i < pGip->cCpus; i++)
5085 {
5086 bool fRc;
5087 ASMAtomicCmpXchgSize(&pGip->aCPUs[i].idCpu, idCpu, NIL_RTCPUID, fRc);
5088 if (fRc)
5089 return i;
5090 }
5091 } while (cTries++ < 32);
5092 AssertReleaseFailed();
5093 return i - 1;
5094}
5095
5096
5097/**
5098 * The calling CPU should be accounted as online, update GIP accordingly.
5099 *
5100 * This is used by supdrvGipMpEvent as well as the supdrvGipCreate.
5101 *
5102 * @param pGip The GIP.
5103 * @param idCpu The CPU ID.
5104 */
5105static void supdrvGipMpEventOnline(PSUPGLOBALINFOPAGE pGip, RTCPUID idCpu)
5106{
5107 int iCpuSet = 0;
5108 uint16_t idApic = UINT16_MAX;
5109 uint32_t i = 0;
5110 uint64_t u64NanoTS = 0;
5111 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
5112
5113 AssertRelease(idCpu == RTMpCpuId());
5114 Assert(pGip->cPossibleCpus == RTMpGetCount());
5115
5116 /*
5117 * Do this behind a spinlock with interrupts disabled as this can fire
5118 * on all CPUs simultaneously, see #6110.
5119 */
5120 RTSpinlockAcquireNoInts(pGip->Spinlock, &SpinlockTmp);
5121
5122 /*
5123 * Update the globals.
5124 */
5125 ASMAtomicWriteU16(&pGip->cPresentCpus, RTMpGetPresentCount());
5126 ASMAtomicWriteU16(&pGip->cOnlineCpus, RTMpGetOnlineCount());
5127 iCpuSet = RTMpCpuIdToSetIndex(idCpu);
5128 if (iCpuSet >= 0)
5129 {
5130 Assert(RTCpuSetIsMemberByIndex(&pGip->PossibleCpuSet, iCpuSet));
5131 RTCpuSetAddByIndex(&pGip->OnlineCpuSet, iCpuSet);
5132 RTCpuSetAddByIndex(&pGip->PresentCpuSet, iCpuSet);
5133 }
5134
5135 /*
5136 * Update the entry.
5137 */
5138 u64NanoTS = RTTimeSystemNanoTS() - pGip->u32UpdateIntervalNS;
5139 i = supdrvGipCpuIndexFromCpuId(pGip, idCpu);
5140 supdrvGipInitCpu(pGip, &pGip->aCPUs[i], u64NanoTS);
5141 idApic = ASMGetApicId();
5142 ASMAtomicWriteU16(&pGip->aCPUs[i].idApic, idApic);
5143 ASMAtomicWriteS16(&pGip->aCPUs[i].iCpuSet, (int16_t)iCpuSet);
5144 ASMAtomicWriteSize(&pGip->aCPUs[i].idCpu, idCpu);
5145
5146 /*
5147 * Update the APIC ID and CPU set index mappings.
5148 */
5149 ASMAtomicWriteU16(&pGip->aiCpuFromApicId[idApic], i);
5150 ASMAtomicWriteU16(&pGip->aiCpuFromCpuSetIdx[iCpuSet], i);
5151
5152 /* commit it */
5153 ASMAtomicWriteSize(&pGip->aCPUs[i].enmState, SUPGIPCPUSTATE_ONLINE);
5154
5155 RTSpinlockReleaseNoInts(pGip->Spinlock, &SpinlockTmp);
5156}
5157
5158
5159/**
5160 * The CPU should be accounted as offline, update the GIP accordingly.
5161 *
5162 * This is used by supdrvGipMpEvent.
5163 *
5164 * @param pGip The GIP.
5165 * @param idCpu The CPU ID.
5166 */
5167static void supdrvGipMpEventOffline(PSUPGLOBALINFOPAGE pGip, RTCPUID idCpu)
5168{
5169 int iCpuSet;
5170 unsigned i;
5171
5172 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
5173 RTSpinlockAcquireNoInts(pGip->Spinlock, &SpinlockTmp);
5174
5175 iCpuSet = RTMpCpuIdToSetIndex(idCpu);
5176 AssertReturnVoid(iCpuSet >= 0);
5177
5178 i = pGip->aiCpuFromCpuSetIdx[iCpuSet];
5179 AssertReturnVoid(i < pGip->cCpus);
5180 AssertReturnVoid(pGip->aCPUs[i].idCpu == idCpu);
5181
5182 Assert(RTCpuSetIsMemberByIndex(&pGip->PossibleCpuSet, iCpuSet));
5183 RTCpuSetDelByIndex(&pGip->OnlineCpuSet, iCpuSet);
5184
5185 /* commit it */
5186 ASMAtomicWriteSize(&pGip->aCPUs[i].enmState, SUPGIPCPUSTATE_OFFLINE);
5187
5188 RTSpinlockReleaseNoInts(pGip->Spinlock, &SpinlockTmp);
5189}
5190
5191
5192/**
5193 * Multiprocessor event notification callback.
5194 *
5195 * This is used to make sure that the GIP master gets passed on to
5196 * another CPU. It also updates the associated CPU data.
5197 *
5198 * @param enmEvent The event.
5199 * @param idCpu The cpu it applies to.
5200 * @param pvUser Pointer to the device extension.
5201 *
5202 * @remarks This function -must- fire on the newly online'd CPU for the
5203 * RTMPEVENT_ONLINE case and can fire on any CPU for the
5204 * RTMPEVENT_OFFLINE case.
5205 */
5206static DECLCALLBACK(void) supdrvGipMpEvent(RTMPEVENT enmEvent, RTCPUID idCpu, void *pvUser)
5207{
5208 PSUPDRVDEVEXT pDevExt = (PSUPDRVDEVEXT)pvUser;
5209 PSUPGLOBALINFOPAGE pGip = pDevExt->pGip;
5210
5211 AssertRelease(!RTThreadPreemptIsEnabled(NIL_RTTHREAD));
5212
5213 /*
5214 * Update the GIP CPU data.
5215 */
5216 if (pGip)
5217 {
5218 switch (enmEvent)
5219 {
5220 case RTMPEVENT_ONLINE:
5221 AssertRelease(idCpu == RTMpCpuId());
5222 supdrvGipMpEventOnline(pGip, idCpu);
5223 break;
5224 case RTMPEVENT_OFFLINE:
5225 supdrvGipMpEventOffline(pGip, idCpu);
5226 break;
5227
5228 }
5229 }
5230
5231 /*
5232 * Make sure there is a master GIP.
5233 */
5234 if (enmEvent == RTMPEVENT_OFFLINE)
5235 {
5236 RTCPUID idGipMaster = ASMAtomicReadU32(&pDevExt->idGipMaster);
5237 if (idGipMaster == idCpu)
5238 {
5239 /*
5240 * Find a new GIP master.
5241 */
5242 bool fIgnored;
5243 unsigned i;
5244 RTCPUID idNewGipMaster = NIL_RTCPUID;
5245 RTCPUSET OnlineCpus;
5246 RTMpGetOnlineSet(&OnlineCpus);
5247
5248 for (i = 0; i < RTCPUSET_MAX_CPUS; i++)
5249 {
5250 RTCPUID idCurCpu = RTMpCpuIdFromSetIndex(i);
5251 if ( RTCpuSetIsMember(&OnlineCpus, idCurCpu)
5252 && idCurCpu != idGipMaster)
5253 {
5254 idNewGipMaster = idCurCpu;
5255 break;
5256 }
5257 }
5258
5259 Log(("supdrvGipMpEvent: Gip master %#lx -> %#lx\n", (long)idGipMaster, (long)idNewGipMaster));
5260 ASMAtomicCmpXchgSize(&pDevExt->idGipMaster, idNewGipMaster, idGipMaster, fIgnored);
5261 NOREF(fIgnored);
5262 }
5263 }
5264}
5265
5266
5267/**
5268 * Callback used by supdrvDetermineAsyncTSC to read the TSC on a CPU.
5269 *
5270 * @param idCpu Ignored.
5271 * @param pvUser1 Where to put the TSC.
5272 * @param pvUser2 Ignored.
5273 */
5274static DECLCALLBACK(void) supdrvDetermineAsyncTscWorker(RTCPUID idCpu, void *pvUser1, void *pvUser2)
5275{
5276#if 1
5277 ASMAtomicWriteU64((uint64_t volatile *)pvUser1, ASMReadTSC());
5278#else
5279 *(uint64_t *)pvUser1 = ASMReadTSC();
5280#endif
5281}
5282
5283
5284/**
5285 * Determine if Async GIP mode is required because of TSC drift.
5286 *
5287 * When using the default/normal timer code it is essential that the time stamp counter
5288 * (TSC) runs never backwards, that is, a read operation to the counter should return
5289 * a bigger value than any previous read operation. This is guaranteed by the latest
5290 * AMD CPUs and by newer Intel CPUs which never enter the C2 state (P4). In any other
5291 * case we have to choose the asynchronous timer mode.
5292 *
5293 * @param poffMin Pointer to the determined difference between different cores.
5294 * @return false if the time stamp counters appear to be synchronized, true otherwise.
5295 */
5296static bool supdrvDetermineAsyncTsc(uint64_t *poffMin)
5297{
5298 /*
5299 * Just iterate all the cpus 8 times and make sure that the TSC is
5300 * ever increasing. We don't bother taking TSC rollover into account.
5301 */
5302 int iEndCpu = RTMpGetArraySize();
5303 int iCpu;
5304 int cLoops = 8;
5305 bool fAsync = false;
5306 int rc = VINF_SUCCESS;
5307 uint64_t offMax = 0;
5308 uint64_t offMin = ~(uint64_t)0;
5309 uint64_t PrevTsc = ASMReadTSC();
5310
5311 while (cLoops-- > 0)
5312 {
5313 for (iCpu = 0; iCpu < iEndCpu; iCpu++)
5314 {
5315 uint64_t CurTsc;
5316 rc = RTMpOnSpecific(RTMpCpuIdFromSetIndex(iCpu), supdrvDetermineAsyncTscWorker, &CurTsc, NULL);
5317 if (RT_SUCCESS(rc))
5318 {
5319 if (CurTsc <= PrevTsc)
5320 {
5321 fAsync = true;
5322 offMin = offMax = PrevTsc - CurTsc;
5323 Log(("supdrvDetermineAsyncTsc: iCpu=%d cLoops=%d CurTsc=%llx PrevTsc=%llx\n",
5324 iCpu, cLoops, CurTsc, PrevTsc));
5325 break;
5326 }
5327
5328 /* Gather statistics (except the first time). */
5329 if (iCpu != 0 || cLoops != 7)
5330 {
5331 uint64_t off = CurTsc - PrevTsc;
5332 if (off < offMin)
5333 offMin = off;
5334 if (off > offMax)
5335 offMax = off;
5336 Log2(("%d/%d: off=%llx\n", cLoops, iCpu, off));
5337 }
5338
5339 /* Next */
5340 PrevTsc = CurTsc;
5341 }
5342 else if (rc == VERR_NOT_SUPPORTED)
5343 break;
5344 else
5345 AssertMsg(rc == VERR_CPU_NOT_FOUND || rc == VERR_CPU_OFFLINE, ("%d\n", rc));
5346 }
5347
5348 /* broke out of the loop. */
5349 if (iCpu < iEndCpu)
5350 break;
5351 }
5352
5353 *poffMin = offMin; /* Almost RTMpOnSpecific profiling. */
5354 Log(("supdrvDetermineAsyncTsc: returns %d; iEndCpu=%d rc=%d offMin=%llx offMax=%llx\n",
5355 fAsync, iEndCpu, rc, offMin, offMax));
5356#if !defined(RT_OS_SOLARIS) && !defined(RT_OS_OS2) && !defined(RT_OS_WINDOWS)
5357 OSDBGPRINT(("vboxdrv: fAsync=%d offMin=%#lx offMax=%#lx\n", fAsync, (long)offMin, (long)offMax));
5358#endif
5359 return fAsync;
5360}
5361
5362
5363/**
5364 * Determine the GIP TSC mode.
5365 *
5366 * @returns The most suitable TSC mode.
5367 * @param pDevExt Pointer to the device instance data.
5368 */
5369static SUPGIPMODE supdrvGipDeterminTscMode(PSUPDRVDEVEXT pDevExt)
5370{
5371 /*
5372 * On SMP we're faced with two problems:
5373 * (1) There might be a skew between the CPU, so that cpu0
5374 * returns a TSC that is slightly different from cpu1.
5375 * (2) Power management (and other things) may cause the TSC
5376 * to run at a non-constant speed, and cause the speed
5377 * to be different on the cpus. This will result in (1).
5378 *
5379 * So, on SMP systems we'll have to select the ASYNC update method
5380 * if there are symptoms of these problems.
5381 */
5382 if (RTMpGetCount() > 1)
5383 {
5384 uint32_t uEAX, uEBX, uECX, uEDX;
5385 uint64_t u64DiffCoresIgnored;
5386
5387 /* Permit the user and/or the OS specific bits to force async mode. */
5388 if (supdrvOSGetForcedAsyncTscMode(pDevExt))
5389 return SUPGIPMODE_ASYNC_TSC;
5390
5391 /* Try check for current differences between the cpus. */
5392 if (supdrvDetermineAsyncTsc(&u64DiffCoresIgnored))
5393 return SUPGIPMODE_ASYNC_TSC;
5394
5395 /*
5396 * If the CPU supports power management and is an AMD one we
5397 * won't trust it unless it has the TscInvariant bit is set.
5398 */
5399 /* Check for "AuthenticAMD" */
5400 ASMCpuId(0, &uEAX, &uEBX, &uECX, &uEDX);
5401 if ( uEAX >= 1
5402 && uEBX == X86_CPUID_VENDOR_AMD_EBX
5403 && uECX == X86_CPUID_VENDOR_AMD_ECX
5404 && uEDX == X86_CPUID_VENDOR_AMD_EDX)
5405 {
5406 /* Check for APM support and that TscInvariant is cleared. */
5407 ASMCpuId(0x80000000, &uEAX, &uEBX, &uECX, &uEDX);
5408 if (uEAX >= 0x80000007)
5409 {
5410 ASMCpuId(0x80000007, &uEAX, &uEBX, &uECX, &uEDX);
5411 if ( !(uEDX & RT_BIT(8))/* TscInvariant */
5412 && (uEDX & 0x3e)) /* STC|TM|THERMTRIP|VID|FID. Ignore TS. */
5413 return SUPGIPMODE_ASYNC_TSC;
5414 }
5415 }
5416 }
5417 return SUPGIPMODE_SYNC_TSC;
5418}
5419
5420
5421/**
5422 * Initializes per-CPU GIP information.
5423 *
5424 * @param pGip Pointer to the read-write kernel mapping of the GIP.
5425 * @param pCpu Pointer to which GIP CPU to initalize.
5426 * @param u64NanoTS The current nanosecond timestamp.
5427 */
5428static void supdrvGipInitCpu(PSUPGLOBALINFOPAGE pGip, PSUPGIPCPU pCpu, uint64_t u64NanoTS)
5429{
5430 pCpu->u32TransactionId = 2;
5431 pCpu->u64NanoTS = u64NanoTS;
5432 pCpu->u64TSC = ASMReadTSC();
5433
5434 ASMAtomicWriteSize(&pCpu->enmState, SUPGIPCPUSTATE_INVALID);
5435 ASMAtomicWriteSize(&pCpu->idCpu, NIL_RTCPUID);
5436 ASMAtomicWriteS16(&pCpu->iCpuSet, -1);
5437 ASMAtomicWriteU16(&pCpu->idApic, UINT16_MAX);
5438
5439 /*
5440 * We don't know the following values until we've executed updates.
5441 * So, we'll just pretend it's a 4 GHz CPU and adjust the history it on
5442 * the 2nd timer callout.
5443 */
5444 pCpu->u64CpuHz = _4G + 1; /* tstGIP-2 depends on this. */
5445 pCpu->u32UpdateIntervalTSC
5446 = pCpu->au32TSCHistory[0]
5447 = pCpu->au32TSCHistory[1]
5448 = pCpu->au32TSCHistory[2]
5449 = pCpu->au32TSCHistory[3]
5450 = pCpu->au32TSCHistory[4]
5451 = pCpu->au32TSCHistory[5]
5452 = pCpu->au32TSCHistory[6]
5453 = pCpu->au32TSCHistory[7]
5454 = (uint32_t)(_4G / pGip->u32UpdateHz);
5455}
5456
5457
5458/**
5459 * Initializes the GIP data.
5460 *
5461 * @param pDevExt Pointer to the device instance data.
5462 * @param pGip Pointer to the read-write kernel mapping of the GIP.
5463 * @param HCPhys The physical address of the GIP.
5464 * @param u64NanoTS The current nanosecond timestamp.
5465 * @param uUpdateHz The update frequency.
5466 * @param cCpus The CPU count.
5467 */
5468static void supdrvGipInit(PSUPDRVDEVEXT pDevExt, PSUPGLOBALINFOPAGE pGip, RTHCPHYS HCPhys,
5469 uint64_t u64NanoTS, unsigned uUpdateHz, unsigned cCpus)
5470{
5471 size_t const cbGip = RT_ALIGN_Z(RT_OFFSETOF(SUPGLOBALINFOPAGE, aCPUs[cCpus]), PAGE_SIZE);
5472 unsigned i;
5473#ifdef DEBUG_DARWIN_GIP
5474 OSDBGPRINT(("supdrvGipInit: pGip=%p HCPhys=%lx u64NanoTS=%llu uUpdateHz=%d cCpus=%u\n", pGip, (long)HCPhys, u64NanoTS, uUpdateHz, cCpus));
5475#else
5476 LogFlow(("supdrvGipInit: pGip=%p HCPhys=%lx u64NanoTS=%llu uUpdateHz=%d cCpus=%u\n", pGip, (long)HCPhys, u64NanoTS, uUpdateHz, cCpus));
5477#endif
5478
5479 /*
5480 * Initialize the structure.
5481 */
5482 memset(pGip, 0, cbGip);
5483 pGip->u32Magic = SUPGLOBALINFOPAGE_MAGIC;
5484 pGip->u32Version = SUPGLOBALINFOPAGE_VERSION;
5485 pGip->u32Mode = supdrvGipDeterminTscMode(pDevExt);
5486 pGip->cCpus = (uint16_t)cCpus;
5487 pGip->cPages = (uint16_t)(cbGip / PAGE_SIZE);
5488 pGip->u32UpdateHz = uUpdateHz;
5489 pGip->u32UpdateIntervalNS = 1000000000 / uUpdateHz;
5490 pGip->u64NanoTSLastUpdateHz = u64NanoTS;
5491 RTCpuSetEmpty(&pGip->OnlineCpuSet);
5492 RTCpuSetEmpty(&pGip->PresentCpuSet);
5493 RTMpGetSet(&pGip->PossibleCpuSet);
5494 pGip->cOnlineCpus = RTMpGetOnlineCount();
5495 pGip->cPresentCpus = RTMpGetPresentCount();
5496 pGip->cPossibleCpus = RTMpGetCount();
5497 pGip->idCpuMax = RTMpGetMaxCpuId();
5498 pGip->Spinlock = NULL;
5499 for (i = 0; i < RT_ELEMENTS(pGip->aiCpuFromApicId); i++)
5500 pGip->aiCpuFromApicId[i] = 0;
5501 for (i = 0; i < RT_ELEMENTS(pGip->aiCpuFromCpuSetIdx); i++)
5502 pGip->aiCpuFromCpuSetIdx[i] = UINT16_MAX;
5503
5504 for (i = 0; i < cCpus; i++)
5505 supdrvGipInitCpu(pGip, &pGip->aCPUs[i], u64NanoTS);
5506
5507 /*
5508 * Link it to the device extension.
5509 */
5510 pDevExt->pGip = pGip;
5511 pDevExt->HCPhysGip = HCPhys;
5512 pDevExt->cGipUsers = 0;
5513}
5514
5515
5516/**
5517 * On CPU initialization callback for RTMpOnAll.
5518 *
5519 * @param idCpu The CPU ID.
5520 * @param pvUser1 The device extension.
5521 * @param pvUser2 The GIP.
5522 */
5523static DECLCALLBACK(void) supdrvGipInitOnCpu(RTCPUID idCpu, void *pvUser1, void *pvUser2)
5524{
5525 /* This is good enough, even though it will update some of the globals a
5526 bit to much. */
5527 supdrvGipMpEventOnline((PSUPGLOBALINFOPAGE)pvUser2, idCpu);
5528}
5529
5530
5531/**
5532 * Invalidates the GIP data upon termination.
5533 *
5534 * @param pGip Pointer to the read-write kernel mapping of the GIP.
5535 */
5536static void supdrvGipTerm(PSUPGLOBALINFOPAGE pGip)
5537{
5538 unsigned i;
5539 pGip->u32Magic = 0;
5540 for (i = 0; i < RT_ELEMENTS(pGip->aCPUs); i++)
5541 {
5542 pGip->aCPUs[i].u64NanoTS = 0;
5543 pGip->aCPUs[i].u64TSC = 0;
5544 pGip->aCPUs[i].iTSCHistoryHead = 0;
5545 }
5546}
5547
5548
5549/**
5550 * Worker routine for supdrvGipUpdate and supdrvGipUpdatePerCpu that
5551 * updates all the per cpu data except the transaction id.
5552 *
5553 * @param pGip The GIP.
5554 * @param pGipCpu Pointer to the per cpu data.
5555 * @param u64NanoTS The current time stamp.
5556 * @param u64TSC The current TSC.
5557 * @param iTick The current timer tick.
5558 */
5559static void supdrvGipDoUpdateCpu(PSUPGLOBALINFOPAGE pGip, PSUPGIPCPU pGipCpu, uint64_t u64NanoTS, uint64_t u64TSC, uint64_t iTick)
5560{
5561 uint64_t u64TSCDelta;
5562 uint32_t u32UpdateIntervalTSC;
5563 uint32_t u32UpdateIntervalTSCSlack;
5564 unsigned iTSCHistoryHead;
5565 uint64_t u64CpuHz;
5566 uint32_t u32TransactionId;
5567
5568 /* Delta between this and the previous update. */
5569 ASMAtomicUoWriteU32(&pGipCpu->u32PrevUpdateIntervalNS, (uint32_t)(u64NanoTS - pGipCpu->u64NanoTS));
5570
5571 /*
5572 * Update the NanoTS.
5573 */
5574 ASMAtomicWriteU64(&pGipCpu->u64NanoTS, u64NanoTS);
5575
5576 /*
5577 * Calc TSC delta.
5578 */
5579 /** @todo validate the NanoTS delta, don't trust the OS to call us when it should... */
5580 u64TSCDelta = u64TSC - pGipCpu->u64TSC;
5581 ASMAtomicWriteU64(&pGipCpu->u64TSC, u64TSC);
5582
5583 if (u64TSCDelta >> 32)
5584 {
5585 u64TSCDelta = pGipCpu->u32UpdateIntervalTSC;
5586 pGipCpu->cErrors++;
5587 }
5588
5589 /*
5590 * On the 2nd and 3rd callout, reset the history with the current TSC
5591 * interval since the values entered by supdrvGipInit are totally off.
5592 * The interval on the 1st callout completely unreliable, the 2nd is a bit
5593 * better, while the 3rd should be most reliable.
5594 */
5595 u32TransactionId = pGipCpu->u32TransactionId;
5596 if (RT_UNLIKELY( ( u32TransactionId == 5
5597 || u32TransactionId == 7)
5598 && ( iTick == 2
5599 || iTick == 3) ))
5600 {
5601 unsigned i;
5602 for (i = 0; i < RT_ELEMENTS(pGipCpu->au32TSCHistory); i++)
5603 ASMAtomicUoWriteU32(&pGipCpu->au32TSCHistory[i], (uint32_t)u64TSCDelta);
5604 }
5605
5606 /*
5607 * TSC History.
5608 */
5609 Assert(RT_ELEMENTS(pGipCpu->au32TSCHistory) == 8);
5610 iTSCHistoryHead = (pGipCpu->iTSCHistoryHead + 1) & 7;
5611 ASMAtomicWriteU32(&pGipCpu->iTSCHistoryHead, iTSCHistoryHead);
5612 ASMAtomicWriteU32(&pGipCpu->au32TSCHistory[iTSCHistoryHead], (uint32_t)u64TSCDelta);
5613
5614 /*
5615 * UpdateIntervalTSC = average of last 8,2,1 intervals depending on update HZ.
5616 */
5617 if (pGip->u32UpdateHz >= 1000)
5618 {
5619 uint32_t u32;
5620 u32 = pGipCpu->au32TSCHistory[0];
5621 u32 += pGipCpu->au32TSCHistory[1];
5622 u32 += pGipCpu->au32TSCHistory[2];
5623 u32 += pGipCpu->au32TSCHistory[3];
5624 u32 >>= 2;
5625 u32UpdateIntervalTSC = pGipCpu->au32TSCHistory[4];
5626 u32UpdateIntervalTSC += pGipCpu->au32TSCHistory[5];
5627 u32UpdateIntervalTSC += pGipCpu->au32TSCHistory[6];
5628 u32UpdateIntervalTSC += pGipCpu->au32TSCHistory[7];
5629 u32UpdateIntervalTSC >>= 2;
5630 u32UpdateIntervalTSC += u32;
5631 u32UpdateIntervalTSC >>= 1;
5632
5633 /* Value chosen for a 2GHz Athlon64 running linux 2.6.10/11, . */
5634 u32UpdateIntervalTSCSlack = u32UpdateIntervalTSC >> 14;
5635 }
5636 else if (pGip->u32UpdateHz >= 90)
5637 {
5638 u32UpdateIntervalTSC = (uint32_t)u64TSCDelta;
5639 u32UpdateIntervalTSC += pGipCpu->au32TSCHistory[(iTSCHistoryHead - 1) & 7];
5640 u32UpdateIntervalTSC >>= 1;
5641
5642 /* value chosen on a 2GHz thinkpad running windows */
5643 u32UpdateIntervalTSCSlack = u32UpdateIntervalTSC >> 7;
5644 }
5645 else
5646 {
5647 u32UpdateIntervalTSC = (uint32_t)u64TSCDelta;
5648
5649 /* This value hasn't be checked yet.. waiting for OS/2 and 33Hz timers.. :-) */
5650 u32UpdateIntervalTSCSlack = u32UpdateIntervalTSC >> 6;
5651 }
5652 ASMAtomicWriteU32(&pGipCpu->u32UpdateIntervalTSC, u32UpdateIntervalTSC + u32UpdateIntervalTSCSlack);
5653
5654 /*
5655 * CpuHz.
5656 */
5657 u64CpuHz = ASMMult2xU32RetU64(u32UpdateIntervalTSC, pGip->u32UpdateHz);
5658 ASMAtomicWriteU64(&pGipCpu->u64CpuHz, u64CpuHz);
5659}
5660
5661
5662/**
5663 * Updates the GIP.
5664 *
5665 * @param pGip Pointer to the GIP.
5666 * @param u64NanoTS The current nanosecond timesamp.
5667 * @param u64TSC The current TSC timesamp.
5668 * @param idCpu The CPU ID.
5669 * @param iTick The current timer tick.
5670 */
5671static void supdrvGipUpdate(PSUPGLOBALINFOPAGE pGip, uint64_t u64NanoTS, uint64_t u64TSC, RTCPUID idCpu, uint64_t iTick)
5672{
5673 /*
5674 * Determine the relevant CPU data.
5675 */
5676 PSUPGIPCPU pGipCpu;
5677 if (pGip->u32Mode != SUPGIPMODE_ASYNC_TSC)
5678 pGipCpu = &pGip->aCPUs[0];
5679 else
5680 {
5681 unsigned iCpu = pGip->aiCpuFromApicId[ASMGetApicId()];
5682 if (RT_UNLIKELY(iCpu >= pGip->cCpus))
5683 return;
5684 pGipCpu = &pGip->aCPUs[iCpu];
5685 if (RT_UNLIKELY(pGipCpu->idCpu != idCpu))
5686 return;
5687 }
5688
5689 /*
5690 * Start update transaction.
5691 */
5692 if (!(ASMAtomicIncU32(&pGipCpu->u32TransactionId) & 1))
5693 {
5694 /* this can happen on win32 if we're taking to long and there are more CPUs around. shouldn't happen though. */
5695 AssertMsgFailed(("Invalid transaction id, %#x, not odd!\n", pGipCpu->u32TransactionId));
5696 ASMAtomicIncU32(&pGipCpu->u32TransactionId);
5697 pGipCpu->cErrors++;
5698 return;
5699 }
5700
5701 /*
5702 * Recalc the update frequency every 0x800th time.
5703 */
5704 if (!(pGipCpu->u32TransactionId & (GIP_UPDATEHZ_RECALC_FREQ * 2 - 2)))
5705 {
5706 if (pGip->u64NanoTSLastUpdateHz)
5707 {
5708#ifdef RT_ARCH_AMD64 /** @todo fix 64-bit div here to work on x86 linux. */
5709 uint64_t u64Delta = u64NanoTS - pGip->u64NanoTSLastUpdateHz;
5710 uint32_t u32UpdateHz = (uint32_t)((UINT64_C(1000000000) * GIP_UPDATEHZ_RECALC_FREQ) / u64Delta);
5711 if (u32UpdateHz <= 2000 && u32UpdateHz >= 30)
5712 {
5713 ASMAtomicWriteU32(&pGip->u32UpdateHz, u32UpdateHz);
5714 ASMAtomicWriteU32(&pGip->u32UpdateIntervalNS, 1000000000 / u32UpdateHz);
5715 }
5716#endif
5717 }
5718 ASMAtomicWriteU64(&pGip->u64NanoTSLastUpdateHz, u64NanoTS);
5719 }
5720
5721 /*
5722 * Update the data.
5723 */
5724 supdrvGipDoUpdateCpu(pGip, pGipCpu, u64NanoTS, u64TSC, iTick);
5725
5726 /*
5727 * Complete transaction.
5728 */
5729 ASMAtomicIncU32(&pGipCpu->u32TransactionId);
5730}
5731
5732
5733/**
5734 * Updates the per cpu GIP data for the calling cpu.
5735 *
5736 * @param pGip Pointer to the GIP.
5737 * @param u64NanoTS The current nanosecond timesamp.
5738 * @param u64TSC The current TSC timesamp.
5739 * @param idCpu The CPU ID.
5740 * @param idApic The APIC id for the CPU index.
5741 * @param iTick The current timer tick.
5742 */
5743static void supdrvGipUpdatePerCpu(PSUPGLOBALINFOPAGE pGip, uint64_t u64NanoTS, uint64_t u64TSC,
5744 RTCPUID idCpu, uint8_t idApic, uint64_t iTick)
5745{
5746 uint32_t iCpu;
5747
5748 /*
5749 * Avoid a potential race when a CPU online notification doesn't fire on
5750 * the onlined CPU but the tick creeps in before the event notification is
5751 * run.
5752 */
5753 if (RT_UNLIKELY(iTick == 1))
5754 {
5755 iCpu = supdrvGipCpuIndexFromCpuId(pGip, idCpu);
5756 if (pGip->aCPUs[iCpu].enmState == SUPGIPCPUSTATE_OFFLINE)
5757 supdrvGipMpEventOnline(pGip, idCpu);
5758 }
5759
5760 iCpu = pGip->aiCpuFromApicId[idApic];
5761 if (RT_LIKELY(iCpu < pGip->cCpus))
5762 {
5763 PSUPGIPCPU pGipCpu = &pGip->aCPUs[iCpu];
5764 if (pGipCpu->idCpu == idCpu)
5765 {
5766 /*
5767 * Start update transaction.
5768 */
5769 if (!(ASMAtomicIncU32(&pGipCpu->u32TransactionId) & 1))
5770 {
5771 AssertMsgFailed(("Invalid transaction id, %#x, not odd!\n", pGipCpu->u32TransactionId));
5772 ASMAtomicIncU32(&pGipCpu->u32TransactionId);
5773 pGipCpu->cErrors++;
5774 return;
5775 }
5776
5777 /*
5778 * Update the data.
5779 */
5780 supdrvGipDoUpdateCpu(pGip, pGipCpu, u64NanoTS, u64TSC, iTick);
5781
5782 /*
5783 * Complete transaction.
5784 */
5785 ASMAtomicIncU32(&pGipCpu->u32TransactionId);
5786 }
5787 }
5788}
5789
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette