VirtualBox

source: vbox/trunk/src/VBox/Runtime/r0drv/linux/alloc-r0drv-linux.c@ 7554

Last change on this file since 7554 was 7531, checked in by vboxsync, 17 years ago

vboxdrv: set_pages_attr is not available for 2.6.25 anymore

  • Property svn:eol-style set to native
  • Property svn:keywords set to Id
File size: 9.3 KB
Line 
1/* $Id: alloc-r0drv-linux.c 7531 2008-03-25 11:02:24Z vboxsync $ */
2/** @file
3 * innotek Portable Runtime - Memory Allocation, Ring-0 Driver, Linux.
4 */
5
6/*
7 * Copyright (C) 2006-2007 innotek GmbH
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * The contents of this file may alternatively be used under the terms
18 * of the Common Development and Distribution License Version 1.0
19 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20 * VirtualBox OSE distribution, in which case the provisions of the
21 * CDDL are applicable instead of those of the GPL.
22 *
23 * You may elect to license modified versions of this file under the
24 * terms and conditions of either the GPL or the CDDL or both.
25 */
26
27
28/*******************************************************************************
29* Header Files *
30*******************************************************************************/
31#include "the-linux-kernel.h"
32#include <iprt/mem.h>
33#include <iprt/assert.h>
34#include "r0drv/alloc-r0drv.h"
35
36#if defined(RT_ARCH_AMD64) || defined(__DOXYGEN__)
37/**
38 * We need memory in the module range (~2GB to ~0) this can only be obtained
39 * thru APIs that are not exported (see module_alloc()).
40 *
41 * So, we'll have to create a quick and dirty heap here using BSS memory.
42 * Very annoying and it's going to restrict us!
43 */
44# define RTMEMALLOC_EXEC_HEAP
45#endif
46#ifdef RTMEMALLOC_EXEC_HEAP
47# include <iprt/heap.h>
48# include <iprt/spinlock.h>
49# include <iprt/err.h>
50#endif
51
52
53/*******************************************************************************
54* Global Variables *
55*******************************************************************************/
56#ifdef RTMEMALLOC_EXEC_HEAP
57/** The heap. */
58static RTHEAPSIMPLE g_HeapExec = NIL_RTHEAPSIMPLE;
59/** Spinlock protecting the heap. */
60static RTSPINLOCK g_HeapExecSpinlock = NIL_RTSPINLOCK;
61
62
63/**
64 * API for cleaning up the heap spinlock on IPRT termination.
65 * This is as RTMemExecDonate specific to AMD64 Linux/GNU.
66 */
67void rtR0MemExecCleanup(void)
68{
69 RTSpinlockDestroy(g_HeapExecSpinlock);
70 g_HeapExecSpinlock = NIL_RTSPINLOCK;
71}
72
73
74/**
75 * Donate read+write+execute memory to the exec heap.
76 *
77 * This API is specific to AMD64 and Linux/GNU. A kernel module that desires to
78 * use RTMemExecAlloc on AMD64 Linux/GNU will have to donate some statically
79 * allocated memory in the module if it wishes for GCC generated code to work.
80 * GCC can only generate modules that work in the address range ~2GB to ~0
81 * currently.
82 *
83 * The API only accept one single donation.
84 *
85 * @returns IPRT status code.
86 * @param pvMemory Pointer to the memory block.
87 * @param cb The size of the memory block.
88 */
89RTR0DECL(int) RTR0MemExecDonate(void *pvMemory, size_t cb)
90{
91 int rc;
92 AssertReturn(g_HeapExec == NIL_RTHEAPSIMPLE, VERR_WRONG_ORDER);
93
94 rc = RTSpinlockCreate(&g_HeapExecSpinlock);
95 if (RT_SUCCESS(rc))
96 {
97 rc = RTHeapSimpleInit(&g_HeapExec, pvMemory, cb);
98 if (RT_FAILURE(rc))
99 rtR0MemExecCleanup();
100 }
101 return rc;
102}
103#endif /* RTMEMALLOC_EXEC_HEAP */
104
105
106
107/**
108 * OS specific allocation function.
109 */
110PRTMEMHDR rtMemAlloc(size_t cb, uint32_t fFlags)
111{
112 /*
113 * Allocate.
114 */
115 PRTMEMHDR pHdr;
116 if (fFlags & RTMEMHDR_FLAG_EXEC)
117 {
118#if defined(RT_ARCH_AMD64)
119# ifdef RTMEMALLOC_EXEC_HEAP
120 if (g_HeapExec != NIL_RTHEAPSIMPLE)
121 {
122 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
123 RTSpinlockAcquireNoInts(g_HeapExecSpinlock, &SpinlockTmp);
124 pHdr = (PRTMEMHDR)RTHeapSimpleAlloc(g_HeapExec, cb + sizeof(*pHdr), 0);
125 RTSpinlockReleaseNoInts(g_HeapExecSpinlock, &SpinlockTmp);
126 fFlags |= RTMEMHDR_FLAG_EXEC_HEAP;
127 }
128 else
129# endif
130 pHdr = (PRTMEMHDR)__vmalloc(cb + sizeof(*pHdr), GFP_KERNEL | __GFP_HIGHMEM, PAGE_KERNEL_EXEC);
131
132#elif defined(PAGE_KERNEL_EXEC) && defined(CONFIG_X86_PAE)
133 pHdr = (PRTMEMHDR)__vmalloc(cb + sizeof(*pHdr), GFP_KERNEL | __GFP_HIGHMEM,
134 __pgprot(cpu_has_pge ? _PAGE_KERNEL_EXEC | _PAGE_GLOBAL : _PAGE_KERNEL_EXEC));
135#else
136 pHdr = (PRTMEMHDR)vmalloc(cb + sizeof(*pHdr));
137#endif
138 }
139 else
140 {
141 if (cb <= PAGE_SIZE)
142 {
143 fFlags |= RTMEMHDR_FLAG_KMALLOC;
144 pHdr = kmalloc(cb + sizeof(*pHdr), GFP_KERNEL);
145 }
146 else
147 pHdr = vmalloc(cb + sizeof(*pHdr));
148 }
149
150 /*
151 * Initialize.
152 */
153 if (pHdr)
154 {
155 pHdr->u32Magic = RTMEMHDR_MAGIC;
156 pHdr->fFlags = fFlags;
157 pHdr->cb = cb;
158 pHdr->cbReq = cb;
159 }
160 return pHdr;
161}
162
163
164/**
165 * OS specific free function.
166 */
167void rtMemFree(PRTMEMHDR pHdr)
168{
169 pHdr->u32Magic += 1;
170 if (pHdr->fFlags & RTMEMHDR_FLAG_KMALLOC)
171 kfree(pHdr);
172#ifdef RTMEMALLOC_EXEC_HEAP
173 else if (pHdr->fFlags & RTMEMHDR_FLAG_EXEC_HEAP)
174 {
175 RTSPINLOCKTMP SpinlockTmp = RTSPINLOCKTMP_INITIALIZER;
176 RTSpinlockAcquireNoInts(g_HeapExecSpinlock, &SpinlockTmp);
177 RTHeapSimpleFree(g_HeapExec, pHdr);
178 RTSpinlockReleaseNoInts(g_HeapExecSpinlock, &SpinlockTmp);
179 }
180#endif
181 else
182 vfree(pHdr);
183}
184
185
186/**
187 * Compute order. Some functions allocate 2^order pages.
188 *
189 * @returns order.
190 * @param cPages Number of pages.
191 */
192static int CalcPowerOf2Order(unsigned long cPages)
193{
194 int iOrder;
195 unsigned long cTmp;
196
197 for (iOrder = 0, cTmp = cPages; cTmp >>= 1; ++iOrder)
198 ;
199 if (cPages & ~(1 << iOrder))
200 ++iOrder;
201
202 return iOrder;
203}
204
205
206/**
207 * Allocates physical contiguous memory (below 4GB).
208 * The allocation is page aligned and the content is undefined.
209 *
210 * @returns Pointer to the memory block. This is page aligned.
211 * @param pPhys Where to store the physical address.
212 * @param cb The allocation size in bytes. This is always
213 * rounded up to PAGE_SIZE.
214 */
215RTR0DECL(void *) RTMemContAlloc(PRTCCPHYS pPhys, size_t cb)
216{
217 int cOrder;
218 unsigned cPages;
219 struct page *paPages;
220
221 /*
222 * validate input.
223 */
224 Assert(VALID_PTR(pPhys));
225 Assert(cb > 0);
226
227 /*
228 * Allocate page pointer array.
229 */
230 cb = RT_ALIGN_Z(cb, PAGE_SIZE);
231 cPages = cb >> PAGE_SHIFT;
232 cOrder = CalcPowerOf2Order(cPages);
233#ifdef RT_ARCH_AMD64 /** @todo check out if there is a correct way of getting memory below 4GB (physically). */
234 paPages = alloc_pages(GFP_DMA, cOrder);
235#else
236 paPages = alloc_pages(GFP_USER, cOrder);
237#endif
238 if (paPages)
239 {
240 /*
241 * Reserve the pages and mark them executable.
242 */
243 unsigned iPage;
244 for (iPage = 0; iPage < cPages; iPage++)
245 {
246 Assert(!PageHighMem(&paPages[iPage]));
247 if (iPage + 1 < cPages)
248 {
249 AssertMsg( (uintptr_t)phys_to_virt(page_to_phys(&paPages[iPage])) + PAGE_SIZE
250 == (uintptr_t)phys_to_virt(page_to_phys(&paPages[iPage + 1]))
251 && page_to_phys(&paPages[iPage]) + PAGE_SIZE
252 == page_to_phys(&paPages[iPage + 1]),
253 ("iPage=%i cPages=%u [0]=%#llx,%p [1]=%#llx,%p\n", iPage, cPages,
254 (long long)page_to_phys(&paPages[iPage]), phys_to_virt(page_to_phys(&paPages[iPage])),
255 (long long)page_to_phys(&paPages[iPage + 1]), phys_to_virt(page_to_phys(&paPages[iPage + 1])) ));
256 }
257
258 SetPageReserved(&paPages[iPage]);
259#if LINUX_VERSION_CODE > KERNEL_VERSION(2, 4, 20) /** @todo find the exact kernel where change_page_attr was introduced. */
260 MY_SET_PAGES_EXEC(&paPages[iPage], 1);
261#endif
262 }
263 *pPhys = page_to_phys(paPages);
264 return phys_to_virt(page_to_phys(paPages));
265 }
266
267 return NULL;
268}
269
270
271/**
272 * Frees memory allocated ysing RTMemContAlloc().
273 *
274 * @param pv Pointer to return from RTMemContAlloc().
275 * @param cb The cb parameter passed to RTMemContAlloc().
276 */
277RTR0DECL(void) RTMemContFree(void *pv, size_t cb)
278{
279 if (pv)
280 {
281 int cOrder;
282 unsigned cPages;
283 unsigned iPage;
284 struct page *paPages;
285
286 /* validate */
287 AssertMsg(!((uintptr_t)pv & PAGE_OFFSET_MASK), ("pv=%p\n", pv));
288 Assert(cb > 0);
289
290 /* calc order and get pages */
291 cb = RT_ALIGN_Z(cb, PAGE_SIZE);
292 cPages = cb >> PAGE_SHIFT;
293 cOrder = CalcPowerOf2Order(cPages);
294 paPages = virt_to_page(pv);
295
296 /*
297 * Restore page attributes freeing the pages.
298 */
299 for (iPage = 0; iPage < cPages; iPage++)
300 {
301 ClearPageReserved(&paPages[iPage]);
302#if LINUX_VERSION_CODE > KERNEL_VERSION(2, 4, 20) /** @todo find the exact kernel where change_page_attr was introduced. */
303 MY_SET_PAGES_NOEXEC(&paPages[iPage], 1);
304#endif
305 }
306 __free_pages(paPages, cOrder);
307 }
308}
309
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette