VirtualBox

source: vbox/trunk/src/VBox/HostDrivers/VBoxPci/linux/VBoxPci-linux.c@ 70562

Last change on this file since 70562 was 69744, checked in by vboxsync, 7 years ago

VBoxPci-linux.c: use kernel_write instead of vfs_write as of Linux 4.14.
bugref:9057: VBoxPci: vfs_write() no longer exported by Linux kernel

As of Linux 4.14 vfs_write() is no longer exported for use by modules. Other
users have been converted to use kernel_write(), which is a wrapper around
vfs_write() with some added boiler-plate calls to make it safe to use on
kernel addresses too. It seems to me like we should probably already have
been using kernel_write(), but I prefer to leave that decision to someone who
knows the code, so this change switches over for 4.14 and later.

Fixes: ticketref:17267:comment:6

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 33.8 KB
Line 
1/* $Id: VBoxPci-linux.c 69744 2017-11-18 20:10:33Z vboxsync $ */
2/** @file
3 * VBoxPci - PCI Driver (Host), Linux Specific Code.
4 */
5
6/*
7 * Copyright (C) 2011-2017 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * The contents of this file may alternatively be used under the terms
18 * of the Common Development and Distribution License Version 1.0
19 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20 * VirtualBox OSE distribution, in which case the provisions of the
21 * CDDL are applicable instead of those of the GPL.
22 *
23 * You may elect to license modified versions of this file under the
24 * terms and conditions of either the GPL or the CDDL or both.
25 */
26
27
28/*********************************************************************************************************************************
29* Header Files *
30*********************************************************************************************************************************/
31#include "the-linux-kernel.h"
32#include "version-generated.h"
33#include "revision-generated.h"
34#include "product-generated.h"
35
36#define LOG_GROUP LOG_GROUP_DEV_PCI_RAW
37#include <VBox/log.h>
38#include <VBox/err.h>
39#include <iprt/process.h>
40#include <iprt/initterm.h>
41#include <iprt/string.h>
42#include <iprt/mem.h>
43
44#include "VBoxPciInternal.h"
45
46#ifdef VBOX_WITH_IOMMU
47# include <linux/dmar.h>
48# include <linux/intel-iommu.h>
49# include <linux/pci.h>
50# if LINUX_VERSION_CODE < KERNEL_VERSION(3, 1, 0) && \
51 (LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 41) || LINUX_VERSION_CODE >= KERNEL_VERSION(3, 0, 0))
52# include <asm/amd_iommu.h>
53# else
54# include <linux/amd-iommu.h>
55# endif
56# if LINUX_VERSION_CODE < KERNEL_VERSION(3, 2, 0)
57# define IOMMU_PRESENT() iommu_found()
58# define IOMMU_DOMAIN_ALLOC() iommu_domain_alloc()
59# else
60# define IOMMU_PRESENT() iommu_present(&pci_bus_type)
61# define IOMMU_DOMAIN_ALLOC() iommu_domain_alloc(&pci_bus_type)
62# endif
63#endif /* VBOX_WITH_IOMMU */
64
65
66/*********************************************************************************************************************************
67* Internal Functions *
68*********************************************************************************************************************************/
69static int VBoxPciLinuxInit(void);
70static void VBoxPciLinuxUnload(void);
71
72
73/*********************************************************************************************************************************
74* Global Variables *
75*********************************************************************************************************************************/
76static VBOXRAWPCIGLOBALS g_VBoxPciGlobals;
77
78module_init(VBoxPciLinuxInit);
79module_exit(VBoxPciLinuxUnload);
80
81MODULE_AUTHOR(VBOX_VENDOR);
82MODULE_DESCRIPTION(VBOX_PRODUCT " PCI access Driver");
83MODULE_LICENSE("GPL");
84#ifdef MODULE_VERSION
85MODULE_VERSION(VBOX_VERSION_STRING " r" RT_XSTR(VBOX_SVN_REV));
86#endif
87
88
89#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 20)
90# define PCI_DEV_GET(v,d,p) pci_get_device(v,d,p)
91# define PCI_DEV_PUT(x) pci_dev_put(x)
92# define PCI_DEV_GET_SLOT(bus, devfn) pci_get_bus_and_slot(bus, devfn)
93#else
94# define PCI_DEV_GET(v,d,p) pci_find_device(v,d,p)
95# define PCI_DEV_PUT(x) do { } while (0)
96# define PCI_DEV_GET_SLOT(bus, devfn) pci_find_slot(bus, devfn)
97#endif
98
99/**
100 * Name of module used to attach to the host PCI device, when
101 * PCI device passthrough is used.
102 */
103#define PCI_STUB_MODULE "pci-stub"
104/* For some reasons my kernel names module for find_module() this way,
105 * while device name seems to be above one.
106 */
107#define PCI_STUB_MODULE_NAME "pci_stub"
108
109/**
110 * Our driver name.
111 */
112#define DRIVER_NAME "vboxpci"
113
114/*
115 * Currently we keep the device bound to pci stub driver, so
116 * dev_printk() &co would report that instead of our name. They also
117 * expect non-NULL dev pointer in older kernels.
118 */
119#define vbpci_printk(level, pdev, format, arg...) \
120 printk(level DRIVER_NAME "%s%s: " format, \
121 pdev ? " " : "", pdev ? pci_name(pdev) : "", \
122 ## arg)
123
124
125/**
126 * Initialize module.
127 *
128 * @returns appropriate status code.
129 */
130static int __init VBoxPciLinuxInit(void)
131{
132 int rc;
133 /*
134 * Initialize IPRT.
135 */
136 rc = RTR0Init(0);
137
138 if (RT_FAILURE(rc))
139 goto error;
140
141
142 LogRel(("VBoxPciLinuxInit\n"));
143
144 RT_ZERO(g_VBoxPciGlobals);
145
146 rc = vboxPciInit(&g_VBoxPciGlobals);
147 if (RT_FAILURE(rc))
148 {
149 LogRel(("cannot do VBoxPciInit: %Rc\n", rc));
150 goto error;
151 }
152
153#if defined(CONFIG_PCI_STUB)
154 /* nothing to do, pci_stub module part of the kernel */
155 g_VBoxPciGlobals.fPciStubModuleAvail = true;
156
157#elif defined(CONFIG_PCI_STUB_MODULE)
158 if (request_module(PCI_STUB_MODULE) == 0)
159 {
160# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 30)
161 /* find_module() is static before Linux 2.6.30 */
162 mutex_lock(&module_mutex);
163 g_VBoxPciGlobals.pciStubModule = find_module(PCI_STUB_MODULE_NAME);
164 mutex_unlock(&module_mutex);
165 if (g_VBoxPciGlobals.pciStubModule)
166 {
167 if (try_module_get(g_VBoxPciGlobals.pciStubModule))
168 g_VBoxPciGlobals.fPciStubModuleAvail = true;
169 }
170 else
171 printk(KERN_INFO "vboxpci: find_module %s failed\n", PCI_STUB_MODULE);
172# endif
173 }
174 else
175 printk(KERN_INFO "vboxpci: cannot load %s\n", PCI_STUB_MODULE);
176
177#else
178 printk(KERN_INFO "vboxpci: %s module not available, cannot detach PCI devices\n",
179 PCI_STUB_MODULE);
180#endif
181
182#ifdef VBOX_WITH_IOMMU
183 if (IOMMU_PRESENT())
184 printk(KERN_INFO "vboxpci: IOMMU found\n");
185 else
186 printk(KERN_INFO "vboxpci: IOMMU not found (not registered)\n");
187#else
188 printk(KERN_INFO "vboxpci: IOMMU not found (not compiled)\n");
189#endif
190
191 return 0;
192
193 error:
194 return -RTErrConvertToErrno(rc);
195}
196
197/**
198 * Unload the module.
199 */
200static void __exit VBoxPciLinuxUnload(void)
201{
202 LogRel(("VBoxPciLinuxLinuxUnload\n"));
203
204 /*
205 * Undo the work done during start (in reverse order).
206 */
207 vboxPciShutdown(&g_VBoxPciGlobals);
208
209 RTR0Term();
210
211 if (g_VBoxPciGlobals.pciStubModule)
212 {
213 module_put(g_VBoxPciGlobals.pciStubModule);
214 g_VBoxPciGlobals.pciStubModule = NULL;
215 }
216
217 Log(("VBoxPciLinuxUnload - done\n"));
218}
219
220static int vboxPciLinuxDevRegisterWithIommu(PVBOXRAWPCIINS pIns)
221{
222#ifdef VBOX_WITH_IOMMU
223 int rc = VINF_SUCCESS;
224 struct pci_dev *pPciDev = pIns->pPciDev;
225 PVBOXRAWPCIDRVVM pData = VBOX_DRV_VMDATA(pIns);
226 IPRT_LINUX_SAVE_EFL_AC();
227
228 if (RT_LIKELY(pData))
229 {
230 if (RT_LIKELY(pData->pIommuDomain))
231 {
232 /** @todo KVM checks IOMMU_CAP_CACHE_COHERENCY and sets
233 * flag IOMMU_CACHE later used when mapping physical
234 * addresses, which could improve performance.
235 */
236 int rcLnx = iommu_attach_device(pData->pIommuDomain, &pPciDev->dev);
237 if (!rcLnx)
238 {
239 vbpci_printk(KERN_DEBUG, pPciDev, "attached to IOMMU\n");
240 pIns->fIommuUsed = true;
241 rc = VINF_SUCCESS;
242 }
243 else
244 {
245 vbpci_printk(KERN_DEBUG, pPciDev, "failed to attach to IOMMU, error %d\n", rcLnx);
246 rc = VERR_INTERNAL_ERROR;
247 }
248 }
249 else
250 {
251 vbpci_printk(KERN_DEBUG, pIns->pPciDev, "cannot attach to IOMMU, no domain\n");
252 rc = VERR_NOT_FOUND;
253 }
254 }
255 else
256 {
257 vbpci_printk(KERN_DEBUG, pPciDev, "cannot attach to IOMMU, no VM data\n");
258 rc = VERR_INVALID_PARAMETER;
259 }
260
261 IPRT_LINUX_RESTORE_EFL_AC();
262 return rc;
263#else
264 return VERR_NOT_SUPPORTED;
265#endif
266}
267
268static int vboxPciLinuxDevUnregisterWithIommu(PVBOXRAWPCIINS pIns)
269{
270#ifdef VBOX_WITH_IOMMU
271 int rc = VINF_SUCCESS;
272 struct pci_dev *pPciDev = pIns->pPciDev;
273 PVBOXRAWPCIDRVVM pData = VBOX_DRV_VMDATA(pIns);
274 IPRT_LINUX_SAVE_EFL_AC();
275
276 if (RT_LIKELY(pData))
277 {
278 if (RT_LIKELY(pData->pIommuDomain))
279 {
280 if (pIns->fIommuUsed)
281 {
282 iommu_detach_device(pData->pIommuDomain, &pIns->pPciDev->dev);
283 vbpci_printk(KERN_DEBUG, pPciDev, "detached from IOMMU\n");
284 pIns->fIommuUsed = false;
285 }
286 }
287 else
288 {
289 vbpci_printk(KERN_DEBUG, pPciDev,
290 "cannot detach from IOMMU, no domain\n");
291 rc = VERR_NOT_FOUND;
292 }
293 }
294 else
295 {
296 vbpci_printk(KERN_DEBUG, pPciDev,
297 "cannot detach from IOMMU, no VM data\n");
298 rc = VERR_INVALID_PARAMETER;
299 }
300
301 IPRT_LINUX_RESTORE_EFL_AC();
302 return rc;
303#else
304 return VERR_NOT_SUPPORTED;
305#endif
306}
307
308static int vboxPciLinuxDevReset(PVBOXRAWPCIINS pIns)
309{
310 int rc = VINF_SUCCESS;
311 IPRT_LINUX_SAVE_EFL_AC();
312
313 if (RT_LIKELY(pIns->pPciDev))
314 {
315#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 28)
316 if (pci_reset_function(pIns->pPciDev))
317 {
318 vbpci_printk(KERN_DEBUG, pIns->pPciDev,
319 "pci_reset_function() failed\n");
320 rc = VERR_INTERNAL_ERROR;
321 }
322#else
323 rc = VERR_NOT_SUPPORTED;
324#endif
325 }
326 else
327 rc = VERR_INVALID_PARAMETER;
328
329 IPRT_LINUX_RESTORE_EFL_AC();
330 return rc;
331}
332
333static struct file* vboxPciFileOpen(const char* path, int flags)
334{
335 struct file* filp = NULL;
336 int err = 0;
337
338 filp = filp_open(path, flags, 0);
339
340 if (IS_ERR(filp))
341 {
342 err = PTR_ERR(filp);
343 printk(KERN_DEBUG "vboxPciFileOpen: error %d\n", err);
344 return NULL;
345 }
346
347 if (!filp->f_op || !filp->f_op->write)
348 {
349 printk(KERN_DEBUG "Not writable FS\n");
350 filp_close(filp, NULL);
351 return NULL;
352 }
353
354 return filp;
355}
356
357static void vboxPciFileClose(struct file* file)
358{
359 filp_close(file, NULL);
360}
361
362static int vboxPciFileWrite(struct file* file, unsigned long long offset, unsigned char* data, unsigned int size)
363{
364 int ret;
365 mm_segment_t fs_save;
366
367 fs_save = get_fs();
368 set_fs(get_ds());
369#if LINUX_VERSION_CODE >= KERNEL_VERSION(4, 14, 0)
370 ret = kernel_write(file, data, size, &offset);
371#else
372 ret = vfs_write(file, data, size, &offset);
373#endif
374 set_fs(fs_save);
375 if (ret < 0)
376 printk(KERN_DEBUG "vboxPciFileWrite: error %d\n", ret);
377
378 return ret;
379}
380
381static int vboxPciLinuxDevDetachHostDriver(PVBOXRAWPCIINS pIns)
382{
383 struct pci_dev *pPciDev = NULL;
384 uint8_t uBus = (pIns->HostPciAddress) >> 8;
385 uint8_t uDevFn = (pIns->HostPciAddress) & 0xff;
386 const char* currentDriver;
387 uint16_t uVendor, uDevice;
388 bool fDetach = 0;
389
390 if (!g_VBoxPciGlobals.fPciStubModuleAvail)
391 {
392 printk(KERN_INFO "vboxpci: stub module %s not detected: cannot detach\n",
393 PCI_STUB_MODULE);
394 return VERR_ACCESS_DENIED;
395 }
396
397 pPciDev = PCI_DEV_GET_SLOT(uBus, uDevFn);
398
399 if (!pPciDev)
400 {
401 printk(KERN_INFO "vboxpci: device at %02x:%02x.%d not found\n",
402 uBus, uDevFn>>3, uDevFn&7);
403 return VERR_NOT_FOUND;
404 }
405
406 uVendor = pPciDev->vendor;
407 uDevice = pPciDev->device;
408
409 currentDriver = pPciDev->driver ? pPciDev->driver->name : NULL;
410
411 printk(KERN_DEBUG "vboxpci: detected device: %04x:%04x at %02x:%02x.%d, driver %s\n",
412 uVendor, uDevice, uBus, uDevFn>>3, uDevFn&7,
413 currentDriver ? currentDriver : "<none>");
414
415 fDetach = (currentDriver == NULL || (strcmp(currentDriver, PCI_STUB_MODULE) != 0));
416
417 /* Init previous driver data. */
418 pIns->szPrevDriver[0] = '\0';
419
420 if (fDetach && currentDriver)
421 {
422 /* Dangerous: if device name for some reasons contains slashes - arbitrary file could be written to. */
423 if (strchr(currentDriver, '/') != 0)
424 {
425 printk(KERN_DEBUG "vboxpci: ERROR: %s contains invalid symbols\n", currentDriver);
426 return VERR_ACCESS_DENIED;
427 }
428 /** @todo RTStrCopy not exported. */
429 strncpy(pIns->szPrevDriver, currentDriver, sizeof(pIns->szPrevDriver));
430 }
431
432 PCI_DEV_PUT(pPciDev);
433 pPciDev = NULL;
434
435 if (fDetach)
436 {
437 char* szCmdBuf;
438 char* szFileBuf;
439 struct file* pFile;
440 int iCmdLen;
441 const int cMaxBuf = 128;
442 const struct cred *pOldCreds;
443 struct cred *pNewCreds;
444
445 /*
446 * Now perform kernel analog of:
447 *
448 * echo -n "10de 040a" > /sys/bus/pci/drivers/pci-stub/new_id
449 * echo -n 0000:03:00.0 > /sys/bus/pci/drivers/nvidia/unbind
450 * echo -n 0000:03:00.0 > /sys/bus/pci/drivers/pci-stub/bind
451 *
452 * We do this way, as this interface is presumingly more stable than
453 * in-kernel ones.
454 */
455 szCmdBuf = kmalloc(cMaxBuf, GFP_KERNEL);
456 szFileBuf = kmalloc(cMaxBuf, GFP_KERNEL);
457 if (!szCmdBuf || !szFileBuf)
458 goto done;
459
460 /* Somewhat ugly hack - override current credentials */
461#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 29)
462 pNewCreds = prepare_creds();
463 if (!pNewCreds)
464 goto done;
465
466# if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
467 pNewCreds->fsuid = GLOBAL_ROOT_UID;
468# else
469 pNewCreds->fsuid = 0;
470# endif
471 pOldCreds = override_creds(pNewCreds);
472#endif
473
474 RTStrPrintf(szFileBuf, cMaxBuf,
475 "/sys/bus/pci/drivers/%s/new_id",
476 PCI_STUB_MODULE);
477 pFile = vboxPciFileOpen(szFileBuf, O_WRONLY);
478 if (pFile)
479 {
480 iCmdLen = RTStrPrintf(szCmdBuf, cMaxBuf,
481 "%04x %04x",
482 uVendor, uDevice);
483 /* Don't write trailing \0 */
484 vboxPciFileWrite(pFile, 0, szCmdBuf, iCmdLen);
485 vboxPciFileClose(pFile);
486 }
487 else
488 printk(KERN_DEBUG "vboxpci: cannot open %s\n", szFileBuf);
489
490 iCmdLen = RTStrPrintf(szCmdBuf, cMaxBuf,
491 "0000:%02x:%02x.%d",
492 uBus, uDevFn>>3, uDevFn&7);
493
494 /* Unbind if bound to smth */
495 if (pIns->szPrevDriver[0])
496 {
497 RTStrPrintf(szFileBuf, cMaxBuf,
498 "/sys/bus/pci/drivers/%s/unbind",
499 pIns->szPrevDriver);
500 pFile = vboxPciFileOpen(szFileBuf, O_WRONLY);
501 if (pFile)
502 {
503
504 /* Don't write trailing \0 */
505 vboxPciFileWrite(pFile, 0, szCmdBuf, iCmdLen);
506 vboxPciFileClose(pFile);
507 }
508 else
509 printk(KERN_DEBUG "vboxpci: cannot open %s\n", szFileBuf);
510 }
511
512 RTStrPrintf(szFileBuf, cMaxBuf,
513 "/sys/bus/pci/drivers/%s/bind",
514 PCI_STUB_MODULE);
515 pFile = vboxPciFileOpen(szFileBuf, O_WRONLY);
516 if (pFile)
517 {
518 /* Don't write trailing \0 */
519 vboxPciFileWrite(pFile, 0, szCmdBuf, iCmdLen);
520 vboxPciFileClose(pFile);
521 }
522 else
523 printk(KERN_DEBUG "vboxpci: cannot open %s\n", szFileBuf);
524
525#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 29)
526 revert_creds(pOldCreds);
527 put_cred(pNewCreds);
528#endif
529
530 done:
531 kfree(szCmdBuf);
532 kfree(szFileBuf);
533 }
534
535 return 0;
536}
537
538static int vboxPciLinuxDevReattachHostDriver(PVBOXRAWPCIINS pIns)
539{
540 struct pci_dev *pPciDev = pIns->pPciDev;
541
542 if (!pPciDev)
543 return VINF_SUCCESS;
544
545 if (pIns->szPrevDriver[0])
546 {
547 char* szCmdBuf;
548 char* szFileBuf;
549 struct file* pFile;
550 int iCmdLen;
551 const int cMaxBuf = 128;
552 const struct cred *pOldCreds;
553 struct cred *pNewCreds;
554 uint8_t uBus = (pIns->HostPciAddress) >> 8;
555 uint8_t uDevFn = (pIns->HostPciAddress) & 0xff;
556
557 vbpci_printk(KERN_DEBUG, pPciDev,
558 "reattaching old host driver %s\n", pIns->szPrevDriver);
559 /*
560 * Now perform kernel analog of:
561 *
562 * echo -n 0000:03:00.0 > /sys/bus/pci/drivers/pci-stub/unbind
563 * echo -n 0000:03:00.0 > /sys/bus/pci/drivers/nvidia/bind
564 */
565 szCmdBuf = kmalloc(cMaxBuf, GFP_KERNEL);
566 szFileBuf = kmalloc(cMaxBuf, GFP_KERNEL);
567
568 if (!szCmdBuf || !szFileBuf)
569 goto done;
570
571 iCmdLen = RTStrPrintf(szCmdBuf, cMaxBuf,
572 "0000:%02x:%02x.%d",
573 uBus, uDevFn>>3, uDevFn&7);
574
575 /* Somewhat ugly hack - override current credentials */
576#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 29)
577 pNewCreds = prepare_creds();
578 if (!pNewCreds)
579 goto done;
580
581# if LINUX_VERSION_CODE >= KERNEL_VERSION(3, 5, 0)
582 pNewCreds->fsuid = GLOBAL_ROOT_UID;
583# else
584 pNewCreds->fsuid = 0;
585# endif
586 pOldCreds = override_creds(pNewCreds);
587#endif
588 RTStrPrintf(szFileBuf, cMaxBuf,
589 "/sys/bus/pci/drivers/%s/unbind",
590 PCI_STUB_MODULE);
591 pFile = vboxPciFileOpen(szFileBuf, O_WRONLY);
592 if (pFile)
593 {
594
595 /* Don't write trailing \0 */
596 vboxPciFileWrite(pFile, 0, szCmdBuf, iCmdLen);
597 vboxPciFileClose(pFile);
598 }
599 else
600 printk(KERN_DEBUG "vboxpci: cannot open %s\n", szFileBuf);
601
602 RTStrPrintf(szFileBuf, cMaxBuf,
603 "/sys/bus/pci/drivers/%s/bind",
604 pIns->szPrevDriver);
605 pFile = vboxPciFileOpen(szFileBuf, O_WRONLY);
606 if (pFile)
607 {
608
609 /* Don't write trailing \0 */
610 vboxPciFileWrite(pFile, 0, szCmdBuf, iCmdLen);
611 vboxPciFileClose(pFile);
612 pIns->szPrevDriver[0] = '\0';
613 }
614 else
615 printk(KERN_DEBUG "vboxpci: cannot open %s\n", szFileBuf);
616
617#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 29)
618 revert_creds(pOldCreds);
619 put_cred(pNewCreds);
620#endif
621
622 done:
623 kfree(szCmdBuf);
624 kfree(szFileBuf);
625 }
626
627 return VINF_SUCCESS;
628}
629
630DECLHIDDEN(int) vboxPciOsDevInit(PVBOXRAWPCIINS pIns, uint32_t fFlags)
631{
632 struct pci_dev *pPciDev = NULL;
633 int rc = VINF_SUCCESS;
634 IPRT_LINUX_SAVE_EFL_AC();
635
636 if (fFlags & PCIRAWDRIVERRFLAG_DETACH_HOST_DRIVER)
637 {
638 rc = vboxPciLinuxDevDetachHostDriver(pIns);
639 if (RT_FAILURE(rc))
640 {
641 printk(KERN_DEBUG "Cannot detach host driver for device %x: %d\n",
642 pIns->HostPciAddress, rc);
643 }
644 }
645
646 if (RT_SUCCESS(rc))
647 {
648 pPciDev = PCI_DEV_GET_SLOT((pIns->HostPciAddress) >> 8,
649 (pIns->HostPciAddress) & 0xff);
650
651 if (RT_LIKELY(pPciDev))
652 {
653 int rcLnx = pci_enable_device(pPciDev);
654
655 if (!rcLnx)
656 {
657 pIns->pPciDev = pPciDev;
658 vbpci_printk(KERN_DEBUG, pPciDev, "%s\n", __func__);
659
660#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 1)
661 if (pci_enable_msi(pPciDev) == 0)
662 pIns->fMsiUsed = true;
663#endif
664
665 /** @todo
666 * pci_enable_msix(pPciDev, entries, nvec)
667 *
668 * In fact, if device uses interrupts, and cannot be forced to use MSI or MSI-X
669 * we have to refuse using it, as we cannot work with shared PCI interrupts (unless we're lucky
670 * to grab unshared PCI interrupt).
671 */
672 }
673 else
674 rc = RTErrConvertFromErrno(RT_ABS(rcLnx));
675 }
676 else
677 rc = VERR_NOT_FOUND;
678 }
679
680 IPRT_LINUX_RESTORE_EFL_AC();
681 return rc;
682}
683
684DECLHIDDEN(int) vboxPciOsDevDeinit(PVBOXRAWPCIINS pIns, uint32_t fFlags)
685{
686 int rc = VINF_SUCCESS;
687 struct pci_dev *pPciDev = pIns->pPciDev;
688 IPRT_LINUX_SAVE_EFL_AC();
689
690 vbpci_printk(KERN_DEBUG, pPciDev, "%s\n", __func__);
691
692 if (RT_LIKELY(pPciDev))
693 {
694 int iRegion;
695 for (iRegion = 0; iRegion < 7; ++iRegion)
696 {
697 if (pIns->aRegionR0Mapping[iRegion])
698 {
699 iounmap(pIns->aRegionR0Mapping[iRegion]);
700 pIns->aRegionR0Mapping[iRegion] = 0;
701 pci_release_region(pPciDev, iRegion);
702 }
703 }
704
705 vboxPciLinuxDevUnregisterWithIommu(pIns);
706
707#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 1)
708 if (pIns->fMsiUsed)
709 pci_disable_msi(pPciDev);
710#endif
711 // pci_disable_msix(pPciDev);
712 pci_disable_device(pPciDev);
713 vboxPciLinuxDevReattachHostDriver(pIns);
714
715 PCI_DEV_PUT(pPciDev);
716 pIns->pPciDev = NULL;
717 }
718 else
719 rc = VERR_INVALID_PARAMETER;
720
721 IPRT_LINUX_RESTORE_EFL_AC();
722 return rc;
723}
724
725DECLHIDDEN(int) vboxPciOsDevDestroy(PVBOXRAWPCIINS pIns)
726{
727 return VINF_SUCCESS;
728}
729
730DECLHIDDEN(int) vboxPciOsDevGetRegionInfo(PVBOXRAWPCIINS pIns,
731 int32_t iRegion,
732 RTHCPHYS *pRegionStart,
733 uint64_t *pu64RegionSize,
734 bool *pfPresent,
735 uint32_t *pfFlags)
736{
737 int rc = VINF_SUCCESS;
738 struct pci_dev *pPciDev = pIns->pPciDev;
739 IPRT_LINUX_SAVE_EFL_AC();
740
741 if (RT_LIKELY(pPciDev))
742 {
743 int fFlags = pci_resource_flags(pPciDev, iRegion);
744
745 if ( ((fFlags & (IORESOURCE_MEM | IORESOURCE_IO)) == 0)
746 || ((fFlags & IORESOURCE_DISABLED) != 0))
747 {
748 *pfPresent = false;
749 rc = VERR_INVALID_PARAMETER;
750 }
751 else
752 {
753 uint32_t fResFlags = 0;
754 *pfPresent = true;
755
756 if (fFlags & IORESOURCE_MEM)
757 fResFlags |= PCIRAW_ADDRESS_SPACE_MEM;
758
759 if (fFlags & IORESOURCE_IO)
760 fResFlags |= PCIRAW_ADDRESS_SPACE_IO;
761
762#ifdef IORESOURCE_MEM_64
763 if (fFlags & IORESOURCE_MEM_64)
764 fResFlags |= PCIRAW_ADDRESS_SPACE_BAR64;
765#endif
766
767 if (fFlags & IORESOURCE_PREFETCH)
768 fResFlags |= PCIRAW_ADDRESS_SPACE_MEM_PREFETCH;
769
770 *pfFlags = fResFlags;
771 *pRegionStart = pci_resource_start(pPciDev, iRegion);
772 *pu64RegionSize = pci_resource_len (pPciDev, iRegion);
773
774 vbpci_printk(KERN_DEBUG, pPciDev,
775 "region %d: %s %llx+%lld\n",
776 iRegion, (fFlags & IORESOURCE_MEM) ? "mmio" : "pio",
777 *pRegionStart, *pu64RegionSize);
778 }
779 }
780 else
781 {
782 *pfPresent = false;
783 rc = VERR_INVALID_PARAMETER;
784 }
785
786 IPRT_LINUX_RESTORE_EFL_AC();
787 return rc;
788}
789
790DECLHIDDEN(int) vboxPciOsDevMapRegion(PVBOXRAWPCIINS pIns,
791 int32_t iRegion,
792 RTHCPHYS RegionStart,
793 uint64_t u64RegionSize,
794 uint32_t fFlags,
795 RTR0PTR *pRegionBase)
796{
797 int rc = VINF_SUCCESS;
798 struct pci_dev *pPciDev = pIns->pPciDev;
799 IPRT_LINUX_SAVE_EFL_AC();
800
801 if (!pPciDev || iRegion < 0 || iRegion > 0)
802 {
803 if (pPciDev)
804 vbpci_printk(KERN_DEBUG, pPciDev, "invalid region %d\n", iRegion);
805
806 IPRT_LINUX_RESTORE_EFL_AC();
807 return VERR_INVALID_PARAMETER;
808 }
809
810 vbpci_printk(KERN_DEBUG, pPciDev, "reg=%d start=%llx size=%lld\n",
811 iRegion, RegionStart, u64RegionSize);
812
813 if ( (pci_resource_flags(pPciDev, iRegion) & IORESOURCE_IO)
814 || RegionStart != pci_resource_start(pPciDev, iRegion)
815 || u64RegionSize != pci_resource_len(pPciDev, iRegion))
816 {
817 IPRT_LINUX_RESTORE_EFL_AC();
818 return VERR_INVALID_PARAMETER;
819 }
820
821 /*
822 * XXX: Current code never calls unmap. To avoid leaking mappings
823 * only request and map resources once.
824 */
825 if (!pIns->aRegionR0Mapping[iRegion])
826 {
827 int rcLnx;
828 *pRegionBase = pIns->aRegionR0Mapping[iRegion];
829
830 rcLnx = pci_request_region(pPciDev, iRegion, "vboxpci");
831 if (!rcLnx)
832 {
833 /* For now no caching, try to optimize later. */
834 RTR0PTR R0PtrMapping = ioremap_nocache(pci_resource_start(pPciDev, iRegion),
835 pci_resource_len(pPciDev, iRegion));
836
837 if (R0PtrMapping != NIL_RTR0PTR)
838 pIns->aRegionR0Mapping[iRegion] = R0PtrMapping;
839 else
840 {
841 vbpci_printk(KERN_DEBUG, pPciDev, "ioremap_nocache() failed\n");
842 pci_release_region(pPciDev, iRegion);
843 rc = VERR_MAP_FAILED;
844 }
845 }
846 else
847 rc = VERR_RESOURCE_BUSY;
848 }
849
850 if (RT_SUCCESS(rc))
851 *pRegionBase = pIns->aRegionR0Mapping[iRegion];
852
853 IPRT_LINUX_RESTORE_EFL_AC();
854 return rc;
855}
856
857DECLHIDDEN(int) vboxPciOsDevUnmapRegion(PVBOXRAWPCIINS pIns,
858 int32_t iRegion,
859 RTHCPHYS RegionStart,
860 uint64_t u64RegionSize,
861 RTR0PTR RegionBase)
862{
863 /* XXX: Current code never calls unmap. */
864 return VERR_NOT_IMPLEMENTED;
865}
866
867DECLHIDDEN(int) vboxPciOsDevPciCfgWrite(PVBOXRAWPCIINS pIns, uint32_t Register, PCIRAWMEMLOC *pValue)
868{
869 struct pci_dev *pPciDev = pIns->pPciDev;
870 int rc = VINF_SUCCESS;
871 IPRT_LINUX_SAVE_EFL_AC();
872
873 if (RT_LIKELY(pPciDev))
874 {
875 switch (pValue->cb)
876 {
877 case 1:
878 pci_write_config_byte(pPciDev, Register, pValue->u.u8);
879 break;
880 case 2:
881 pci_write_config_word(pPciDev, Register, pValue->u.u16);
882 break;
883 case 4:
884 pci_write_config_dword(pPciDev, Register, pValue->u.u32);
885 break;
886 }
887 }
888 else
889 rc = VERR_INVALID_PARAMETER;
890
891 IPRT_LINUX_RESTORE_EFL_AC();
892 return rc;
893}
894
895DECLHIDDEN(int) vboxPciOsDevPciCfgRead(PVBOXRAWPCIINS pIns, uint32_t Register, PCIRAWMEMLOC *pValue)
896{
897 struct pci_dev *pPciDev = pIns->pPciDev;
898 int rc = VINF_SUCCESS;
899
900 if (RT_LIKELY(pPciDev))
901 {
902 IPRT_LINUX_SAVE_EFL_AC();
903
904 switch (pValue->cb)
905 {
906 case 1:
907 pci_read_config_byte(pPciDev, Register, &pValue->u.u8);
908 break;
909 case 2:
910 pci_read_config_word(pPciDev, Register, &pValue->u.u16);
911 break;
912 case 4:
913 pci_read_config_dword(pPciDev, Register, &pValue->u.u32);
914 break;
915 }
916
917 IPRT_LINUX_RESTORE_EFL_AC();
918 }
919 else
920 rc = VERR_INVALID_PARAMETER;
921
922 return rc;
923}
924
925/**
926 * Interrupt service routine.
927 *
928 * @returns In 2.6 we indicate whether we've handled the IRQ or not.
929 *
930 * @param iIrq The IRQ number.
931 * @param pvDevId The device ID, a pointer to PVBOXRAWPCIINS.
932 * @param pRegs Register set. Removed in 2.6.19.
933 */
934#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 19) && !defined(DOXYGEN_RUNNING)
935static irqreturn_t vboxPciOsIrqHandler(int iIrq, void *pvDevId)
936#else
937static irqreturn_t vboxPciOsIrqHandler(int iIrq, void *pvDevId, struct pt_regs *pRegs)
938#endif
939{
940 PVBOXRAWPCIINS pIns = (PVBOXRAWPCIINS)pvDevId;
941 bool fTaken = true;
942
943 if (pIns && pIns->IrqHandler.pfnIrqHandler)
944 fTaken = pIns->IrqHandler.pfnIrqHandler(pIns->IrqHandler.pIrqContext, iIrq);
945#ifndef VBOX_WITH_SHARED_PCI_INTERRUPTS
946 /* If we don't allow interrupts sharing, we consider all interrupts as non-shared, thus targetted to us. */
947 fTaken = true;
948#endif
949
950 return fTaken;
951}
952
953DECLHIDDEN(int) vboxPciOsDevRegisterIrqHandler(PVBOXRAWPCIINS pIns, PFNRAWPCIISR pfnHandler, void* pIrqContext, int32_t *piHostIrq)
954{
955 int rc;
956 int32_t iIrq = pIns->pPciDev->irq;
957 IPRT_LINUX_SAVE_EFL_AC();
958
959 if (iIrq == 0)
960 {
961 vbpci_printk(KERN_NOTICE, pIns->pPciDev, "no irq assigned\n");
962 IPRT_LINUX_RESTORE_EFL_AC();
963 return VERR_INVALID_PARAMETER;
964 }
965
966 rc = request_irq(iIrq,
967 vboxPciOsIrqHandler,
968#ifdef VBOX_WITH_SHARED_PCI_INTERRUPTS
969 /* Allow interrupts sharing. */
970# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 20)
971 IRQF_SHARED,
972# else
973 SA_SHIRQ,
974# endif
975
976#else
977
978 /* We don't allow interrupts sharing */
979 /* XXX overhaul */
980# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 20) && LINUX_VERSION_CODE < KERNEL_VERSION(4, 1, 0)
981 IRQF_DISABLED, /* keep irqs disabled when calling the action handler */
982# else
983 0,
984# endif
985#endif
986 DRIVER_NAME,
987 pIns);
988 if (rc)
989 {
990 vbpci_printk(KERN_DEBUG, pIns->pPciDev,
991 "could not request irq %d, error %d\n", iIrq, rc);
992 IPRT_LINUX_RESTORE_EFL_AC();
993 return VERR_RESOURCE_BUSY;
994 }
995
996 vbpci_printk(KERN_DEBUG, pIns->pPciDev, "got irq %d\n", iIrq);
997 *piHostIrq = iIrq;
998
999 IPRT_LINUX_RESTORE_EFL_AC();
1000 return VINF_SUCCESS;
1001}
1002
1003DECLHIDDEN(int) vboxPciOsDevUnregisterIrqHandler(PVBOXRAWPCIINS pIns, int32_t iHostIrq)
1004{
1005 IPRT_LINUX_SAVE_EFL_AC();
1006
1007 vbpci_printk(KERN_DEBUG, pIns->pPciDev, "freeing irq %d\n", iHostIrq);
1008 free_irq(iHostIrq, pIns);
1009
1010 IPRT_LINUX_RESTORE_EFL_AC();
1011 return VINF_SUCCESS;
1012}
1013
1014DECLHIDDEN(int) vboxPciOsDevPowerStateChange(PVBOXRAWPCIINS pIns, PCIRAWPOWERSTATE aState)
1015{
1016 int rc;
1017
1018 switch (aState)
1019 {
1020 case PCIRAW_POWER_ON:
1021 vbpci_printk(KERN_DEBUG, pIns->pPciDev, "PCIRAW_POWER_ON\n");
1022 /* Reset device, just in case. */
1023 vboxPciLinuxDevReset(pIns);
1024 /* register us with IOMMU */
1025 rc = vboxPciLinuxDevRegisterWithIommu(pIns);
1026 break;
1027 case PCIRAW_POWER_RESET:
1028 vbpci_printk(KERN_DEBUG, pIns->pPciDev, "PCIRAW_POWER_RESET\n");
1029 rc = vboxPciLinuxDevReset(pIns);
1030 break;
1031 case PCIRAW_POWER_OFF:
1032 vbpci_printk(KERN_DEBUG, pIns->pPciDev, "PCIRAW_POWER_OFF\n");
1033 /* unregister us from IOMMU */
1034 rc = vboxPciLinuxDevUnregisterWithIommu(pIns);
1035 break;
1036 case PCIRAW_POWER_SUSPEND:
1037 vbpci_printk(KERN_DEBUG, pIns->pPciDev, "PCIRAW_POWER_SUSPEND\n");
1038 rc = VINF_SUCCESS;
1039 /// @todo what do we do here?
1040 break;
1041 case PCIRAW_POWER_RESUME:
1042 vbpci_printk(KERN_DEBUG, pIns->pPciDev, "PCIRAW_POWER_RESUME\n");
1043 rc = VINF_SUCCESS;
1044 /// @todo what do we do here?
1045 break;
1046 default:
1047 vbpci_printk(KERN_DEBUG, pIns->pPciDev, "unknown power state %u\n", aState);
1048 /* to make compiler happy */
1049 rc = VERR_NOT_SUPPORTED;
1050 break;
1051 }
1052
1053 return rc;
1054}
1055
1056
1057#ifdef VBOX_WITH_IOMMU
1058/** Callback for FNRAWPCICONTIGPHYSMEMINFO. */
1059static DECLCALLBACK(int) vboxPciOsContigMemInfo(PRAWPCIPERVM pVmCtx, RTHCPHYS HostStart, RTGCPHYS GuestStart,
1060 uint64_t cMemSize, PCIRAWMEMINFOACTION Action)
1061{
1062 struct iommu_domain* domain = ((PVBOXRAWPCIDRVVM)(pVmCtx->pDriverData))->pIommuDomain;
1063 int rc = VINF_SUCCESS;
1064 IPRT_LINUX_SAVE_EFL_AC();
1065
1066 switch (Action)
1067 {
1068 case PCIRAW_MEMINFO_MAP:
1069 {
1070 int flags, r;
1071
1072 if (iommu_iova_to_phys(domain, GuestStart))
1073 break;
1074
1075 flags = IOMMU_READ | IOMMU_WRITE;
1076 /** @todo flags |= IOMMU_CACHE; */
1077
1078 r = iommu_map(domain, GuestStart, HostStart, get_order(cMemSize), flags);
1079 if (r)
1080 {
1081 printk(KERN_ERR "vboxPciOsContigMemInfo:"
1082 "iommu failed to map pfn=%llx\n", HostStart);
1083 rc = VERR_GENERAL_FAILURE;
1084 break;
1085 }
1086 rc = VINF_SUCCESS;
1087 break;
1088 }
1089 case PCIRAW_MEMINFO_UNMAP:
1090 {
1091 int order;
1092 order = iommu_unmap(domain, GuestStart, get_order(cMemSize));
1093 NOREF(order);
1094 break;
1095 }
1096
1097 default:
1098 printk(KERN_DEBUG "Unsupported action: %d\n", (int)Action);
1099 rc = VERR_NOT_SUPPORTED;
1100 break;
1101 }
1102
1103 IPRT_LINUX_RESTORE_EFL_AC();
1104 return rc;
1105}
1106#endif
1107
1108DECLHIDDEN(int) vboxPciOsInitVm(PVBOXRAWPCIDRVVM pThis, PVM pVM, PRAWPCIPERVM pVmData)
1109{
1110 int rc = VINF_SUCCESS;
1111
1112#ifdef VBOX_WITH_IOMMU
1113 IPRT_LINUX_SAVE_EFL_AC();
1114
1115 if (IOMMU_PRESENT())
1116 {
1117 pThis->pIommuDomain = IOMMU_DOMAIN_ALLOC();
1118 if (!pThis->pIommuDomain)
1119 {
1120 vbpci_printk(KERN_DEBUG, NULL, "cannot allocate IOMMU domain\n");
1121 rc = VERR_NO_MEMORY;
1122 }
1123 else
1124 {
1125 pVmData->pfnContigMemInfo = vboxPciOsContigMemInfo;
1126
1127 vbpci_printk(KERN_DEBUG, NULL, "created IOMMU domain %p\n",
1128 pThis->pIommuDomain);
1129 }
1130 }
1131
1132 IPRT_LINUX_RESTORE_EFL_AC();
1133#endif
1134 return rc;
1135}
1136
1137DECLHIDDEN(void) vboxPciOsDeinitVm(PVBOXRAWPCIDRVVM pThis, PVM pVM)
1138{
1139#ifdef VBOX_WITH_IOMMU
1140 IPRT_LINUX_SAVE_EFL_AC();
1141
1142 if (pThis->pIommuDomain)
1143 {
1144 vbpci_printk(KERN_DEBUG, NULL, "freeing IOMMU domain %p\n",
1145 pThis->pIommuDomain);
1146 iommu_domain_free(pThis->pIommuDomain);
1147 pThis->pIommuDomain = NULL;
1148 }
1149
1150 IPRT_LINUX_RESTORE_EFL_AC();
1151#endif
1152}
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette