VirtualBox

source: vbox/trunk/src/VBox/Devices/Network/DevVirtioNet.cpp@ 74579

Last change on this file since 74579 was 73415, checked in by vboxsync, 6 years ago

Build fix for r124028

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 84.8 KB
Line 
1/* $Id: DevVirtioNet.cpp 73415 2018-07-31 17:21:54Z vboxsync $ */
2/** @file
3 * DevVirtioNet - Virtio Network Device
4 */
5
6/*
7 * Copyright (C) 2009-2017 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*********************************************************************************************************************************
20* Header Files *
21*********************************************************************************************************************************/
22#define LOG_GROUP LOG_GROUP_DEV_VIRTIO_NET
23#define VNET_GC_SUPPORT
24#define VNET_WITH_GSO
25#define VNET_WITH_MERGEABLE_RX_BUFS
26
27#include <VBox/vmm/pdmdev.h>
28#include <VBox/vmm/pdmnetifs.h>
29#include <iprt/asm.h>
30#include <iprt/net.h>
31#include <iprt/semaphore.h>
32#ifdef IN_RING3
33# include <iprt/mem.h>
34# include <iprt/uuid.h>
35#endif /* IN_RING3 */
36#include <VBox/VBoxPktDmp.h>
37#include "VBoxDD.h"
38#include "../VirtIO/Virtio.h"
39
40
41/*********************************************************************************************************************************
42* Defined Constants And Macros *
43*********************************************************************************************************************************/
44#ifndef VBOX_DEVICE_STRUCT_TESTCASE
45
46#define INSTANCE(pThis) pThis->VPCI.szInstance
47#define STATUS pThis->config.uStatus
48
49#ifdef IN_RING3
50
51#define VNET_PCI_CLASS 0x0200
52#define VNET_N_QUEUES 3
53#define VNET_NAME_FMT "VNet%d"
54
55#if 0
56/* Virtio Block Device */
57#define VNET_PCI_CLASS 0x0180
58#define VNET_N_QUEUES 2
59#define VNET_NAME_FMT "VBlk%d"
60#endif
61
62#endif /* IN_RING3 */
63
64#endif /* VBOX_DEVICE_STRUCT_TESTCASE */
65
66/*
67 * Commenting out VNET_TX_DELAY enables async transmission in a dedicated thread.
68 * When VNET_TX_DELAY is defined, a timer handler does the job.
69 */
70//#define VNET_TX_DELAY 150 /**< 150 microseconds */
71#define VNET_MAX_FRAME_SIZE 65535 + 18 /**< Max IP packet size + Ethernet header with VLAN tag */
72#define VNET_MAC_FILTER_LEN 32
73#define VNET_MAX_VID (1 << 12)
74
75/** @name Virtio net features
76 * @{ */
77#define VNET_F_CSUM 0x00000001 /**< Host handles pkts w/ partial csum */
78#define VNET_F_GUEST_CSUM 0x00000002 /**< Guest handles pkts w/ partial csum */
79#define VNET_F_MAC 0x00000020 /**< Host has given MAC address. */
80#define VNET_F_GSO 0x00000040 /**< Host handles pkts w/ any GSO type */
81#define VNET_F_GUEST_TSO4 0x00000080 /**< Guest can handle TSOv4 in. */
82#define VNET_F_GUEST_TSO6 0x00000100 /**< Guest can handle TSOv6 in. */
83#define VNET_F_GUEST_ECN 0x00000200 /**< Guest can handle TSO[6] w/ ECN in. */
84#define VNET_F_GUEST_UFO 0x00000400 /**< Guest can handle UFO in. */
85#define VNET_F_HOST_TSO4 0x00000800 /**< Host can handle TSOv4 in. */
86#define VNET_F_HOST_TSO6 0x00001000 /**< Host can handle TSOv6 in. */
87#define VNET_F_HOST_ECN 0x00002000 /**< Host can handle TSO[6] w/ ECN in. */
88#define VNET_F_HOST_UFO 0x00004000 /**< Host can handle UFO in. */
89#define VNET_F_MRG_RXBUF 0x00008000 /**< Host can merge receive buffers. */
90#define VNET_F_STATUS 0x00010000 /**< virtio_net_config.status available */
91#define VNET_F_CTRL_VQ 0x00020000 /**< Control channel available */
92#define VNET_F_CTRL_RX 0x00040000 /**< Control channel RX mode support */
93#define VNET_F_CTRL_VLAN 0x00080000 /**< Control channel VLAN filtering */
94/** @} */
95
96#define VNET_S_LINK_UP 1
97
98
99/*********************************************************************************************************************************
100* Structures and Typedefs *
101*********************************************************************************************************************************/
102#ifdef _MSC_VER
103struct VNetPCIConfig
104#else /* !_MSC_VER */
105struct __attribute__ ((__packed__)) VNetPCIConfig /** @todo r=bird: Use #pragma pack if necessary, that's portable! */
106#endif /* !_MSC_VER */
107{
108 RTMAC mac;
109 uint16_t uStatus;
110};
111AssertCompileMemberOffset(struct VNetPCIConfig, uStatus, 6);
112
113/**
114 * Device state structure. Holds the current state of device.
115 *
116 * @extends VPCISTATE
117 * @implements PDMINETWORKDOWN
118 * @implements PDMINETWORKCONFIG
119 */
120typedef struct VNetState_st
121{
122 /* VPCISTATE must be the first member! */
123 VPCISTATE VPCI;
124
125// PDMCRITSECT csRx; /**< Protects RX queue. */
126
127 PDMINETWORKDOWN INetworkDown;
128 PDMINETWORKCONFIG INetworkConfig;
129 R3PTRTYPE(PPDMIBASE) pDrvBase; /**< Attached network driver. */
130 R3PTRTYPE(PPDMINETWORKUP) pDrv; /**< Connector of attached network driver. */
131
132 R3PTRTYPE(PPDMQUEUE) pCanRxQueueR3; /**< Rx wakeup signaller - R3. */
133 R0PTRTYPE(PPDMQUEUE) pCanRxQueueR0; /**< Rx wakeup signaller - R0. */
134 RCPTRTYPE(PPDMQUEUE) pCanRxQueueRC; /**< Rx wakeup signaller - RC. */
135# if HC_ARCH_BITS == 64
136 uint32_t padding;
137# endif
138
139 /**< Link Up(/Restore) Timer. */
140 PTMTIMERR3 pLinkUpTimer;
141
142#ifdef VNET_TX_DELAY
143 /**< Transmit Delay Timer - R3. */
144 PTMTIMERR3 pTxTimerR3;
145 /**< Transmit Delay Timer - R0. */
146 PTMTIMERR0 pTxTimerR0;
147 /**< Transmit Delay Timer - GC. */
148 PTMTIMERRC pTxTimerRC;
149
150# if HC_ARCH_BITS == 64
151 uint32_t padding2;
152# endif
153
154 uint32_t u32i;
155 uint32_t u32AvgDiff;
156 uint32_t u32MinDiff;
157 uint32_t u32MaxDiff;
158 uint64_t u64NanoTS;
159#else /* !VNET_TX_DELAY */
160 /** The support driver session handle. */
161 R3R0PTRTYPE(PSUPDRVSESSION) pSupDrvSession;
162 /** The event semaphore TX thread waits on. */
163 SUPSEMEVENT hTxEvent;
164 R3PTRTYPE(PPDMTHREAD) pTxThread;
165#endif /* !VNET_TX_DELAY */
166
167 /** Indicates transmission in progress -- only one thread is allowed. */
168 uint32_t uIsTransmitting;
169
170 /** PCI config area holding MAC address as well as TBD. */
171 struct VNetPCIConfig config;
172 /** MAC address obtained from the configuration. */
173 RTMAC macConfigured;
174 /** True if physical cable is attached in configuration. */
175 bool fCableConnected;
176 /** Link up delay (in milliseconds). */
177 uint32_t cMsLinkUpDelay;
178
179 uint32_t alignment;
180
181 /** Number of packet being sent/received to show in debug log. */
182 uint32_t u32PktNo;
183
184 /** N/A: */
185 bool volatile fMaybeOutOfSpace;
186
187 /** Promiscuous mode -- RX filter accepts all packets. */
188 bool fPromiscuous;
189 /** AllMulti mode -- RX filter accepts all multicast packets. */
190 bool fAllMulti;
191 /** The number of actually used slots in aMacTable. */
192 uint32_t nMacFilterEntries;
193 /** Array of MAC addresses accepted by RX filter. */
194 RTMAC aMacFilter[VNET_MAC_FILTER_LEN];
195 /** Bit array of VLAN filter, one bit per VLAN ID. */
196 uint8_t aVlanFilter[VNET_MAX_VID / sizeof(uint8_t)];
197
198 R3PTRTYPE(PVQUEUE) pRxQueue;
199 R3PTRTYPE(PVQUEUE) pTxQueue;
200 R3PTRTYPE(PVQUEUE) pCtlQueue;
201 /* Receive-blocking-related fields ***************************************/
202
203 /** EMT: Gets signalled when more RX descriptors become available. */
204 RTSEMEVENT hEventMoreRxDescAvail;
205
206 /** @name Statistic
207 * @{ */
208 STAMCOUNTER StatReceiveBytes;
209 STAMCOUNTER StatTransmitBytes;
210 STAMCOUNTER StatReceiveGSO;
211 STAMCOUNTER StatTransmitPackets;
212 STAMCOUNTER StatTransmitGSO;
213 STAMCOUNTER StatTransmitCSum;
214#if defined(VBOX_WITH_STATISTICS)
215 STAMPROFILE StatReceive;
216 STAMPROFILE StatReceiveStore;
217 STAMPROFILEADV StatTransmit;
218 STAMPROFILE StatTransmitSend;
219 STAMPROFILE StatRxOverflow;
220 STAMCOUNTER StatRxOverflowWakeup;
221 STAMCOUNTER StatTransmitByNetwork;
222 STAMCOUNTER StatTransmitByThread;
223#endif /* VBOX_WITH_STATISTICS */
224 /** @} */
225} VNETSTATE;
226/** Pointer to a virtual I/O network device state. */
227typedef VNETSTATE *PVNETSTATE;
228
229#ifndef VBOX_DEVICE_STRUCT_TESTCASE
230
231#define VNETHDR_F_NEEDS_CSUM 1 // Use u16CSumStart, u16CSumOffset
232
233#define VNETHDR_GSO_NONE 0 // Not a GSO frame
234#define VNETHDR_GSO_TCPV4 1 // GSO frame, IPv4 TCP (TSO)
235#define VNETHDR_GSO_UDP 3 // GSO frame, IPv4 UDP (UFO)
236#define VNETHDR_GSO_TCPV6 4 // GSO frame, IPv6 TCP
237#define VNETHDR_GSO_ECN 0x80 // TCP has ECN set
238
239struct VNetHdr
240{
241 uint8_t u8Flags;
242 uint8_t u8GSOType;
243 uint16_t u16HdrLen;
244 uint16_t u16GSOSize;
245 uint16_t u16CSumStart;
246 uint16_t u16CSumOffset;
247};
248typedef struct VNetHdr VNETHDR;
249typedef VNETHDR *PVNETHDR;
250AssertCompileSize(VNETHDR, 10);
251
252struct VNetHdrMrx
253{
254 VNETHDR Hdr;
255 uint16_t u16NumBufs;
256};
257typedef struct VNetHdrMrx VNETHDRMRX;
258typedef VNETHDRMRX *PVNETHDRMRX;
259AssertCompileSize(VNETHDRMRX, 12);
260
261AssertCompileMemberOffset(VNETSTATE, VPCI, 0);
262
263#define VNET_OK 0
264#define VNET_ERROR 1
265typedef uint8_t VNETCTLACK;
266
267#define VNET_CTRL_CLS_RX_MODE 0
268#define VNET_CTRL_CMD_RX_MODE_PROMISC 0
269#define VNET_CTRL_CMD_RX_MODE_ALLMULTI 1
270
271#define VNET_CTRL_CLS_MAC 1
272#define VNET_CTRL_CMD_MAC_TABLE_SET 0
273
274#define VNET_CTRL_CLS_VLAN 2
275#define VNET_CTRL_CMD_VLAN_ADD 0
276#define VNET_CTRL_CMD_VLAN_DEL 1
277
278
279struct VNetCtlHdr
280{
281 uint8_t u8Class;
282 uint8_t u8Command;
283};
284typedef struct VNetCtlHdr VNETCTLHDR;
285typedef VNETCTLHDR *PVNETCTLHDR;
286AssertCompileSize(VNETCTLHDR, 2);
287
288#ifdef IN_RING3
289
290/** Returns true if large packets are written into several RX buffers. */
291DECLINLINE(bool) vnetMergeableRxBuffers(PVNETSTATE pThis)
292{
293 return !!(pThis->VPCI.uGuestFeatures & VNET_F_MRG_RXBUF);
294}
295
296DECLINLINE(int) vnetCsEnter(PVNETSTATE pThis, int rcBusy)
297{
298 return vpciCsEnter(&pThis->VPCI, rcBusy);
299}
300
301DECLINLINE(void) vnetCsLeave(PVNETSTATE pThis)
302{
303 vpciCsLeave(&pThis->VPCI);
304}
305
306#endif /* IN_RING3 */
307
308DECLINLINE(int) vnetCsRxEnter(PVNETSTATE pThis, int rcBusy)
309{
310 RT_NOREF_PV(pThis);
311 RT_NOREF_PV(rcBusy);
312 // STAM_PROFILE_START(&pThis->CTXSUFF(StatCsRx), a);
313 // int rc = PDMCritSectEnter(&pThis->csRx, rcBusy);
314 // STAM_PROFILE_STOP(&pThis->CTXSUFF(StatCsRx), a);
315 // return rc;
316 return VINF_SUCCESS;
317}
318
319DECLINLINE(void) vnetCsRxLeave(PVNETSTATE pThis)
320{
321 RT_NOREF_PV(pThis);
322 // PDMCritSectLeave(&pThis->csRx);
323}
324
325#ifdef IN_RING3
326/**
327 * Dump a packet to debug log.
328 *
329 * @param pThis The device state structure.
330 * @param pbPacket The packet.
331 * @param cb The size of the packet.
332 * @param pszText A string denoting direction of packet transfer.
333 */
334DECLINLINE(void) vnetPacketDump(PVNETSTATE pThis, const uint8_t *pbPacket, size_t cb, const char *pszText)
335{
336# ifdef DEBUG
337# if 0
338 Log(("%s %s packet #%d (%d bytes):\n",
339 INSTANCE(pThis), pszText, ++pThis->u32PktNo, cb));
340 Log3(("%.*Rhxd\n", cb, pbPacket));
341# else
342 vboxEthPacketDump(INSTANCE(pThis), pszText, pbPacket, (uint32_t)cb);
343# endif
344# else
345 RT_NOREF4(pThis, pbPacket, cb, pszText);
346# endif
347}
348#endif /* IN_RING3 */
349
350/**
351 * Print features given in uFeatures to debug log.
352 *
353 * @param pThis The device state structure.
354 * @param fFeatures Descriptions of which features to print.
355 * @param pcszText A string to print before the list of features.
356 */
357DECLINLINE(void) vnetPrintFeatures(PVNETSTATE pThis, uint32_t fFeatures, const char *pcszText)
358{
359#ifdef DEBUG
360 static struct
361 {
362 uint32_t uMask;
363 const char *pcszDesc;
364 } const s_aFeatures[] =
365 {
366 { VNET_F_CSUM, "host handles pkts w/ partial csum" },
367 { VNET_F_GUEST_CSUM, "guest handles pkts w/ partial csum" },
368 { VNET_F_MAC, "host has given MAC address" },
369 { VNET_F_GSO, "host handles pkts w/ any GSO type" },
370 { VNET_F_GUEST_TSO4, "guest can handle TSOv4 in" },
371 { VNET_F_GUEST_TSO6, "guest can handle TSOv6 in" },
372 { VNET_F_GUEST_ECN, "guest can handle TSO[6] w/ ECN in" },
373 { VNET_F_GUEST_UFO, "guest can handle UFO in" },
374 { VNET_F_HOST_TSO4, "host can handle TSOv4 in" },
375 { VNET_F_HOST_TSO6, "host can handle TSOv6 in" },
376 { VNET_F_HOST_ECN, "host can handle TSO[6] w/ ECN in" },
377 { VNET_F_HOST_UFO, "host can handle UFO in" },
378 { VNET_F_MRG_RXBUF, "host can merge receive buffers" },
379 { VNET_F_STATUS, "virtio_net_config.status available" },
380 { VNET_F_CTRL_VQ, "control channel available" },
381 { VNET_F_CTRL_RX, "control channel RX mode support" },
382 { VNET_F_CTRL_VLAN, "control channel VLAN filtering" }
383 };
384
385 Log3(("%s %s:\n", INSTANCE(pThis), pcszText));
386 for (unsigned i = 0; i < RT_ELEMENTS(s_aFeatures); ++i)
387 {
388 if (s_aFeatures[i].uMask & fFeatures)
389 Log3(("%s --> %s\n", INSTANCE(pThis), s_aFeatures[i].pcszDesc));
390 }
391#else /* !DEBUG */
392 RT_NOREF3(pThis, fFeatures, pcszText);
393#endif /* !DEBUG */
394}
395
396static DECLCALLBACK(uint32_t) vnetIoCb_GetHostFeatures(void *pvState)
397{
398 RT_NOREF_PV(pvState);
399
400 /* We support:
401 * - Host-provided MAC address
402 * - Link status reporting in config space
403 * - Control queue
404 * - RX mode setting
405 * - MAC filter table
406 * - VLAN filter
407 */
408 return VNET_F_MAC
409 | VNET_F_STATUS
410 | VNET_F_CTRL_VQ
411 | VNET_F_CTRL_RX
412 | VNET_F_CTRL_VLAN
413#ifdef VNET_WITH_GSO
414 | VNET_F_CSUM
415 | VNET_F_HOST_TSO4
416 | VNET_F_HOST_TSO6
417 | VNET_F_HOST_UFO
418 | VNET_F_GUEST_CSUM /* We expect the guest to accept partial TCP checksums (see @bugref{4796}) */
419 | VNET_F_GUEST_TSO4
420 | VNET_F_GUEST_TSO6
421 | VNET_F_GUEST_UFO
422#endif
423#ifdef VNET_WITH_MERGEABLE_RX_BUFS
424 | VNET_F_MRG_RXBUF
425#endif
426 ;
427}
428
429static DECLCALLBACK(uint32_t) vnetIoCb_GetHostMinimalFeatures(void *pvState)
430{
431 RT_NOREF_PV(pvState);
432 return VNET_F_MAC;
433}
434
435static DECLCALLBACK(void) vnetIoCb_SetHostFeatures(void *pvState, uint32_t fFeatures)
436{
437 /** @todo Nothing to do here yet */
438 PVNETSTATE pThis = (PVNETSTATE)pvState;
439 LogFlow(("%s vnetIoCb_SetHostFeatures: uFeatures=%x\n", INSTANCE(pThis), fFeatures));
440 vnetPrintFeatures(pThis, fFeatures, "The guest negotiated the following features");
441}
442
443static DECLCALLBACK(int) vnetIoCb_GetConfig(void *pvState, uint32_t offCfg, uint32_t cb, void *data)
444{
445 PVNETSTATE pThis = (PVNETSTATE)pvState;
446 if (offCfg + cb > sizeof(struct VNetPCIConfig))
447 {
448 Log(("%s vnetIoCb_GetConfig: Read beyond the config structure is attempted (offCfg=%#x cb=%x).\n", INSTANCE(pThis), offCfg, cb));
449 return VERR_IOM_IOPORT_UNUSED;
450 }
451 memcpy(data, (uint8_t *)&pThis->config + offCfg, cb);
452 return VINF_SUCCESS;
453}
454
455static DECLCALLBACK(int) vnetIoCb_SetConfig(void *pvState, uint32_t offCfg, uint32_t cb, void *data)
456{
457 PVNETSTATE pThis = (PVNETSTATE)pvState;
458 if (offCfg + cb > sizeof(struct VNetPCIConfig))
459 {
460 Log(("%s vnetIoCb_SetConfig: Write beyond the config structure is attempted (offCfg=%#x cb=%x).\n", INSTANCE(pThis), offCfg, cb));
461 if (offCfg < sizeof(struct VNetPCIConfig))
462 memcpy((uint8_t *)&pThis->config + offCfg, data,
463 sizeof(struct VNetPCIConfig) - offCfg);
464 return VINF_SUCCESS;
465 }
466 memcpy((uint8_t *)&pThis->config + offCfg, data, cb);
467 return VINF_SUCCESS;
468}
469
470/**
471 * Hardware reset. Revert all registers to initial values.
472 *
473 * @param pThis The device state structure.
474 */
475static DECLCALLBACK(int) vnetIoCb_Reset(void *pvState)
476{
477 PVNETSTATE pThis = (PVNETSTATE)pvState;
478 Log(("%s Reset triggered\n", INSTANCE(pThis)));
479
480 int rc = vnetCsRxEnter(pThis, VERR_SEM_BUSY);
481 if (RT_UNLIKELY(rc != VINF_SUCCESS))
482 {
483 LogRel(("vnetIoCb_Reset failed to enter RX critical section!\n"));
484 return rc;
485 }
486 vpciReset(&pThis->VPCI);
487 vnetCsRxLeave(pThis);
488
489 /// @todo Implement reset
490 if (pThis->fCableConnected)
491 STATUS = VNET_S_LINK_UP;
492 else
493 STATUS = 0;
494 Log(("%s vnetIoCb_Reset: Link is %s\n", INSTANCE(pThis), pThis->fCableConnected ? "up" : "down"));
495
496 /*
497 * By default we pass all packets up since the older guests cannot control
498 * virtio mode.
499 */
500 pThis->fPromiscuous = true;
501 pThis->fAllMulti = false;
502 pThis->nMacFilterEntries = 0;
503 memset(pThis->aMacFilter, 0, VNET_MAC_FILTER_LEN * sizeof(RTMAC));
504 memset(pThis->aVlanFilter, 0, sizeof(pThis->aVlanFilter));
505 pThis->uIsTransmitting = 0;
506#ifndef IN_RING3
507 return VINF_IOM_R3_IOPORT_WRITE;
508#else
509 if (pThis->pDrv)
510 pThis->pDrv->pfnSetPromiscuousMode(pThis->pDrv, true);
511 return VINF_SUCCESS;
512#endif
513}
514
515#ifdef IN_RING3
516
517/**
518 * Wakeup the RX thread.
519 */
520static void vnetWakeupReceive(PPDMDEVINS pDevIns)
521{
522 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
523 if ( pThis->fMaybeOutOfSpace
524 && pThis->hEventMoreRxDescAvail != NIL_RTSEMEVENT)
525 {
526 STAM_COUNTER_INC(&pThis->StatRxOverflowWakeup);
527 Log(("%s Waking up Out-of-RX-space semaphore\n", INSTANCE(pThis)));
528/**
529 * @todo r=bird: We can wake stuff up from ring-0 too, see vmsvga, nvme,
530 * buslogic, lsilogic, ata, ahci, xhci. Also, please address similar
531 * TODO in E1000.
532 *
533 * The API Is SUPSem*, btw.
534 */
535 RTSemEventSignal(pThis->hEventMoreRxDescAvail);
536 }
537}
538
539
540/**
541 * Helper function that raises an interrupt if the guest is ready to receive it.
542 */
543int vnetRaiseInterrupt(PVNETSTATE pThis, int rcBusy, uint8_t u8IntCause)
544{
545 if (pThis->VPCI.uStatus & VPCI_STATUS_DRV_OK)
546 return vpciRaiseInterrupt(&pThis->VPCI, rcBusy, u8IntCause);
547 return rcBusy;
548}
549
550
551/**
552 * Takes down the link temporarily if it's current status is up.
553 *
554 * This is used during restore and when replumbing the network link.
555 *
556 * The temporary link outage is supposed to indicate to the OS that all network
557 * connections have been lost and that it for instance is appropriate to
558 * renegotiate any DHCP lease.
559 *
560 * @param pThis The Virtual I/O network device state.
561 */
562static void vnetTempLinkDown(PVNETSTATE pThis)
563{
564 if (STATUS & VNET_S_LINK_UP)
565 {
566 STATUS &= ~VNET_S_LINK_UP;
567 vnetRaiseInterrupt(pThis, VERR_SEM_BUSY, VPCI_ISR_CONFIG);
568 /* Restore the link back in 5 seconds. */
569 int rc = TMTimerSetMillies(pThis->pLinkUpTimer, pThis->cMsLinkUpDelay);
570 AssertRC(rc);
571 Log(("%s vnetTempLinkDown: Link is down temporarily\n", INSTANCE(pThis)));
572 }
573}
574
575
576/**
577 * @callback_method_impl{FNTMTIMERDEV, Link Up Timer handler.}
578 */
579static DECLCALLBACK(void) vnetLinkUpTimer(PPDMDEVINS pDevIns, PTMTIMER pTimer, void *pvUser)
580{
581 RT_NOREF(pTimer);
582 PVNETSTATE pThis = (PVNETSTATE)pvUser;
583
584 int rc = vnetCsEnter(pThis, VERR_SEM_BUSY);
585 if (RT_UNLIKELY(rc != VINF_SUCCESS))
586 return;
587 STATUS |= VNET_S_LINK_UP;
588 vnetRaiseInterrupt(pThis, VERR_SEM_BUSY, VPCI_ISR_CONFIG);
589 vnetWakeupReceive(pDevIns);
590 vnetCsLeave(pThis);
591 Log(("%s vnetLinkUpTimer: Link is up\n", INSTANCE(pThis)));
592 if (pThis->pDrv)
593 pThis->pDrv->pfnNotifyLinkChanged(pThis->pDrv, PDMNETWORKLINKSTATE_UP);
594}
595
596
597/**
598 * @callback_method_impl{FNPDMQUEUEDEV, Handler for the wakeup signaller queue.}
599 */
600static DECLCALLBACK(bool) vnetCanRxQueueConsumer(PPDMDEVINS pDevIns, PPDMQUEUEITEMCORE pItem)
601{
602 RT_NOREF(pItem);
603 vnetWakeupReceive(pDevIns);
604 return true;
605}
606
607#endif /* IN_RING3 */
608
609/**
610 * This function is called when the driver becomes ready.
611 *
612 * @param pThis The device state structure.
613 */
614static DECLCALLBACK(void) vnetIoCb_Ready(void *pvState)
615{
616 PVNETSTATE pThis = (PVNETSTATE)pvState;
617 Log(("%s Driver became ready, waking up RX thread...\n", INSTANCE(pThis)));
618/**
619 * @todo r=bird: We can wake stuff up from ring-0 too, see vmsvga, nvme,
620 * buslogic, lsilogic, ata, ahci, xhci. Also, please address similar
621 * TODO in E1000.
622 *
623 * The API Is SUPSem*, btw.
624 */
625#ifdef IN_RING3
626 vnetWakeupReceive(pThis->VPCI.CTX_SUFF(pDevIns));
627#else
628 PPDMQUEUEITEMCORE pItem = PDMQueueAlloc(pThis->CTX_SUFF(pCanRxQueue));
629 if (pItem)
630 PDMQueueInsert(pThis->CTX_SUFF(pCanRxQueue), pItem);
631#endif
632}
633
634
635/**
636 * I/O port callbacks.
637 */
638static const VPCIIOCALLBACKS g_IOCallbacks =
639{
640 vnetIoCb_GetHostFeatures,
641 vnetIoCb_GetHostMinimalFeatures,
642 vnetIoCb_SetHostFeatures,
643 vnetIoCb_GetConfig,
644 vnetIoCb_SetConfig,
645 vnetIoCb_Reset,
646 vnetIoCb_Ready,
647};
648
649
650/**
651 * @callback_method_impl{FNIOMIOPORTIN}
652 */
653PDMBOTHCBDECL(int) vnetIOPortIn(PPDMDEVINS pDevIns, void *pvUser, RTIOPORT port, uint32_t *pu32, unsigned cb)
654{
655 return vpciIOPortIn(pDevIns, pvUser, port, pu32, cb, &g_IOCallbacks);
656}
657
658
659/**
660 * @callback_method_impl{FNIOMIOPORTOUT}
661 */
662PDMBOTHCBDECL(int) vnetIOPortOut(PPDMDEVINS pDevIns, void *pvUser, RTIOPORT port, uint32_t u32, unsigned cb)
663{
664 return vpciIOPortOut(pDevIns, pvUser, port, u32, cb, &g_IOCallbacks);
665}
666
667
668#ifdef IN_RING3
669
670/**
671 * Check if the device can receive data now.
672 * This must be called before the pfnRecieve() method is called.
673 *
674 * @remarks As a side effect this function enables queue notification
675 * if it cannot receive because the queue is empty.
676 * It disables notification if it can receive.
677 *
678 * @returns VERR_NET_NO_BUFFER_SPACE if it cannot.
679 * @param pInterface Pointer to the interface structure containing the called function pointer.
680 * @thread RX
681 */
682static int vnetCanReceive(PVNETSTATE pThis)
683{
684 int rc = vnetCsRxEnter(pThis, VERR_SEM_BUSY);
685 AssertRCReturn(rc, rc);
686
687 LogFlow(("%s vnetCanReceive\n", INSTANCE(pThis)));
688 if (!(pThis->VPCI.uStatus & VPCI_STATUS_DRV_OK))
689 rc = VERR_NET_NO_BUFFER_SPACE;
690 else if (!vqueueIsReady(&pThis->VPCI, pThis->pRxQueue))
691 rc = VERR_NET_NO_BUFFER_SPACE;
692 else if (vqueueIsEmpty(&pThis->VPCI, pThis->pRxQueue))
693 {
694 vringSetNotification(&pThis->VPCI, &pThis->pRxQueue->VRing, true);
695 rc = VERR_NET_NO_BUFFER_SPACE;
696 }
697 else
698 {
699 vringSetNotification(&pThis->VPCI, &pThis->pRxQueue->VRing, false);
700 rc = VINF_SUCCESS;
701 }
702
703 LogFlow(("%s vnetCanReceive -> %Rrc\n", INSTANCE(pThis), rc));
704 vnetCsRxLeave(pThis);
705 return rc;
706}
707
708/**
709 * @interface_method_impl{PDMINETWORKDOWN,pfnWaitReceiveAvail}
710 */
711static DECLCALLBACK(int) vnetNetworkDown_WaitReceiveAvail(PPDMINETWORKDOWN pInterface, RTMSINTERVAL cMillies)
712{
713 PVNETSTATE pThis = RT_FROM_MEMBER(pInterface, VNETSTATE, INetworkDown);
714 LogFlow(("%s vnetNetworkDown_WaitReceiveAvail(cMillies=%u)\n", INSTANCE(pThis), cMillies));
715 int rc = vnetCanReceive(pThis);
716
717 if (RT_SUCCESS(rc))
718 return VINF_SUCCESS;
719 if (RT_UNLIKELY(cMillies == 0))
720 return VERR_NET_NO_BUFFER_SPACE;
721
722 rc = VERR_INTERRUPTED;
723 ASMAtomicXchgBool(&pThis->fMaybeOutOfSpace, true);
724 STAM_PROFILE_START(&pThis->StatRxOverflow, a);
725
726 VMSTATE enmVMState;
727 while (RT_LIKELY( (enmVMState = PDMDevHlpVMState(pThis->VPCI.CTX_SUFF(pDevIns))) == VMSTATE_RUNNING
728 || enmVMState == VMSTATE_RUNNING_LS))
729 {
730 int rc2 = vnetCanReceive(pThis);
731 if (RT_SUCCESS(rc2))
732 {
733 rc = VINF_SUCCESS;
734 break;
735 }
736 Log(("%s vnetNetworkDown_WaitReceiveAvail: waiting cMillies=%u...\n", INSTANCE(pThis), cMillies));
737 RTSemEventWait(pThis->hEventMoreRxDescAvail, cMillies);
738 }
739 STAM_PROFILE_STOP(&pThis->StatRxOverflow, a);
740 ASMAtomicXchgBool(&pThis->fMaybeOutOfSpace, false);
741
742 LogFlow(("%s vnetNetworkDown_WaitReceiveAvail -> %d\n", INSTANCE(pThis), rc));
743 return rc;
744}
745
746
747/**
748 * @interface_method_impl{PDMIBASE,pfnQueryInterface}
749 */
750static DECLCALLBACK(void *) vnetQueryInterface(struct PDMIBASE *pInterface, const char *pszIID)
751{
752 PVNETSTATE pThis = RT_FROM_MEMBER(pInterface, VNETSTATE, VPCI.IBase);
753 Assert(&pThis->VPCI.IBase == pInterface);
754
755 PDMIBASE_RETURN_INTERFACE(pszIID, PDMINETWORKDOWN, &pThis->INetworkDown);
756 PDMIBASE_RETURN_INTERFACE(pszIID, PDMINETWORKCONFIG, &pThis->INetworkConfig);
757 return vpciQueryInterface(pInterface, pszIID);
758}
759
760/**
761 * Returns true if it is a broadcast packet.
762 *
763 * @returns true if destination address indicates broadcast.
764 * @param pvBuf The ethernet packet.
765 */
766DECLINLINE(bool) vnetIsBroadcast(const void *pvBuf)
767{
768 static const uint8_t s_abBcastAddr[] = { 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF };
769 return memcmp(pvBuf, s_abBcastAddr, sizeof(s_abBcastAddr)) == 0;
770}
771
772/**
773 * Returns true if it is a multicast packet.
774 *
775 * @remarks returns true for broadcast packets as well.
776 * @returns true if destination address indicates multicast.
777 * @param pvBuf The ethernet packet.
778 */
779DECLINLINE(bool) vnetIsMulticast(const void *pvBuf)
780{
781 return (*(char*)pvBuf) & 1;
782}
783
784/**
785 * Determines if the packet is to be delivered to upper layer.
786 *
787 * @returns true if packet is intended for this node.
788 * @param pThis Pointer to the state structure.
789 * @param pvBuf The ethernet packet.
790 * @param cb Number of bytes available in the packet.
791 */
792static bool vnetAddressFilter(PVNETSTATE pThis, const void *pvBuf, size_t cb)
793{
794 if (pThis->fPromiscuous)
795 return true;
796
797 /* Ignore everything outside of our VLANs */
798 uint16_t *u16Ptr = (uint16_t*)pvBuf;
799 /* Compare TPID with VLAN Ether Type */
800 if ( u16Ptr[6] == RT_H2BE_U16(0x8100)
801 && !ASMBitTest(pThis->aVlanFilter, RT_BE2H_U16(u16Ptr[7]) & 0xFFF))
802 {
803 Log4(("%s vnetAddressFilter: not our VLAN, returning false\n", INSTANCE(pThis)));
804 return false;
805 }
806
807 if (vnetIsBroadcast(pvBuf))
808 return true;
809
810 if (pThis->fAllMulti && vnetIsMulticast(pvBuf))
811 return true;
812
813 if (!memcmp(pThis->config.mac.au8, pvBuf, sizeof(RTMAC)))
814 return true;
815 Log4(("%s vnetAddressFilter: %RTmac (conf) != %RTmac (dest)\n", INSTANCE(pThis), pThis->config.mac.au8, pvBuf));
816
817 for (unsigned i = 0; i < pThis->nMacFilterEntries; i++)
818 if (!memcmp(&pThis->aMacFilter[i], pvBuf, sizeof(RTMAC)))
819 return true;
820
821 Log2(("%s vnetAddressFilter: failed all tests, returning false, packet dump follows:\n", INSTANCE(pThis)));
822 vnetPacketDump(pThis, (const uint8_t *)pvBuf, cb, "<-- Incoming");
823
824 return false;
825}
826
827/**
828 * Pad and store received packet.
829 *
830 * @remarks Make sure that the packet appears to upper layer as one coming
831 * from real Ethernet: pad it and insert FCS.
832 *
833 * @returns VBox status code.
834 * @param pThis The device state structure.
835 * @param pvBuf The available data.
836 * @param cb Number of bytes available in the buffer.
837 * @thread RX
838 */
839static int vnetHandleRxPacket(PVNETSTATE pThis, const void *pvBuf, size_t cb,
840 PCPDMNETWORKGSO pGso)
841{
842 VNETHDRMRX Hdr;
843 unsigned uHdrLen;
844 RTGCPHYS addrHdrMrx = 0;
845
846 if (pGso)
847 {
848 Log2(("%s vnetHandleRxPacket: gso type=%x cbHdrsTotal=%u cbHdrsSeg=%u mss=%u off1=0x%x off2=0x%x\n",
849 INSTANCE(pThis), pGso->u8Type, pGso->cbHdrsTotal, pGso->cbHdrsSeg, pGso->cbMaxSeg, pGso->offHdr1, pGso->offHdr2));
850 Hdr.Hdr.u8Flags = VNETHDR_F_NEEDS_CSUM;
851 switch (pGso->u8Type)
852 {
853 case PDMNETWORKGSOTYPE_IPV4_TCP:
854 Hdr.Hdr.u8GSOType = VNETHDR_GSO_TCPV4;
855 Hdr.Hdr.u16CSumOffset = RT_OFFSETOF(RTNETTCP, th_sum);
856 break;
857 case PDMNETWORKGSOTYPE_IPV6_TCP:
858 Hdr.Hdr.u8GSOType = VNETHDR_GSO_TCPV6;
859 Hdr.Hdr.u16CSumOffset = RT_OFFSETOF(RTNETTCP, th_sum);
860 break;
861 case PDMNETWORKGSOTYPE_IPV4_UDP:
862 Hdr.Hdr.u8GSOType = VNETHDR_GSO_UDP;
863 Hdr.Hdr.u16CSumOffset = RT_OFFSETOF(RTNETUDP, uh_sum);
864 break;
865 default:
866 return VERR_INVALID_PARAMETER;
867 }
868 Hdr.Hdr.u16HdrLen = pGso->cbHdrsTotal;
869 Hdr.Hdr.u16GSOSize = pGso->cbMaxSeg;
870 Hdr.Hdr.u16CSumStart = pGso->offHdr2;
871 STAM_REL_COUNTER_INC(&pThis->StatReceiveGSO);
872 }
873 else
874 {
875 Hdr.Hdr.u8Flags = 0;
876 Hdr.Hdr.u8GSOType = VNETHDR_GSO_NONE;
877 }
878
879 if (vnetMergeableRxBuffers(pThis))
880 uHdrLen = sizeof(VNETHDRMRX);
881 else
882 uHdrLen = sizeof(VNETHDR);
883
884 vnetPacketDump(pThis, (const uint8_t *)pvBuf, cb, "<-- Incoming");
885
886 unsigned int uOffset = 0;
887 unsigned int nElem;
888 for (nElem = 0; uOffset < cb; nElem++)
889 {
890 VQUEUEELEM elem;
891 unsigned int nSeg = 0, uElemSize = 0, cbReserved = 0;
892
893 if (!vqueueGet(&pThis->VPCI, pThis->pRxQueue, &elem))
894 {
895 /*
896 * @todo: It is possible to run out of RX buffers if only a few
897 * were added and we received a big packet.
898 */
899 Log(("%s vnetHandleRxPacket: Suddenly there is no space in receive queue!\n", INSTANCE(pThis)));
900 return VERR_INTERNAL_ERROR;
901 }
902
903 if (elem.nIn < 1)
904 {
905 Log(("%s vnetHandleRxPacket: No writable descriptors in receive queue!\n", INSTANCE(pThis)));
906 return VERR_INTERNAL_ERROR;
907 }
908
909 if (nElem == 0)
910 {
911 if (vnetMergeableRxBuffers(pThis))
912 {
913 addrHdrMrx = elem.aSegsIn[nSeg].addr;
914 cbReserved = uHdrLen;
915 }
916 else
917 {
918 /* The very first segment of the very first element gets the header. */
919 if (elem.aSegsIn[nSeg].cb != sizeof(VNETHDR))
920 {
921 Log(("%s vnetHandleRxPacket: The first descriptor does match the header size!\n", INSTANCE(pThis)));
922 return VERR_INTERNAL_ERROR;
923 }
924 elem.aSegsIn[nSeg++].pv = &Hdr;
925 }
926 uElemSize += uHdrLen;
927 }
928 while (nSeg < elem.nIn && uOffset < cb)
929 {
930 unsigned int uSize = (unsigned int)RT_MIN(elem.aSegsIn[nSeg].cb - (nSeg?0:cbReserved),
931 cb - uOffset);
932 elem.aSegsIn[nSeg++].pv = (uint8_t*)pvBuf + uOffset;
933 uOffset += uSize;
934 uElemSize += uSize;
935 }
936 STAM_PROFILE_START(&pThis->StatReceiveStore, a);
937 vqueuePut(&pThis->VPCI, pThis->pRxQueue, &elem, uElemSize, cbReserved);
938 STAM_PROFILE_STOP(&pThis->StatReceiveStore, a);
939 if (!vnetMergeableRxBuffers(pThis))
940 break;
941 cbReserved = 0;
942 }
943 if (vnetMergeableRxBuffers(pThis))
944 {
945 Hdr.u16NumBufs = nElem;
946 int rc = PDMDevHlpPCIPhysWrite(pThis->VPCI.CTX_SUFF(pDevIns), addrHdrMrx,
947 &Hdr, sizeof(Hdr));
948 if (RT_FAILURE(rc))
949 {
950 Log(("%s vnetHandleRxPacket: Failed to write merged RX buf header: %Rrc\n", INSTANCE(pThis), rc));
951 return rc;
952 }
953 }
954 vqueueSync(&pThis->VPCI, pThis->pRxQueue);
955 if (uOffset < cb)
956 {
957 Log(("%s vnetHandleRxPacket: Packet did not fit into RX queue (packet size=%u)!\n", INSTANCE(pThis), cb));
958 return VERR_TOO_MUCH_DATA;
959 }
960
961 return VINF_SUCCESS;
962}
963
964/**
965 * @interface_method_impl{PDMINETWORKDOWN,pfnReceiveGso}
966 */
967static DECLCALLBACK(int) vnetNetworkDown_ReceiveGso(PPDMINETWORKDOWN pInterface,
968 const void *pvBuf, size_t cb,
969 PCPDMNETWORKGSO pGso)
970{
971 PVNETSTATE pThis = RT_FROM_MEMBER(pInterface, VNETSTATE, INetworkDown);
972
973 if (pGso)
974 {
975 uint32_t uFeatures = pThis->VPCI.uGuestFeatures;
976
977 switch (pGso->u8Type)
978 {
979 case PDMNETWORKGSOTYPE_IPV4_TCP:
980 uFeatures &= VNET_F_GUEST_TSO4;
981 break;
982 case PDMNETWORKGSOTYPE_IPV6_TCP:
983 uFeatures &= VNET_F_GUEST_TSO6;
984 break;
985 case PDMNETWORKGSOTYPE_IPV4_UDP:
986 case PDMNETWORKGSOTYPE_IPV6_UDP:
987 uFeatures &= VNET_F_GUEST_UFO;
988 break;
989 default:
990 uFeatures = 0;
991 break;
992 }
993 if (!uFeatures)
994 {
995 Log2(("%s vnetNetworkDown_ReceiveGso: GSO type (0x%x) not supported\n", INSTANCE(pThis), pGso->u8Type));
996 return VERR_NOT_SUPPORTED;
997 }
998 }
999
1000 Log2(("%s vnetNetworkDown_ReceiveGso: pvBuf=%p cb=%u pGso=%p\n", INSTANCE(pThis), pvBuf, cb, pGso));
1001 int rc = vnetCanReceive(pThis);
1002 if (RT_FAILURE(rc))
1003 return rc;
1004
1005 /* Drop packets if VM is not running or cable is disconnected. */
1006 VMSTATE enmVMState = PDMDevHlpVMState(pThis->VPCI.CTX_SUFF(pDevIns));
1007 if (( enmVMState != VMSTATE_RUNNING
1008 && enmVMState != VMSTATE_RUNNING_LS)
1009 || !(STATUS & VNET_S_LINK_UP))
1010 return VINF_SUCCESS;
1011
1012 STAM_PROFILE_START(&pThis->StatReceive, a);
1013 vpciSetReadLed(&pThis->VPCI, true);
1014 if (vnetAddressFilter(pThis, pvBuf, cb))
1015 {
1016 rc = vnetCsRxEnter(pThis, VERR_SEM_BUSY);
1017 if (RT_SUCCESS(rc))
1018 {
1019 rc = vnetHandleRxPacket(pThis, pvBuf, cb, pGso);
1020 STAM_REL_COUNTER_ADD(&pThis->StatReceiveBytes, cb);
1021 vnetCsRxLeave(pThis);
1022 }
1023 }
1024 vpciSetReadLed(&pThis->VPCI, false);
1025 STAM_PROFILE_STOP(&pThis->StatReceive, a);
1026 return rc;
1027}
1028
1029/**
1030 * @interface_method_impl{PDMINETWORKDOWN,pfnReceive}
1031 */
1032static DECLCALLBACK(int) vnetNetworkDown_Receive(PPDMINETWORKDOWN pInterface, const void *pvBuf, size_t cb)
1033{
1034 return vnetNetworkDown_ReceiveGso(pInterface, pvBuf, cb, NULL);
1035}
1036
1037/**
1038 * Gets the current Media Access Control (MAC) address.
1039 *
1040 * @returns VBox status code.
1041 * @param pInterface Pointer to the interface structure containing the called function pointer.
1042 * @param pMac Where to store the MAC address.
1043 * @thread EMT
1044 */
1045static DECLCALLBACK(int) vnetGetMac(PPDMINETWORKCONFIG pInterface, PRTMAC pMac)
1046{
1047 PVNETSTATE pThis = RT_FROM_MEMBER(pInterface, VNETSTATE, INetworkConfig);
1048 memcpy(pMac, pThis->config.mac.au8, sizeof(RTMAC));
1049 return VINF_SUCCESS;
1050}
1051
1052/**
1053 * Gets the new link state.
1054 *
1055 * @returns The current link state.
1056 * @param pInterface Pointer to the interface structure containing the called function pointer.
1057 * @thread EMT
1058 */
1059static DECLCALLBACK(PDMNETWORKLINKSTATE) vnetGetLinkState(PPDMINETWORKCONFIG pInterface)
1060{
1061 PVNETSTATE pThis = RT_FROM_MEMBER(pInterface, VNETSTATE, INetworkConfig);
1062 if (STATUS & VNET_S_LINK_UP)
1063 return PDMNETWORKLINKSTATE_UP;
1064 return PDMNETWORKLINKSTATE_DOWN;
1065}
1066
1067
1068/**
1069 * Sets the new link state.
1070 *
1071 * @returns VBox status code.
1072 * @param pInterface Pointer to the interface structure containing the called function pointer.
1073 * @param enmState The new link state
1074 */
1075static DECLCALLBACK(int) vnetSetLinkState(PPDMINETWORKCONFIG pInterface, PDMNETWORKLINKSTATE enmState)
1076{
1077 PVNETSTATE pThis = RT_FROM_MEMBER(pInterface, VNETSTATE, INetworkConfig);
1078 bool fOldUp = !!(STATUS & VNET_S_LINK_UP);
1079 bool fNewUp = enmState == PDMNETWORKLINKSTATE_UP;
1080
1081 Log(("%s vnetSetLinkState: enmState=%d\n", INSTANCE(pThis), enmState));
1082 if (enmState == PDMNETWORKLINKSTATE_DOWN_RESUME)
1083 {
1084 if (fOldUp)
1085 {
1086 /*
1087 * We bother to bring the link down only if it was up previously. The UP link state
1088 * notification will be sent when the link actually goes up in vnetLinkUpTimer().
1089 */
1090 vnetTempLinkDown(pThis);
1091 if (pThis->pDrv)
1092 pThis->pDrv->pfnNotifyLinkChanged(pThis->pDrv, enmState);
1093 }
1094 }
1095 else if (fNewUp != fOldUp)
1096 {
1097 if (fNewUp)
1098 {
1099 Log(("%s Link is up\n", INSTANCE(pThis)));
1100 pThis->fCableConnected = true;
1101 STATUS |= VNET_S_LINK_UP;
1102 vnetRaiseInterrupt(pThis, VERR_SEM_BUSY, VPCI_ISR_CONFIG);
1103 }
1104 else
1105 {
1106 /* The link was brought down explicitly, make sure it won't come up by timer. */
1107 TMTimerStop(pThis->pLinkUpTimer);
1108 Log(("%s Link is down\n", INSTANCE(pThis)));
1109 pThis->fCableConnected = false;
1110 STATUS &= ~VNET_S_LINK_UP;
1111 vnetRaiseInterrupt(pThis, VERR_SEM_BUSY, VPCI_ISR_CONFIG);
1112 }
1113 if (pThis->pDrv)
1114 pThis->pDrv->pfnNotifyLinkChanged(pThis->pDrv, enmState);
1115 }
1116 return VINF_SUCCESS;
1117}
1118
1119static DECLCALLBACK(void) vnetQueueReceive(void *pvState, PVQUEUE pQueue)
1120{
1121 RT_NOREF(pQueue);
1122 PVNETSTATE pThis = (PVNETSTATE)pvState;
1123 Log(("%s Receive buffers has been added, waking up receive thread.\n", INSTANCE(pThis)));
1124 vnetWakeupReceive(pThis->VPCI.CTX_SUFF(pDevIns));
1125}
1126
1127/**
1128 * Sets up the GSO context according to the Virtio header.
1129 *
1130 * @param pGso The GSO context to setup.
1131 * @param pCtx The context descriptor.
1132 */
1133DECLINLINE(PPDMNETWORKGSO) vnetSetupGsoCtx(PPDMNETWORKGSO pGso, VNETHDR const *pHdr)
1134{
1135 pGso->u8Type = PDMNETWORKGSOTYPE_INVALID;
1136
1137 if (pHdr->u8GSOType & VNETHDR_GSO_ECN)
1138 {
1139 AssertMsgFailed(("Unsupported flag in virtio header: ECN\n"));
1140 return NULL;
1141 }
1142 switch (pHdr->u8GSOType & ~VNETHDR_GSO_ECN)
1143 {
1144 case VNETHDR_GSO_TCPV4:
1145 pGso->u8Type = PDMNETWORKGSOTYPE_IPV4_TCP;
1146 pGso->cbHdrsSeg = pHdr->u16HdrLen;
1147 break;
1148 case VNETHDR_GSO_TCPV6:
1149 pGso->u8Type = PDMNETWORKGSOTYPE_IPV6_TCP;
1150 pGso->cbHdrsSeg = pHdr->u16HdrLen;
1151 break;
1152 case VNETHDR_GSO_UDP:
1153 pGso->u8Type = PDMNETWORKGSOTYPE_IPV4_UDP;
1154 pGso->cbHdrsSeg = pHdr->u16CSumStart;
1155 break;
1156 default:
1157 return NULL;
1158 }
1159 if (pHdr->u8Flags & VNETHDR_F_NEEDS_CSUM)
1160 pGso->offHdr2 = pHdr->u16CSumStart;
1161 else
1162 {
1163 AssertMsgFailed(("GSO without checksum offloading!\n"));
1164 return NULL;
1165 }
1166 pGso->offHdr1 = sizeof(RTNETETHERHDR);
1167 pGso->cbHdrsTotal = pHdr->u16HdrLen;
1168 pGso->cbMaxSeg = pHdr->u16GSOSize;
1169 return pGso;
1170}
1171
1172DECLINLINE(uint16_t) vnetCSum16(const void *pvBuf, size_t cb)
1173{
1174 uint32_t csum = 0;
1175 uint16_t *pu16 = (uint16_t *)pvBuf;
1176
1177 while (cb > 1)
1178 {
1179 csum += *pu16++;
1180 cb -= 2;
1181 }
1182 if (cb)
1183 csum += *(uint8_t*)pu16;
1184 while (csum >> 16)
1185 csum = (csum >> 16) + (csum & 0xFFFF);
1186 return ~csum;
1187}
1188
1189DECLINLINE(void) vnetCompleteChecksum(uint8_t *pBuf, size_t cbSize, uint16_t uStart, uint16_t uOffset)
1190{
1191 AssertReturnVoid(uStart < cbSize);
1192 AssertReturnVoid(uStart + uOffset + sizeof(uint16_t) <= cbSize);
1193 *(uint16_t*)(pBuf + uStart + uOffset) = vnetCSum16(pBuf + uStart, cbSize - uStart);
1194}
1195
1196static bool vnetReadHeader(PVNETSTATE pThis, RTGCPHYS GCPhys, PVNETHDR pHdr, uint32_t cbMax)
1197{
1198 int rc = PDMDevHlpPhysRead(pThis->VPCI.CTX_SUFF(pDevIns), GCPhys, pHdr, sizeof(*pHdr));
1199 if (RT_FAILURE(rc))
1200 return false;
1201
1202 Log4(("virtio-net: header flags=%x gso-type=%x len=%x gso-size=%x csum-start=%x csum-offset=%x cb=%x\n",
1203 pHdr->u8Flags, pHdr->u8GSOType, pHdr->u16HdrLen, pHdr->u16GSOSize, pHdr->u16CSumStart, pHdr->u16CSumOffset, cbMax));
1204
1205 if (pHdr->u8GSOType)
1206 {
1207 uint32_t u32MinHdrSize;
1208
1209 /* Segmentation offloading cannot be done without checksumming. */
1210 if (RT_UNLIKELY(!(pHdr->u8Flags & VNETHDR_F_NEEDS_CSUM)))
1211 return false;
1212 /* We do not support ECN. */
1213 if (RT_UNLIKELY(pHdr->u8GSOType & VNETHDR_GSO_ECN))
1214 return false;
1215 switch (pHdr->u8GSOType)
1216 {
1217 case VNETHDR_GSO_TCPV4:
1218 case VNETHDR_GSO_TCPV6:
1219 u32MinHdrSize = sizeof(RTNETTCP);
1220 break;
1221 case VNETHDR_GSO_UDP:
1222 u32MinHdrSize = 0;
1223 break;
1224 default:
1225 return false;
1226 }
1227 /* Header+MSS must not exceed the packet size. */
1228 if (RT_UNLIKELY(u32MinHdrSize + pHdr->u16CSumStart + pHdr->u16GSOSize > cbMax))
1229 return false;
1230 }
1231 /* Checksum must fit into the frame (validating both checksum fields). */
1232 if ( (pHdr->u8Flags & VNETHDR_F_NEEDS_CSUM)
1233 && sizeof(uint16_t) + pHdr->u16CSumStart + pHdr->u16CSumOffset > cbMax)
1234 return false;
1235 Log4(("virtio-net: return true\n"));
1236 return true;
1237}
1238
1239static int vnetTransmitFrame(PVNETSTATE pThis, PPDMSCATTERGATHER pSgBuf, PPDMNETWORKGSO pGso, PVNETHDR pHdr)
1240{
1241 vnetPacketDump(pThis, (uint8_t *)pSgBuf->aSegs[0].pvSeg, pSgBuf->cbUsed, "--> Outgoing");
1242 if (pGso)
1243 {
1244 /* Some guests (RHEL) may report HdrLen excluding transport layer header! */
1245 /*
1246 * We cannot use cdHdrs provided by the guest because of different ways
1247 * it gets filled out by different versions of kernels.
1248 */
1249 //if (pGso->cbHdrs < pHdr->u16CSumStart + pHdr->u16CSumOffset + 2)
1250 {
1251 Log4(("%s vnetTransmitPendingPackets: HdrLen before adjustment %d.\n",
1252 INSTANCE(pThis), pGso->cbHdrsTotal));
1253 switch (pGso->u8Type)
1254 {
1255 case PDMNETWORKGSOTYPE_IPV4_TCP:
1256 case PDMNETWORKGSOTYPE_IPV6_TCP:
1257 pGso->cbHdrsTotal = pHdr->u16CSumStart +
1258 ((PRTNETTCP)(((uint8_t*)pSgBuf->aSegs[0].pvSeg) + pHdr->u16CSumStart))->th_off * 4;
1259 pGso->cbHdrsSeg = pGso->cbHdrsTotal;
1260 break;
1261 case PDMNETWORKGSOTYPE_IPV4_UDP:
1262 pGso->cbHdrsTotal = (uint8_t)(pHdr->u16CSumStart + sizeof(RTNETUDP));
1263 pGso->cbHdrsSeg = pHdr->u16CSumStart;
1264 break;
1265 }
1266 /* Update GSO structure embedded into the frame */
1267 ((PPDMNETWORKGSO)pSgBuf->pvUser)->cbHdrsTotal = pGso->cbHdrsTotal;
1268 ((PPDMNETWORKGSO)pSgBuf->pvUser)->cbHdrsSeg = pGso->cbHdrsSeg;
1269 Log4(("%s vnetTransmitPendingPackets: adjusted HdrLen to %d.\n",
1270 INSTANCE(pThis), pGso->cbHdrsTotal));
1271 }
1272 Log2(("%s vnetTransmitPendingPackets: gso type=%x cbHdrsTotal=%u cbHdrsSeg=%u mss=%u off1=0x%x off2=0x%x\n",
1273 INSTANCE(pThis), pGso->u8Type, pGso->cbHdrsTotal, pGso->cbHdrsSeg, pGso->cbMaxSeg, pGso->offHdr1, pGso->offHdr2));
1274 STAM_REL_COUNTER_INC(&pThis->StatTransmitGSO);
1275 }
1276 else if (pHdr->u8Flags & VNETHDR_F_NEEDS_CSUM)
1277 {
1278 STAM_REL_COUNTER_INC(&pThis->StatTransmitCSum);
1279 /*
1280 * This is not GSO frame but checksum offloading is requested.
1281 */
1282 vnetCompleteChecksum((uint8_t*)pSgBuf->aSegs[0].pvSeg, pSgBuf->cbUsed,
1283 pHdr->u16CSumStart, pHdr->u16CSumOffset);
1284 }
1285
1286 return pThis->pDrv->pfnSendBuf(pThis->pDrv, pSgBuf, false);
1287}
1288
1289static void vnetTransmitPendingPackets(PVNETSTATE pThis, PVQUEUE pQueue, bool fOnWorkerThread)
1290{
1291 /*
1292 * Only one thread is allowed to transmit at a time, others should skip
1293 * transmission as the packets will be picked up by the transmitting
1294 * thread.
1295 */
1296 if (!ASMAtomicCmpXchgU32(&pThis->uIsTransmitting, 1, 0))
1297 return;
1298
1299 if ((pThis->VPCI.uStatus & VPCI_STATUS_DRV_OK) == 0)
1300 {
1301 Log(("%s Ignoring transmit requests from non-existent driver (status=0x%x).\n", INSTANCE(pThis), pThis->VPCI.uStatus));
1302 return;
1303 }
1304
1305 if (!pThis->fCableConnected)
1306 {
1307 Log(("%s Ignoring transmit requests while cable is disconnected.\n", INSTANCE(pThis)));
1308 return;
1309 }
1310
1311 PPDMINETWORKUP pDrv = pThis->pDrv;
1312 if (pDrv)
1313 {
1314 int rc = pDrv->pfnBeginXmit(pDrv, fOnWorkerThread);
1315 Assert(rc == VINF_SUCCESS || rc == VERR_TRY_AGAIN);
1316 if (rc == VERR_TRY_AGAIN)
1317 {
1318 ASMAtomicWriteU32(&pThis->uIsTransmitting, 0);
1319 return;
1320 }
1321 }
1322
1323 unsigned int uHdrLen;
1324 if (vnetMergeableRxBuffers(pThis))
1325 uHdrLen = sizeof(VNETHDRMRX);
1326 else
1327 uHdrLen = sizeof(VNETHDR);
1328
1329 Log3(("%s vnetTransmitPendingPackets: About to transmit %d pending packets\n",
1330 INSTANCE(pThis), vringReadAvailIndex(&pThis->VPCI, &pThis->pTxQueue->VRing) - pThis->pTxQueue->uNextAvailIndex));
1331
1332 vpciSetWriteLed(&pThis->VPCI, true);
1333
1334 /*
1335 * Do not remove descriptors from available ring yet, try to allocate the
1336 * buffer first.
1337 */
1338 VQUEUEELEM elem; /* This bugger is big! ~48KB on 64-bit hosts. */
1339 while (vqueuePeek(&pThis->VPCI, pQueue, &elem))
1340 {
1341 unsigned int uOffset = 0;
1342 if (elem.nOut < 2 || elem.aSegsOut[0].cb != uHdrLen)
1343 {
1344 Log(("%s vnetQueueTransmit: The first segment is not the header! (%u < 2 || %u != %u).\n",
1345 INSTANCE(pThis), elem.nOut, elem.aSegsOut[0].cb, uHdrLen));
1346 break; /* For now we simply ignore the header, but it must be there anyway! */
1347 }
1348 RT_UNTRUSTED_VALIDATED_FENCE();
1349
1350 VNETHDR Hdr;
1351 unsigned int uSize = 0;
1352 STAM_PROFILE_ADV_START(&pThis->StatTransmit, a);
1353
1354 /* Compute total frame size. */
1355 for (unsigned int i = 1; i < elem.nOut && uSize < VNET_MAX_FRAME_SIZE; i++)
1356 uSize += elem.aSegsOut[i].cb;
1357 Log5(("%s vnetTransmitPendingPackets: complete frame is %u bytes.\n", INSTANCE(pThis), uSize));
1358 Assert(uSize <= VNET_MAX_FRAME_SIZE);
1359
1360 /* Truncate oversized frames. */
1361 if (uSize > VNET_MAX_FRAME_SIZE)
1362 uSize = VNET_MAX_FRAME_SIZE;
1363 if (pThis->pDrv && vnetReadHeader(pThis, elem.aSegsOut[0].addr, &Hdr, uSize))
1364 {
1365 RT_UNTRUSTED_VALIDATED_FENCE();
1366 STAM_REL_COUNTER_INC(&pThis->StatTransmitPackets);
1367 STAM_PROFILE_START(&pThis->StatTransmitSend, a);
1368
1369 PDMNETWORKGSO Gso;
1370 PDMNETWORKGSO *pGso = vnetSetupGsoCtx(&Gso, &Hdr);
1371
1372 /** @todo Optimize away the extra copying! (lazy bird) */
1373 PPDMSCATTERGATHER pSgBuf;
1374 int rc = pThis->pDrv->pfnAllocBuf(pThis->pDrv, uSize, pGso, &pSgBuf);
1375 if (RT_SUCCESS(rc))
1376 {
1377 Assert(pSgBuf->cSegs == 1);
1378 pSgBuf->cbUsed = uSize;
1379
1380 /* Assemble a complete frame. */
1381 for (unsigned int i = 1; i < elem.nOut && uSize > 0; i++)
1382 {
1383 unsigned int cbSegment = RT_MIN(uSize, elem.aSegsOut[i].cb);
1384 PDMDevHlpPhysRead(pThis->VPCI.CTX_SUFF(pDevIns), elem.aSegsOut[i].addr,
1385 ((uint8_t*)pSgBuf->aSegs[0].pvSeg) + uOffset,
1386 cbSegment);
1387 uOffset += cbSegment;
1388 uSize -= cbSegment;
1389 }
1390 rc = vnetTransmitFrame(pThis, pSgBuf, pGso, &Hdr);
1391 }
1392 else
1393 {
1394 Log4(("virtio-net: failed to allocate SG buffer: size=%u rc=%Rrc\n", uSize, rc));
1395 STAM_PROFILE_STOP(&pThis->StatTransmitSend, a);
1396 STAM_PROFILE_ADV_STOP(&pThis->StatTransmit, a);
1397 /* Stop trying to fetch TX descriptors until we get more bandwidth. */
1398 break;
1399 }
1400
1401 STAM_PROFILE_STOP(&pThis->StatTransmitSend, a);
1402 STAM_REL_COUNTER_ADD(&pThis->StatTransmitBytes, uOffset);
1403 }
1404
1405 /* Remove this descriptor chain from the available ring */
1406 vqueueSkip(&pThis->VPCI, pQueue);
1407 vqueuePut(&pThis->VPCI, pQueue, &elem, sizeof(VNETHDR) + uOffset);
1408 vqueueSync(&pThis->VPCI, pQueue);
1409 STAM_PROFILE_ADV_STOP(&pThis->StatTransmit, a);
1410 }
1411 vpciSetWriteLed(&pThis->VPCI, false);
1412
1413 if (pDrv)
1414 pDrv->pfnEndXmit(pDrv);
1415 ASMAtomicWriteU32(&pThis->uIsTransmitting, 0);
1416}
1417
1418/**
1419 * @interface_method_impl{PDMINETWORKDOWN,pfnXmitPending}
1420 */
1421static DECLCALLBACK(void) vnetNetworkDown_XmitPending(PPDMINETWORKDOWN pInterface)
1422{
1423 PVNETSTATE pThis = RT_FROM_MEMBER(pInterface, VNETSTATE, INetworkDown);
1424#if defined(VBOX_WITH_STATISTICS)
1425 STAM_REL_COUNTER_INC(&pThis->StatTransmitByNetwork);
1426#endif /* VBOX_WITH_STATISTICS */
1427 vnetTransmitPendingPackets(pThis, pThis->pTxQueue, false /*fOnWorkerThread*/);
1428}
1429
1430#ifdef VNET_TX_DELAY
1431
1432static DECLCALLBACK(void) vnetQueueTransmit(void *pvState, PVQUEUE pQueue)
1433{
1434 PVNETSTATE pThis = (PVNETSTATE)pvState;
1435
1436 if (TMTimerIsActive(pThis->CTX_SUFF(pTxTimer)))
1437 {
1438 TMTimerStop(pThis->CTX_SUFF(pTxTimer));
1439 Log3(("%s vnetQueueTransmit: Got kicked with notification disabled, re-enable notification and flush TX queue\n", INSTANCE(pThis)));
1440 vnetTransmitPendingPackets(pThis, pQueue, false /*fOnWorkerThread*/);
1441 if (RT_FAILURE(vnetCsEnter(pThis, VERR_SEM_BUSY)))
1442 LogRel(("vnetQueueTransmit: Failed to enter critical section!/n"));
1443 else
1444 {
1445 vringSetNotification(&pThis->VPCI, &pThis->pTxQueue->VRing, true);
1446 vnetCsLeave(pThis);
1447 }
1448 }
1449 else
1450 {
1451 if (RT_FAILURE(vnetCsEnter(pThis, VERR_SEM_BUSY)))
1452 LogRel(("vnetQueueTransmit: Failed to enter critical section!/n"));
1453 else
1454 {
1455 vringSetNotification(&pThis->VPCI, &pThis->pTxQueue->VRing, false);
1456 TMTimerSetMicro(pThis->CTX_SUFF(pTxTimer), VNET_TX_DELAY);
1457 pThis->u64NanoTS = RTTimeNanoTS();
1458 vnetCsLeave(pThis);
1459 }
1460 }
1461}
1462
1463/**
1464 * @callback_method_impl{FNTMTIMERDEV, Transmit Delay Timer handler.}
1465 */
1466static DECLCALLBACK(void) vnetTxTimer(PPDMDEVINS pDevIns, PTMTIMER pTimer, void *pvUser)
1467{
1468 RT_NOREF(pDevIns, pTimer);
1469 PVNETSTATE pThis = (PVNETSTATE)pvUser;
1470
1471 uint32_t u32MicroDiff = (uint32_t)((RTTimeNanoTS() - pThis->u64NanoTS)/1000);
1472 if (u32MicroDiff < pThis->u32MinDiff)
1473 pThis->u32MinDiff = u32MicroDiff;
1474 if (u32MicroDiff > pThis->u32MaxDiff)
1475 pThis->u32MaxDiff = u32MicroDiff;
1476 pThis->u32AvgDiff = (pThis->u32AvgDiff * pThis->u32i + u32MicroDiff) / (pThis->u32i + 1);
1477 pThis->u32i++;
1478 Log3(("vnetTxTimer: Expired, diff %9d usec, avg %9d usec, min %9d usec, max %9d usec\n",
1479 u32MicroDiff, pThis->u32AvgDiff, pThis->u32MinDiff, pThis->u32MaxDiff));
1480
1481// Log3(("%s vnetTxTimer: Expired\n", INSTANCE(pThis)));
1482 vnetTransmitPendingPackets(pThis, pThis->pTxQueue, false /*fOnWorkerThread*/);
1483 if (RT_FAILURE(vnetCsEnter(pThis, VERR_SEM_BUSY)))
1484 {
1485 LogRel(("vnetTxTimer: Failed to enter critical section!/n"));
1486 return;
1487 }
1488 vringSetNotification(&pThis->VPCI, &pThis->pTxQueue->VRing, true);
1489 vnetCsLeave(pThis);
1490}
1491
1492inline int vnetCreateTxThreadAndEvent(PPDMDEVINS pDevIns, PVNETSTATE pThis)
1493{
1494 RT_NOREF(pDevIns, pThis);
1495 return VINF_SUCCESS;
1496}
1497
1498inline void vnetDestroyTxThreadAndEvent(PVNETSTATE pThis)
1499{
1500 RT_NOREF(pThis);
1501}
1502#else /* !VNET_TX_DELAY */
1503
1504static DECLCALLBACK(int) vnetTxThread(PPDMDEVINS pDevIns, PPDMTHREAD pThread)
1505{
1506 RT_NOREF(pDevIns);
1507 PVNETSTATE pThis = (PVNETSTATE)pThread->pvUser;
1508 int rc = VINF_SUCCESS;
1509
1510 if (pThread->enmState == PDMTHREADSTATE_INITIALIZING)
1511 return VINF_SUCCESS;
1512
1513 while (pThread->enmState == PDMTHREADSTATE_RUNNING)
1514 {
1515 rc = SUPSemEventWaitNoResume(pThis->pSupDrvSession, pThis->hTxEvent, RT_INDEFINITE_WAIT);
1516 if (RT_UNLIKELY(pThread->enmState != PDMTHREADSTATE_RUNNING))
1517 break;
1518#if defined(VBOX_WITH_STATISTICS)
1519 STAM_REL_COUNTER_INC(&pThis->StatTransmitByThread);
1520#endif /* VBOX_WITH_STATISTICS */
1521 while (true)
1522 {
1523 vnetTransmitPendingPackets(pThis, pThis->pTxQueue, false /*fOnWorkerThread*/); /// @todo shouldn't it be true instead?
1524 Log(("vnetTxThread: enable kicking and get to sleep\n"));
1525 vringSetNotification(&pThis->VPCI, &pThis->pTxQueue->VRing, true);
1526 if (vqueueIsEmpty(&pThis->VPCI, pThis->pTxQueue))
1527 break;
1528 vringSetNotification(&pThis->VPCI, &pThis->pTxQueue->VRing, false);
1529 }
1530 }
1531
1532 return rc;
1533}
1534
1535/**
1536 * Unblock TX thread so it can respond to a state change.
1537 *
1538 * @returns VBox status code.
1539 * @param pDevIns The device instance.
1540 * @param pThread The send thread.
1541 */
1542static DECLCALLBACK(int) vnetTxThreadWakeUp(PPDMDEVINS pDevIns, PPDMTHREAD pThread)
1543{
1544 RT_NOREF(pDevIns);
1545 PVNETSTATE pThis = (PVNETSTATE)pThread->pvUser;
1546 return SUPSemEventSignal(pThis->pSupDrvSession, pThis->hTxEvent);
1547}
1548
1549static int vnetCreateTxThreadAndEvent(PPDMDEVINS pDevIns, PVNETSTATE pThis)
1550{
1551 int rc = SUPSemEventCreate(pThis->pSupDrvSession, &pThis->hTxEvent);
1552 if (RT_FAILURE(rc))
1553 return PDMDevHlpVMSetError(pDevIns, rc, RT_SRC_POS,
1554 N_("VNET: Failed to create SUP event semaphore"));
1555 rc = PDMDevHlpThreadCreate(pDevIns, &pThis->pTxThread, pThis, vnetTxThread,
1556 vnetTxThreadWakeUp, 0, RTTHREADTYPE_IO, INSTANCE(pThis));
1557 if (RT_FAILURE(rc))
1558 return PDMDevHlpVMSetError(pDevIns, rc, RT_SRC_POS,
1559 N_("VNET: Failed to create worker thread %s"), INSTANCE(pThis));
1560 return VINF_SUCCESS;
1561}
1562
1563static void vnetDestroyTxThreadAndEvent(PVNETSTATE pThis)
1564{
1565 if (pThis->pTxThread)
1566 {
1567 int rcThread;
1568 /* Destroy the thread. */
1569 int rc = PDMR3ThreadDestroy(pThis->pTxThread, &rcThread);
1570 if (RT_FAILURE(rc) || RT_FAILURE(rcThread))
1571 AssertMsgFailed(("%s Failed to destroy async IO thread rc=%Rrc rcThread=%Rrc\n", __FUNCTION__, rc, rcThread));
1572 pThis->pTxThread = NULL;
1573 }
1574 if (pThis->hTxEvent != NIL_SUPSEMEVENT)
1575 {
1576 SUPSemEventClose(pThis->pSupDrvSession, pThis->hTxEvent);
1577 pThis->hTxEvent = NIL_SUPSEMEVENT;
1578 }
1579}
1580
1581static DECLCALLBACK(void) vnetQueueTransmit(void *pvState, PVQUEUE pQueue)
1582{
1583 PVNETSTATE pThis = (PVNETSTATE)pvState;
1584
1585 Log(("vnetQueueTransmit: disable kicking and wake up TX thread\n"));
1586 vringSetNotification(&pThis->VPCI, &pQueue->VRing, false);
1587 SUPSemEventSignal(pThis->pSupDrvSession, pThis->hTxEvent);
1588}
1589
1590#endif /* !VNET_TX_DELAY */
1591
1592static uint8_t vnetControlRx(PVNETSTATE pThis, PVNETCTLHDR pCtlHdr, PVQUEUEELEM pElem)
1593{
1594 uint8_t u8Ack = VNET_OK;
1595 uint8_t fOn, fDrvWasPromisc = pThis->fPromiscuous | pThis->fAllMulti;
1596 PDMDevHlpPhysRead(pThis->VPCI.CTX_SUFF(pDevIns),
1597 pElem->aSegsOut[1].addr,
1598 &fOn, sizeof(fOn));
1599 Log(("%s vnetControlRx: uCommand=%u fOn=%u\n", INSTANCE(pThis), pCtlHdr->u8Command, fOn));
1600 switch (pCtlHdr->u8Command)
1601 {
1602 case VNET_CTRL_CMD_RX_MODE_PROMISC:
1603 pThis->fPromiscuous = !!fOn;
1604 break;
1605 case VNET_CTRL_CMD_RX_MODE_ALLMULTI:
1606 pThis->fAllMulti = !!fOn;
1607 break;
1608 default:
1609 u8Ack = VNET_ERROR;
1610 }
1611 if (fDrvWasPromisc != (pThis->fPromiscuous | pThis->fAllMulti) && pThis->pDrv)
1612 pThis->pDrv->pfnSetPromiscuousMode(pThis->pDrv,
1613 (pThis->fPromiscuous | pThis->fAllMulti));
1614
1615 return u8Ack;
1616}
1617
1618static uint8_t vnetControlMac(PVNETSTATE pThis, PVNETCTLHDR pCtlHdr, PVQUEUEELEM pElem)
1619{
1620 uint32_t nMacs = 0;
1621
1622 if (pCtlHdr->u8Command != VNET_CTRL_CMD_MAC_TABLE_SET
1623 || pElem->nOut != 3
1624 || pElem->aSegsOut[1].cb < sizeof(nMacs)
1625 || pElem->aSegsOut[2].cb < sizeof(nMacs))
1626 {
1627 Log(("%s vnetControlMac: Segment layout is wrong (u8Command=%u nOut=%u cb1=%u cb2=%u)\n",
1628 INSTANCE(pThis), pCtlHdr->u8Command, pElem->nOut, pElem->aSegsOut[1].cb, pElem->aSegsOut[2].cb));
1629 return VNET_ERROR;
1630 }
1631
1632 /* Load unicast addresses */
1633 PDMDevHlpPhysRead(pThis->VPCI.CTX_SUFF(pDevIns),
1634 pElem->aSegsOut[1].addr,
1635 &nMacs, sizeof(nMacs));
1636
1637 if (pElem->aSegsOut[1].cb < nMacs * sizeof(RTMAC) + sizeof(nMacs))
1638 {
1639 Log(("%s vnetControlMac: The unicast mac segment is too small (nMacs=%u cb=%u)\n",
1640 INSTANCE(pThis), nMacs, pElem->aSegsOut[1].cb));
1641 return VNET_ERROR;
1642 }
1643
1644 if (nMacs > VNET_MAC_FILTER_LEN)
1645 {
1646 Log(("%s vnetControlMac: MAC table is too big, have to use promiscuous mode (nMacs=%u)\n", INSTANCE(pThis), nMacs));
1647 pThis->fPromiscuous = true;
1648 }
1649 else
1650 {
1651 if (nMacs)
1652 PDMDevHlpPhysRead(pThis->VPCI.CTX_SUFF(pDevIns),
1653 pElem->aSegsOut[1].addr + sizeof(nMacs),
1654 pThis->aMacFilter, nMacs * sizeof(RTMAC));
1655 pThis->nMacFilterEntries = nMacs;
1656#ifdef DEBUG
1657 Log(("%s vnetControlMac: unicast macs:\n", INSTANCE(pThis)));
1658 for(unsigned i = 0; i < nMacs; i++)
1659 Log((" %RTmac\n", &pThis->aMacFilter[i]));
1660#endif /* DEBUG */
1661 }
1662
1663 /* Load multicast addresses */
1664 PDMDevHlpPhysRead(pThis->VPCI.CTX_SUFF(pDevIns),
1665 pElem->aSegsOut[2].addr,
1666 &nMacs, sizeof(nMacs));
1667
1668 if (pElem->aSegsOut[2].cb < nMacs * sizeof(RTMAC) + sizeof(nMacs))
1669 {
1670 Log(("%s vnetControlMac: The multicast mac segment is too small (nMacs=%u cb=%u)\n",
1671 INSTANCE(pThis), nMacs, pElem->aSegsOut[2].cb));
1672 return VNET_ERROR;
1673 }
1674
1675 if (nMacs > VNET_MAC_FILTER_LEN - pThis->nMacFilterEntries)
1676 {
1677 Log(("%s vnetControlMac: MAC table is too big, have to use allmulti mode (nMacs=%u)\n", INSTANCE(pThis), nMacs));
1678 pThis->fAllMulti = true;
1679 }
1680 else
1681 {
1682 if (nMacs)
1683 PDMDevHlpPhysRead(pThis->VPCI.CTX_SUFF(pDevIns),
1684 pElem->aSegsOut[2].addr + sizeof(nMacs),
1685 &pThis->aMacFilter[pThis->nMacFilterEntries],
1686 nMacs * sizeof(RTMAC));
1687#ifdef DEBUG
1688 Log(("%s vnetControlMac: multicast macs:\n", INSTANCE(pThis)));
1689 for(unsigned i = 0; i < nMacs; i++)
1690 Log((" %RTmac\n",
1691 &pThis->aMacFilter[i+pThis->nMacFilterEntries]));
1692#endif /* DEBUG */
1693 pThis->nMacFilterEntries += nMacs;
1694 }
1695
1696 return VNET_OK;
1697}
1698
1699static uint8_t vnetControlVlan(PVNETSTATE pThis, PVNETCTLHDR pCtlHdr, PVQUEUEELEM pElem)
1700{
1701 uint8_t u8Ack = VNET_OK;
1702 uint16_t u16Vid;
1703
1704 if (pElem->nOut != 2 || pElem->aSegsOut[1].cb != sizeof(u16Vid))
1705 {
1706 Log(("%s vnetControlVlan: Segment layout is wrong (u8Command=%u nOut=%u cb=%u)\n",
1707 INSTANCE(pThis), pCtlHdr->u8Command, pElem->nOut, pElem->aSegsOut[1].cb));
1708 return VNET_ERROR;
1709 }
1710
1711 PDMDevHlpPhysRead(pThis->VPCI.CTX_SUFF(pDevIns),
1712 pElem->aSegsOut[1].addr,
1713 &u16Vid, sizeof(u16Vid));
1714
1715 if (u16Vid >= VNET_MAX_VID)
1716 {
1717 Log(("%s vnetControlVlan: VLAN ID is out of range (VID=%u)\n", INSTANCE(pThis), u16Vid));
1718 return VNET_ERROR;
1719 }
1720
1721 Log(("%s vnetControlVlan: uCommand=%u VID=%u\n", INSTANCE(pThis), pCtlHdr->u8Command, u16Vid));
1722
1723 switch (pCtlHdr->u8Command)
1724 {
1725 case VNET_CTRL_CMD_VLAN_ADD:
1726 ASMBitSet(pThis->aVlanFilter, u16Vid);
1727 break;
1728 case VNET_CTRL_CMD_VLAN_DEL:
1729 ASMBitClear(pThis->aVlanFilter, u16Vid);
1730 break;
1731 default:
1732 u8Ack = VNET_ERROR;
1733 }
1734
1735 return u8Ack;
1736}
1737
1738
1739static DECLCALLBACK(void) vnetQueueControl(void *pvState, PVQUEUE pQueue)
1740{
1741 PVNETSTATE pThis = (PVNETSTATE)pvState;
1742 uint8_t u8Ack;
1743 VQUEUEELEM elem;
1744 while (vqueueGet(&pThis->VPCI, pQueue, &elem))
1745 {
1746 if (elem.nOut < 1 || elem.aSegsOut[0].cb < sizeof(VNETCTLHDR))
1747 {
1748 Log(("%s vnetQueueControl: The first 'out' segment is not the header! (%u < 1 || %u < %u).\n",
1749 INSTANCE(pThis), elem.nOut, elem.aSegsOut[0].cb,sizeof(VNETCTLHDR)));
1750 break; /* Skip the element and hope the next one is good. */
1751 }
1752 else if ( elem.nIn < 1
1753 || elem.aSegsIn[elem.nIn - 1].cb < sizeof(VNETCTLACK))
1754 {
1755 Log(("%s vnetQueueControl: The last 'in' segment is too small to hold the acknowledge! (%u < 1 || %u < %u).\n",
1756 INSTANCE(pThis), elem.nIn, elem.aSegsIn[elem.nIn - 1].cb, sizeof(VNETCTLACK)));
1757 break; /* Skip the element and hope the next one is good. */
1758 }
1759 else
1760 {
1761 VNETCTLHDR CtlHdr;
1762 PDMDevHlpPhysRead(pThis->VPCI.CTX_SUFF(pDevIns),
1763 elem.aSegsOut[0].addr,
1764 &CtlHdr, sizeof(CtlHdr));
1765 switch (CtlHdr.u8Class)
1766 {
1767 case VNET_CTRL_CLS_RX_MODE:
1768 u8Ack = vnetControlRx(pThis, &CtlHdr, &elem);
1769 break;
1770 case VNET_CTRL_CLS_MAC:
1771 u8Ack = vnetControlMac(pThis, &CtlHdr, &elem);
1772 break;
1773 case VNET_CTRL_CLS_VLAN:
1774 u8Ack = vnetControlVlan(pThis, &CtlHdr, &elem);
1775 break;
1776 default:
1777 u8Ack = VNET_ERROR;
1778 }
1779 Log(("%s Processed control message %u, ack=%u.\n", INSTANCE(pThis), CtlHdr.u8Class, u8Ack));
1780 PDMDevHlpPCIPhysWrite(pThis->VPCI.CTX_SUFF(pDevIns),
1781 elem.aSegsIn[elem.nIn - 1].addr,
1782 &u8Ack, sizeof(u8Ack));
1783 }
1784 vqueuePut(&pThis->VPCI, pQueue, &elem, sizeof(u8Ack));
1785 vqueueSync(&pThis->VPCI, pQueue);
1786 }
1787}
1788
1789
1790/* -=-=-=-=- Saved state -=-=-=-=- */
1791
1792/**
1793 * Saves the configuration.
1794 *
1795 * @param pThis The VNET state.
1796 * @param pSSM The handle to the saved state.
1797 */
1798static void vnetSaveConfig(PVNETSTATE pThis, PSSMHANDLE pSSM)
1799{
1800 SSMR3PutMem(pSSM, &pThis->macConfigured, sizeof(pThis->macConfigured));
1801}
1802
1803
1804/**
1805 * @callback_method_impl{FNSSMDEVLIVEEXEC}
1806 */
1807static DECLCALLBACK(int) vnetLiveExec(PPDMDEVINS pDevIns, PSSMHANDLE pSSM, uint32_t uPass)
1808{
1809 RT_NOREF(uPass);
1810 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
1811 vnetSaveConfig(pThis, pSSM);
1812 return VINF_SSM_DONT_CALL_AGAIN;
1813}
1814
1815
1816/**
1817 * @callback_method_impl{FNSSMDEVSAVEPREP}
1818 */
1819static DECLCALLBACK(int) vnetSavePrep(PPDMDEVINS pDevIns, PSSMHANDLE pSSM)
1820{
1821 RT_NOREF(pSSM);
1822 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
1823
1824 int rc = vnetCsRxEnter(pThis, VERR_SEM_BUSY);
1825 if (RT_UNLIKELY(rc != VINF_SUCCESS))
1826 return rc;
1827 vnetCsRxLeave(pThis);
1828 return VINF_SUCCESS;
1829}
1830
1831
1832/**
1833 * @callback_method_impl{FNSSMDEVSAVEEXEC}
1834 */
1835static DECLCALLBACK(int) vnetSaveExec(PPDMDEVINS pDevIns, PSSMHANDLE pSSM)
1836{
1837 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
1838
1839 /* Save config first */
1840 vnetSaveConfig(pThis, pSSM);
1841
1842 /* Save the common part */
1843 int rc = vpciSaveExec(&pThis->VPCI, pSSM);
1844 AssertRCReturn(rc, rc);
1845 /* Save device-specific part */
1846 rc = SSMR3PutMem( pSSM, pThis->config.mac.au8, sizeof(pThis->config.mac));
1847 AssertRCReturn(rc, rc);
1848 rc = SSMR3PutBool(pSSM, pThis->fPromiscuous);
1849 AssertRCReturn(rc, rc);
1850 rc = SSMR3PutBool(pSSM, pThis->fAllMulti);
1851 AssertRCReturn(rc, rc);
1852 rc = SSMR3PutU32( pSSM, pThis->nMacFilterEntries);
1853 AssertRCReturn(rc, rc);
1854 rc = SSMR3PutMem( pSSM, pThis->aMacFilter,
1855 pThis->nMacFilterEntries * sizeof(RTMAC));
1856 AssertRCReturn(rc, rc);
1857 rc = SSMR3PutMem( pSSM, pThis->aVlanFilter, sizeof(pThis->aVlanFilter));
1858 AssertRCReturn(rc, rc);
1859 Log(("%s State has been saved\n", INSTANCE(pThis)));
1860 return VINF_SUCCESS;
1861}
1862
1863
1864/**
1865 * @callback_method_impl{FNSSMDEVLOADPREP, Serializes the receive thread, it may
1866 * be working inside the critsect. }
1867 */
1868static DECLCALLBACK(int) vnetLoadPrep(PPDMDEVINS pDevIns, PSSMHANDLE pSSM)
1869{
1870 RT_NOREF(pSSM);
1871 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
1872
1873 int rc = vnetCsRxEnter(pThis, VERR_SEM_BUSY);
1874 if (RT_UNLIKELY(rc != VINF_SUCCESS))
1875 return rc;
1876 vnetCsRxLeave(pThis);
1877 return VINF_SUCCESS;
1878}
1879
1880
1881/**
1882 * @callback_method_impl{FNSSMDEVLOADEXEC}
1883 */
1884static DECLCALLBACK(int) vnetLoadExec(PPDMDEVINS pDevIns, PSSMHANDLE pSSM, uint32_t uVersion, uint32_t uPass)
1885{
1886 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
1887 int rc;
1888
1889 /* config checks */
1890 RTMAC macConfigured;
1891 rc = SSMR3GetMem(pSSM, &macConfigured, sizeof(macConfigured));
1892 AssertRCReturn(rc, rc);
1893 if (memcmp(&macConfigured, &pThis->macConfigured, sizeof(macConfigured))
1894 && (uPass == 0 || !PDMDevHlpVMTeleportedAndNotFullyResumedYet(pDevIns)))
1895 LogRel(("%s: The mac address differs: config=%RTmac saved=%RTmac\n", INSTANCE(pThis), &pThis->macConfigured, &macConfigured));
1896
1897 rc = vpciLoadExec(&pThis->VPCI, pSSM, uVersion, uPass, VNET_N_QUEUES);
1898 AssertRCReturn(rc, rc);
1899
1900 if (uPass == SSM_PASS_FINAL)
1901 {
1902 rc = SSMR3GetMem( pSSM, pThis->config.mac.au8,
1903 sizeof(pThis->config.mac));
1904 AssertRCReturn(rc, rc);
1905
1906 if (uVersion > VIRTIO_SAVEDSTATE_VERSION_3_1_BETA1)
1907 {
1908 rc = SSMR3GetBool(pSSM, &pThis->fPromiscuous);
1909 AssertRCReturn(rc, rc);
1910 rc = SSMR3GetBool(pSSM, &pThis->fAllMulti);
1911 AssertRCReturn(rc, rc);
1912 rc = SSMR3GetU32(pSSM, &pThis->nMacFilterEntries);
1913 AssertRCReturn(rc, rc);
1914 rc = SSMR3GetMem(pSSM, pThis->aMacFilter,
1915 pThis->nMacFilterEntries * sizeof(RTMAC));
1916 AssertRCReturn(rc, rc);
1917 /* Clear the rest. */
1918 if (pThis->nMacFilterEntries < VNET_MAC_FILTER_LEN)
1919 memset(&pThis->aMacFilter[pThis->nMacFilterEntries],
1920 0,
1921 (VNET_MAC_FILTER_LEN - pThis->nMacFilterEntries)
1922 * sizeof(RTMAC));
1923 rc = SSMR3GetMem(pSSM, pThis->aVlanFilter,
1924 sizeof(pThis->aVlanFilter));
1925 AssertRCReturn(rc, rc);
1926 }
1927 else
1928 {
1929 pThis->fPromiscuous = true;
1930 pThis->fAllMulti = false;
1931 pThis->nMacFilterEntries = 0;
1932 memset(pThis->aMacFilter, 0, VNET_MAC_FILTER_LEN * sizeof(RTMAC));
1933 memset(pThis->aVlanFilter, 0, sizeof(pThis->aVlanFilter));
1934 if (pThis->pDrv)
1935 pThis->pDrv->pfnSetPromiscuousMode(pThis->pDrv, true);
1936 }
1937 }
1938
1939 return rc;
1940}
1941
1942
1943/**
1944 * @callback_method_impl{FNSSMDEVLOADDONE, Link status adjustments after
1945 * loading.}
1946 */
1947static DECLCALLBACK(int) vnetLoadDone(PPDMDEVINS pDevIns, PSSMHANDLE pSSM)
1948{
1949 RT_NOREF(pSSM);
1950 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
1951
1952 if (pThis->pDrv)
1953 pThis->pDrv->pfnSetPromiscuousMode(pThis->pDrv,
1954 (pThis->fPromiscuous | pThis->fAllMulti));
1955 /*
1956 * Indicate link down to the guest OS that all network connections have
1957 * been lost, unless we've been teleported here.
1958 */
1959 if (!PDMDevHlpVMTeleportedAndNotFullyResumedYet(pDevIns))
1960 vnetTempLinkDown(pThis);
1961
1962 return VINF_SUCCESS;
1963}
1964
1965
1966/* -=-=-=-=- PCI Device -=-=-=-=- */
1967
1968/**
1969 * @callback_method_impl{FNPCIIOREGIONMAP}
1970 */
1971static DECLCALLBACK(int) vnetMap(PPDMDEVINS pDevIns, PPDMPCIDEV pPciDev, uint32_t iRegion,
1972 RTGCPHYS GCPhysAddress, RTGCPHYS cb, PCIADDRESSSPACE enmType)
1973{
1974 RT_NOREF(pPciDev, iRegion);
1975 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
1976 int rc;
1977
1978 if (enmType != PCI_ADDRESS_SPACE_IO)
1979 {
1980 /* We should never get here */
1981 AssertMsgFailed(("Invalid PCI address space param in map callback"));
1982 return VERR_INTERNAL_ERROR;
1983 }
1984
1985 pThis->VPCI.IOPortBase = (RTIOPORT)GCPhysAddress;
1986 rc = PDMDevHlpIOPortRegister(pDevIns, pThis->VPCI.IOPortBase,
1987 cb, 0, vnetIOPortOut, vnetIOPortIn,
1988 NULL, NULL, "VirtioNet");
1989#ifdef VNET_GC_SUPPORT
1990 AssertRCReturn(rc, rc);
1991 rc = PDMDevHlpIOPortRegisterR0(pDevIns, pThis->VPCI.IOPortBase,
1992 cb, 0, "vnetIOPortOut", "vnetIOPortIn",
1993 NULL, NULL, "VirtioNet");
1994 AssertRCReturn(rc, rc);
1995 rc = PDMDevHlpIOPortRegisterRC(pDevIns, pThis->VPCI.IOPortBase,
1996 cb, 0, "vnetIOPortOut", "vnetIOPortIn",
1997 NULL, NULL, "VirtioNet");
1998#endif
1999 AssertRC(rc);
2000 return rc;
2001}
2002
2003
2004/* -=-=-=-=- PDMDEVREG -=-=-=-=- */
2005
2006/**
2007 * @interface_method_impl{PDMDEVREG,pfnDetach}
2008 */
2009static DECLCALLBACK(void) vnetDetach(PPDMDEVINS pDevIns, unsigned iLUN, uint32_t fFlags)
2010{
2011 RT_NOREF(fFlags);
2012 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
2013 Log(("%s vnetDetach:\n", INSTANCE(pThis)));
2014
2015 AssertLogRelReturnVoid(iLUN == 0);
2016
2017 int rc = vnetCsEnter(pThis, VERR_SEM_BUSY);
2018 if (RT_FAILURE(rc))
2019 {
2020 LogRel(("vnetDetach failed to enter critical section!\n"));
2021 return;
2022 }
2023
2024 vnetDestroyTxThreadAndEvent(pThis);
2025 /*
2026 * Zero some important members.
2027 */
2028 pThis->pDrvBase = NULL;
2029 pThis->pDrv = NULL;
2030
2031 vnetCsLeave(pThis);
2032}
2033
2034
2035/**
2036 * @interface_method_impl{PDMDEVREG,pfnAttach}
2037 */
2038static DECLCALLBACK(int) vnetAttach(PPDMDEVINS pDevIns, unsigned iLUN, uint32_t fFlags)
2039{
2040 RT_NOREF(fFlags);
2041 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
2042 LogFlow(("%s vnetAttach:\n", INSTANCE(pThis)));
2043
2044 AssertLogRelReturn(iLUN == 0, VERR_PDM_NO_SUCH_LUN);
2045
2046 int rc = vnetCsEnter(pThis, VERR_SEM_BUSY);
2047 if (RT_FAILURE(rc))
2048 {
2049 LogRel(("vnetAttach failed to enter critical section!\n"));
2050 return rc;
2051 }
2052
2053 /*
2054 * Attach the driver.
2055 */
2056 rc = PDMDevHlpDriverAttach(pDevIns, 0, &pThis->VPCI.IBase, &pThis->pDrvBase, "Network Port");
2057 if (RT_SUCCESS(rc))
2058 {
2059 if (rc == VINF_NAT_DNS)
2060 {
2061#ifdef RT_OS_LINUX
2062 PDMDevHlpVMSetRuntimeError(pDevIns, 0 /*fFlags*/, "NoDNSforNAT",
2063 N_("A Domain Name Server (DNS) for NAT networking could not be determined. Please check your /etc/resolv.conf for <tt>nameserver</tt> entries. Either add one manually (<i>man resolv.conf</i>) or ensure that your host is correctly connected to an ISP. If you ignore this warning the guest will not be able to perform nameserver lookups and it will probably observe delays if trying so"));
2064#else
2065 PDMDevHlpVMSetRuntimeError(pDevIns, 0 /*fFlags*/, "NoDNSforNAT",
2066 N_("A Domain Name Server (DNS) for NAT networking could not be determined. Ensure that your host is correctly connected to an ISP. If you ignore this warning the guest will not be able to perform nameserver lookups and it will probably observe delays if trying so"));
2067#endif
2068 }
2069 pThis->pDrv = PDMIBASE_QUERY_INTERFACE(pThis->pDrvBase, PDMINETWORKUP);
2070 AssertMsgStmt(pThis->pDrv, ("Failed to obtain the PDMINETWORKUP interface!\n"),
2071 rc = VERR_PDM_MISSING_INTERFACE_BELOW);
2072
2073 vnetCreateTxThreadAndEvent(pDevIns, pThis);
2074 }
2075 else if ( rc == VERR_PDM_NO_ATTACHED_DRIVER
2076 || rc == VERR_PDM_CFG_MISSING_DRIVER_NAME)
2077 {
2078 /* This should never happen because this function is not called
2079 * if there is no driver to attach! */
2080 Log(("%s No attached driver!\n", INSTANCE(pThis)));
2081 }
2082
2083 /*
2084 * Temporary set the link down if it was up so that the guest
2085 * will know that we have change the configuration of the
2086 * network card
2087 */
2088 if (RT_SUCCESS(rc))
2089 vnetTempLinkDown(pThis);
2090
2091 vnetCsLeave(pThis);
2092 return rc;
2093
2094}
2095
2096
2097/**
2098 * @interface_method_impl{PDMDEVREG,pfnSuspend}
2099 */
2100static DECLCALLBACK(void) vnetSuspend(PPDMDEVINS pDevIns)
2101{
2102 /* Poke thread waiting for buffer space. */
2103 vnetWakeupReceive(pDevIns);
2104}
2105
2106
2107/**
2108 * @interface_method_impl{PDMDEVREG,pfnPowerOff}
2109 */
2110static DECLCALLBACK(void) vnetPowerOff(PPDMDEVINS pDevIns)
2111{
2112 /* Poke thread waiting for buffer space. */
2113 vnetWakeupReceive(pDevIns);
2114}
2115
2116
2117/**
2118 * @interface_method_impl{PDMDEVREG,pfnRelocate}
2119 */
2120static DECLCALLBACK(void) vnetRelocate(PPDMDEVINS pDevIns, RTGCINTPTR offDelta)
2121{
2122 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
2123 vpciRelocate(pDevIns, offDelta);
2124 pThis->pCanRxQueueRC = PDMQueueRCPtr(pThis->pCanRxQueueR3);
2125#ifdef VNET_TX_DELAY
2126 pThis->pTxTimerRC = TMTimerRCPtr(pThis->pTxTimerR3);
2127#endif /* VNET_TX_DELAY */
2128 // TBD
2129}
2130
2131
2132/**
2133 * @interface_method_impl{PDMDEVREG,pfnDestruct}
2134 */
2135static DECLCALLBACK(int) vnetDestruct(PPDMDEVINS pDevIns)
2136{
2137 PDMDEV_CHECK_VERSIONS_RETURN_QUIET(pDevIns);
2138 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
2139
2140#ifdef VNET_TX_DELAY
2141 LogRel(("TxTimer stats (avg/min/max): %7d usec %7d usec %7d usec\n",
2142 pThis->u32AvgDiff, pThis->u32MinDiff, pThis->u32MaxDiff));
2143#endif /* VNET_TX_DELAY */
2144 Log(("%s Destroying instance\n", INSTANCE(pThis)));
2145 if (pThis->hEventMoreRxDescAvail != NIL_RTSEMEVENT)
2146 {
2147 RTSemEventSignal(pThis->hEventMoreRxDescAvail);
2148 RTSemEventDestroy(pThis->hEventMoreRxDescAvail);
2149 pThis->hEventMoreRxDescAvail = NIL_RTSEMEVENT;
2150 }
2151
2152 // if (PDMCritSectIsInitialized(&pThis->csRx))
2153 // PDMR3CritSectDelete(&pThis->csRx);
2154
2155 return vpciDestruct(&pThis->VPCI);
2156}
2157
2158
2159/**
2160 * @interface_method_impl{PDMDEVREG,pfnConstruct}
2161 */
2162static DECLCALLBACK(int) vnetConstruct(PPDMDEVINS pDevIns, int iInstance, PCFGMNODE pCfg)
2163{
2164 PDMDEV_CHECK_VERSIONS_RETURN(pDevIns);
2165 PVNETSTATE pThis = PDMINS_2_DATA(pDevIns, PVNETSTATE);
2166 int rc;
2167
2168 /* Initialize the instance data suffiencently for the destructor not to blow up. */
2169 pThis->hEventMoreRxDescAvail = NIL_RTSEMEVENT;
2170
2171 /* Do our own locking. */
2172 rc = PDMDevHlpSetDeviceCritSect(pDevIns, PDMDevHlpCritSectGetNop(pDevIns));
2173 AssertRCReturn(rc, rc);
2174
2175 /* Initialize PCI part. */
2176 pThis->VPCI.IBase.pfnQueryInterface = vnetQueryInterface;
2177 rc = vpciConstruct(pDevIns, &pThis->VPCI, iInstance,
2178 VNET_NAME_FMT, VIRTIO_NET_ID,
2179 VNET_PCI_CLASS, VNET_N_QUEUES);
2180 pThis->pRxQueue = vpciAddQueue(&pThis->VPCI, 256, vnetQueueReceive, "RX ");
2181 pThis->pTxQueue = vpciAddQueue(&pThis->VPCI, 256, vnetQueueTransmit, "TX ");
2182 pThis->pCtlQueue = vpciAddQueue(&pThis->VPCI, 16, vnetQueueControl, "CTL");
2183
2184 Log(("%s Constructing new instance\n", INSTANCE(pThis)));
2185
2186 /*
2187 * Validate configuration.
2188 */
2189 if (!CFGMR3AreValuesValid(pCfg, "MAC\0" "CableConnected\0" "LineSpeed\0" "LinkUpDelay\0"))
2190 return PDMDEV_SET_ERROR(pDevIns, VERR_PDM_DEVINS_UNKNOWN_CFG_VALUES, N_("Invalid configuration for VirtioNet device"));
2191
2192 /* Get config params */
2193 rc = CFGMR3QueryBytes(pCfg, "MAC", pThis->macConfigured.au8,
2194 sizeof(pThis->macConfigured));
2195 if (RT_FAILURE(rc))
2196 return PDMDEV_SET_ERROR(pDevIns, rc,
2197 N_("Configuration error: Failed to get MAC address"));
2198 rc = CFGMR3QueryBool(pCfg, "CableConnected", &pThis->fCableConnected);
2199 if (RT_FAILURE(rc))
2200 return PDMDEV_SET_ERROR(pDevIns, rc,
2201 N_("Configuration error: Failed to get the value of 'CableConnected'"));
2202 rc = CFGMR3QueryU32Def(pCfg, "LinkUpDelay", (uint32_t*)&pThis->cMsLinkUpDelay, 5000); /* ms */
2203 if (RT_FAILURE(rc))
2204 return PDMDEV_SET_ERROR(pDevIns, rc,
2205 N_("Configuration error: Failed to get the value of 'LinkUpDelay'"));
2206 Assert(pThis->cMsLinkUpDelay <= 300000); /* less than 5 minutes */
2207 if (pThis->cMsLinkUpDelay > 5000 || pThis->cMsLinkUpDelay < 100)
2208 {
2209 LogRel(("%s WARNING! Link up delay is set to %u seconds!\n",
2210 INSTANCE(pThis), pThis->cMsLinkUpDelay / 1000));
2211 }
2212 Log(("%s Link up delay is set to %u seconds\n",
2213 INSTANCE(pThis), pThis->cMsLinkUpDelay / 1000));
2214
2215
2216 vnetPrintFeatures(pThis, vnetIoCb_GetHostFeatures(pThis), "Device supports the following features");
2217
2218 /* Initialize PCI config space */
2219 memcpy(pThis->config.mac.au8, pThis->macConfigured.au8, sizeof(pThis->config.mac.au8));
2220 pThis->config.uStatus = 0;
2221
2222 /* Initialize state structure */
2223 pThis->u32PktNo = 1;
2224
2225 /* Interfaces */
2226 pThis->INetworkDown.pfnWaitReceiveAvail = vnetNetworkDown_WaitReceiveAvail;
2227 pThis->INetworkDown.pfnReceive = vnetNetworkDown_Receive;
2228 pThis->INetworkDown.pfnReceiveGso = vnetNetworkDown_ReceiveGso;
2229 pThis->INetworkDown.pfnXmitPending = vnetNetworkDown_XmitPending;
2230
2231 pThis->INetworkConfig.pfnGetMac = vnetGetMac;
2232 pThis->INetworkConfig.pfnGetLinkState = vnetGetLinkState;
2233 pThis->INetworkConfig.pfnSetLinkState = vnetSetLinkState;
2234
2235 /* Initialize critical section. */
2236 // char szTmp[sizeof(pThis->VPCI.szInstance) + 2];
2237 // RTStrPrintf(szTmp, sizeof(szTmp), "%sRX", pThis->VPCI.szInstance);
2238 // rc = PDMDevHlpCritSectInit(pDevIns, &pThis->csRx, szTmp);
2239 // if (RT_FAILURE(rc))
2240 // return rc;
2241
2242 /* Map our ports to IO space. */
2243 rc = PDMDevHlpPCIIORegionRegister(pDevIns, 0,
2244 VPCI_CONFIG + sizeof(VNetPCIConfig),
2245 PCI_ADDRESS_SPACE_IO, vnetMap);
2246 if (RT_FAILURE(rc))
2247 return rc;
2248
2249
2250 /* Register save/restore state handlers. */
2251 rc = PDMDevHlpSSMRegisterEx(pDevIns, VIRTIO_SAVEDSTATE_VERSION, sizeof(VNETSTATE), NULL,
2252 NULL, vnetLiveExec, NULL,
2253 vnetSavePrep, vnetSaveExec, NULL,
2254 vnetLoadPrep, vnetLoadExec, vnetLoadDone);
2255 if (RT_FAILURE(rc))
2256 return rc;
2257
2258 /* Create the RX notifier signaller. */
2259 rc = PDMDevHlpQueueCreate(pDevIns, sizeof(PDMQUEUEITEMCORE), 1, 0,
2260 vnetCanRxQueueConsumer, true, "VNet-Rcv", &pThis->pCanRxQueueR3);
2261 if (RT_FAILURE(rc))
2262 return rc;
2263 pThis->pCanRxQueueR0 = PDMQueueR0Ptr(pThis->pCanRxQueueR3);
2264 pThis->pCanRxQueueRC = PDMQueueRCPtr(pThis->pCanRxQueueR3);
2265
2266 /* Create Link Up Timer */
2267 rc = PDMDevHlpTMTimerCreate(pDevIns, TMCLOCK_VIRTUAL, vnetLinkUpTimer, pThis,
2268 TMTIMER_FLAGS_NO_CRIT_SECT,
2269 "VirtioNet Link Up Timer", &pThis->pLinkUpTimer);
2270 if (RT_FAILURE(rc))
2271 return rc;
2272
2273#ifndef VNET_TX_DELAY
2274 pThis->pSupDrvSession = PDMDevHlpGetSupDrvSession(pDevIns);
2275 pThis->hTxEvent = NIL_SUPSEMEVENT;
2276 pThis->pTxThread = NULL;
2277#else /* VNET_TX_DELAY */
2278 /* Create Transmit Delay Timer */
2279 rc = PDMDevHlpTMTimerCreate(pDevIns, TMCLOCK_VIRTUAL, vnetTxTimer, pThis,
2280 TMTIMER_FLAGS_NO_CRIT_SECT,
2281 "VirtioNet TX Delay Timer", &pThis->pTxTimerR3);
2282 if (RT_FAILURE(rc))
2283 return rc;
2284 pThis->pTxTimerR0 = TMTimerR0Ptr(pThis->pTxTimerR3);
2285 pThis->pTxTimerRC = TMTimerRCPtr(pThis->pTxTimerR3);
2286
2287 pThis->u32i = pThis->u32AvgDiff = pThis->u32MaxDiff = 0;
2288 pThis->u32MinDiff = UINT32_MAX;
2289#endif /* VNET_TX_DELAY */
2290
2291 rc = PDMDevHlpDriverAttach(pDevIns, 0, &pThis->VPCI.IBase, &pThis->pDrvBase, "Network Port");
2292 if (RT_SUCCESS(rc))
2293 {
2294 if (rc == VINF_NAT_DNS)
2295 {
2296 PDMDevHlpVMSetRuntimeError(pDevIns, 0 /*fFlags*/, "NoDNSforNAT",
2297 N_("A Domain Name Server (DNS) for NAT networking could not be determined. Ensure that your host is correctly connected to an ISP. If you ignore this warning the guest will not be able to perform nameserver lookups and it will probably observe delays if trying so"));
2298 }
2299 pThis->pDrv = PDMIBASE_QUERY_INTERFACE(pThis->pDrvBase, PDMINETWORKUP);
2300 AssertMsgReturn(pThis->pDrv, ("Failed to obtain the PDMINETWORKUP interface!\n"),
2301 VERR_PDM_MISSING_INTERFACE_BELOW);
2302
2303 vnetCreateTxThreadAndEvent(pDevIns, pThis);
2304 }
2305 else if ( rc == VERR_PDM_NO_ATTACHED_DRIVER
2306 || rc == VERR_PDM_CFG_MISSING_DRIVER_NAME )
2307 {
2308 /* No error! */
2309 Log(("%s This adapter is not attached to any network!\n", INSTANCE(pThis)));
2310 }
2311 else
2312 return PDMDEV_SET_ERROR(pDevIns, rc, N_("Failed to attach the network LUN"));
2313
2314 rc = RTSemEventCreate(&pThis->hEventMoreRxDescAvail);
2315 if (RT_FAILURE(rc))
2316 return rc;
2317
2318 rc = vnetIoCb_Reset(pThis);
2319 AssertRC(rc);
2320
2321 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatReceiveBytes, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_BYTES, "Amount of data received", "/Public/Net/VNet%u/BytesReceived", iInstance);
2322 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatTransmitBytes, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_BYTES, "Amount of data transmitted", "/Public/Net/VNet%u/BytesTransmitted", iInstance);
2323
2324 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatReceiveBytes, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_BYTES, "Amount of data received", "/Devices/VNet%d/ReceiveBytes", iInstance);
2325 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatTransmitBytes, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_BYTES, "Amount of data transmitted", "/Devices/VNet%d/TransmitBytes", iInstance);
2326 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatReceiveGSO, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_COUNT, "Number of received GSO packets", "/Devices/VNet%d/Packets/ReceiveGSO", iInstance);
2327 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatTransmitPackets, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_COUNT, "Number of sent packets", "/Devices/VNet%d/Packets/Transmit", iInstance);
2328 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatTransmitGSO, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_COUNT, "Number of sent GSO packets", "/Devices/VNet%d/Packets/Transmit-Gso", iInstance);
2329 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatTransmitCSum, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_COUNT, "Number of completed TX checksums", "/Devices/VNet%d/Packets/Transmit-Csum", iInstance);
2330#if defined(VBOX_WITH_STATISTICS)
2331 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatReceive, STAMTYPE_PROFILE, STAMVISIBILITY_ALWAYS, STAMUNIT_TICKS_PER_CALL, "Profiling receive", "/Devices/VNet%d/Receive/Total", iInstance);
2332 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatReceiveStore, STAMTYPE_PROFILE, STAMVISIBILITY_ALWAYS, STAMUNIT_TICKS_PER_CALL, "Profiling receive storing", "/Devices/VNet%d/Receive/Store", iInstance);
2333 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatRxOverflow, STAMTYPE_PROFILE, STAMVISIBILITY_ALWAYS, STAMUNIT_TICKS_PER_OCCURENCE, "Profiling RX overflows", "/Devices/VNet%d/RxOverflow", iInstance);
2334 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatRxOverflowWakeup, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_OCCURENCES, "Nr of RX overflow wakeups", "/Devices/VNet%d/RxOverflowWakeup", iInstance);
2335 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatTransmit, STAMTYPE_PROFILE, STAMVISIBILITY_ALWAYS, STAMUNIT_TICKS_PER_CALL, "Profiling transmits in HC", "/Devices/VNet%d/Transmit/Total", iInstance);
2336 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatTransmitSend, STAMTYPE_PROFILE, STAMVISIBILITY_ALWAYS, STAMUNIT_TICKS_PER_CALL, "Profiling send transmit in HC", "/Devices/VNet%d/Transmit/Send", iInstance);
2337 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatTransmitByNetwork, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_COUNT, "Network-initiated transmissions", "/Devices/VNet%d/Transmit/ByNetwork", iInstance);
2338 PDMDevHlpSTAMRegisterF(pDevIns, &pThis->StatTransmitByThread, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS, STAMUNIT_COUNT, "Thread-initiated transmissions", "/Devices/VNet%d/Transmit/ByThread", iInstance);
2339#endif /* VBOX_WITH_STATISTICS */
2340
2341 return VINF_SUCCESS;
2342}
2343
2344/**
2345 * The device registration structure.
2346 */
2347const PDMDEVREG g_DeviceVirtioNet =
2348{
2349 /* Structure version. PDM_DEVREG_VERSION defines the current version. */
2350 PDM_DEVREG_VERSION,
2351 /* Device name. */
2352 "virtio-net",
2353 /* Name of guest context module (no path).
2354 * Only evalutated if PDM_DEVREG_FLAGS_RC is set. */
2355 "VBoxDDRC.rc",
2356 /* Name of ring-0 module (no path).
2357 * Only evalutated if PDM_DEVREG_FLAGS_RC is set. */
2358 "VBoxDDR0.r0",
2359 /* The description of the device. The UTF-8 string pointed to shall, like this structure,
2360 * remain unchanged from registration till VM destruction. */
2361 "Virtio Ethernet.\n",
2362
2363 /* Flags, combination of the PDM_DEVREG_FLAGS_* \#defines. */
2364#ifdef VNET_GC_SUPPORT
2365 PDM_DEVREG_FLAGS_DEFAULT_BITS | PDM_DEVREG_FLAGS_RC | PDM_DEVREG_FLAGS_R0,
2366#else
2367 PDM_DEVREG_FLAGS_DEFAULT_BITS,
2368#endif
2369 /* Device class(es), combination of the PDM_DEVREG_CLASS_* \#defines. */
2370 PDM_DEVREG_CLASS_NETWORK,
2371 /* Maximum number of instances (per VM). */
2372 ~0U,
2373 /* Size of the instance data. */
2374 sizeof(VNETSTATE),
2375
2376 /* pfnConstruct */
2377 vnetConstruct,
2378 /* pfnDestruct */
2379 vnetDestruct,
2380 /* pfnRelocate */
2381 vnetRelocate,
2382 /* pfnMemSetup. */
2383 NULL,
2384 /* pfnPowerOn */
2385 NULL,
2386 /* pfnReset */
2387 NULL,
2388 /* pfnSuspend */
2389 vnetSuspend,
2390 /* pfnResume */
2391 NULL,
2392 /* pfnAttach */
2393 vnetAttach,
2394 /* pfnDetach */
2395 vnetDetach,
2396 /* pfnQueryInterface */
2397 NULL,
2398 /* pfnInitComplete */
2399 NULL,
2400 /* pfnPowerOff */
2401 vnetPowerOff,
2402 /* pfnSoftReset */
2403 NULL,
2404
2405 /* u32VersionEnd */
2406 PDM_DEVREG_VERSION
2407};
2408
2409#endif /* IN_RING3 */
2410#endif /* !VBOX_DEVICE_STRUCT_TESTCASE */
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette