VirtualBox

source: vbox/trunk/src/VBox/Storage/VD.cpp@ 49133

Last change on this file since 49133 was 48957, checked in by vboxsync, 11 years ago

Storage: Whitespace cleanups by scm.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 348.6 KB
Line 
1/* $Id: VD.cpp 48957 2013-10-07 22:04:36Z vboxsync $ */
2/** @file
3 * VBoxHDD - VBox HDD Container implementation.
4 */
5
6/*
7 * Copyright (C) 2006-2013 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18/*******************************************************************************
19* Header Files *
20*******************************************************************************/
21#define LOG_GROUP LOG_GROUP_VD
22#include <VBox/vd.h>
23#include <VBox/err.h>
24#include <VBox/sup.h>
25#include <VBox/log.h>
26
27#include <iprt/alloc.h>
28#include <iprt/assert.h>
29#include <iprt/uuid.h>
30#include <iprt/file.h>
31#include <iprt/string.h>
32#include <iprt/asm.h>
33#include <iprt/ldr.h>
34#include <iprt/dir.h>
35#include <iprt/path.h>
36#include <iprt/param.h>
37#include <iprt/memcache.h>
38#include <iprt/sg.h>
39#include <iprt/list.h>
40#include <iprt/avl.h>
41#include <iprt/semaphore.h>
42
43#include <VBox/vd-plugin.h>
44#include <VBox/vd-cache-plugin.h>
45
46/** Disable dynamic backends on non x86 architectures. This feature
47 * requires the SUPR3 library which is not available there.
48 */
49#if !defined(VBOX_HDD_NO_DYNAMIC_BACKENDS) && !defined(RT_ARCH_X86) && !defined(RT_ARCH_AMD64)
50# define VBOX_HDD_NO_DYNAMIC_BACKENDS
51#endif
52
53#define VBOXHDDDISK_SIGNATURE 0x6f0e2a7d
54
55/** Buffer size used for merging images. */
56#define VD_MERGE_BUFFER_SIZE (16 * _1M)
57
58/** Maximum number of segments in one I/O task. */
59#define VD_IO_TASK_SEGMENTS_MAX 64
60
61/** Threshold after not recently used blocks are removed from the list. */
62#define VD_DISCARD_REMOVE_THRESHOLD (10 * _1M) /** @todo: experiment */
63
64/**
65 * VD async I/O interface storage descriptor.
66 */
67typedef struct VDIIOFALLBACKSTORAGE
68{
69 /** File handle. */
70 RTFILE File;
71 /** Completion callback. */
72 PFNVDCOMPLETED pfnCompleted;
73 /** Thread for async access. */
74 RTTHREAD ThreadAsync;
75} VDIIOFALLBACKSTORAGE, *PVDIIOFALLBACKSTORAGE;
76
77/**
78 * Structure containing everything I/O related
79 * for the image and cache descriptors.
80 */
81typedef struct VDIO
82{
83 /** I/O interface to the upper layer. */
84 PVDINTERFACEIO pInterfaceIo;
85
86 /** Per image internal I/O interface. */
87 VDINTERFACEIOINT VDIfIoInt;
88
89 /** Fallback I/O interface, only used if the caller doesn't provide it. */
90 VDINTERFACEIO VDIfIo;
91
92 /** Opaque backend data. */
93 void *pBackendData;
94 /** Disk this image is part of */
95 PVBOXHDD pDisk;
96 /** Flag whether to ignore flush requests. */
97 bool fIgnoreFlush;
98} VDIO, *PVDIO;
99
100/** Forward declaration of an I/O task */
101typedef struct VDIOTASK *PVDIOTASK;
102
103/**
104 * VBox HDD Container image descriptor.
105 */
106typedef struct VDIMAGE
107{
108 /** Link to parent image descriptor, if any. */
109 struct VDIMAGE *pPrev;
110 /** Link to child image descriptor, if any. */
111 struct VDIMAGE *pNext;
112 /** Container base filename. (UTF-8) */
113 char *pszFilename;
114 /** Data managed by the backend which keeps the actual info. */
115 void *pBackendData;
116 /** Cached sanitized image flags. */
117 unsigned uImageFlags;
118 /** Image open flags (only those handled generically in this code and which
119 * the backends will never ever see). */
120 unsigned uOpenFlags;
121
122 /** Function pointers for the various backend methods. */
123 PCVBOXHDDBACKEND Backend;
124 /** Pointer to list of VD interfaces, per-image. */
125 PVDINTERFACE pVDIfsImage;
126 /** I/O related things. */
127 VDIO VDIo;
128} VDIMAGE, *PVDIMAGE;
129
130/**
131 * uModified bit flags.
132 */
133#define VD_IMAGE_MODIFIED_FLAG RT_BIT(0)
134#define VD_IMAGE_MODIFIED_FIRST RT_BIT(1)
135#define VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE RT_BIT(2)
136
137
138/**
139 * VBox HDD Cache image descriptor.
140 */
141typedef struct VDCACHE
142{
143 /** Cache base filename. (UTF-8) */
144 char *pszFilename;
145 /** Data managed by the backend which keeps the actual info. */
146 void *pBackendData;
147 /** Cached sanitized image flags. */
148 unsigned uImageFlags;
149 /** Image open flags (only those handled generically in this code and which
150 * the backends will never ever see). */
151 unsigned uOpenFlags;
152
153 /** Function pointers for the various backend methods. */
154 PCVDCACHEBACKEND Backend;
155
156 /** Pointer to list of VD interfaces, per-cache. */
157 PVDINTERFACE pVDIfsCache;
158 /** I/O related things. */
159 VDIO VDIo;
160} VDCACHE, *PVDCACHE;
161
162/**
163 * A block waiting for a discard.
164 */
165typedef struct VDDISCARDBLOCK
166{
167 /** AVL core. */
168 AVLRU64NODECORE Core;
169 /** LRU list node. */
170 RTLISTNODE NodeLru;
171 /** Number of bytes to discard. */
172 size_t cbDiscard;
173 /** Bitmap of allocated sectors. */
174 void *pbmAllocated;
175} VDDISCARDBLOCK, *PVDDISCARDBLOCK;
176
177/**
178 * VD discard state.
179 */
180typedef struct VDDISCARDSTATE
181{
182 /** Number of bytes waiting for a discard. */
183 size_t cbDiscarding;
184 /** AVL tree with blocks waiting for a discard.
185 * The uOffset + cbDiscard range is the search key. */
186 PAVLRU64TREE pTreeBlocks;
187 /** LRU list of the least frequently discarded blocks.
188 * If there are to many blocks waiting the least frequently used
189 * will be removed and the range will be set to 0.
190 */
191 RTLISTNODE ListLru;
192} VDDISCARDSTATE, *PVDDISCARDSTATE;
193
194/**
195 * VBox HDD Container main structure, private part.
196 */
197struct VBOXHDD
198{
199 /** Structure signature (VBOXHDDDISK_SIGNATURE). */
200 uint32_t u32Signature;
201
202 /** Image type. */
203 VDTYPE enmType;
204
205 /** Number of opened images. */
206 unsigned cImages;
207
208 /** Base image. */
209 PVDIMAGE pBase;
210
211 /** Last opened image in the chain.
212 * The same as pBase if only one image is used. */
213 PVDIMAGE pLast;
214
215 /** If a merge to one of the parents is running this may be non-NULL
216 * to indicate to what image the writes should be additionally relayed. */
217 PVDIMAGE pImageRelay;
218
219 /** Flags representing the modification state. */
220 unsigned uModified;
221
222 /** Cached size of this disk. */
223 uint64_t cbSize;
224 /** Cached PCHS geometry for this disk. */
225 VDGEOMETRY PCHSGeometry;
226 /** Cached LCHS geometry for this disk. */
227 VDGEOMETRY LCHSGeometry;
228
229 /** Pointer to list of VD interfaces, per-disk. */
230 PVDINTERFACE pVDIfsDisk;
231 /** Pointer to the common interface structure for error reporting. */
232 PVDINTERFACEERROR pInterfaceError;
233 /** Pointer to the optional thread synchronization callbacks. */
234 PVDINTERFACETHREADSYNC pInterfaceThreadSync;
235
236 /** Memory cache for I/O contexts */
237 RTMEMCACHE hMemCacheIoCtx;
238 /** Memory cache for I/O tasks. */
239 RTMEMCACHE hMemCacheIoTask;
240 /** An I/O context is currently using the disk structures
241 * Every I/O context must be placed on one of the lists below. */
242 volatile bool fLocked;
243 /** Head of pending I/O tasks waiting for completion - LIFO order. */
244 volatile PVDIOTASK pIoTasksPendingHead;
245 /** Head of newly queued I/O contexts - LIFO order. */
246 volatile PVDIOCTX pIoCtxHead;
247 /** Head of halted I/O contexts which are given back to generic
248 * disk framework by the backend. - LIFO order. */
249 volatile PVDIOCTX pIoCtxHaltedHead;
250
251 /** Head of blocked I/O contexts, processed only
252 * after pIoCtxLockOwner was freed - LIFO order. */
253 volatile PVDIOCTX pIoCtxBlockedHead;
254 /** I/O context which locked the disk for a growing write or flush request.
255 * Other flush or growing write requests need to wait until
256 * the current one completes. - NIL_VDIOCTX if unlocked. */
257 volatile PVDIOCTX pIoCtxLockOwner;
258
259 /** Pointer to the L2 disk cache if any. */
260 PVDCACHE pCache;
261 /** Pointer to the discard state if any. */
262 PVDDISCARDSTATE pDiscard;
263
264 /** Event semaphore for synchronous I/O. */
265 RTSEMEVENT hEventSemSyncIo;
266 /** Status code of the last synchronous I/O request. */
267 int rcSync;
268};
269
270# define VD_IS_LOCKED(a_pDisk) \
271 do \
272 { \
273 AssertMsg(a_pDisk->fLocked, \
274 ("Lock not held\n"));\
275 } while(0)
276
277/**
278 * VBox parent read descriptor, used internally for compaction.
279 */
280typedef struct VDPARENTSTATEDESC
281{
282 /** Pointer to disk descriptor. */
283 PVBOXHDD pDisk;
284 /** Pointer to image descriptor. */
285 PVDIMAGE pImage;
286} VDPARENTSTATEDESC, *PVDPARENTSTATEDESC;
287
288/**
289 * Transfer direction.
290 */
291typedef enum VDIOCTXTXDIR
292{
293 /** Read */
294 VDIOCTXTXDIR_READ = 0,
295 /** Write */
296 VDIOCTXTXDIR_WRITE,
297 /** Flush */
298 VDIOCTXTXDIR_FLUSH,
299 /** Discard */
300 VDIOCTXTXDIR_DISCARD,
301 /** 32bit hack */
302 VDIOCTXTXDIR_32BIT_HACK = 0x7fffffff
303} VDIOCTXTXDIR, *PVDIOCTXTXDIR;
304
305/** Transfer function */
306typedef DECLCALLBACK(int) FNVDIOCTXTRANSFER (PVDIOCTX pIoCtx);
307/** Pointer to a transfer function. */
308typedef FNVDIOCTXTRANSFER *PFNVDIOCTXTRANSFER;
309
310/**
311 * I/O context
312 */
313typedef struct VDIOCTX
314{
315 /** Pointer to the next I/O context. */
316 struct VDIOCTX * volatile pIoCtxNext;
317 /** Disk this is request is for. */
318 PVBOXHDD pDisk;
319 /** Return code. */
320 int rcReq;
321 /** Various flags for the I/O context. */
322 uint32_t fFlags;
323 /** Number of data transfers currently pending. */
324 volatile uint32_t cDataTransfersPending;
325 /** How many meta data transfers are pending. */
326 volatile uint32_t cMetaTransfersPending;
327 /** Flag whether the request finished */
328 volatile bool fComplete;
329 /** Temporary allocated memory which is freed
330 * when the context completes. */
331 void *pvAllocation;
332 /** Transfer function. */
333 PFNVDIOCTXTRANSFER pfnIoCtxTransfer;
334 /** Next transfer part after the current one completed. */
335 PFNVDIOCTXTRANSFER pfnIoCtxTransferNext;
336 /** Transfer direction */
337 VDIOCTXTXDIR enmTxDir;
338 /** Request type dependent data. */
339 union
340 {
341 /** I/O request (read/write). */
342 struct
343 {
344 /** Number of bytes left until this context completes. */
345 volatile uint32_t cbTransferLeft;
346 /** Current offset */
347 volatile uint64_t uOffset;
348 /** Number of bytes to transfer */
349 volatile size_t cbTransfer;
350 /** Current image in the chain. */
351 PVDIMAGE pImageCur;
352 /** Start image to read from. pImageCur is reset to this
353 * value after it reached the first image in the chain. */
354 PVDIMAGE pImageStart;
355 /** S/G buffer */
356 RTSGBUF SgBuf;
357 /** Number of bytes to clear in the buffer before the current read. */
358 size_t cbBufClear;
359 /** Number of images to read. */
360 unsigned cImagesRead;
361 /** Override for the parent image to start reading from. */
362 PVDIMAGE pImageParentOverride;
363 } Io;
364 /** Discard requests. */
365 struct
366 {
367 /** Pointer to the range descriptor array. */
368 PCRTRANGE paRanges;
369 /** Number of ranges in the array. */
370 unsigned cRanges;
371 /** Range descriptor index which is processed. */
372 unsigned idxRange;
373 /** Start offset to discard currently. */
374 uint64_t offCur;
375 /** How many bytes left to discard in the current range. */
376 size_t cbDiscardLeft;
377 /** How many bytes to discard in the current block (<= cbDiscardLeft). */
378 size_t cbThisDiscard;
379 /** Discard block handled currently. */
380 PVDDISCARDBLOCK pBlock;
381 } Discard;
382 } Req;
383 /** Parent I/O context if any. Sets the type of the context (root/child) */
384 PVDIOCTX pIoCtxParent;
385 /** Type dependent data (root/child) */
386 union
387 {
388 /** Root data */
389 struct
390 {
391 /** Completion callback */
392 PFNVDASYNCTRANSFERCOMPLETE pfnComplete;
393 /** User argument 1 passed on completion. */
394 void *pvUser1;
395 /** User argument 2 passed on completion. */
396 void *pvUser2;
397 } Root;
398 /** Child data */
399 struct
400 {
401 /** Saved start offset */
402 uint64_t uOffsetSaved;
403 /** Saved transfer size */
404 size_t cbTransferLeftSaved;
405 /** Number of bytes transferred from the parent if this context completes. */
406 size_t cbTransferParent;
407 /** Number of bytes to pre read */
408 size_t cbPreRead;
409 /** Number of bytes to post read. */
410 size_t cbPostRead;
411 /** Number of bytes to write left in the parent. */
412 size_t cbWriteParent;
413 /** Write type dependent data. */
414 union
415 {
416 /** Optimized */
417 struct
418 {
419 /** Bytes to fill to satisfy the block size. Not part of the virtual disk. */
420 size_t cbFill;
421 /** Bytes to copy instead of reading from the parent */
422 size_t cbWriteCopy;
423 /** Bytes to read from the image. */
424 size_t cbReadImage;
425 } Optimized;
426 } Write;
427 } Child;
428 } Type;
429} VDIOCTX;
430
431/** Default flags for an I/O context, i.e. unblocked and async. */
432#define VDIOCTX_FLAGS_DEFAULT (0)
433/** Flag whether the context is blocked. */
434#define VDIOCTX_FLAGS_BLOCKED RT_BIT_32(0)
435/** Flag whether the I/O context is using synchronous I/O. */
436#define VDIOCTX_FLAGS_SYNC RT_BIT_32(1)
437/** Flag whether the read should update the cache. */
438#define VDIOCTX_FLAGS_READ_UPDATE_CACHE RT_BIT_32(2)
439/** Flag whether free blocks should be zeroed.
440 * If false and no image has data for sepcified
441 * range VERR_VD_BLOCK_FREE is returned for the I/O context.
442 * Note that unallocated blocks are still zeroed
443 * if at least one image has valid data for a part
444 * of the range.
445 */
446#define VDIOCTX_FLAGS_ZERO_FREE_BLOCKS RT_BIT_32(3)
447/** Don't free the I/O context when complete because
448 * it was alloacted elsewhere (stack, ...). */
449#define VDIOCTX_FLAGS_DONT_FREE RT_BIT_32(4)
450/* Don't set the modified flag for this I/O context when writing. */
451#define VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG RT_BIT_32(5)
452
453/** NIL I/O context pointer value. */
454#define NIL_VDIOCTX ((PVDIOCTX)0)
455
456/**
457 * List node for deferred I/O contexts.
458 */
459typedef struct VDIOCTXDEFERRED
460{
461 /** Node in the list of deferred requests.
462 * A request can be deferred if the image is growing
463 * and the request accesses the same range or if
464 * the backend needs to read or write metadata from the disk
465 * before it can continue. */
466 RTLISTNODE NodeDeferred;
467 /** I/O context this entry points to. */
468 PVDIOCTX pIoCtx;
469} VDIOCTXDEFERRED, *PVDIOCTXDEFERRED;
470
471/**
472 * I/O task.
473 */
474typedef struct VDIOTASK
475{
476 /** Next I/O task waiting in the list. */
477 struct VDIOTASK * volatile pNext;
478 /** Storage this task belongs to. */
479 PVDIOSTORAGE pIoStorage;
480 /** Optional completion callback. */
481 PFNVDXFERCOMPLETED pfnComplete;
482 /** Opaque user data. */
483 void *pvUser;
484 /** Completion status code for the task. */
485 int rcReq;
486 /** Flag whether this is a meta data transfer. */
487 bool fMeta;
488 /** Type dependent data. */
489 union
490 {
491 /** User data transfer. */
492 struct
493 {
494 /** Number of bytes this task transferred. */
495 uint32_t cbTransfer;
496 /** Pointer to the I/O context the task belongs. */
497 PVDIOCTX pIoCtx;
498 } User;
499 /** Meta data transfer. */
500 struct
501 {
502 /** Meta transfer this task is for. */
503 PVDMETAXFER pMetaXfer;
504 } Meta;
505 } Type;
506} VDIOTASK;
507
508/**
509 * Storage handle.
510 */
511typedef struct VDIOSTORAGE
512{
513 /** Image I/O state this storage handle belongs to. */
514 PVDIO pVDIo;
515 /** AVL tree for pending async metadata transfers. */
516 PAVLRFOFFTREE pTreeMetaXfers;
517 /** Storage handle */
518 void *pStorage;
519} VDIOSTORAGE;
520
521/**
522 * Metadata transfer.
523 *
524 * @note This entry can't be freed if either the list is not empty or
525 * the reference counter is not 0.
526 * The assumption is that the backends don't need to read huge amounts of
527 * metadata to complete a transfer so the additional memory overhead should
528 * be relatively small.
529 */
530typedef struct VDMETAXFER
531{
532 /** AVL core for fast search (the file offset is the key) */
533 AVLRFOFFNODECORE Core;
534 /** I/O storage for this transfer. */
535 PVDIOSTORAGE pIoStorage;
536 /** Flags. */
537 uint32_t fFlags;
538 /** List of I/O contexts waiting for this metadata transfer to complete. */
539 RTLISTNODE ListIoCtxWaiting;
540 /** Number of references to this entry. */
541 unsigned cRefs;
542 /** Size of the data stored with this entry. */
543 size_t cbMeta;
544 /** Data stored - variable size. */
545 uint8_t abData[1];
546} VDMETAXFER;
547
548/**
549 * The transfer direction for the metadata.
550 */
551#define VDMETAXFER_TXDIR_MASK 0x3
552#define VDMETAXFER_TXDIR_NONE 0x0
553#define VDMETAXFER_TXDIR_WRITE 0x1
554#define VDMETAXFER_TXDIR_READ 0x2
555#define VDMETAXFER_TXDIR_FLUSH 0x3
556#define VDMETAXFER_TXDIR_GET(flags) ((flags) & VDMETAXFER_TXDIR_MASK)
557#define VDMETAXFER_TXDIR_SET(flags, dir) ((flags) = (flags & ~VDMETAXFER_TXDIR_MASK) | (dir))
558
559extern VBOXHDDBACKEND g_RawBackend;
560extern VBOXHDDBACKEND g_VmdkBackend;
561extern VBOXHDDBACKEND g_VDIBackend;
562extern VBOXHDDBACKEND g_VhdBackend;
563extern VBOXHDDBACKEND g_ParallelsBackend;
564extern VBOXHDDBACKEND g_DmgBackend;
565extern VBOXHDDBACKEND g_ISCSIBackend;
566extern VBOXHDDBACKEND g_QedBackend;
567extern VBOXHDDBACKEND g_QCowBackend;
568extern VBOXHDDBACKEND g_VhdxBackend;
569
570static unsigned g_cBackends = 0;
571static PVBOXHDDBACKEND *g_apBackends = NULL;
572static PVBOXHDDBACKEND aStaticBackends[] =
573{
574 &g_VmdkBackend,
575 &g_VDIBackend,
576 &g_VhdBackend,
577 &g_ParallelsBackend,
578 &g_DmgBackend,
579 &g_QedBackend,
580 &g_QCowBackend,
581 &g_VhdxBackend,
582 &g_RawBackend,
583 &g_ISCSIBackend
584};
585
586/**
587 * Supported backends for the disk cache.
588 */
589extern VDCACHEBACKEND g_VciCacheBackend;
590
591static unsigned g_cCacheBackends = 0;
592static PVDCACHEBACKEND *g_apCacheBackends = NULL;
593static PVDCACHEBACKEND aStaticCacheBackends[] =
594{
595 &g_VciCacheBackend
596};
597
598/** Forward declaration of the async discard helper. */
599static int vdDiscardHelperAsync(PVDIOCTX pIoCtx);
600static int vdWriteHelperAsync(PVDIOCTX pIoCtx);
601static void vdDiskProcessBlockedIoCtx(PVBOXHDD pDisk);
602static int vdDiskUnlock(PVBOXHDD pDisk, PVDIOCTX pIoCtxRc);
603static DECLCALLBACK(void) vdIoCtxSyncComplete(void *pvUser1, void *pvUser2, int rcReq);
604
605/**
606 * internal: add several backends.
607 */
608static int vdAddBackends(PVBOXHDDBACKEND *ppBackends, unsigned cBackends)
609{
610 PVBOXHDDBACKEND *pTmp = (PVBOXHDDBACKEND*)RTMemRealloc(g_apBackends,
611 (g_cBackends + cBackends) * sizeof(PVBOXHDDBACKEND));
612 if (RT_UNLIKELY(!pTmp))
613 return VERR_NO_MEMORY;
614 g_apBackends = pTmp;
615 memcpy(&g_apBackends[g_cBackends], ppBackends, cBackends * sizeof(PVBOXHDDBACKEND));
616 g_cBackends += cBackends;
617 return VINF_SUCCESS;
618}
619
620/**
621 * internal: add single backend.
622 */
623DECLINLINE(int) vdAddBackend(PVBOXHDDBACKEND pBackend)
624{
625 return vdAddBackends(&pBackend, 1);
626}
627
628/**
629 * internal: add several cache backends.
630 */
631static int vdAddCacheBackends(PVDCACHEBACKEND *ppBackends, unsigned cBackends)
632{
633 PVDCACHEBACKEND *pTmp = (PVDCACHEBACKEND*)RTMemRealloc(g_apCacheBackends,
634 (g_cCacheBackends + cBackends) * sizeof(PVDCACHEBACKEND));
635 if (RT_UNLIKELY(!pTmp))
636 return VERR_NO_MEMORY;
637 g_apCacheBackends = pTmp;
638 memcpy(&g_apCacheBackends[g_cCacheBackends], ppBackends, cBackends * sizeof(PVDCACHEBACKEND));
639 g_cCacheBackends += cBackends;
640 return VINF_SUCCESS;
641}
642
643/**
644 * internal: add single cache backend.
645 */
646DECLINLINE(int) vdAddCacheBackend(PVDCACHEBACKEND pBackend)
647{
648 return vdAddCacheBackends(&pBackend, 1);
649}
650
651/**
652 * internal: issue error message.
653 */
654static int vdError(PVBOXHDD pDisk, int rc, RT_SRC_POS_DECL,
655 const char *pszFormat, ...)
656{
657 va_list va;
658 va_start(va, pszFormat);
659 if (pDisk->pInterfaceError)
660 pDisk->pInterfaceError->pfnError(pDisk->pInterfaceError->Core.pvUser, rc, RT_SRC_POS_ARGS, pszFormat, va);
661 va_end(va);
662 return rc;
663}
664
665/**
666 * internal: thread synchronization, start read.
667 */
668DECLINLINE(int) vdThreadStartRead(PVBOXHDD pDisk)
669{
670 int rc = VINF_SUCCESS;
671 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
672 rc = pDisk->pInterfaceThreadSync->pfnStartRead(pDisk->pInterfaceThreadSync->Core.pvUser);
673 return rc;
674}
675
676/**
677 * internal: thread synchronization, finish read.
678 */
679DECLINLINE(int) vdThreadFinishRead(PVBOXHDD pDisk)
680{
681 int rc = VINF_SUCCESS;
682 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
683 rc = pDisk->pInterfaceThreadSync->pfnFinishRead(pDisk->pInterfaceThreadSync->Core.pvUser);
684 return rc;
685}
686
687/**
688 * internal: thread synchronization, start write.
689 */
690DECLINLINE(int) vdThreadStartWrite(PVBOXHDD pDisk)
691{
692 int rc = VINF_SUCCESS;
693 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
694 rc = pDisk->pInterfaceThreadSync->pfnStartWrite(pDisk->pInterfaceThreadSync->Core.pvUser);
695 return rc;
696}
697
698/**
699 * internal: thread synchronization, finish write.
700 */
701DECLINLINE(int) vdThreadFinishWrite(PVBOXHDD pDisk)
702{
703 int rc = VINF_SUCCESS;
704 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
705 rc = pDisk->pInterfaceThreadSync->pfnFinishWrite(pDisk->pInterfaceThreadSync->Core.pvUser);
706 return rc;
707}
708
709/**
710 * internal: find image format backend.
711 */
712static int vdFindBackend(const char *pszBackend, PCVBOXHDDBACKEND *ppBackend)
713{
714 int rc = VINF_SUCCESS;
715 PCVBOXHDDBACKEND pBackend = NULL;
716
717 if (!g_apBackends)
718 VDInit();
719
720 for (unsigned i = 0; i < g_cBackends; i++)
721 {
722 if (!RTStrICmp(pszBackend, g_apBackends[i]->pszBackendName))
723 {
724 pBackend = g_apBackends[i];
725 break;
726 }
727 }
728 *ppBackend = pBackend;
729 return rc;
730}
731
732/**
733 * internal: find cache format backend.
734 */
735static int vdFindCacheBackend(const char *pszBackend, PCVDCACHEBACKEND *ppBackend)
736{
737 int rc = VINF_SUCCESS;
738 PCVDCACHEBACKEND pBackend = NULL;
739
740 if (!g_apCacheBackends)
741 VDInit();
742
743 for (unsigned i = 0; i < g_cCacheBackends; i++)
744 {
745 if (!RTStrICmp(pszBackend, g_apCacheBackends[i]->pszBackendName))
746 {
747 pBackend = g_apCacheBackends[i];
748 break;
749 }
750 }
751 *ppBackend = pBackend;
752 return rc;
753}
754
755/**
756 * internal: add image structure to the end of images list.
757 */
758static void vdAddImageToList(PVBOXHDD pDisk, PVDIMAGE pImage)
759{
760 pImage->pPrev = NULL;
761 pImage->pNext = NULL;
762
763 if (pDisk->pBase)
764 {
765 Assert(pDisk->cImages > 0);
766 pImage->pPrev = pDisk->pLast;
767 pDisk->pLast->pNext = pImage;
768 pDisk->pLast = pImage;
769 }
770 else
771 {
772 Assert(pDisk->cImages == 0);
773 pDisk->pBase = pImage;
774 pDisk->pLast = pImage;
775 }
776
777 pDisk->cImages++;
778}
779
780/**
781 * internal: remove image structure from the images list.
782 */
783static void vdRemoveImageFromList(PVBOXHDD pDisk, PVDIMAGE pImage)
784{
785 Assert(pDisk->cImages > 0);
786
787 if (pImage->pPrev)
788 pImage->pPrev->pNext = pImage->pNext;
789 else
790 pDisk->pBase = pImage->pNext;
791
792 if (pImage->pNext)
793 pImage->pNext->pPrev = pImage->pPrev;
794 else
795 pDisk->pLast = pImage->pPrev;
796
797 pImage->pPrev = NULL;
798 pImage->pNext = NULL;
799
800 pDisk->cImages--;
801}
802
803/**
804 * internal: find image by index into the images list.
805 */
806static PVDIMAGE vdGetImageByNumber(PVBOXHDD pDisk, unsigned nImage)
807{
808 PVDIMAGE pImage = pDisk->pBase;
809 if (nImage == VD_LAST_IMAGE)
810 return pDisk->pLast;
811 while (pImage && nImage)
812 {
813 pImage = pImage->pNext;
814 nImage--;
815 }
816 return pImage;
817}
818
819/**
820 * Initialize the structure members of a given I/O context.
821 */
822DECLINLINE(void) vdIoCtxInit(PVDIOCTX pIoCtx, PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
823 uint64_t uOffset, size_t cbTransfer, PVDIMAGE pImageStart,
824 PCRTSGBUF pcSgBuf, void *pvAllocation,
825 PFNVDIOCTXTRANSFER pfnIoCtxTransfer, uint32_t fFlags)
826{
827 pIoCtx->pDisk = pDisk;
828 pIoCtx->enmTxDir = enmTxDir;
829 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbTransfer; Assert((uint32_t)cbTransfer == cbTransfer);
830 pIoCtx->Req.Io.uOffset = uOffset;
831 pIoCtx->Req.Io.cbTransfer = cbTransfer;
832 pIoCtx->Req.Io.pImageStart = pImageStart;
833 pIoCtx->Req.Io.pImageCur = pImageStart;
834 pIoCtx->Req.Io.cbBufClear = 0;
835 pIoCtx->Req.Io.pImageParentOverride = NULL;
836 pIoCtx->cDataTransfersPending = 0;
837 pIoCtx->cMetaTransfersPending = 0;
838 pIoCtx->fComplete = false;
839 pIoCtx->fFlags = fFlags;
840 pIoCtx->pvAllocation = pvAllocation;
841 pIoCtx->pfnIoCtxTransfer = pfnIoCtxTransfer;
842 pIoCtx->pfnIoCtxTransferNext = NULL;
843 pIoCtx->rcReq = VINF_SUCCESS;
844 pIoCtx->pIoCtxParent = NULL;
845
846 /* There is no S/G list for a flush request. */
847 if ( enmTxDir != VDIOCTXTXDIR_FLUSH
848 && enmTxDir != VDIOCTXTXDIR_DISCARD)
849 RTSgBufClone(&pIoCtx->Req.Io.SgBuf, pcSgBuf);
850 else
851 memset(&pIoCtx->Req.Io.SgBuf, 0, sizeof(RTSGBUF));
852}
853
854/**
855 * Internal: Tries to read the desired range from the given cache.
856 *
857 * @returns VBox status code.
858 * @retval VERR_VD_BLOCK_FREE if the block is not in the cache.
859 * pcbRead will be set to the number of bytes not in the cache.
860 * Everything thereafter might be in the cache.
861 * @param pCache The cache to read from.
862 * @param uOffset Offset of the virtual disk to read.
863 * @param cbRead How much to read.
864 * @param pIoCtx The I/O context to read into.
865 * @param pcbRead Where to store the number of bytes actually read.
866 * On success this indicates the number of bytes read from the cache.
867 * If VERR_VD_BLOCK_FREE is returned this gives the number of bytes
868 * which are not in the cache.
869 * In both cases everything beyond this value
870 * might or might not be in the cache.
871 */
872static int vdCacheReadHelper(PVDCACHE pCache, uint64_t uOffset,
873 size_t cbRead, PVDIOCTX pIoCtx, size_t *pcbRead)
874{
875 int rc = VINF_SUCCESS;
876
877 LogFlowFunc(("pCache=%#p uOffset=%llu pIoCtx=%p cbRead=%zu pcbRead=%#p\n",
878 pCache, uOffset, pIoCtx, cbRead, pcbRead));
879
880 AssertPtr(pCache);
881 AssertPtr(pcbRead);
882
883 rc = pCache->Backend->pfnRead(pCache->pBackendData, uOffset, cbRead,
884 pIoCtx, pcbRead);
885
886 LogFlowFunc(("returns rc=%Rrc pcbRead=%zu\n", rc, *pcbRead));
887 return rc;
888}
889
890/**
891 * Internal: Writes data for the given block into the cache.
892 *
893 * @returns VBox status code.
894 * @param pCache The cache to write to.
895 * @param uOffset Offset of the virtual disk to write to the cache.
896 * @param cbWrite How much to write.
897 * @param pIoCtx The I/O context to ẃrite from.
898 * @param pcbWritten How much data could be written, optional.
899 */
900static int vdCacheWriteHelper(PVDCACHE pCache, uint64_t uOffset, size_t cbWrite,
901 PVDIOCTX pIoCtx, size_t *pcbWritten)
902{
903 int rc = VINF_SUCCESS;
904
905 LogFlowFunc(("pCache=%#p uOffset=%llu pIoCtx=%p cbWrite=%zu pcbWritten=%#p\n",
906 pCache, uOffset, pIoCtx, cbWrite, pcbWritten));
907
908 AssertPtr(pCache);
909 AssertPtr(pIoCtx);
910 Assert(cbWrite > 0);
911
912 if (pcbWritten)
913 rc = pCache->Backend->pfnWrite(pCache->pBackendData, uOffset, cbWrite,
914 pIoCtx, pcbWritten);
915 else
916 {
917 size_t cbWritten = 0;
918
919 do
920 {
921 rc = pCache->Backend->pfnWrite(pCache->pBackendData, uOffset, cbWrite,
922 pIoCtx, &cbWritten);
923 uOffset += cbWritten;
924 cbWrite -= cbWritten;
925 } while ( cbWrite
926 && ( RT_SUCCESS(rc)
927 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS));
928 }
929
930 LogFlowFunc(("returns rc=%Rrc pcbWritten=%zu\n",
931 rc, pcbWritten ? *pcbWritten : cbWrite));
932 return rc;
933}
934
935/**
936 * Creates a new empty discard state.
937 *
938 * @returns Pointer to the new discard state or NULL if out of memory.
939 */
940static PVDDISCARDSTATE vdDiscardStateCreate(void)
941{
942 PVDDISCARDSTATE pDiscard = (PVDDISCARDSTATE)RTMemAllocZ(sizeof(VDDISCARDSTATE));
943
944 if (pDiscard)
945 {
946 RTListInit(&pDiscard->ListLru);
947 pDiscard->pTreeBlocks = (PAVLRU64TREE)RTMemAllocZ(sizeof(AVLRU64TREE));
948 if (!pDiscard->pTreeBlocks)
949 {
950 RTMemFree(pDiscard);
951 pDiscard = NULL;
952 }
953 }
954
955 return pDiscard;
956}
957
958/**
959 * Removes the least recently used blocks from the waiting list until
960 * the new value is reached.
961 *
962 * @returns VBox status code.
963 * @param pDisk VD disk container.
964 * @param pDiscard The discard state.
965 * @param cbDiscardingNew How many bytes should be waiting on success.
966 * The number of bytes waiting can be less.
967 */
968static int vdDiscardRemoveBlocks(PVBOXHDD pDisk, PVDDISCARDSTATE pDiscard, size_t cbDiscardingNew)
969{
970 int rc = VINF_SUCCESS;
971
972 LogFlowFunc(("pDisk=%#p pDiscard=%#p cbDiscardingNew=%zu\n",
973 pDisk, pDiscard, cbDiscardingNew));
974
975 while (pDiscard->cbDiscarding > cbDiscardingNew)
976 {
977 PVDDISCARDBLOCK pBlock = RTListGetLast(&pDiscard->ListLru, VDDISCARDBLOCK, NodeLru);
978
979 Assert(!RTListIsEmpty(&pDiscard->ListLru));
980
981 /* Go over the allocation bitmap and mark all discarded sectors as unused. */
982 uint64_t offStart = pBlock->Core.Key;
983 uint32_t idxStart = 0;
984 size_t cbLeft = pBlock->cbDiscard;
985 bool fAllocated = ASMBitTest(pBlock->pbmAllocated, idxStart);
986 uint32_t cSectors = (uint32_t)(pBlock->cbDiscard / 512);
987
988 while (cbLeft > 0)
989 {
990 int32_t idxEnd;
991 size_t cbThis = cbLeft;
992
993 if (fAllocated)
994 {
995 /* Check for the first unallocated bit. */
996 idxEnd = ASMBitNextClear(pBlock->pbmAllocated, cSectors, idxStart);
997 if (idxEnd != -1)
998 {
999 cbThis = (idxEnd - idxStart) * 512;
1000 fAllocated = false;
1001 }
1002 }
1003 else
1004 {
1005 /* Mark as unused and check for the first set bit. */
1006 idxEnd = ASMBitNextSet(pBlock->pbmAllocated, cSectors, idxStart);
1007 if (idxEnd != -1)
1008 cbThis = (idxEnd - idxStart) * 512;
1009
1010
1011 VDIOCTX IoCtx;
1012 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_DISCARD, 0, 0, NULL,
1013 NULL, NULL, NULL, VDIOCTX_FLAGS_SYNC);
1014 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData,
1015 &IoCtx, offStart, cbThis, NULL,
1016 NULL, &cbThis, NULL,
1017 VD_DISCARD_MARK_UNUSED);
1018 if (RT_FAILURE(rc))
1019 break;
1020
1021 fAllocated = true;
1022 }
1023
1024 idxStart = idxEnd;
1025 offStart += cbThis;
1026 cbLeft -= cbThis;
1027 }
1028
1029 if (RT_FAILURE(rc))
1030 break;
1031
1032 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
1033 Assert(pBlockRemove == pBlock);
1034 RTListNodeRemove(&pBlock->NodeLru);
1035
1036 pDiscard->cbDiscarding -= pBlock->cbDiscard;
1037 RTMemFree(pBlock->pbmAllocated);
1038 RTMemFree(pBlock);
1039 }
1040
1041 Assert(RT_FAILURE(rc) || pDiscard->cbDiscarding <= cbDiscardingNew);
1042
1043 LogFlowFunc(("returns rc=%Rrc\n", rc));
1044 return rc;
1045}
1046
1047/**
1048 * Destroys the current discard state, writing any waiting blocks to the image.
1049 *
1050 * @returns VBox status code.
1051 * @param pDisk VD disk container.
1052 */
1053static int vdDiscardStateDestroy(PVBOXHDD pDisk)
1054{
1055 int rc = VINF_SUCCESS;
1056
1057 if (pDisk->pDiscard)
1058 {
1059 rc = vdDiscardRemoveBlocks(pDisk, pDisk->pDiscard, 0 /* Remove all blocks. */);
1060 AssertRC(rc);
1061 RTMemFree(pDisk->pDiscard->pTreeBlocks);
1062 RTMemFree(pDisk->pDiscard);
1063 pDisk->pDiscard = NULL;
1064 }
1065
1066 return rc;
1067}
1068
1069/**
1070 * Marks the given range as allocated in the image.
1071 * Required if there are discards in progress and a write to a block which can get discarded
1072 * is written to.
1073 *
1074 * @returns VBox status code.
1075 * @param pDisk VD container data.
1076 * @param uOffset First byte to mark as allocated.
1077 * @param cbRange Number of bytes to mark as allocated.
1078 */
1079static int vdDiscardSetRangeAllocated(PVBOXHDD pDisk, uint64_t uOffset, size_t cbRange)
1080{
1081 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
1082 int rc = VINF_SUCCESS;
1083
1084 if (pDiscard)
1085 {
1086 do
1087 {
1088 size_t cbThisRange = cbRange;
1089 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTAvlrU64RangeGet(pDiscard->pTreeBlocks, uOffset);
1090
1091 if (pBlock)
1092 {
1093 int32_t idxStart, idxEnd;
1094
1095 Assert(!(cbThisRange % 512));
1096 Assert(!((uOffset - pBlock->Core.Key) % 512));
1097
1098 cbThisRange = RT_MIN(cbThisRange, pBlock->Core.KeyLast - uOffset + 1);
1099
1100 idxStart = (uOffset - pBlock->Core.Key) / 512;
1101 idxEnd = idxStart + (int32_t)(cbThisRange / 512);
1102 ASMBitSetRange(pBlock->pbmAllocated, idxStart, idxEnd);
1103 }
1104 else
1105 {
1106 pBlock = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, uOffset, true);
1107 if (pBlock)
1108 cbThisRange = RT_MIN(cbThisRange, pBlock->Core.Key - uOffset);
1109 }
1110
1111 Assert(cbRange >= cbThisRange);
1112
1113 uOffset += cbThisRange;
1114 cbRange -= cbThisRange;
1115 } while (cbRange != 0);
1116 }
1117
1118 return rc;
1119}
1120
1121DECLINLINE(PVDIOCTX) vdIoCtxAlloc(PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1122 uint64_t uOffset, size_t cbTransfer,
1123 PVDIMAGE pImageStart,PCRTSGBUF pcSgBuf,
1124 void *pvAllocation, PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1125 uint32_t fFlags)
1126{
1127 PVDIOCTX pIoCtx = NULL;
1128
1129 pIoCtx = (PVDIOCTX)RTMemCacheAlloc(pDisk->hMemCacheIoCtx);
1130 if (RT_LIKELY(pIoCtx))
1131 {
1132 vdIoCtxInit(pIoCtx, pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1133 pcSgBuf, pvAllocation, pfnIoCtxTransfer, fFlags);
1134 }
1135
1136 return pIoCtx;
1137}
1138
1139DECLINLINE(PVDIOCTX) vdIoCtxRootAlloc(PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1140 uint64_t uOffset, size_t cbTransfer,
1141 PVDIMAGE pImageStart, PCRTSGBUF pcSgBuf,
1142 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1143 void *pvUser1, void *pvUser2,
1144 void *pvAllocation,
1145 PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1146 uint32_t fFlags)
1147{
1148 PVDIOCTX pIoCtx = vdIoCtxAlloc(pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1149 pcSgBuf, pvAllocation, pfnIoCtxTransfer, fFlags);
1150
1151 if (RT_LIKELY(pIoCtx))
1152 {
1153 pIoCtx->pIoCtxParent = NULL;
1154 pIoCtx->Type.Root.pfnComplete = pfnComplete;
1155 pIoCtx->Type.Root.pvUser1 = pvUser1;
1156 pIoCtx->Type.Root.pvUser2 = pvUser2;
1157 }
1158
1159 LogFlow(("Allocated root I/O context %#p\n", pIoCtx));
1160 return pIoCtx;
1161}
1162
1163DECLINLINE(PVDIOCTX) vdIoCtxDiscardAlloc(PVBOXHDD pDisk, PCRTRANGE paRanges,
1164 unsigned cRanges,
1165 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1166 void *pvUser1, void *pvUser2,
1167 void *pvAllocation,
1168 PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1169 uint32_t fFlags)
1170{
1171 PVDIOCTX pIoCtx = NULL;
1172
1173 pIoCtx = (PVDIOCTX)RTMemCacheAlloc(pDisk->hMemCacheIoCtx);
1174 if (RT_LIKELY(pIoCtx))
1175 {
1176 pIoCtx->pIoCtxNext = NULL;
1177 pIoCtx->pDisk = pDisk;
1178 pIoCtx->enmTxDir = VDIOCTXTXDIR_DISCARD;
1179 pIoCtx->cDataTransfersPending = 0;
1180 pIoCtx->cMetaTransfersPending = 0;
1181 pIoCtx->fComplete = false;
1182 pIoCtx->fFlags = fFlags;
1183 pIoCtx->pvAllocation = pvAllocation;
1184 pIoCtx->pfnIoCtxTransfer = pfnIoCtxTransfer;
1185 pIoCtx->pfnIoCtxTransferNext = NULL;
1186 pIoCtx->rcReq = VINF_SUCCESS;
1187 pIoCtx->Req.Discard.paRanges = paRanges;
1188 pIoCtx->Req.Discard.cRanges = cRanges;
1189 pIoCtx->Req.Discard.idxRange = 0;
1190 pIoCtx->Req.Discard.cbDiscardLeft = 0;
1191 pIoCtx->Req.Discard.offCur = 0;
1192 pIoCtx->Req.Discard.cbThisDiscard = 0;
1193
1194 pIoCtx->pIoCtxParent = NULL;
1195 pIoCtx->Type.Root.pfnComplete = pfnComplete;
1196 pIoCtx->Type.Root.pvUser1 = pvUser1;
1197 pIoCtx->Type.Root.pvUser2 = pvUser2;
1198 }
1199
1200 LogFlow(("Allocated discard I/O context %#p\n", pIoCtx));
1201 return pIoCtx;
1202}
1203
1204DECLINLINE(PVDIOCTX) vdIoCtxChildAlloc(PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1205 uint64_t uOffset, size_t cbTransfer,
1206 PVDIMAGE pImageStart, PCRTSGBUF pcSgBuf,
1207 PVDIOCTX pIoCtxParent, size_t cbTransferParent,
1208 size_t cbWriteParent, void *pvAllocation,
1209 PFNVDIOCTXTRANSFER pfnIoCtxTransfer)
1210{
1211 PVDIOCTX pIoCtx = vdIoCtxAlloc(pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1212 pcSgBuf, pvAllocation, pfnIoCtxTransfer, pIoCtxParent->fFlags & ~VDIOCTX_FLAGS_DONT_FREE);
1213
1214 AssertPtr(pIoCtxParent);
1215 Assert(!pIoCtxParent->pIoCtxParent);
1216
1217 if (RT_LIKELY(pIoCtx))
1218 {
1219 pIoCtx->pIoCtxParent = pIoCtxParent;
1220 pIoCtx->Type.Child.uOffsetSaved = uOffset;
1221 pIoCtx->Type.Child.cbTransferLeftSaved = cbTransfer;
1222 pIoCtx->Type.Child.cbTransferParent = cbTransferParent;
1223 pIoCtx->Type.Child.cbWriteParent = cbWriteParent;
1224 }
1225
1226 LogFlow(("Allocated child I/O context %#p\n", pIoCtx));
1227 return pIoCtx;
1228}
1229
1230DECLINLINE(PVDIOTASK) vdIoTaskUserAlloc(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser, PVDIOCTX pIoCtx, uint32_t cbTransfer)
1231{
1232 PVDIOTASK pIoTask = NULL;
1233
1234 pIoTask = (PVDIOTASK)RTMemCacheAlloc(pIoStorage->pVDIo->pDisk->hMemCacheIoTask);
1235 if (pIoTask)
1236 {
1237 pIoTask->pIoStorage = pIoStorage;
1238 pIoTask->pfnComplete = pfnComplete;
1239 pIoTask->pvUser = pvUser;
1240 pIoTask->fMeta = false;
1241 pIoTask->Type.User.cbTransfer = cbTransfer;
1242 pIoTask->Type.User.pIoCtx = pIoCtx;
1243 }
1244
1245 return pIoTask;
1246}
1247
1248DECLINLINE(PVDIOTASK) vdIoTaskMetaAlloc(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser, PVDMETAXFER pMetaXfer)
1249{
1250 PVDIOTASK pIoTask = NULL;
1251
1252 pIoTask = (PVDIOTASK)RTMemCacheAlloc(pIoStorage->pVDIo->pDisk->hMemCacheIoTask);
1253 if (pIoTask)
1254 {
1255 pIoTask->pIoStorage = pIoStorage;
1256 pIoTask->pfnComplete = pfnComplete;
1257 pIoTask->pvUser = pvUser;
1258 pIoTask->fMeta = true;
1259 pIoTask->Type.Meta.pMetaXfer = pMetaXfer;
1260 }
1261
1262 return pIoTask;
1263}
1264
1265DECLINLINE(void) vdIoCtxFree(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1266{
1267 Log(("Freeing I/O context %#p\n", pIoCtx));
1268
1269 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_DONT_FREE))
1270 {
1271 if (pIoCtx->pvAllocation)
1272 RTMemFree(pIoCtx->pvAllocation);
1273#ifdef DEBUG
1274 memset(&pIoCtx->pDisk, 0xff, sizeof(void *));
1275#endif
1276 RTMemCacheFree(pDisk->hMemCacheIoCtx, pIoCtx);
1277 }
1278}
1279
1280DECLINLINE(void) vdIoTaskFree(PVBOXHDD pDisk, PVDIOTASK pIoTask)
1281{
1282//#ifdef DEBUG
1283 memset(pIoTask, 0xff, sizeof(VDIOTASK));
1284//#endif
1285 RTMemCacheFree(pDisk->hMemCacheIoTask, pIoTask);
1286}
1287
1288DECLINLINE(void) vdIoCtxChildReset(PVDIOCTX pIoCtx)
1289{
1290 AssertPtr(pIoCtx->pIoCtxParent);
1291
1292 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
1293 pIoCtx->Req.Io.uOffset = pIoCtx->Type.Child.uOffsetSaved;
1294 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)pIoCtx->Type.Child.cbTransferLeftSaved;
1295 Assert((uint32_t)pIoCtx->Type.Child.cbTransferLeftSaved == pIoCtx->Type.Child.cbTransferLeftSaved);
1296}
1297
1298DECLINLINE(PVDMETAXFER) vdMetaXferAlloc(PVDIOSTORAGE pIoStorage, uint64_t uOffset, size_t cb)
1299{
1300 PVDMETAXFER pMetaXfer = (PVDMETAXFER)RTMemAlloc(RT_OFFSETOF(VDMETAXFER, abData[cb]));
1301
1302 if (RT_LIKELY(pMetaXfer))
1303 {
1304 pMetaXfer->Core.Key = uOffset;
1305 pMetaXfer->Core.KeyLast = uOffset + cb - 1;
1306 pMetaXfer->fFlags = VDMETAXFER_TXDIR_NONE;
1307 pMetaXfer->cbMeta = cb;
1308 pMetaXfer->pIoStorage = pIoStorage;
1309 pMetaXfer->cRefs = 0;
1310 RTListInit(&pMetaXfer->ListIoCtxWaiting);
1311 }
1312 return pMetaXfer;
1313}
1314
1315DECLINLINE(void) vdIoCtxAddToWaitingList(volatile PVDIOCTX *ppList, PVDIOCTX pIoCtx)
1316{
1317 /* Put it on the waiting list. */
1318 PVDIOCTX pNext = ASMAtomicUoReadPtrT(ppList, PVDIOCTX);
1319 PVDIOCTX pHeadOld;
1320 pIoCtx->pIoCtxNext = pNext;
1321 while (!ASMAtomicCmpXchgExPtr(ppList, pIoCtx, pNext, &pHeadOld))
1322 {
1323 pNext = pHeadOld;
1324 Assert(pNext != pIoCtx);
1325 pIoCtx->pIoCtxNext = pNext;
1326 ASMNopPause();
1327 }
1328}
1329
1330DECLINLINE(void) vdIoCtxDefer(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1331{
1332 LogFlowFunc(("Deferring write pIoCtx=%#p\n", pIoCtx));
1333
1334 Assert(!pIoCtx->pIoCtxParent && !(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED));
1335 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
1336 vdIoCtxAddToWaitingList(&pDisk->pIoCtxBlockedHead, pIoCtx);
1337}
1338
1339static size_t vdIoCtxCopy(PVDIOCTX pIoCtxDst, PVDIOCTX pIoCtxSrc, size_t cbData)
1340{
1341 return RTSgBufCopy(&pIoCtxDst->Req.Io.SgBuf, &pIoCtxSrc->Req.Io.SgBuf, cbData);
1342}
1343
1344static int vdIoCtxCmp(PVDIOCTX pIoCtx1, PVDIOCTX pIoCtx2, size_t cbData)
1345{
1346 return RTSgBufCmp(&pIoCtx1->Req.Io.SgBuf, &pIoCtx2->Req.Io.SgBuf, cbData);
1347}
1348
1349static size_t vdIoCtxCopyTo(PVDIOCTX pIoCtx, const uint8_t *pbData, size_t cbData)
1350{
1351 return RTSgBufCopyFromBuf(&pIoCtx->Req.Io.SgBuf, pbData, cbData);
1352}
1353
1354static size_t vdIoCtxCopyFrom(PVDIOCTX pIoCtx, uint8_t *pbData, size_t cbData)
1355{
1356 return RTSgBufCopyToBuf(&pIoCtx->Req.Io.SgBuf, pbData, cbData);
1357}
1358
1359static size_t vdIoCtxSet(PVDIOCTX pIoCtx, uint8_t ch, size_t cbData)
1360{
1361 return RTSgBufSet(&pIoCtx->Req.Io.SgBuf, ch, cbData);
1362}
1363
1364/**
1365 * Process the I/O context, core method which assumes that the I/O context
1366 * acquired the lock.
1367 *
1368 * @returns VBox status code.
1369 * @param pIoCtx I/O context to process.
1370 */
1371static int vdIoCtxProcessLocked(PVDIOCTX pIoCtx)
1372{
1373 int rc = VINF_SUCCESS;
1374
1375 VD_IS_LOCKED(pIoCtx->pDisk);
1376
1377 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
1378
1379 if ( !pIoCtx->cMetaTransfersPending
1380 && !pIoCtx->cDataTransfersPending
1381 && !pIoCtx->pfnIoCtxTransfer)
1382 {
1383 rc = VINF_VD_ASYNC_IO_FINISHED;
1384 goto out;
1385 }
1386
1387 /*
1388 * We complete the I/O context in case of an error
1389 * if there is no I/O task pending.
1390 */
1391 if ( RT_FAILURE(pIoCtx->rcReq)
1392 && !pIoCtx->cMetaTransfersPending
1393 && !pIoCtx->cDataTransfersPending)
1394 {
1395 rc = VINF_VD_ASYNC_IO_FINISHED;
1396 goto out;
1397 }
1398
1399 /* Don't change anything if there is a metadata transfer pending or we are blocked. */
1400 if ( pIoCtx->cMetaTransfersPending
1401 || (pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
1402 {
1403 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1404 goto out;
1405 }
1406
1407 if (pIoCtx->pfnIoCtxTransfer)
1408 {
1409 /* Call the transfer function advancing to the next while there is no error. */
1410 while ( pIoCtx->pfnIoCtxTransfer
1411 && !pIoCtx->cMetaTransfersPending
1412 && RT_SUCCESS(rc))
1413 {
1414 LogFlowFunc(("calling transfer function %#p\n", pIoCtx->pfnIoCtxTransfer));
1415 rc = pIoCtx->pfnIoCtxTransfer(pIoCtx);
1416
1417 /* Advance to the next part of the transfer if the current one succeeded. */
1418 if (RT_SUCCESS(rc))
1419 {
1420 pIoCtx->pfnIoCtxTransfer = pIoCtx->pfnIoCtxTransferNext;
1421 pIoCtx->pfnIoCtxTransferNext = NULL;
1422 }
1423 }
1424 }
1425
1426 if ( RT_SUCCESS(rc)
1427 && !pIoCtx->cMetaTransfersPending
1428 && !pIoCtx->cDataTransfersPending)
1429 rc = VINF_VD_ASYNC_IO_FINISHED;
1430 else if ( RT_SUCCESS(rc)
1431 || rc == VERR_VD_NOT_ENOUGH_METADATA
1432 || rc == VERR_VD_IOCTX_HALT)
1433 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1434 else if ( RT_FAILURE(rc)
1435 && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
1436 && (rc != VERR_DISK_FULL))
1437 {
1438 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rc, VINF_SUCCESS);
1439 /*
1440 * The I/O context completed if we have an error and there is no data
1441 * or meta data transfer pending.
1442 */
1443 if ( !pIoCtx->cMetaTransfersPending
1444 && !pIoCtx->cDataTransfersPending)
1445 rc = VINF_VD_ASYNC_IO_FINISHED;
1446 else
1447 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1448 }
1449
1450out:
1451 LogFlowFunc(("pIoCtx=%#p rc=%Rrc cDataTransfersPending=%u cMetaTransfersPending=%u fComplete=%RTbool\n",
1452 pIoCtx, rc, pIoCtx->cDataTransfersPending, pIoCtx->cMetaTransfersPending,
1453 pIoCtx->fComplete));
1454
1455 return rc;
1456}
1457
1458/**
1459 * Processes the list of waiting I/O contexts.
1460 *
1461 * @returns VBox status code.
1462 * @param pDisk The disk structure.
1463 * @param pIoCtxRc An I/O context handle which waits on the list. When processed
1464 * The status code is returned. NULL if there is no I/O context
1465 * to return the status code for.
1466 */
1467static int vdDiskProcessWaitingIoCtx(PVBOXHDD pDisk, PVDIOCTX pIoCtxRc)
1468{
1469 int rc = VINF_SUCCESS;
1470
1471 LogFlowFunc(("pDisk=%#p pIoCtxRc=%#p\n", pDisk, pIoCtxRc));
1472
1473 VD_IS_LOCKED(pDisk);
1474
1475 /* Get the waiting list and process it in FIFO order. */
1476 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxHead, NULL, PVDIOCTX);
1477
1478 /* Reverse it. */
1479 PVDIOCTX pCur = pIoCtxHead;
1480 pIoCtxHead = NULL;
1481 while (pCur)
1482 {
1483 PVDIOCTX pInsert = pCur;
1484 pCur = pCur->pIoCtxNext;
1485 pInsert->pIoCtxNext = pIoCtxHead;
1486 pIoCtxHead = pInsert;
1487 }
1488
1489 /* Process now. */
1490 pCur = pIoCtxHead;
1491 while (pCur)
1492 {
1493 int rcTmp;
1494 PVDIOCTX pTmp = pCur;
1495
1496 pCur = pCur->pIoCtxNext;
1497 pTmp->pIoCtxNext = NULL;
1498
1499 /*
1500 * Need to clear the sync flag here if there is a new I/O context
1501 * with it set and the context is not given in pIoCtxRc.
1502 * This happens most likely on a different thread and that one shouldn't
1503 * process the context synchronously.
1504 *
1505 * The thread who issued the context will wait on the event semaphore
1506 * anyway which is signalled when the completion handler is called.
1507 */
1508 if ( pTmp->fFlags & VDIOCTX_FLAGS_SYNC
1509 && pTmp != pIoCtxRc)
1510 pTmp->fFlags &= ~VDIOCTX_FLAGS_SYNC;
1511
1512 rcTmp = vdIoCtxProcessLocked(pTmp);
1513 if (pTmp == pIoCtxRc)
1514 {
1515 /* The given I/O context was processed, pass the return code to the caller. */
1516 rc = rcTmp;
1517 }
1518 else if ( rcTmp == VINF_VD_ASYNC_IO_FINISHED
1519 && ASMAtomicCmpXchgBool(&pTmp->fComplete, true, false))
1520 {
1521 LogFlowFunc(("Waiting I/O context completed pTmp=%#p\n", pTmp));
1522 vdThreadFinishWrite(pDisk);
1523 pTmp->Type.Root.pfnComplete(pTmp->Type.Root.pvUser1,
1524 pTmp->Type.Root.pvUser2,
1525 pTmp->rcReq);
1526 vdIoCtxFree(pDisk, pTmp);
1527 }
1528 }
1529
1530 /*
1531 * vdIoCtxProcessLocked() never returns VINF_SUCCESS.
1532 * If the status code is still set and a valid I/O context was given
1533 * it was not found on the list (another thread cleared it already).
1534 * Return I/O in progress status code in that case.
1535 */
1536 if (rc == VINF_SUCCESS && pIoCtxRc)
1537 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1538
1539 LogFlowFunc(("returns rc=%Rrc\n", rc));
1540 return rc;
1541}
1542
1543/**
1544 * Processes the list of blocked I/O contexts.
1545 *
1546 * @returns nothing.
1547 * @param pDisk The disk structure.
1548 */
1549static void vdDiskProcessBlockedIoCtx(PVBOXHDD pDisk)
1550{
1551 LogFlowFunc(("pDisk=%#p\n", pDisk));
1552
1553 VD_IS_LOCKED(pDisk);
1554
1555 /* Get the waiting list and process it in FIFO order. */
1556 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxBlockedHead, NULL, PVDIOCTX);
1557
1558 /* Reverse it. */
1559 PVDIOCTX pCur = pIoCtxHead;
1560 pIoCtxHead = NULL;
1561 while (pCur)
1562 {
1563 PVDIOCTX pInsert = pCur;
1564 pCur = pCur->pIoCtxNext;
1565 pInsert->pIoCtxNext = pIoCtxHead;
1566 pIoCtxHead = pInsert;
1567 }
1568
1569 /* Process now. */
1570 pCur = pIoCtxHead;
1571 while (pCur)
1572 {
1573 int rc;
1574 PVDIOCTX pTmp = pCur;
1575
1576 pCur = pCur->pIoCtxNext;
1577 pTmp->pIoCtxNext = NULL;
1578
1579 Assert(!pTmp->pIoCtxParent);
1580 Assert(pTmp->fFlags & VDIOCTX_FLAGS_BLOCKED);
1581 pTmp->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
1582
1583 rc = vdIoCtxProcessLocked(pTmp);
1584 if ( rc == VINF_VD_ASYNC_IO_FINISHED
1585 && ASMAtomicCmpXchgBool(&pTmp->fComplete, true, false))
1586 {
1587 LogFlowFunc(("Waiting I/O context completed pTmp=%#p\n", pTmp));
1588 vdThreadFinishWrite(pDisk);
1589 pTmp->Type.Root.pfnComplete(pTmp->Type.Root.pvUser1,
1590 pTmp->Type.Root.pvUser2,
1591 pTmp->rcReq);
1592 vdIoCtxFree(pDisk, pTmp);
1593 }
1594 }
1595
1596 LogFlowFunc(("returns\n"));
1597}
1598
1599/**
1600 * Processes the I/O context trying to lock the criticial section.
1601 * The context is deferred if the critical section is busy.
1602 *
1603 * @returns VBox status code.
1604 * @param pIoCtx The I/O context to process.
1605 */
1606static int vdIoCtxProcessTryLockDefer(PVDIOCTX pIoCtx)
1607{
1608 int rc = VINF_SUCCESS;
1609 PVBOXHDD pDisk = pIoCtx->pDisk;
1610
1611 Log(("Defer pIoCtx=%#p\n", pIoCtx));
1612
1613 /* Put it on the waiting list first. */
1614 vdIoCtxAddToWaitingList(&pDisk->pIoCtxHead, pIoCtx);
1615
1616 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
1617 {
1618 /* Leave it again, the context will be processed just before leaving the lock. */
1619 LogFlowFunc(("Successfully acquired the lock\n"));
1620 rc = vdDiskUnlock(pDisk, pIoCtx);
1621 }
1622 else
1623 {
1624 LogFlowFunc(("Lock is held\n"));
1625 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1626 }
1627
1628 return rc;
1629}
1630
1631/**
1632 * Process the I/O context in a synchronous manner, waiting
1633 * for it to complete.
1634 *
1635 * @returns VBox status code of the completed request.
1636 * @param pIoCtx The sync I/O context.
1637 */
1638static int vdIoCtxProcessSync(PVDIOCTX pIoCtx)
1639{
1640 int rc = VINF_SUCCESS;
1641 PVBOXHDD pDisk = pIoCtx->pDisk;
1642
1643 LogFlowFunc(("pIoCtx=%p\n", pIoCtx));
1644
1645 AssertMsg(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC,
1646 ("I/O context is not marked as synchronous\n"));
1647
1648 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
1649 if (rc == VINF_VD_ASYNC_IO_FINISHED)
1650 rc = VINF_SUCCESS;
1651
1652 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
1653 {
1654 rc = RTSemEventWait(pDisk->hEventSemSyncIo, RT_INDEFINITE_WAIT);
1655 AssertRC(rc);
1656
1657 rc = pDisk->rcSync;
1658 }
1659 else /* Success or error. */
1660 {
1661 rc = pIoCtx->rcReq;
1662 vdIoCtxFree(pDisk, pIoCtx);
1663 }
1664
1665 return rc;
1666}
1667
1668DECLINLINE(bool) vdIoCtxIsDiskLockOwner(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1669{
1670 return pDisk->pIoCtxLockOwner == pIoCtx;
1671}
1672
1673static int vdIoCtxLockDisk(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1674{
1675 int rc = VINF_SUCCESS;
1676
1677 VD_IS_LOCKED(pDisk);
1678
1679 LogFlowFunc(("pDisk=%#p pIoCtx=%#p\n", pDisk, pIoCtx));
1680
1681 if (!ASMAtomicCmpXchgPtr(&pDisk->pIoCtxLockOwner, pIoCtx, NIL_VDIOCTX))
1682 {
1683 Assert(pDisk->pIoCtxLockOwner != pIoCtx); /* No nesting allowed. */
1684 vdIoCtxDefer(pDisk, pIoCtx);
1685 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1686 }
1687
1688 LogFlowFunc(("returns -> %Rrc\n", rc));
1689 return rc;
1690}
1691
1692static void vdIoCtxUnlockDisk(PVBOXHDD pDisk, PVDIOCTX pIoCtx, bool fProcessBlockedReqs)
1693{
1694 LogFlowFunc(("pDisk=%#p pIoCtx=%#p fProcessBlockedReqs=%RTbool\n",
1695 pDisk, pIoCtx, fProcessBlockedReqs));
1696
1697 VD_IS_LOCKED(pDisk);
1698
1699 LogFlow(("Unlocking disk lock owner is %#p\n", pDisk->pIoCtxLockOwner));
1700 Assert(pDisk->pIoCtxLockOwner == pIoCtx);
1701 ASMAtomicXchgPtrT(&pDisk->pIoCtxLockOwner, NIL_VDIOCTX, PVDIOCTX);
1702
1703 if (fProcessBlockedReqs)
1704 {
1705 /* Process any blocked writes if the current request didn't caused another growing. */
1706 vdDiskProcessBlockedIoCtx(pDisk);
1707 }
1708
1709 LogFlowFunc(("returns\n"));
1710}
1711
1712/**
1713 * Internal: Reads a given amount of data from the image chain of the disk.
1714 **/
1715static int vdDiskReadHelper(PVBOXHDD pDisk, PVDIMAGE pImage, PVDIMAGE pImageParentOverride,
1716 uint64_t uOffset, size_t cbRead, PVDIOCTX pIoCtx, size_t *pcbThisRead)
1717{
1718 int rc = VINF_SUCCESS;
1719 size_t cbThisRead = cbRead;
1720
1721 AssertPtr(pcbThisRead);
1722
1723 *pcbThisRead = 0;
1724
1725 /*
1726 * Try to read from the given image.
1727 * If the block is not allocated read from override chain if present.
1728 */
1729 rc = pImage->Backend->pfnRead(pImage->pBackendData,
1730 uOffset, cbThisRead, pIoCtx,
1731 &cbThisRead);
1732
1733 if (rc == VERR_VD_BLOCK_FREE)
1734 {
1735 for (PVDIMAGE pCurrImage = pImageParentOverride ? pImageParentOverride : pImage->pPrev;
1736 pCurrImage != NULL && rc == VERR_VD_BLOCK_FREE;
1737 pCurrImage = pCurrImage->pPrev)
1738 {
1739 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
1740 uOffset, cbThisRead, pIoCtx,
1741 &cbThisRead);
1742 }
1743 }
1744
1745 if (RT_SUCCESS(rc) || rc == VERR_VD_BLOCK_FREE)
1746 *pcbThisRead = cbThisRead;
1747
1748 return rc;
1749}
1750
1751/**
1752 * internal: read the specified amount of data in whatever blocks the backend
1753 * will give us - async version.
1754 */
1755static int vdReadHelperAsync(PVDIOCTX pIoCtx)
1756{
1757 int rc;
1758 PVBOXHDD pDisk = pIoCtx->pDisk;
1759 size_t cbToRead = pIoCtx->Req.Io.cbTransfer;
1760 uint64_t uOffset = pIoCtx->Req.Io.uOffset;
1761 PVDIMAGE pCurrImage = pIoCtx->Req.Io.pImageCur;
1762 PVDIMAGE pImageParentOverride = pIoCtx->Req.Io.pImageParentOverride;
1763 unsigned cImagesRead = pIoCtx->Req.Io.cImagesRead;
1764 size_t cbThisRead;
1765
1766 /* Loop until all reads started or we have a backend which needs to read metadata. */
1767 do
1768 {
1769 /* Search for image with allocated block. Do not attempt to read more
1770 * than the previous reads marked as valid. Otherwise this would return
1771 * stale data when different block sizes are used for the images. */
1772 cbThisRead = cbToRead;
1773
1774 if ( pDisk->pCache
1775 && !pImageParentOverride)
1776 {
1777 rc = vdCacheReadHelper(pDisk->pCache, uOffset, cbThisRead,
1778 pIoCtx, &cbThisRead);
1779 if (rc == VERR_VD_BLOCK_FREE)
1780 {
1781 rc = vdDiskReadHelper(pDisk, pCurrImage, NULL, uOffset, cbThisRead,
1782 pIoCtx, &cbThisRead);
1783
1784 /* If the read was successful, write the data back into the cache. */
1785 if ( RT_SUCCESS(rc)
1786 && pIoCtx->fFlags & VDIOCTX_FLAGS_READ_UPDATE_CACHE)
1787 {
1788 rc = vdCacheWriteHelper(pDisk->pCache, uOffset, cbThisRead,
1789 pIoCtx, NULL);
1790 }
1791 }
1792 }
1793 else
1794 {
1795
1796 /*
1797 * Try to read from the given image.
1798 * If the block is not allocated read from override chain if present.
1799 */
1800 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
1801 uOffset, cbThisRead, pIoCtx,
1802 &cbThisRead);
1803
1804 if ( rc == VERR_VD_BLOCK_FREE
1805 && cImagesRead != 1)
1806 {
1807 unsigned cImagesToProcess = cImagesRead;
1808
1809 pCurrImage = pImageParentOverride ? pImageParentOverride : pCurrImage->pPrev;
1810 pIoCtx->Req.Io.pImageParentOverride = NULL;
1811
1812 while (pCurrImage && rc == VERR_VD_BLOCK_FREE)
1813 {
1814 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
1815 uOffset, cbThisRead,
1816 pIoCtx, &cbThisRead);
1817 if (cImagesToProcess == 1)
1818 break;
1819 else if (cImagesToProcess > 0)
1820 cImagesToProcess--;
1821
1822 if (rc == VERR_VD_BLOCK_FREE)
1823 pCurrImage = pCurrImage->pPrev;
1824 }
1825 }
1826 }
1827
1828 /* The task state will be updated on success already, don't do it here!. */
1829 if (rc == VERR_VD_BLOCK_FREE)
1830 {
1831 /* No image in the chain contains the data for the block. */
1832 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbThisRead); Assert(cbThisRead == (uint32_t)cbThisRead);
1833
1834 /* Fill the free space with 0 if we are told to do so
1835 * or a previous read returned valid data. */
1836 if (pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS)
1837 vdIoCtxSet(pIoCtx, '\0', cbThisRead);
1838 else
1839 pIoCtx->Req.Io.cbBufClear += cbThisRead;
1840
1841 if (pIoCtx->Req.Io.pImageCur->uOpenFlags & VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS)
1842 rc = VINF_VD_NEW_ZEROED_BLOCK;
1843 else
1844 rc = VINF_SUCCESS;
1845 }
1846 else if (rc == VERR_VD_IOCTX_HALT)
1847 {
1848 uOffset += cbThisRead;
1849 cbToRead -= cbThisRead;
1850 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
1851 }
1852 else if ( RT_SUCCESS(rc)
1853 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
1854 {
1855 /* First not free block, fill the space before with 0. */
1856 if ( pIoCtx->Req.Io.cbBufClear
1857 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS))
1858 {
1859 RTSGBUF SgBuf;
1860 RTSgBufClone(&SgBuf, &pIoCtx->Req.Io.SgBuf);
1861 RTSgBufReset(&SgBuf);
1862 RTSgBufSet(&SgBuf, 0, pIoCtx->Req.Io.cbBufClear);
1863 pIoCtx->Req.Io.cbBufClear = 0;
1864 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
1865 }
1866 rc = VINF_SUCCESS;
1867 }
1868
1869 if (RT_FAILURE(rc))
1870 break;
1871
1872 cbToRead -= cbThisRead;
1873 uOffset += cbThisRead;
1874 pCurrImage = pIoCtx->Req.Io.pImageStart; /* Start with the highest image in the chain. */
1875 } while (cbToRead != 0 && RT_SUCCESS(rc));
1876
1877 if ( rc == VERR_VD_NOT_ENOUGH_METADATA
1878 || rc == VERR_VD_IOCTX_HALT)
1879 {
1880 /* Save the current state. */
1881 pIoCtx->Req.Io.uOffset = uOffset;
1882 pIoCtx->Req.Io.cbTransfer = cbToRead;
1883 pIoCtx->Req.Io.pImageCur = pCurrImage ? pCurrImage : pIoCtx->Req.Io.pImageStart;
1884 }
1885
1886 return (!(pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS))
1887 ? VERR_VD_BLOCK_FREE
1888 : rc;
1889}
1890
1891/**
1892 * internal: parent image read wrapper for compacting.
1893 */
1894static int vdParentRead(void *pvUser, uint64_t uOffset, void *pvBuf,
1895 size_t cbRead)
1896{
1897 PVDPARENTSTATEDESC pParentState = (PVDPARENTSTATEDESC)pvUser;
1898
1899 /** @todo
1900 * Only used for compaction so far which is not possible to mix with async I/O.
1901 * Needs to be changed if we want to support online compaction of images.
1902 */
1903 bool fLocked = ASMAtomicXchgBool(&pParentState->pDisk->fLocked, true);
1904 AssertMsgReturn(!fLocked,
1905 ("Calling synchronous parent read while another thread holds the disk lock\n"),
1906 VERR_VD_INVALID_STATE);
1907
1908 /* Fake an I/O context. */
1909 RTSGSEG Segment;
1910 RTSGBUF SgBuf;
1911 VDIOCTX IoCtx;
1912
1913 Segment.pvSeg = pvBuf;
1914 Segment.cbSeg = cbRead;
1915 RTSgBufInit(&SgBuf, &Segment, 1);
1916 vdIoCtxInit(&IoCtx, pParentState->pDisk, VDIOCTXTXDIR_READ, uOffset, cbRead, pParentState->pImage,
1917 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
1918 int rc = vdReadHelperAsync(&IoCtx);
1919 ASMAtomicXchgBool(&pParentState->pDisk->fLocked, false);
1920 return rc;
1921}
1922
1923/**
1924 * Extended version of vdReadHelper(), implementing certain optimizations
1925 * for image cloning.
1926 *
1927 * @returns VBox status code.
1928 * @param pDisk The disk to read from.
1929 * @param pImage The image to start reading from.
1930 * @param pImageParentOverride The parent image to read from
1931 * if the starting image returns a free block.
1932 * If NULL is passed the real parent of the image
1933 * in the chain is used.
1934 * @param uOffset Offset in the disk to start reading from.
1935 * @param pvBuf Where to store the read data.
1936 * @param cbRead How much to read.
1937 * @param fZeroFreeBlocks Flag whether free blocks should be zeroed.
1938 * If false and no image has data for sepcified
1939 * range VERR_VD_BLOCK_FREE is returned.
1940 * Note that unallocated blocks are still zeroed
1941 * if at least one image has valid data for a part
1942 * of the range.
1943 * @param fUpdateCache Flag whether to update the attached cache if
1944 * available.
1945 * @param cImagesRead Number of images in the chain to read until
1946 * the read is cut off. A value of 0 disables the cut off.
1947 */
1948static int vdReadHelperEx(PVBOXHDD pDisk, PVDIMAGE pImage, PVDIMAGE pImageParentOverride,
1949 uint64_t uOffset, void *pvBuf, size_t cbRead,
1950 bool fZeroFreeBlocks, bool fUpdateCache, unsigned cImagesRead)
1951{
1952 uint32_t fFlags = VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE;
1953 RTSGSEG Segment;
1954 RTSGBUF SgBuf;
1955 VDIOCTX IoCtx;
1956
1957 if (fZeroFreeBlocks)
1958 fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
1959 if (fUpdateCache)
1960 fFlags |= VDIOCTX_FLAGS_READ_UPDATE_CACHE;
1961
1962 Segment.pvSeg = pvBuf;
1963 Segment.cbSeg = cbRead;
1964 RTSgBufInit(&SgBuf, &Segment, 1);
1965 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, uOffset, cbRead, pImage, &SgBuf,
1966 NULL, vdReadHelperAsync, fFlags);
1967
1968 IoCtx.Req.Io.pImageParentOverride = pImageParentOverride;
1969 IoCtx.Req.Io.cImagesRead = cImagesRead;
1970 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
1971 IoCtx.Type.Root.pvUser1 = pDisk;
1972 IoCtx.Type.Root.pvUser2 = NULL;
1973 return vdIoCtxProcessSync(&IoCtx);
1974}
1975
1976/**
1977 * internal: read the specified amount of data in whatever blocks the backend
1978 * will give us.
1979 */
1980static int vdReadHelper(PVBOXHDD pDisk, PVDIMAGE pImage, uint64_t uOffset,
1981 void *pvBuf, size_t cbRead, bool fUpdateCache)
1982{
1983 return vdReadHelperEx(pDisk, pImage, NULL, uOffset, pvBuf, cbRead,
1984 true /* fZeroFreeBlocks */, fUpdateCache, 0);
1985}
1986
1987/**
1988 * internal: mark the disk as not modified.
1989 */
1990static void vdResetModifiedFlag(PVBOXHDD pDisk)
1991{
1992 if (pDisk->uModified & VD_IMAGE_MODIFIED_FLAG)
1993 {
1994 /* generate new last-modified uuid */
1995 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
1996 {
1997 RTUUID Uuid;
1998
1999 RTUuidCreate(&Uuid);
2000 pDisk->pLast->Backend->pfnSetModificationUuid(pDisk->pLast->pBackendData,
2001 &Uuid);
2002
2003 if (pDisk->pCache)
2004 pDisk->pCache->Backend->pfnSetModificationUuid(pDisk->pCache->pBackendData,
2005 &Uuid);
2006 }
2007
2008 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FLAG;
2009 }
2010}
2011
2012/**
2013 * internal: mark the disk as modified.
2014 */
2015static void vdSetModifiedFlag(PVBOXHDD pDisk)
2016{
2017 pDisk->uModified |= VD_IMAGE_MODIFIED_FLAG;
2018 if (pDisk->uModified & VD_IMAGE_MODIFIED_FIRST)
2019 {
2020 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FIRST;
2021
2022 /* First modify, so create a UUID and ensure it's written to disk. */
2023 vdResetModifiedFlag(pDisk);
2024
2025 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
2026 {
2027 VDIOCTX IoCtx;
2028 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_FLUSH, 0, 0, NULL,
2029 NULL, NULL, NULL, VDIOCTX_FLAGS_SYNC);
2030 pDisk->pLast->Backend->pfnFlush(pDisk->pLast->pBackendData, &IoCtx);
2031 }
2032 }
2033}
2034
2035/**
2036 * internal: write buffer to the image, taking care of block boundaries and
2037 * write optimizations.
2038 */
2039static int vdWriteHelperEx(PVBOXHDD pDisk, PVDIMAGE pImage,
2040 PVDIMAGE pImageParentOverride, uint64_t uOffset,
2041 const void *pvBuf, size_t cbWrite,
2042 uint32_t fFlags, unsigned cImagesRead)
2043{
2044 RTSGSEG Segment;
2045 RTSGBUF SgBuf;
2046 VDIOCTX IoCtx;
2047
2048 fFlags |= VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE;
2049
2050 Segment.pvSeg = (void *)pvBuf;
2051 Segment.cbSeg = cbWrite;
2052 RTSgBufInit(&SgBuf, &Segment, 1);
2053 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_WRITE, uOffset, cbWrite, pImage, &SgBuf,
2054 NULL, vdWriteHelperAsync, fFlags);
2055
2056 IoCtx.Req.Io.pImageParentOverride = pImageParentOverride;
2057 IoCtx.Req.Io.cImagesRead = cImagesRead;
2058 IoCtx.pIoCtxParent = NULL;
2059 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
2060 IoCtx.Type.Root.pvUser1 = pDisk;
2061 IoCtx.Type.Root.pvUser2 = NULL;
2062 return vdIoCtxProcessSync(&IoCtx);
2063}
2064
2065/**
2066 * internal: write buffer to the image, taking care of block boundaries and
2067 * write optimizations.
2068 */
2069static int vdWriteHelper(PVBOXHDD pDisk, PVDIMAGE pImage, uint64_t uOffset,
2070 const void *pvBuf, size_t cbWrite, uint32_t fFlags)
2071{
2072 return vdWriteHelperEx(pDisk, pImage, NULL, uOffset, pvBuf, cbWrite,
2073 fFlags, 0);
2074}
2075
2076/**
2077 * Internal: Copies the content of one disk to another one applying optimizations
2078 * to speed up the copy process if possible.
2079 */
2080static int vdCopyHelper(PVBOXHDD pDiskFrom, PVDIMAGE pImageFrom, PVBOXHDD pDiskTo,
2081 uint64_t cbSize, unsigned cImagesFromRead, unsigned cImagesToRead,
2082 bool fSuppressRedundantIo, PVDINTERFACEPROGRESS pIfProgress,
2083 PVDINTERFACEPROGRESS pDstIfProgress)
2084{
2085 int rc = VINF_SUCCESS;
2086 int rc2;
2087 uint64_t uOffset = 0;
2088 uint64_t cbRemaining = cbSize;
2089 void *pvBuf = NULL;
2090 bool fLockReadFrom = false;
2091 bool fLockWriteTo = false;
2092 bool fBlockwiseCopy = fSuppressRedundantIo || (cImagesFromRead > 0);
2093 unsigned uProgressOld = 0;
2094
2095 LogFlowFunc(("pDiskFrom=%#p pImageFrom=%#p pDiskTo=%#p cbSize=%llu cImagesFromRead=%u cImagesToRead=%u fSuppressRedundantIo=%RTbool pIfProgress=%#p pDstIfProgress=%#p\n",
2096 pDiskFrom, pImageFrom, pDiskTo, cbSize, cImagesFromRead, cImagesToRead, fSuppressRedundantIo, pDstIfProgress, pDstIfProgress));
2097
2098 /* Allocate tmp buffer. */
2099 pvBuf = RTMemTmpAlloc(VD_MERGE_BUFFER_SIZE);
2100 if (!pvBuf)
2101 return rc;
2102
2103 do
2104 {
2105 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
2106
2107 /* Note that we don't attempt to synchronize cross-disk accesses.
2108 * It wouldn't be very difficult to do, just the lock order would
2109 * need to be defined somehow to prevent deadlocks. Postpone such
2110 * magic as there is no use case for this. */
2111
2112 rc2 = vdThreadStartRead(pDiskFrom);
2113 AssertRC(rc2);
2114 fLockReadFrom = true;
2115
2116 if (fBlockwiseCopy)
2117 {
2118 RTSGSEG SegmentBuf;
2119 RTSGBUF SgBuf;
2120 VDIOCTX IoCtx;
2121
2122 SegmentBuf.pvSeg = pvBuf;
2123 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
2124 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
2125 vdIoCtxInit(&IoCtx, pDiskFrom, VDIOCTXTXDIR_READ, 0, 0, NULL,
2126 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
2127
2128 /* Read the source data. */
2129 rc = pImageFrom->Backend->pfnRead(pImageFrom->pBackendData,
2130 uOffset, cbThisRead, &IoCtx,
2131 &cbThisRead);
2132
2133 if ( rc == VERR_VD_BLOCK_FREE
2134 && cImagesFromRead != 1)
2135 {
2136 unsigned cImagesToProcess = cImagesFromRead;
2137
2138 for (PVDIMAGE pCurrImage = pImageFrom->pPrev;
2139 pCurrImage != NULL && rc == VERR_VD_BLOCK_FREE;
2140 pCurrImage = pCurrImage->pPrev)
2141 {
2142 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
2143 uOffset, cbThisRead,
2144 &IoCtx, &cbThisRead);
2145 if (cImagesToProcess == 1)
2146 break;
2147 else if (cImagesToProcess > 0)
2148 cImagesToProcess--;
2149 }
2150 }
2151 }
2152 else
2153 rc = vdReadHelper(pDiskFrom, pImageFrom, uOffset, pvBuf, cbThisRead,
2154 false /* fUpdateCache */);
2155
2156 if (RT_FAILURE(rc) && rc != VERR_VD_BLOCK_FREE)
2157 break;
2158
2159 rc2 = vdThreadFinishRead(pDiskFrom);
2160 AssertRC(rc2);
2161 fLockReadFrom = false;
2162
2163 if (rc != VERR_VD_BLOCK_FREE)
2164 {
2165 rc2 = vdThreadStartWrite(pDiskTo);
2166 AssertRC(rc2);
2167 fLockWriteTo = true;
2168
2169 /* Only do collapsed I/O if we are copying the data blockwise. */
2170 rc = vdWriteHelperEx(pDiskTo, pDiskTo->pLast, NULL, uOffset, pvBuf,
2171 cbThisRead, VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG /* fFlags */,
2172 fBlockwiseCopy ? cImagesToRead : 0);
2173 if (RT_FAILURE(rc))
2174 break;
2175
2176 rc2 = vdThreadFinishWrite(pDiskTo);
2177 AssertRC(rc2);
2178 fLockWriteTo = false;
2179 }
2180 else /* Don't propagate the error to the outside */
2181 rc = VINF_SUCCESS;
2182
2183 uOffset += cbThisRead;
2184 cbRemaining -= cbThisRead;
2185
2186 unsigned uProgressNew = uOffset * 99 / cbSize;
2187 if (uProgressNew != uProgressOld)
2188 {
2189 uProgressOld = uProgressNew;
2190
2191 if (pIfProgress && pIfProgress->pfnProgress)
2192 {
2193 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
2194 uProgressOld);
2195 if (RT_FAILURE(rc))
2196 break;
2197 }
2198 if (pDstIfProgress && pDstIfProgress->pfnProgress)
2199 {
2200 rc = pDstIfProgress->pfnProgress(pDstIfProgress->Core.pvUser,
2201 uProgressOld);
2202 if (RT_FAILURE(rc))
2203 break;
2204 }
2205 }
2206 } while (uOffset < cbSize);
2207
2208 RTMemFree(pvBuf);
2209
2210 if (fLockReadFrom)
2211 {
2212 rc2 = vdThreadFinishRead(pDiskFrom);
2213 AssertRC(rc2);
2214 }
2215
2216 if (fLockWriteTo)
2217 {
2218 rc2 = vdThreadFinishWrite(pDiskTo);
2219 AssertRC(rc2);
2220 }
2221
2222 LogFlowFunc(("returns rc=%Rrc\n", rc));
2223 return rc;
2224}
2225
2226/**
2227 * Flush helper async version.
2228 */
2229static int vdSetModifiedHelperAsync(PVDIOCTX pIoCtx)
2230{
2231 int rc = VINF_SUCCESS;
2232 PVBOXHDD pDisk = pIoCtx->pDisk;
2233 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2234
2235 rc = pImage->Backend->pfnFlush(pImage->pBackendData, pIoCtx);
2236 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2237 rc = VINF_SUCCESS;
2238
2239 return rc;
2240}
2241
2242/**
2243 * internal: mark the disk as modified - async version.
2244 */
2245static int vdSetModifiedFlagAsync(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
2246{
2247 int rc = VINF_SUCCESS;
2248
2249 VD_IS_LOCKED(pDisk);
2250
2251 pDisk->uModified |= VD_IMAGE_MODIFIED_FLAG;
2252 if (pDisk->uModified & VD_IMAGE_MODIFIED_FIRST)
2253 {
2254 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2255 if (RT_SUCCESS(rc))
2256 {
2257 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FIRST;
2258
2259 /* First modify, so create a UUID and ensure it's written to disk. */
2260 vdResetModifiedFlag(pDisk);
2261
2262 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
2263 {
2264 PVDIOCTX pIoCtxFlush = vdIoCtxChildAlloc(pDisk, VDIOCTXTXDIR_FLUSH,
2265 0, 0, pDisk->pLast,
2266 NULL, pIoCtx, 0, 0, NULL,
2267 vdSetModifiedHelperAsync);
2268
2269 if (pIoCtxFlush)
2270 {
2271 rc = vdIoCtxProcessLocked(pIoCtxFlush);
2272 if (rc == VINF_VD_ASYNC_IO_FINISHED)
2273 {
2274 vdIoCtxUnlockDisk(pDisk, pIoCtx, false /* fProcessDeferredReqs */);
2275 vdIoCtxFree(pDisk, pIoCtxFlush);
2276 }
2277 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2278 {
2279 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
2280 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2281 }
2282 else /* Another error */
2283 vdIoCtxFree(pDisk, pIoCtxFlush);
2284 }
2285 else
2286 rc = VERR_NO_MEMORY;
2287 }
2288 }
2289 }
2290
2291 return rc;
2292}
2293
2294static int vdWriteHelperCommitAsync(PVDIOCTX pIoCtx)
2295{
2296 int rc = VINF_SUCCESS;
2297 PVDIMAGE pImage = pIoCtx->Req.Io.pImageStart;
2298 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2299 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2300 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2301
2302 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2303 rc = pImage->Backend->pfnWrite(pImage->pBackendData,
2304 pIoCtx->Req.Io.uOffset - cbPreRead,
2305 cbPreRead + cbThisWrite + cbPostRead,
2306 pIoCtx, NULL, &cbPreRead, &cbPostRead, 0);
2307 Assert(rc != VERR_VD_BLOCK_FREE);
2308 Assert(rc == VERR_VD_NOT_ENOUGH_METADATA || cbPreRead == 0);
2309 Assert(rc == VERR_VD_NOT_ENOUGH_METADATA || cbPostRead == 0);
2310 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2311 rc = VINF_SUCCESS;
2312 else if (rc == VERR_VD_IOCTX_HALT)
2313 {
2314 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2315 rc = VINF_SUCCESS;
2316 }
2317
2318 LogFlowFunc(("returns rc=%Rrc\n", rc));
2319 return rc;
2320}
2321
2322static int vdWriteHelperOptimizedCmpAndWriteAsync(PVDIOCTX pIoCtx)
2323{
2324 int rc = VINF_SUCCESS;
2325 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2326 size_t cbThisWrite = 0;
2327 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2328 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2329 size_t cbWriteCopy = pIoCtx->Type.Child.Write.Optimized.cbWriteCopy;
2330 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2331 size_t cbReadImage = pIoCtx->Type.Child.Write.Optimized.cbReadImage;
2332 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
2333
2334 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2335
2336 AssertPtr(pIoCtxParent);
2337 Assert(!pIoCtxParent->pIoCtxParent);
2338 Assert(!pIoCtx->Req.Io.cbTransferLeft && !pIoCtx->cMetaTransfersPending);
2339
2340 vdIoCtxChildReset(pIoCtx);
2341 cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2342 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbPreRead);
2343
2344 /* Check if the write would modify anything in this block. */
2345 if (!RTSgBufCmp(&pIoCtx->Req.Io.SgBuf, &pIoCtxParent->Req.Io.SgBuf, cbThisWrite))
2346 {
2347 RTSGBUF SgBufSrcTmp;
2348
2349 RTSgBufClone(&SgBufSrcTmp, &pIoCtxParent->Req.Io.SgBuf);
2350 RTSgBufAdvance(&SgBufSrcTmp, cbThisWrite);
2351 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbThisWrite);
2352
2353 if (!cbWriteCopy || !RTSgBufCmp(&pIoCtx->Req.Io.SgBuf, &SgBufSrcTmp, cbWriteCopy))
2354 {
2355 /* Block is completely unchanged, so no need to write anything. */
2356 LogFlowFunc(("Block didn't changed\n"));
2357 ASMAtomicWriteU32(&pIoCtx->Req.Io.cbTransferLeft, 0);
2358 RTSgBufAdvance(&pIoCtxParent->Req.Io.SgBuf, cbThisWrite);
2359 return VINF_VD_ASYNC_IO_FINISHED;
2360 }
2361 }
2362
2363 /* Copy the data to the right place in the buffer. */
2364 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2365 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbPreRead);
2366 vdIoCtxCopy(pIoCtx, pIoCtxParent, cbThisWrite);
2367
2368 /* Handle the data that goes after the write to fill the block. */
2369 if (cbPostRead)
2370 {
2371 /* Now assemble the remaining data. */
2372 if (cbWriteCopy)
2373 {
2374 /*
2375 * The S/G buffer of the parent needs to be cloned because
2376 * it is not allowed to modify the state.
2377 */
2378 RTSGBUF SgBufParentTmp;
2379
2380 RTSgBufClone(&SgBufParentTmp, &pIoCtxParent->Req.Io.SgBuf);
2381 RTSgBufCopy(&pIoCtx->Req.Io.SgBuf, &SgBufParentTmp, cbWriteCopy);
2382 }
2383
2384 /* Zero out the remainder of this block. Will never be visible, as this
2385 * is beyond the limit of the image. */
2386 if (cbFill)
2387 {
2388 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbReadImage);
2389 vdIoCtxSet(pIoCtx, '\0', cbFill);
2390 }
2391 }
2392
2393 /* Write the full block to the virtual disk. */
2394 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2395 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2396
2397 return rc;
2398}
2399
2400static int vdWriteHelperOptimizedPreReadAsync(PVDIOCTX pIoCtx)
2401{
2402 int rc = VINF_SUCCESS;
2403
2404 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2405
2406 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2407
2408 if (pIoCtx->Req.Io.cbTransferLeft)
2409 rc = vdReadHelperAsync(pIoCtx);
2410
2411 if ( RT_SUCCESS(rc)
2412 && ( pIoCtx->Req.Io.cbTransferLeft
2413 || pIoCtx->cMetaTransfersPending))
2414 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2415 else
2416 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperOptimizedCmpAndWriteAsync;
2417
2418 return rc;
2419}
2420
2421/**
2422 * internal: write a complete block (only used for diff images), taking the
2423 * remaining data from parent images. This implementation optimizes out writes
2424 * that do not change the data relative to the state as of the parent images.
2425 * All backends which support differential/growing images support this - async version.
2426 */
2427static int vdWriteHelperOptimizedAsync(PVDIOCTX pIoCtx)
2428{
2429 PVBOXHDD pDisk = pIoCtx->pDisk;
2430 uint64_t uOffset = pIoCtx->Type.Child.uOffsetSaved;
2431 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2432 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2433 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2434 size_t cbWrite = pIoCtx->Type.Child.cbWriteParent;
2435 size_t cbFill = 0;
2436 size_t cbWriteCopy = 0;
2437 size_t cbReadImage = 0;
2438
2439 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2440
2441 AssertPtr(pIoCtx->pIoCtxParent);
2442 Assert(!pIoCtx->pIoCtxParent->pIoCtxParent);
2443
2444 if (cbPostRead)
2445 {
2446 /* Figure out how much we cannot read from the image, because
2447 * the last block to write might exceed the nominal size of the
2448 * image for technical reasons. */
2449 if (uOffset + cbThisWrite + cbPostRead > pDisk->cbSize)
2450 cbFill = uOffset + cbThisWrite + cbPostRead - pDisk->cbSize;
2451
2452 /* If we have data to be written, use that instead of reading
2453 * data from the image. */
2454 if (cbWrite > cbThisWrite)
2455 cbWriteCopy = RT_MIN(cbWrite - cbThisWrite, cbPostRead);
2456
2457 /* The rest must be read from the image. */
2458 cbReadImage = cbPostRead - cbWriteCopy - cbFill;
2459 }
2460
2461 pIoCtx->Type.Child.Write.Optimized.cbFill = cbFill;
2462 pIoCtx->Type.Child.Write.Optimized.cbWriteCopy = cbWriteCopy;
2463 pIoCtx->Type.Child.Write.Optimized.cbReadImage = cbReadImage;
2464
2465 /* Read the entire data of the block so that we can compare whether it will
2466 * be modified by the write or not. */
2467 size_t cbTmp = cbPreRead + cbThisWrite + cbPostRead - cbFill; Assert(cbTmp == (uint32_t)cbTmp);
2468 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbTmp;
2469 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2470 pIoCtx->Req.Io.uOffset -= cbPreRead;
2471
2472 /* Next step */
2473 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperOptimizedPreReadAsync;
2474 return VINF_SUCCESS;
2475}
2476
2477static int vdWriteHelperStandardAssemble(PVDIOCTX pIoCtx)
2478{
2479 int rc = VINF_SUCCESS;
2480 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2481 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2482 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
2483
2484 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2485
2486 vdIoCtxCopy(pIoCtx, pIoCtxParent, cbThisWrite);
2487 if (cbPostRead)
2488 {
2489 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2490 size_t cbWriteCopy = pIoCtx->Type.Child.Write.Optimized.cbWriteCopy;
2491 size_t cbReadImage = pIoCtx->Type.Child.Write.Optimized.cbReadImage;
2492
2493 /* Now assemble the remaining data. */
2494 if (cbWriteCopy)
2495 {
2496 /*
2497 * The S/G buffer of the parent needs to be cloned because
2498 * it is not allowed to modify the state.
2499 */
2500 RTSGBUF SgBufParentTmp;
2501
2502 RTSgBufClone(&SgBufParentTmp, &pIoCtxParent->Req.Io.SgBuf);
2503 RTSgBufCopy(&pIoCtx->Req.Io.SgBuf, &SgBufParentTmp, cbWriteCopy);
2504 }
2505
2506 /* Zero out the remainder of this block. Will never be visible, as this
2507 * is beyond the limit of the image. */
2508 if (cbFill)
2509 {
2510 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbReadImage);
2511 vdIoCtxSet(pIoCtx, '\0', cbFill);
2512 }
2513
2514 if (cbReadImage)
2515 {
2516 /* Read remaining data. */
2517 }
2518 else
2519 {
2520 /* Write the full block to the virtual disk. */
2521 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2522 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2523 }
2524 }
2525 else
2526 {
2527 /* Write the full block to the virtual disk. */
2528 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2529 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2530 }
2531
2532 return rc;
2533}
2534
2535static int vdWriteHelperStandardPreReadAsync(PVDIOCTX pIoCtx)
2536{
2537 int rc = VINF_SUCCESS;
2538
2539 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2540
2541 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2542
2543 if (pIoCtx->Req.Io.cbTransferLeft)
2544 rc = vdReadHelperAsync(pIoCtx);
2545
2546 if ( RT_SUCCESS(rc)
2547 && ( pIoCtx->Req.Io.cbTransferLeft
2548 || pIoCtx->cMetaTransfersPending))
2549 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2550 else
2551 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardAssemble;
2552
2553 return rc;
2554}
2555
2556static int vdWriteHelperStandardAsync(PVDIOCTX pIoCtx)
2557{
2558 PVBOXHDD pDisk = pIoCtx->pDisk;
2559 uint64_t uOffset = pIoCtx->Type.Child.uOffsetSaved;
2560 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2561 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2562 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2563 size_t cbWrite = pIoCtx->Type.Child.cbWriteParent;
2564 size_t cbFill = 0;
2565 size_t cbWriteCopy = 0;
2566 size_t cbReadImage = 0;
2567
2568 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2569
2570 AssertPtr(pIoCtx->pIoCtxParent);
2571 Assert(!pIoCtx->pIoCtxParent->pIoCtxParent);
2572
2573 /* Calculate the amount of data to read that goes after the write to fill the block. */
2574 if (cbPostRead)
2575 {
2576 /* If we have data to be written, use that instead of reading
2577 * data from the image. */
2578 cbWriteCopy;
2579 if (cbWrite > cbThisWrite)
2580 cbWriteCopy = RT_MIN(cbWrite - cbThisWrite, cbPostRead);
2581
2582 /* Figure out how much we cannot read from the image, because
2583 * the last block to write might exceed the nominal size of the
2584 * image for technical reasons. */
2585 if (uOffset + cbThisWrite + cbPostRead > pDisk->cbSize)
2586 cbFill = uOffset + cbThisWrite + cbPostRead - pDisk->cbSize;
2587
2588 /* The rest must be read from the image. */
2589 cbReadImage = cbPostRead - cbWriteCopy - cbFill;
2590 }
2591
2592 pIoCtx->Type.Child.Write.Optimized.cbFill = cbFill;
2593 pIoCtx->Type.Child.Write.Optimized.cbWriteCopy = cbWriteCopy;
2594 pIoCtx->Type.Child.Write.Optimized.cbReadImage = cbReadImage;
2595
2596 /* Next step */
2597 if (cbPreRead)
2598 {
2599 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardPreReadAsync;
2600
2601 /* Read the data that goes before the write to fill the block. */
2602 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbPreRead; Assert(cbPreRead == (uint32_t)cbPreRead);
2603 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2604 pIoCtx->Req.Io.uOffset -= cbPreRead;
2605 }
2606 else
2607 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardAssemble;
2608
2609 return VINF_SUCCESS;
2610}
2611
2612/**
2613 * internal: write buffer to the image, taking care of block boundaries and
2614 * write optimizations - async version.
2615 */
2616static int vdWriteHelperAsync(PVDIOCTX pIoCtx)
2617{
2618 int rc;
2619 size_t cbWrite = pIoCtx->Req.Io.cbTransfer;
2620 uint64_t uOffset = pIoCtx->Req.Io.uOffset;
2621 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2622 PVBOXHDD pDisk = pIoCtx->pDisk;
2623 unsigned fWrite;
2624 size_t cbThisWrite;
2625 size_t cbPreRead, cbPostRead;
2626
2627 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG))
2628 {
2629 rc = vdSetModifiedFlagAsync(pDisk, pIoCtx);
2630 if (RT_FAILURE(rc)) /* Includes I/O in progress. */
2631 return rc;
2632 }
2633
2634 rc = vdDiscardSetRangeAllocated(pDisk, uOffset, cbWrite);
2635 if (RT_FAILURE(rc))
2636 return rc;
2637
2638 /* Loop until all written. */
2639 do
2640 {
2641 /* Try to write the possibly partial block to the last opened image.
2642 * This works when the block is already allocated in this image or
2643 * if it is a full-block write (and allocation isn't suppressed below).
2644 * For image formats which don't support zero blocks, it's beneficial
2645 * to avoid unnecessarily allocating unchanged blocks. This prevents
2646 * unwanted expanding of images. VMDK is an example. */
2647 cbThisWrite = cbWrite;
2648 fWrite = (pImage->uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME)
2649 ? 0 : VD_WRITE_NO_ALLOC;
2650 rc = pImage->Backend->pfnWrite(pImage->pBackendData, uOffset,
2651 cbThisWrite, pIoCtx,
2652 &cbThisWrite, &cbPreRead,
2653 &cbPostRead, fWrite);
2654 if (rc == VERR_VD_BLOCK_FREE)
2655 {
2656 /* Lock the disk .*/
2657 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2658 if (RT_SUCCESS(rc))
2659 {
2660 /*
2661 * Allocate segment and buffer in one go.
2662 * A bit hackish but avoids the need to allocate memory twice.
2663 */
2664 PRTSGBUF pTmp = (PRTSGBUF)RTMemAlloc(cbPreRead + cbThisWrite + cbPostRead + sizeof(RTSGSEG) + sizeof(RTSGBUF));
2665 AssertBreakStmt(VALID_PTR(pTmp), rc = VERR_NO_MEMORY);
2666 PRTSGSEG pSeg = (PRTSGSEG)(pTmp + 1);
2667
2668 pSeg->pvSeg = pSeg + 1;
2669 pSeg->cbSeg = cbPreRead + cbThisWrite + cbPostRead;
2670 RTSgBufInit(pTmp, pSeg, 1);
2671
2672 PVDIOCTX pIoCtxWrite = vdIoCtxChildAlloc(pDisk, VDIOCTXTXDIR_WRITE,
2673 uOffset, pSeg->cbSeg, pImage,
2674 pTmp,
2675 pIoCtx, cbThisWrite,
2676 cbWrite,
2677 pTmp,
2678 (pImage->uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME)
2679 ? vdWriteHelperStandardAsync
2680 : vdWriteHelperOptimizedAsync);
2681 if (!VALID_PTR(pIoCtxWrite))
2682 {
2683 RTMemTmpFree(pTmp);
2684 rc = VERR_NO_MEMORY;
2685 break;
2686 }
2687
2688 LogFlowFunc(("Disk is growing because of pIoCtx=%#p pIoCtxWrite=%#p\n",
2689 pIoCtx, pIoCtxWrite));
2690
2691 pIoCtxWrite->Type.Child.cbPreRead = cbPreRead;
2692 pIoCtxWrite->Type.Child.cbPostRead = cbPostRead;
2693 pIoCtxWrite->Req.Io.pImageParentOverride = pIoCtx->Req.Io.pImageParentOverride;
2694
2695 /* Process the write request */
2696 rc = vdIoCtxProcessLocked(pIoCtxWrite);
2697
2698 if (RT_FAILURE(rc) && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
2699 {
2700 vdIoCtxFree(pDisk, pIoCtxWrite);
2701 break;
2702 }
2703 else if ( rc == VINF_VD_ASYNC_IO_FINISHED
2704 && ASMAtomicCmpXchgBool(&pIoCtxWrite->fComplete, true, false))
2705 {
2706 LogFlow(("Child write request completed\n"));
2707 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbThisWrite);
2708 Assert(cbThisWrite == (uint32_t)cbThisWrite);
2709 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbThisWrite);
2710 vdIoCtxUnlockDisk(pDisk, pIoCtx, false /* fProcessDeferredReqs*/ );
2711 vdIoCtxFree(pDisk, pIoCtxWrite);
2712
2713 rc = VINF_SUCCESS;
2714 }
2715 else
2716 {
2717 LogFlow(("Child write pending\n"));
2718 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
2719 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2720 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2721 cbWrite -= cbThisWrite;
2722 uOffset += cbThisWrite;
2723 break;
2724 }
2725 }
2726 else
2727 {
2728 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2729 break;
2730 }
2731 }
2732
2733 if (rc == VERR_VD_IOCTX_HALT)
2734 {
2735 cbWrite -= cbThisWrite;
2736 uOffset += cbThisWrite;
2737 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2738 break;
2739 }
2740 else if (rc == VERR_VD_NOT_ENOUGH_METADATA)
2741 break;
2742
2743 cbWrite -= cbThisWrite;
2744 uOffset += cbThisWrite;
2745 } while (cbWrite != 0 && (RT_SUCCESS(rc) || rc == VERR_VD_ASYNC_IO_IN_PROGRESS));
2746
2747 if ( rc == VERR_VD_ASYNC_IO_IN_PROGRESS
2748 || rc == VERR_VD_NOT_ENOUGH_METADATA
2749 || rc == VERR_VD_IOCTX_HALT)
2750 {
2751 /*
2752 * Tell the caller that we don't need to go back here because all
2753 * writes are initiated.
2754 */
2755 if ( !cbWrite
2756 && rc != VERR_VD_IOCTX_HALT)
2757 rc = VINF_SUCCESS;
2758
2759 pIoCtx->Req.Io.uOffset = uOffset;
2760 pIoCtx->Req.Io.cbTransfer = cbWrite;
2761 }
2762
2763 return rc;
2764}
2765
2766/**
2767 * Flush helper async version.
2768 */
2769static int vdFlushHelperAsync(PVDIOCTX pIoCtx)
2770{
2771 int rc = VINF_SUCCESS;
2772 PVBOXHDD pDisk = pIoCtx->pDisk;
2773 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2774
2775 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2776 if (RT_SUCCESS(rc))
2777 {
2778 vdResetModifiedFlag(pDisk);
2779 rc = pImage->Backend->pfnFlush(pImage->pBackendData, pIoCtx);
2780 if ( ( RT_SUCCESS(rc)
2781 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS
2782 || rc == VERR_VD_IOCTX_HALT)
2783 && pDisk->pCache)
2784 {
2785 rc = pDisk->pCache->Backend->pfnFlush(pDisk->pCache->pBackendData, pIoCtx);
2786 if ( RT_SUCCESS(rc)
2787 || ( rc != VERR_VD_ASYNC_IO_IN_PROGRESS
2788 && rc != VERR_VD_IOCTX_HALT))
2789 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessBlockedReqs */);
2790 else if (rc != VERR_VD_IOCTX_HALT)
2791 rc = VINF_SUCCESS;
2792 }
2793 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2794 rc = VINF_SUCCESS;
2795 else if (rc != VERR_VD_IOCTX_HALT)/* Some other error. */
2796 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessBlockedReqs */);
2797 }
2798
2799 return rc;
2800}
2801
2802/**
2803 * Async discard helper - discards a whole block which is recorded in the block
2804 * tree.
2805 *
2806 * @returns VBox status code.
2807 * @param pIoCtx The I/O context to operate on.
2808 */
2809static int vdDiscardWholeBlockAsync(PVDIOCTX pIoCtx)
2810{
2811 int rc = VINF_SUCCESS;
2812 PVBOXHDD pDisk = pIoCtx->pDisk;
2813 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
2814 PVDDISCARDBLOCK pBlock = pIoCtx->Req.Discard.pBlock;
2815 size_t cbPreAllocated, cbPostAllocated, cbActuallyDiscarded;
2816
2817 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2818
2819 AssertPtr(pBlock);
2820
2821 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
2822 pBlock->Core.Key, pBlock->cbDiscard,
2823 &cbPreAllocated, &cbPostAllocated,
2824 &cbActuallyDiscarded, NULL, 0);
2825 Assert(rc != VERR_VD_DISCARD_ALIGNMENT_NOT_MET);
2826 Assert(!cbPreAllocated);
2827 Assert(!cbPostAllocated);
2828 Assert(cbActuallyDiscarded == pBlock->cbDiscard || RT_FAILURE(rc));
2829
2830 /* Remove the block on success. */
2831 if ( RT_SUCCESS(rc)
2832 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2833 {
2834 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
2835 Assert(pBlockRemove == pBlock);
2836
2837 pDiscard->cbDiscarding -= pBlock->cbDiscard;
2838 RTListNodeRemove(&pBlock->NodeLru);
2839 RTMemFree(pBlock->pbmAllocated);
2840 RTMemFree(pBlock);
2841 pIoCtx->Req.Discard.pBlock = NULL;/* Safety precaution. */
2842 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync; /* Next part. */
2843 rc = VINF_SUCCESS;
2844 }
2845
2846 LogFlowFunc(("returns rc=%Rrc\n", rc));
2847 return rc;
2848}
2849
2850/**
2851 * Removes the least recently used blocks from the waiting list until
2852 * the new value is reached - version for async I/O.
2853 *
2854 * @returns VBox status code.
2855 * @param pDisk VD disk container.
2856 * @param pDiscard The discard state.
2857 * @param cbDiscardingNew How many bytes should be waiting on success.
2858 * The number of bytes waiting can be less.
2859 */
2860static int vdDiscardRemoveBlocksAsync(PVBOXHDD pDisk, PVDIOCTX pIoCtx, size_t cbDiscardingNew)
2861{
2862 int rc = VINF_SUCCESS;
2863 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
2864
2865 LogFlowFunc(("pDisk=%#p pDiscard=%#p cbDiscardingNew=%zu\n",
2866 pDisk, pDiscard, cbDiscardingNew));
2867
2868 while (pDiscard->cbDiscarding > cbDiscardingNew)
2869 {
2870 PVDDISCARDBLOCK pBlock = RTListGetLast(&pDiscard->ListLru, VDDISCARDBLOCK, NodeLru);
2871
2872 Assert(!RTListIsEmpty(&pDiscard->ListLru));
2873
2874 /* Go over the allocation bitmap and mark all discarded sectors as unused. */
2875 uint64_t offStart = pBlock->Core.Key;
2876 uint32_t idxStart = 0;
2877 size_t cbLeft = pBlock->cbDiscard;
2878 bool fAllocated = ASMBitTest(pBlock->pbmAllocated, idxStart);
2879 uint32_t cSectors = (uint32_t)(pBlock->cbDiscard / 512);
2880
2881 while (cbLeft > 0)
2882 {
2883 int32_t idxEnd;
2884 size_t cbThis = cbLeft;
2885
2886 if (fAllocated)
2887 {
2888 /* Check for the first unallocated bit. */
2889 idxEnd = ASMBitNextClear(pBlock->pbmAllocated, cSectors, idxStart);
2890 if (idxEnd != -1)
2891 {
2892 cbThis = (idxEnd - idxStart) * 512;
2893 fAllocated = false;
2894 }
2895 }
2896 else
2897 {
2898 /* Mark as unused and check for the first set bit. */
2899 idxEnd = ASMBitNextSet(pBlock->pbmAllocated, cSectors, idxStart);
2900 if (idxEnd != -1)
2901 cbThis = (idxEnd - idxStart) * 512;
2902
2903 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
2904 offStart, cbThis, NULL, NULL, &cbThis,
2905 NULL, VD_DISCARD_MARK_UNUSED);
2906 if ( RT_FAILURE(rc)
2907 && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
2908 break;
2909
2910 fAllocated = true;
2911 }
2912
2913 idxStart = idxEnd;
2914 offStart += cbThis;
2915 cbLeft -= cbThis;
2916 }
2917
2918 if ( RT_FAILURE(rc)
2919 && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
2920 break;
2921
2922 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
2923 Assert(pBlockRemove == pBlock);
2924 RTListNodeRemove(&pBlock->NodeLru);
2925
2926 pDiscard->cbDiscarding -= pBlock->cbDiscard;
2927 RTMemFree(pBlock->pbmAllocated);
2928 RTMemFree(pBlock);
2929 }
2930
2931 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2932 rc = VINF_SUCCESS;
2933
2934 Assert(RT_FAILURE(rc) || pDiscard->cbDiscarding <= cbDiscardingNew);
2935
2936 LogFlowFunc(("returns rc=%Rrc\n", rc));
2937 return rc;
2938}
2939
2940/**
2941 * Async discard helper - discards the current range if there is no matching
2942 * block in the tree.
2943 *
2944 * @returns VBox status code.
2945 * @param pIoCtx The I/O context to operate on.
2946 */
2947static int vdDiscardCurrentRangeAsync(PVDIOCTX pIoCtx)
2948{
2949 PVBOXHDD pDisk = pIoCtx->pDisk;
2950 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
2951 uint64_t offStart = pIoCtx->Req.Discard.offCur;
2952 size_t cbThisDiscard = pIoCtx->Req.Discard.cbThisDiscard;
2953 void *pbmAllocated = NULL;
2954 size_t cbPreAllocated, cbPostAllocated;
2955 int rc = VINF_SUCCESS;
2956
2957 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2958
2959 /* No block found, try to discard using the backend first. */
2960 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
2961 offStart, cbThisDiscard, &cbPreAllocated,
2962 &cbPostAllocated, &cbThisDiscard,
2963 &pbmAllocated, 0);
2964 if (rc == VERR_VD_DISCARD_ALIGNMENT_NOT_MET)
2965 {
2966 /* Create new discard block. */
2967 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTMemAllocZ(sizeof(VDDISCARDBLOCK));
2968 if (pBlock)
2969 {
2970 pBlock->Core.Key = offStart - cbPreAllocated;
2971 pBlock->Core.KeyLast = offStart + cbThisDiscard + cbPostAllocated - 1;
2972 pBlock->cbDiscard = cbPreAllocated + cbThisDiscard + cbPostAllocated;
2973 pBlock->pbmAllocated = pbmAllocated;
2974 bool fInserted = RTAvlrU64Insert(pDiscard->pTreeBlocks, &pBlock->Core);
2975 Assert(fInserted);
2976
2977 RTListPrepend(&pDiscard->ListLru, &pBlock->NodeLru);
2978 pDiscard->cbDiscarding += pBlock->cbDiscard;
2979
2980 Assert(pIoCtx->Req.Discard.cbDiscardLeft >= cbThisDiscard);
2981 pIoCtx->Req.Discard.cbDiscardLeft -= cbThisDiscard;
2982 pIoCtx->Req.Discard.offCur += cbThisDiscard;
2983 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
2984
2985 if (pDiscard->cbDiscarding > VD_DISCARD_REMOVE_THRESHOLD)
2986 rc = vdDiscardRemoveBlocksAsync(pDisk, pIoCtx, VD_DISCARD_REMOVE_THRESHOLD);
2987 else
2988 rc = VINF_SUCCESS;
2989
2990 if (RT_SUCCESS(rc))
2991 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync; /* Next part. */
2992 }
2993 else
2994 {
2995 RTMemFree(pbmAllocated);
2996 rc = VERR_NO_MEMORY;
2997 }
2998 }
2999 else if ( RT_SUCCESS(rc)
3000 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS) /* Save state and andvance to next range. */
3001 {
3002 Assert(pIoCtx->Req.Discard.cbDiscardLeft >= cbThisDiscard);
3003 pIoCtx->Req.Discard.cbDiscardLeft -= cbThisDiscard;
3004 pIoCtx->Req.Discard.offCur += cbThisDiscard;
3005 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3006 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync;
3007 rc = VINF_SUCCESS;
3008 }
3009
3010 LogFlowFunc(("returns rc=%Rrc\n", rc));
3011 return rc;
3012}
3013
3014/**
3015 * Async discard helper - entry point.
3016 *
3017 * @returns VBox status code.
3018 * @param pIoCtx The I/O context to operate on.
3019 */
3020static int vdDiscardHelperAsync(PVDIOCTX pIoCtx)
3021{
3022 int rc = VINF_SUCCESS;
3023 PVBOXHDD pDisk = pIoCtx->pDisk;
3024 PCRTRANGE paRanges = pIoCtx->Req.Discard.paRanges;
3025 unsigned cRanges = pIoCtx->Req.Discard.cRanges;
3026 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3027
3028 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
3029
3030 /* Check if the I/O context processed all ranges. */
3031 if ( pIoCtx->Req.Discard.idxRange == cRanges
3032 && !pIoCtx->Req.Discard.cbDiscardLeft)
3033 {
3034 LogFlowFunc(("All ranges discarded, completing\n"));
3035 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessDeferredReqs*/);
3036 return VINF_SUCCESS;
3037 }
3038
3039 if (pDisk->pIoCtxLockOwner != pIoCtx)
3040 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
3041
3042 if (RT_SUCCESS(rc))
3043 {
3044 uint64_t offStart = pIoCtx->Req.Discard.offCur;
3045 size_t cbDiscardLeft = pIoCtx->Req.Discard.cbDiscardLeft;
3046 size_t cbThisDiscard;
3047
3048 if (RT_UNLIKELY(!pDiscard))
3049 {
3050 pDiscard = vdDiscardStateCreate();
3051 if (!pDiscard)
3052 return VERR_NO_MEMORY;
3053
3054 pDisk->pDiscard = pDiscard;
3055 }
3056
3057 if (!pIoCtx->Req.Discard.cbDiscardLeft)
3058 {
3059 offStart = paRanges[pIoCtx->Req.Discard.idxRange].offStart;
3060 cbDiscardLeft = paRanges[pIoCtx->Req.Discard.idxRange].cbRange;
3061 LogFlowFunc(("New range descriptor loaded (%u) offStart=%llu cbDiscard=%zu\n",
3062 pIoCtx->Req.Discard.idxRange, offStart, cbDiscardLeft));
3063 pIoCtx->Req.Discard.idxRange++;
3064 }
3065
3066 /* Look for a matching block in the AVL tree first. */
3067 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, offStart, false);
3068 if (!pBlock || pBlock->Core.KeyLast < offStart)
3069 {
3070 PVDDISCARDBLOCK pBlockAbove = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, offStart, true);
3071
3072 /* Clip range to remain in the current block. */
3073 if (pBlockAbove)
3074 cbThisDiscard = RT_MIN(cbDiscardLeft, pBlockAbove->Core.KeyLast - offStart + 1);
3075 else
3076 cbThisDiscard = cbDiscardLeft;
3077
3078 Assert(!(cbThisDiscard % 512));
3079 pIoCtx->Req.Discard.pBlock = NULL;
3080 pIoCtx->pfnIoCtxTransferNext = vdDiscardCurrentRangeAsync;
3081 }
3082 else
3083 {
3084 /* Range lies partly in the block, update allocation bitmap. */
3085 int32_t idxStart, idxEnd;
3086
3087 cbThisDiscard = RT_MIN(cbDiscardLeft, pBlock->Core.KeyLast - offStart + 1);
3088
3089 AssertPtr(pBlock);
3090
3091 Assert(!(cbThisDiscard % 512));
3092 Assert(!((offStart - pBlock->Core.Key) % 512));
3093
3094 idxStart = (offStart - pBlock->Core.Key) / 512;
3095 idxEnd = idxStart + (int32_t)(cbThisDiscard / 512);
3096
3097 ASMBitClearRange(pBlock->pbmAllocated, idxStart, idxEnd);
3098
3099 cbDiscardLeft -= cbThisDiscard;
3100 offStart += cbThisDiscard;
3101
3102 /* Call the backend to discard the block if it is completely unallocated now. */
3103 if (ASMBitFirstSet((volatile void *)pBlock->pbmAllocated, (uint32_t)(pBlock->cbDiscard / 512)) == -1)
3104 {
3105 pIoCtx->Req.Discard.pBlock = pBlock;
3106 pIoCtx->pfnIoCtxTransferNext = vdDiscardWholeBlockAsync;
3107 rc = VINF_SUCCESS;
3108 }
3109 else
3110 {
3111 RTListNodeRemove(&pBlock->NodeLru);
3112 RTListPrepend(&pDiscard->ListLru, &pBlock->NodeLru);
3113
3114 /* Start with next range. */
3115 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync;
3116 rc = VINF_SUCCESS;
3117 }
3118 }
3119
3120 /* Save state in the context. */
3121 pIoCtx->Req.Discard.offCur = offStart;
3122 pIoCtx->Req.Discard.cbDiscardLeft = cbDiscardLeft;
3123 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3124 }
3125
3126 LogFlowFunc(("returns rc=%Rrc\n", rc));
3127 return rc;
3128}
3129
3130/**
3131 * internal: scans plugin directory and loads the backends have been found.
3132 */
3133static int vdLoadDynamicBackends()
3134{
3135#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
3136 int rc = VINF_SUCCESS;
3137 PRTDIR pPluginDir = NULL;
3138
3139 /* Enumerate plugin backends. */
3140 char szPath[RTPATH_MAX];
3141 rc = RTPathAppPrivateArch(szPath, sizeof(szPath));
3142 if (RT_FAILURE(rc))
3143 return rc;
3144
3145 /* To get all entries with VBoxHDD as prefix. */
3146 char *pszPluginFilter = RTPathJoinA(szPath, VBOX_HDDFORMAT_PLUGIN_PREFIX "*");
3147 if (!pszPluginFilter)
3148 return VERR_NO_STR_MEMORY;
3149
3150 PRTDIRENTRYEX pPluginDirEntry = NULL;
3151 size_t cbPluginDirEntry = sizeof(RTDIRENTRYEX);
3152 /* The plugins are in the same directory as the other shared libs. */
3153 rc = RTDirOpenFiltered(&pPluginDir, pszPluginFilter, RTDIRFILTER_WINNT, 0);
3154 if (RT_FAILURE(rc))
3155 {
3156 /* On Windows the above immediately signals that there are no
3157 * files matching, while on other platforms enumerating the
3158 * files below fails. Either way: no plugins. */
3159 goto out;
3160 }
3161
3162 pPluginDirEntry = (PRTDIRENTRYEX)RTMemAllocZ(sizeof(RTDIRENTRYEX));
3163 if (!pPluginDirEntry)
3164 {
3165 rc = VERR_NO_MEMORY;
3166 goto out;
3167 }
3168
3169 while ((rc = RTDirReadEx(pPluginDir, pPluginDirEntry, &cbPluginDirEntry, RTFSOBJATTRADD_NOTHING, RTPATH_F_ON_LINK)) != VERR_NO_MORE_FILES)
3170 {
3171 RTLDRMOD hPlugin = NIL_RTLDRMOD;
3172 PFNVBOXHDDFORMATLOAD pfnHDDFormatLoad = NULL;
3173 PVBOXHDDBACKEND pBackend = NULL;
3174 char *pszPluginPath = NULL;
3175
3176 if (rc == VERR_BUFFER_OVERFLOW)
3177 {
3178 /* allocate new buffer. */
3179 RTMemFree(pPluginDirEntry);
3180 pPluginDirEntry = (PRTDIRENTRYEX)RTMemAllocZ(cbPluginDirEntry);
3181 if (!pPluginDirEntry)
3182 {
3183 rc = VERR_NO_MEMORY;
3184 break;
3185 }
3186 /* Retry. */
3187 rc = RTDirReadEx(pPluginDir, pPluginDirEntry, &cbPluginDirEntry, RTFSOBJATTRADD_NOTHING, RTPATH_F_ON_LINK);
3188 if (RT_FAILURE(rc))
3189 break;
3190 }
3191 else if (RT_FAILURE(rc))
3192 break;
3193
3194 /* We got the new entry. */
3195 if (!RTFS_IS_FILE(pPluginDirEntry->Info.Attr.fMode))
3196 continue;
3197
3198 /* Prepend the path to the libraries. */
3199 pszPluginPath = RTPathJoinA(szPath, pPluginDirEntry->szName);
3200 if (!pszPluginPath)
3201 {
3202 rc = VERR_NO_STR_MEMORY;
3203 break;
3204 }
3205
3206 rc = SUPR3HardenedLdrLoadPlugIn(pszPluginPath, &hPlugin, NULL);
3207 if (RT_SUCCESS(rc))
3208 {
3209 rc = RTLdrGetSymbol(hPlugin, VBOX_HDDFORMAT_LOAD_NAME, (void**)&pfnHDDFormatLoad);
3210 if (RT_FAILURE(rc) || !pfnHDDFormatLoad)
3211 {
3212 LogFunc(("error resolving the entry point %s in plugin %s, rc=%Rrc, pfnHDDFormat=%#p\n", VBOX_HDDFORMAT_LOAD_NAME, pPluginDirEntry->szName, rc, pfnHDDFormatLoad));
3213 if (RT_SUCCESS(rc))
3214 rc = VERR_SYMBOL_NOT_FOUND;
3215 }
3216
3217 if (RT_SUCCESS(rc))
3218 {
3219 /* Get the function table. */
3220 rc = pfnHDDFormatLoad(&pBackend);
3221 if (RT_SUCCESS(rc) && pBackend->cbSize == sizeof(VBOXHDDBACKEND))
3222 {
3223 pBackend->hPlugin = hPlugin;
3224 vdAddBackend(pBackend);
3225 }
3226 else
3227 LogFunc(("ignored plugin '%s': pBackend->cbSize=%d rc=%Rrc\n", pszPluginPath, pBackend->cbSize, rc));
3228 }
3229 else
3230 LogFunc(("ignored plugin '%s': rc=%Rrc\n", pszPluginPath, rc));
3231
3232 if (RT_FAILURE(rc))
3233 RTLdrClose(hPlugin);
3234 }
3235 RTStrFree(pszPluginPath);
3236 }
3237out:
3238 if (rc == VERR_NO_MORE_FILES)
3239 rc = VINF_SUCCESS;
3240 RTStrFree(pszPluginFilter);
3241 if (pPluginDirEntry)
3242 RTMemFree(pPluginDirEntry);
3243 if (pPluginDir)
3244 RTDirClose(pPluginDir);
3245 return rc;
3246#else
3247 return VINF_SUCCESS;
3248#endif
3249}
3250
3251/**
3252 * internal: scans plugin directory and loads the cache backends have been found.
3253 */
3254static int vdLoadDynamicCacheBackends()
3255{
3256#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
3257 int rc = VINF_SUCCESS;
3258 PRTDIR pPluginDir = NULL;
3259
3260 /* Enumerate plugin backends. */
3261 char szPath[RTPATH_MAX];
3262 rc = RTPathAppPrivateArch(szPath, sizeof(szPath));
3263 if (RT_FAILURE(rc))
3264 return rc;
3265
3266 /* To get all entries with VBoxHDD as prefix. */
3267 char *pszPluginFilter = RTPathJoinA(szPath, VD_CACHEFORMAT_PLUGIN_PREFIX "*");
3268 if (!pszPluginFilter)
3269 {
3270 rc = VERR_NO_STR_MEMORY;
3271 return rc;
3272 }
3273
3274 PRTDIRENTRYEX pPluginDirEntry = NULL;
3275 size_t cbPluginDirEntry = sizeof(RTDIRENTRYEX);
3276 /* The plugins are in the same directory as the other shared libs. */
3277 rc = RTDirOpenFiltered(&pPluginDir, pszPluginFilter, RTDIRFILTER_WINNT, 0);
3278 if (RT_FAILURE(rc))
3279 {
3280 /* On Windows the above immediately signals that there are no
3281 * files matching, while on other platforms enumerating the
3282 * files below fails. Either way: no plugins. */
3283 goto out;
3284 }
3285
3286 pPluginDirEntry = (PRTDIRENTRYEX)RTMemAllocZ(sizeof(RTDIRENTRYEX));
3287 if (!pPluginDirEntry)
3288 {
3289 rc = VERR_NO_MEMORY;
3290 goto out;
3291 }
3292
3293 while ((rc = RTDirReadEx(pPluginDir, pPluginDirEntry, &cbPluginDirEntry, RTFSOBJATTRADD_NOTHING, RTPATH_F_ON_LINK)) != VERR_NO_MORE_FILES)
3294 {
3295 RTLDRMOD hPlugin = NIL_RTLDRMOD;
3296 PFNVDCACHEFORMATLOAD pfnVDCacheLoad = NULL;
3297 PVDCACHEBACKEND pBackend = NULL;
3298 char *pszPluginPath = NULL;
3299
3300 if (rc == VERR_BUFFER_OVERFLOW)
3301 {
3302 /* allocate new buffer. */
3303 RTMemFree(pPluginDirEntry);
3304 pPluginDirEntry = (PRTDIRENTRYEX)RTMemAllocZ(cbPluginDirEntry);
3305 if (!pPluginDirEntry)
3306 {
3307 rc = VERR_NO_MEMORY;
3308 break;
3309 }
3310 /* Retry. */
3311 rc = RTDirReadEx(pPluginDir, pPluginDirEntry, &cbPluginDirEntry, RTFSOBJATTRADD_NOTHING, RTPATH_F_ON_LINK);
3312 if (RT_FAILURE(rc))
3313 break;
3314 }
3315 else if (RT_FAILURE(rc))
3316 break;
3317
3318 /* We got the new entry. */
3319 if (!RTFS_IS_FILE(pPluginDirEntry->Info.Attr.fMode))
3320 continue;
3321
3322 /* Prepend the path to the libraries. */
3323 pszPluginPath = RTPathJoinA(szPath, pPluginDirEntry->szName);
3324 if (!pszPluginPath)
3325 {
3326 rc = VERR_NO_STR_MEMORY;
3327 break;
3328 }
3329
3330 rc = SUPR3HardenedLdrLoadPlugIn(pszPluginPath, &hPlugin, NULL);
3331 if (RT_SUCCESS(rc))
3332 {
3333 rc = RTLdrGetSymbol(hPlugin, VD_CACHEFORMAT_LOAD_NAME, (void**)&pfnVDCacheLoad);
3334 if (RT_FAILURE(rc) || !pfnVDCacheLoad)
3335 {
3336 LogFunc(("error resolving the entry point %s in plugin %s, rc=%Rrc, pfnVDCacheLoad=%#p\n",
3337 VD_CACHEFORMAT_LOAD_NAME, pPluginDirEntry->szName, rc, pfnVDCacheLoad));
3338 if (RT_SUCCESS(rc))
3339 rc = VERR_SYMBOL_NOT_FOUND;
3340 }
3341
3342 if (RT_SUCCESS(rc))
3343 {
3344 /* Get the function table. */
3345 rc = pfnVDCacheLoad(&pBackend);
3346 if (RT_SUCCESS(rc) && pBackend->cbSize == sizeof(VDCACHEBACKEND))
3347 {
3348 pBackend->hPlugin = hPlugin;
3349 vdAddCacheBackend(pBackend);
3350 }
3351 else
3352 LogFunc(("ignored plugin '%s': pBackend->cbSize=%d rc=%Rrc\n", pszPluginPath, pBackend->cbSize, rc));
3353 }
3354 else
3355 LogFunc(("ignored plugin '%s': rc=%Rrc\n", pszPluginPath, rc));
3356
3357 if (RT_FAILURE(rc))
3358 RTLdrClose(hPlugin);
3359 }
3360 RTStrFree(pszPluginPath);
3361 }
3362out:
3363 if (rc == VERR_NO_MORE_FILES)
3364 rc = VINF_SUCCESS;
3365 RTStrFree(pszPluginFilter);
3366 if (pPluginDirEntry)
3367 RTMemFree(pPluginDirEntry);
3368 if (pPluginDir)
3369 RTDirClose(pPluginDir);
3370 return rc;
3371#else
3372 return VINF_SUCCESS;
3373#endif
3374}
3375
3376/**
3377 * VD async I/O interface open callback.
3378 */
3379static int vdIOOpenFallback(void *pvUser, const char *pszLocation,
3380 uint32_t fOpen, PFNVDCOMPLETED pfnCompleted,
3381 void **ppStorage)
3382{
3383 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)RTMemAllocZ(sizeof(VDIIOFALLBACKSTORAGE));
3384
3385 if (!pStorage)
3386 return VERR_NO_MEMORY;
3387
3388 pStorage->pfnCompleted = pfnCompleted;
3389
3390 /* Open the file. */
3391 int rc = RTFileOpen(&pStorage->File, pszLocation, fOpen);
3392 if (RT_SUCCESS(rc))
3393 {
3394 *ppStorage = pStorage;
3395 return VINF_SUCCESS;
3396 }
3397
3398 RTMemFree(pStorage);
3399 return rc;
3400}
3401
3402/**
3403 * VD async I/O interface close callback.
3404 */
3405static int vdIOCloseFallback(void *pvUser, void *pvStorage)
3406{
3407 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3408
3409 RTFileClose(pStorage->File);
3410 RTMemFree(pStorage);
3411 return VINF_SUCCESS;
3412}
3413
3414static int vdIODeleteFallback(void *pvUser, const char *pcszFilename)
3415{
3416 return RTFileDelete(pcszFilename);
3417}
3418
3419static int vdIOMoveFallback(void *pvUser, const char *pcszSrc, const char *pcszDst, unsigned fMove)
3420{
3421 return RTFileMove(pcszSrc, pcszDst, fMove);
3422}
3423
3424static int vdIOGetFreeSpaceFallback(void *pvUser, const char *pcszFilename, int64_t *pcbFreeSpace)
3425{
3426 return RTFsQuerySizes(pcszFilename, NULL, pcbFreeSpace, NULL, NULL);
3427}
3428
3429static int vdIOGetModificationTimeFallback(void *pvUser, const char *pcszFilename, PRTTIMESPEC pModificationTime)
3430{
3431 RTFSOBJINFO info;
3432 int rc = RTPathQueryInfo(pcszFilename, &info, RTFSOBJATTRADD_NOTHING);
3433 if (RT_SUCCESS(rc))
3434 *pModificationTime = info.ModificationTime;
3435 return rc;
3436}
3437
3438/**
3439 * VD async I/O interface callback for retrieving the file size.
3440 */
3441static int vdIOGetSizeFallback(void *pvUser, void *pvStorage, uint64_t *pcbSize)
3442{
3443 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3444
3445 return RTFileGetSize(pStorage->File, pcbSize);
3446}
3447
3448/**
3449 * VD async I/O interface callback for setting the file size.
3450 */
3451static int vdIOSetSizeFallback(void *pvUser, void *pvStorage, uint64_t cbSize)
3452{
3453 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3454
3455 return RTFileSetSize(pStorage->File, cbSize);
3456}
3457
3458/**
3459 * VD async I/O interface callback for a synchronous write to the file.
3460 */
3461static int vdIOWriteSyncFallback(void *pvUser, void *pvStorage, uint64_t uOffset,
3462 const void *pvBuf, size_t cbWrite, size_t *pcbWritten)
3463{
3464 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3465
3466 return RTFileWriteAt(pStorage->File, uOffset, pvBuf, cbWrite, pcbWritten);
3467}
3468
3469/**
3470 * VD async I/O interface callback for a synchronous read from the file.
3471 */
3472static int vdIOReadSyncFallback(void *pvUser, void *pvStorage, uint64_t uOffset,
3473 void *pvBuf, size_t cbRead, size_t *pcbRead)
3474{
3475 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3476
3477 return RTFileReadAt(pStorage->File, uOffset, pvBuf, cbRead, pcbRead);
3478}
3479
3480/**
3481 * VD async I/O interface callback for a synchronous flush of the file data.
3482 */
3483static int vdIOFlushSyncFallback(void *pvUser, void *pvStorage)
3484{
3485 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3486
3487 return RTFileFlush(pStorage->File);
3488}
3489
3490/**
3491 * VD async I/O interface callback for a asynchronous read from the file.
3492 */
3493static int vdIOReadAsyncFallback(void *pvUser, void *pStorage, uint64_t uOffset,
3494 PCRTSGSEG paSegments, size_t cSegments,
3495 size_t cbRead, void *pvCompletion,
3496 void **ppTask)
3497{
3498 return VERR_NOT_IMPLEMENTED;
3499}
3500
3501/**
3502 * VD async I/O interface callback for a asynchronous write to the file.
3503 */
3504static int vdIOWriteAsyncFallback(void *pvUser, void *pStorage, uint64_t uOffset,
3505 PCRTSGSEG paSegments, size_t cSegments,
3506 size_t cbWrite, void *pvCompletion,
3507 void **ppTask)
3508{
3509 return VERR_NOT_IMPLEMENTED;
3510}
3511
3512/**
3513 * VD async I/O interface callback for a asynchronous flush of the file data.
3514 */
3515static int vdIOFlushAsyncFallback(void *pvUser, void *pStorage,
3516 void *pvCompletion, void **ppTask)
3517{
3518 return VERR_NOT_IMPLEMENTED;
3519}
3520
3521/**
3522 * Internal - Continues an I/O context after
3523 * it was halted because of an active transfer.
3524 */
3525static int vdIoCtxContinue(PVDIOCTX pIoCtx, int rcReq)
3526{
3527 PVBOXHDD pDisk = pIoCtx->pDisk;
3528 int rc = VINF_SUCCESS;
3529
3530 VD_IS_LOCKED(pDisk);
3531
3532 if (RT_FAILURE(rcReq))
3533 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rcReq, VINF_SUCCESS);
3534
3535 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
3536 {
3537 /* Continue the transfer */
3538 rc = vdIoCtxProcessLocked(pIoCtx);
3539
3540 if ( rc == VINF_VD_ASYNC_IO_FINISHED
3541 && ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
3542 {
3543 LogFlowFunc(("I/O context completed pIoCtx=%#p\n", pIoCtx));
3544 if (pIoCtx->pIoCtxParent)
3545 {
3546 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
3547
3548 Assert(!pIoCtxParent->pIoCtxParent);
3549 if (RT_FAILURE(pIoCtx->rcReq))
3550 ASMAtomicCmpXchgS32(&pIoCtxParent->rcReq, pIoCtx->rcReq, VINF_SUCCESS);
3551
3552 ASMAtomicDecU32(&pIoCtxParent->cDataTransfersPending);
3553
3554 if (pIoCtx->enmTxDir == VDIOCTXTXDIR_WRITE)
3555 {
3556 LogFlowFunc(("I/O context transferred %u bytes for the parent pIoCtxParent=%p\n",
3557 pIoCtx->Type.Child.cbTransferParent, pIoCtxParent));
3558
3559 /* Update the parent state. */
3560 Assert(pIoCtxParent->Req.Io.cbTransferLeft >= pIoCtx->Type.Child.cbTransferParent);
3561 ASMAtomicSubU32(&pIoCtxParent->Req.Io.cbTransferLeft, (uint32_t)pIoCtx->Type.Child.cbTransferParent);
3562 }
3563 else
3564 Assert(pIoCtx->enmTxDir == VDIOCTXTXDIR_FLUSH);
3565
3566 /*
3567 * A completed child write means that we finished growing the image.
3568 * We have to process any pending writes now.
3569 */
3570 vdIoCtxUnlockDisk(pDisk, pIoCtxParent, false /* fProcessDeferredReqs */);
3571
3572 /* Unblock the parent */
3573 pIoCtxParent->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
3574
3575 rc = vdIoCtxProcessLocked(pIoCtxParent);
3576
3577 if ( rc == VINF_VD_ASYNC_IO_FINISHED
3578 && ASMAtomicCmpXchgBool(&pIoCtxParent->fComplete, true, false))
3579 {
3580 LogFlowFunc(("Parent I/O context completed pIoCtxParent=%#p rcReq=%Rrc\n", pIoCtxParent, pIoCtxParent->rcReq));
3581 pIoCtxParent->Type.Root.pfnComplete(pIoCtxParent->Type.Root.pvUser1,
3582 pIoCtxParent->Type.Root.pvUser2,
3583 pIoCtxParent->rcReq);
3584 vdThreadFinishWrite(pDisk);
3585 vdIoCtxFree(pDisk, pIoCtxParent);
3586 vdDiskProcessBlockedIoCtx(pDisk);
3587 }
3588 else if (!vdIoCtxIsDiskLockOwner(pDisk, pIoCtx))
3589 {
3590 /* Process any pending writes if the current request didn't caused another growing. */
3591 vdDiskProcessBlockedIoCtx(pDisk);
3592 }
3593 }
3594 else
3595 {
3596 if (pIoCtx->enmTxDir == VDIOCTXTXDIR_FLUSH)
3597 {
3598 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessDerredReqs */);
3599 vdThreadFinishWrite(pDisk);
3600 }
3601 else if ( pIoCtx->enmTxDir == VDIOCTXTXDIR_WRITE
3602 || pIoCtx->enmTxDir == VDIOCTXTXDIR_DISCARD)
3603 vdThreadFinishWrite(pDisk);
3604 else
3605 {
3606 Assert(pIoCtx->enmTxDir == VDIOCTXTXDIR_READ);
3607 vdThreadFinishRead(pDisk);
3608 }
3609
3610 LogFlowFunc(("I/O context completed pIoCtx=%#p rcReq=%Rrc\n", pIoCtx, pIoCtx->rcReq));
3611 pIoCtx->Type.Root.pfnComplete(pIoCtx->Type.Root.pvUser1,
3612 pIoCtx->Type.Root.pvUser2,
3613 pIoCtx->rcReq);
3614 }
3615
3616 vdIoCtxFree(pDisk, pIoCtx);
3617 }
3618 }
3619
3620 return VINF_SUCCESS;
3621}
3622
3623/**
3624 * Internal - Called when user transfer completed.
3625 */
3626static int vdUserXferCompleted(PVDIOSTORAGE pIoStorage, PVDIOCTX pIoCtx,
3627 PFNVDXFERCOMPLETED pfnComplete, void *pvUser,
3628 size_t cbTransfer, int rcReq)
3629{
3630 int rc = VINF_SUCCESS;
3631 bool fIoCtxContinue = true;
3632 PVBOXHDD pDisk = pIoCtx->pDisk;
3633
3634 LogFlowFunc(("pIoStorage=%#p pIoCtx=%#p pfnComplete=%#p pvUser=%#p cbTransfer=%zu rcReq=%Rrc\n",
3635 pIoStorage, pIoCtx, pfnComplete, pvUser, cbTransfer, rcReq));
3636
3637 VD_IS_LOCKED(pDisk);
3638
3639 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbTransfer);
3640 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTransfer); Assert(cbTransfer == (uint32_t)cbTransfer);
3641 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
3642
3643 if (pfnComplete)
3644 rc = pfnComplete(pIoStorage->pVDIo->pBackendData, pIoCtx, pvUser, rcReq);
3645
3646 if (RT_SUCCESS(rc))
3647 rc = vdIoCtxContinue(pIoCtx, rcReq);
3648 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3649 rc = VINF_SUCCESS;
3650
3651 return rc;
3652}
3653
3654/**
3655 * Internal - Called when a meta transfer completed.
3656 */
3657static int vdMetaXferCompleted(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser,
3658 PVDMETAXFER pMetaXfer, int rcReq)
3659{
3660 PVBOXHDD pDisk = pIoStorage->pVDIo->pDisk;
3661 RTLISTNODE ListIoCtxWaiting;
3662 bool fFlush;
3663
3664 LogFlowFunc(("pIoStorage=%#p pfnComplete=%#p pvUser=%#p pMetaXfer=%#p rcReq=%Rrc\n",
3665 pIoStorage, pfnComplete, pvUser, pMetaXfer, rcReq));
3666
3667 VD_IS_LOCKED(pDisk);
3668
3669 fFlush = VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_FLUSH;
3670 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
3671
3672 if (!fFlush)
3673 {
3674 RTListMove(&ListIoCtxWaiting, &pMetaXfer->ListIoCtxWaiting);
3675
3676 if (RT_FAILURE(rcReq))
3677 {
3678 /* Remove from the AVL tree. */
3679 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
3680 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
3681 Assert(fRemoved);
3682 RTMemFree(pMetaXfer);
3683 }
3684 else
3685 {
3686 /* Increase the reference counter to make sure it doesn't go away before the last context is processed. */
3687 pMetaXfer->cRefs++;
3688 }
3689 }
3690 else
3691 RTListMove(&ListIoCtxWaiting, &pMetaXfer->ListIoCtxWaiting);
3692
3693 /* Go through the waiting list and continue the I/O contexts. */
3694 while (!RTListIsEmpty(&ListIoCtxWaiting))
3695 {
3696 int rc = VINF_SUCCESS;
3697 bool fContinue = true;
3698 PVDIOCTXDEFERRED pDeferred = RTListGetFirst(&ListIoCtxWaiting, VDIOCTXDEFERRED, NodeDeferred);
3699 PVDIOCTX pIoCtx = pDeferred->pIoCtx;
3700 RTListNodeRemove(&pDeferred->NodeDeferred);
3701
3702 RTMemFree(pDeferred);
3703 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
3704
3705 if (pfnComplete)
3706 rc = pfnComplete(pIoStorage->pVDIo->pBackendData, pIoCtx, pvUser, rcReq);
3707
3708 LogFlow(("Completion callback for I/O context %#p returned %Rrc\n", pIoCtx, rc));
3709
3710 if (RT_SUCCESS(rc))
3711 {
3712 rc = vdIoCtxContinue(pIoCtx, rcReq);
3713 AssertRC(rc);
3714 }
3715 else
3716 Assert(rc == VERR_VD_ASYNC_IO_IN_PROGRESS);
3717 }
3718
3719 /* Remove if not used anymore. */
3720 if (RT_SUCCESS(rcReq) && !fFlush)
3721 {
3722 pMetaXfer->cRefs--;
3723 if (!pMetaXfer->cRefs && RTListIsEmpty(&pMetaXfer->ListIoCtxWaiting))
3724 {
3725 /* Remove from the AVL tree. */
3726 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
3727 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
3728 Assert(fRemoved);
3729 RTMemFree(pMetaXfer);
3730 }
3731 }
3732 else if (fFlush)
3733 RTMemFree(pMetaXfer);
3734
3735 return VINF_SUCCESS;
3736}
3737
3738/**
3739 * Processes a list of waiting I/O tasks. The disk lock must be held by caller.
3740 *
3741 * @returns nothing.
3742 * @param pDisk The disk to process the list for.
3743 */
3744static void vdIoTaskProcessWaitingList(PVBOXHDD pDisk)
3745{
3746 LogFlowFunc(("pDisk=%#p\n", pDisk));
3747
3748 VD_IS_LOCKED(pDisk);
3749
3750 PVDIOTASK pHead = ASMAtomicXchgPtrT(&pDisk->pIoTasksPendingHead, NULL, PVDIOTASK);
3751
3752 Log(("I/O task list cleared\n"));
3753
3754 /* Reverse order. */
3755 PVDIOTASK pCur = pHead;
3756 pHead = NULL;
3757 while (pCur)
3758 {
3759 PVDIOTASK pInsert = pCur;
3760 pCur = pCur->pNext;
3761 pInsert->pNext = pHead;
3762 pHead = pInsert;
3763 }
3764
3765 while (pHead)
3766 {
3767 PVDIOSTORAGE pIoStorage = pHead->pIoStorage;
3768
3769 if (!pHead->fMeta)
3770 vdUserXferCompleted(pIoStorage, pHead->Type.User.pIoCtx,
3771 pHead->pfnComplete, pHead->pvUser,
3772 pHead->Type.User.cbTransfer, pHead->rcReq);
3773 else
3774 vdMetaXferCompleted(pIoStorage, pHead->pfnComplete, pHead->pvUser,
3775 pHead->Type.Meta.pMetaXfer, pHead->rcReq);
3776
3777 pCur = pHead;
3778 pHead = pHead->pNext;
3779 vdIoTaskFree(pDisk, pCur);
3780 }
3781}
3782
3783/**
3784 * Process any I/O context on the halted list.
3785 *
3786 * @returns nothing.
3787 * @param pDisk The disk.
3788 */
3789static void vdIoCtxProcessHaltedList(PVBOXHDD pDisk)
3790{
3791 LogFlowFunc(("pDisk=%#p\n", pDisk));
3792
3793 VD_IS_LOCKED(pDisk);
3794
3795 /* Get the waiting list and process it in FIFO order. */
3796 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxHaltedHead, NULL, PVDIOCTX);
3797
3798 /* Reverse it. */
3799 PVDIOCTX pCur = pIoCtxHead;
3800 pIoCtxHead = NULL;
3801 while (pCur)
3802 {
3803 PVDIOCTX pInsert = pCur;
3804 pCur = pCur->pIoCtxNext;
3805 pInsert->pIoCtxNext = pIoCtxHead;
3806 pIoCtxHead = pInsert;
3807 }
3808
3809 /* Process now. */
3810 pCur = pIoCtxHead;
3811 while (pCur)
3812 {
3813 PVDIOCTX pTmp = pCur;
3814
3815 pCur = pCur->pIoCtxNext;
3816 pTmp->pIoCtxNext = NULL;
3817
3818 /* Continue */
3819 pTmp->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
3820 vdIoCtxContinue(pTmp, pTmp->rcReq);
3821 }
3822}
3823
3824/**
3825 * Unlock the disk and process pending tasks.
3826 *
3827 * @returns VBox status code.
3828 * @param pDisk The disk to unlock.
3829 */
3830static int vdDiskUnlock(PVBOXHDD pDisk, PVDIOCTX pIoCtxRc)
3831{
3832 int rc = VINF_SUCCESS;
3833
3834 VD_IS_LOCKED(pDisk);
3835
3836 /*
3837 * Process the list of waiting I/O tasks first
3838 * because they might complete I/O contexts.
3839 * Same for the list of halted I/O contexts.
3840 * Afterwards comes the list of new I/O contexts.
3841 */
3842 vdIoTaskProcessWaitingList(pDisk);
3843 vdIoCtxProcessHaltedList(pDisk);
3844 rc = vdDiskProcessWaitingIoCtx(pDisk, pIoCtxRc);
3845 ASMAtomicXchgBool(&pDisk->fLocked, false);
3846
3847 /*
3848 * Need to check for new I/O tasks and waiting I/O contexts now
3849 * again as other threads might added them while we processed
3850 * previous lists.
3851 */
3852 while ( ASMAtomicUoReadPtrT(&pDisk->pIoCtxHead, PVDIOCTX) != NULL
3853 || ASMAtomicUoReadPtrT(&pDisk->pIoTasksPendingHead, PVDIOTASK) != NULL
3854 || ASMAtomicUoReadPtrT(&pDisk->pIoCtxHaltedHead, PVDIOCTX) != NULL)
3855 {
3856 /* Try lock disk again. */
3857 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
3858 {
3859 vdIoTaskProcessWaitingList(pDisk);
3860 vdIoCtxProcessHaltedList(pDisk);
3861 vdDiskProcessWaitingIoCtx(pDisk, NULL);
3862 ASMAtomicXchgBool(&pDisk->fLocked, false);
3863 }
3864 else /* Let the other thread everything when he unlocks the disk. */
3865 break;
3866 }
3867
3868 return rc;
3869}
3870
3871/**
3872 * Try to lock the disk to complete pressing of the I/O task.
3873 * The completion is deferred if the disk is locked already.
3874 *
3875 * @returns nothing.
3876 * @param pIoTask The I/O task to complete.
3877 */
3878static void vdXferTryLockDiskDeferIoTask(PVDIOTASK pIoTask)
3879{
3880 PVDIOSTORAGE pIoStorage = pIoTask->pIoStorage;
3881 PVBOXHDD pDisk = pIoStorage->pVDIo->pDisk;
3882
3883 Log(("Deferring I/O task pIoTask=%p\n", pIoTask));
3884
3885 /* Put it on the waiting list. */
3886 PVDIOTASK pNext = ASMAtomicUoReadPtrT(&pDisk->pIoTasksPendingHead, PVDIOTASK);
3887 PVDIOTASK pHeadOld;
3888 pIoTask->pNext = pNext;
3889 while (!ASMAtomicCmpXchgExPtr(&pDisk->pIoTasksPendingHead, pIoTask, pNext, &pHeadOld))
3890 {
3891 pNext = pHeadOld;
3892 Assert(pNext != pIoTask);
3893 pIoTask->pNext = pNext;
3894 ASMNopPause();
3895 }
3896
3897 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
3898 {
3899 /* Release disk lock, it will take care of processing all lists. */
3900 vdDiskUnlock(pDisk, NULL);
3901 }
3902}
3903
3904static int vdIOIntReqCompleted(void *pvUser, int rcReq)
3905{
3906 PVDIOTASK pIoTask = (PVDIOTASK)pvUser;
3907
3908 LogFlowFunc(("Task completed pIoTask=%#p\n", pIoTask));
3909
3910 pIoTask->rcReq = rcReq;
3911 vdXferTryLockDiskDeferIoTask(pIoTask);
3912 return VINF_SUCCESS;
3913}
3914
3915/**
3916 * VD I/O interface callback for opening a file.
3917 */
3918static int vdIOIntOpen(void *pvUser, const char *pszLocation,
3919 unsigned uOpenFlags, PPVDIOSTORAGE ppIoStorage)
3920{
3921 int rc = VINF_SUCCESS;
3922 PVDIO pVDIo = (PVDIO)pvUser;
3923 PVDIOSTORAGE pIoStorage = (PVDIOSTORAGE)RTMemAllocZ(sizeof(VDIOSTORAGE));
3924
3925 if (!pIoStorage)
3926 return VERR_NO_MEMORY;
3927
3928 /* Create the AVl tree. */
3929 pIoStorage->pTreeMetaXfers = (PAVLRFOFFTREE)RTMemAllocZ(sizeof(AVLRFOFFTREE));
3930 if (pIoStorage->pTreeMetaXfers)
3931 {
3932 rc = pVDIo->pInterfaceIo->pfnOpen(pVDIo->pInterfaceIo->Core.pvUser,
3933 pszLocation, uOpenFlags,
3934 vdIOIntReqCompleted,
3935 &pIoStorage->pStorage);
3936 if (RT_SUCCESS(rc))
3937 {
3938 pIoStorage->pVDIo = pVDIo;
3939 *ppIoStorage = pIoStorage;
3940 return VINF_SUCCESS;
3941 }
3942
3943 RTMemFree(pIoStorage->pTreeMetaXfers);
3944 }
3945 else
3946 rc = VERR_NO_MEMORY;
3947
3948 RTMemFree(pIoStorage);
3949 return rc;
3950}
3951
3952static int vdIOIntTreeMetaXferDestroy(PAVLRFOFFNODECORE pNode, void *pvUser)
3953{
3954 AssertMsgFailed(("Tree should be empty at this point!\n"));
3955 return VINF_SUCCESS;
3956}
3957
3958static int vdIOIntClose(void *pvUser, PVDIOSTORAGE pIoStorage)
3959{
3960 int rc = VINF_SUCCESS;
3961 PVDIO pVDIo = (PVDIO)pvUser;
3962
3963 /* We free everything here, even if closing the file failed for some reason. */
3964 rc = pVDIo->pInterfaceIo->pfnClose(pVDIo->pInterfaceIo->Core.pvUser, pIoStorage->pStorage);
3965 RTAvlrFileOffsetDestroy(pIoStorage->pTreeMetaXfers, vdIOIntTreeMetaXferDestroy, NULL);
3966 RTMemFree(pIoStorage->pTreeMetaXfers);
3967 RTMemFree(pIoStorage);
3968 return rc;
3969}
3970
3971static int vdIOIntDelete(void *pvUser, const char *pcszFilename)
3972{
3973 PVDIO pVDIo = (PVDIO)pvUser;
3974 return pVDIo->pInterfaceIo->pfnDelete(pVDIo->pInterfaceIo->Core.pvUser,
3975 pcszFilename);
3976}
3977
3978static int vdIOIntMove(void *pvUser, const char *pcszSrc, const char *pcszDst,
3979 unsigned fMove)
3980{
3981 PVDIO pVDIo = (PVDIO)pvUser;
3982 return pVDIo->pInterfaceIo->pfnMove(pVDIo->pInterfaceIo->Core.pvUser,
3983 pcszSrc, pcszDst, fMove);
3984}
3985
3986static int vdIOIntGetFreeSpace(void *pvUser, const char *pcszFilename,
3987 int64_t *pcbFreeSpace)
3988{
3989 PVDIO pVDIo = (PVDIO)pvUser;
3990 return pVDIo->pInterfaceIo->pfnGetFreeSpace(pVDIo->pInterfaceIo->Core.pvUser,
3991 pcszFilename, pcbFreeSpace);
3992}
3993
3994static int vdIOIntGetModificationTime(void *pvUser, const char *pcszFilename,
3995 PRTTIMESPEC pModificationTime)
3996{
3997 PVDIO pVDIo = (PVDIO)pvUser;
3998 return pVDIo->pInterfaceIo->pfnGetModificationTime(pVDIo->pInterfaceIo->Core.pvUser,
3999 pcszFilename, pModificationTime);
4000}
4001
4002static int vdIOIntGetSize(void *pvUser, PVDIOSTORAGE pIoStorage,
4003 uint64_t *pcbSize)
4004{
4005 PVDIO pVDIo = (PVDIO)pvUser;
4006 return pVDIo->pInterfaceIo->pfnGetSize(pVDIo->pInterfaceIo->Core.pvUser,
4007 pIoStorage->pStorage, pcbSize);
4008}
4009
4010static int vdIOIntSetSize(void *pvUser, PVDIOSTORAGE pIoStorage,
4011 uint64_t cbSize)
4012{
4013 PVDIO pVDIo = (PVDIO)pvUser;
4014 return pVDIo->pInterfaceIo->pfnSetSize(pVDIo->pInterfaceIo->Core.pvUser,
4015 pIoStorage->pStorage, cbSize);
4016}
4017
4018static int vdIOIntReadUser(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4019 PVDIOCTX pIoCtx, size_t cbRead)
4020{
4021 int rc = VINF_SUCCESS;
4022 PVDIO pVDIo = (PVDIO)pvUser;
4023 PVBOXHDD pDisk = pVDIo->pDisk;
4024
4025 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pIoCtx=%#p cbRead=%u\n",
4026 pvUser, pIoStorage, uOffset, pIoCtx, cbRead));
4027
4028 /** @todo: Enable check for sync I/O later. */
4029 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4030 VD_IS_LOCKED(pDisk);
4031
4032 Assert(cbRead > 0);
4033
4034 if (pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4035 {
4036 RTSGSEG Seg;
4037 unsigned cSegments = 1;
4038 size_t cbTaskRead = 0;
4039
4040 /* Synchronous I/O contexts only have one buffer segment. */
4041 AssertMsgReturn(pIoCtx->Req.Io.SgBuf.cSegs == 1,
4042 ("Invalid number of buffer segments for synchronous I/O context"),
4043 VERR_INVALID_PARAMETER);
4044
4045 cbTaskRead = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, &Seg, &cSegments, cbRead);
4046 Assert(cbRead == cbTaskRead);
4047 Assert(cSegments == 1);
4048 rc = pVDIo->pInterfaceIo->pfnReadSync(pVDIo->pInterfaceIo->Core.pvUser,
4049 pIoStorage->pStorage, uOffset,
4050 Seg.pvSeg, cbRead, NULL);
4051 if (RT_SUCCESS(rc))
4052 {
4053 Assert(cbRead == (uint32_t)cbRead);
4054 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbRead);
4055 }
4056 }
4057 else
4058 {
4059 /* Build the S/G array and spawn a new I/O task */
4060 while (cbRead)
4061 {
4062 RTSGSEG aSeg[VD_IO_TASK_SEGMENTS_MAX];
4063 unsigned cSegments = VD_IO_TASK_SEGMENTS_MAX;
4064 size_t cbTaskRead = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, aSeg, &cSegments, cbRead);
4065
4066 Assert(cSegments > 0);
4067 Assert(cbTaskRead > 0);
4068 AssertMsg(cbTaskRead <= cbRead, ("Invalid number of bytes to read\n"));
4069
4070 LogFlow(("Reading %u bytes into %u segments\n", cbTaskRead, cSegments));
4071
4072#ifdef RT_STRICT
4073 for (unsigned i = 0; i < cSegments; i++)
4074 AssertMsg(aSeg[i].pvSeg && !(aSeg[i].cbSeg % 512),
4075 ("Segment %u is invalid\n", i));
4076#endif
4077
4078 Assert(cbTaskRead == (uint32_t)cbTaskRead);
4079 PVDIOTASK pIoTask = vdIoTaskUserAlloc(pIoStorage, NULL, NULL, pIoCtx, (uint32_t)cbTaskRead);
4080
4081 if (!pIoTask)
4082 return VERR_NO_MEMORY;
4083
4084 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
4085
4086 void *pvTask;
4087 Log(("Spawning pIoTask=%p pIoCtx=%p\n", pIoTask, pIoCtx));
4088 rc = pVDIo->pInterfaceIo->pfnReadAsync(pVDIo->pInterfaceIo->Core.pvUser,
4089 pIoStorage->pStorage, uOffset,
4090 aSeg, cSegments, cbTaskRead, pIoTask,
4091 &pvTask);
4092 if (RT_SUCCESS(rc))
4093 {
4094 AssertMsg(cbTaskRead <= pIoCtx->Req.Io.cbTransferLeft, ("Impossible!\n"));
4095 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTaskRead);
4096 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4097 vdIoTaskFree(pDisk, pIoTask);
4098 }
4099 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4100 {
4101 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4102 vdIoTaskFree(pDisk, pIoTask);
4103 break;
4104 }
4105
4106 uOffset += cbTaskRead;
4107 cbRead -= cbTaskRead;
4108 }
4109 }
4110
4111 LogFlowFunc(("returns rc=%Rrc\n", rc));
4112 return rc;
4113}
4114
4115static int vdIOIntWriteUser(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4116 PVDIOCTX pIoCtx, size_t cbWrite, PFNVDXFERCOMPLETED pfnComplete,
4117 void *pvCompleteUser)
4118{
4119 int rc = VINF_SUCCESS;
4120 PVDIO pVDIo = (PVDIO)pvUser;
4121 PVBOXHDD pDisk = pVDIo->pDisk;
4122
4123 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pIoCtx=%#p cbWrite=%u\n",
4124 pvUser, pIoStorage, uOffset, pIoCtx, cbWrite));
4125
4126 /** @todo: Enable check for sync I/O later. */
4127 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4128 VD_IS_LOCKED(pDisk);
4129
4130 Assert(cbWrite > 0);
4131
4132 if (pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4133 {
4134 RTSGSEG Seg;
4135 unsigned cSegments = 1;
4136 size_t cbTaskWrite = 0;
4137
4138 /* Synchronous I/O contexts only have one buffer segment. */
4139 AssertMsgReturn(pIoCtx->Req.Io.SgBuf.cSegs == 1,
4140 ("Invalid number of buffer segments for synchronous I/O context"),
4141 VERR_INVALID_PARAMETER);
4142
4143 cbTaskWrite = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, &Seg, &cSegments, cbWrite);
4144 Assert(cbWrite == cbTaskWrite);
4145 Assert(cSegments == 1);
4146 rc = pVDIo->pInterfaceIo->pfnWriteSync(pVDIo->pInterfaceIo->Core.pvUser,
4147 pIoStorage->pStorage, uOffset,
4148 Seg.pvSeg, cbWrite, NULL);
4149 if (RT_SUCCESS(rc))
4150 {
4151 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbWrite);
4152 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbWrite);
4153 }
4154 }
4155 else
4156 {
4157 /* Build the S/G array and spawn a new I/O task */
4158 while (cbWrite)
4159 {
4160 RTSGSEG aSeg[VD_IO_TASK_SEGMENTS_MAX];
4161 unsigned cSegments = VD_IO_TASK_SEGMENTS_MAX;
4162 size_t cbTaskWrite = 0;
4163
4164 cbTaskWrite = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, aSeg, &cSegments, cbWrite);
4165
4166 Assert(cSegments > 0);
4167 Assert(cbTaskWrite > 0);
4168 AssertMsg(cbTaskWrite <= cbWrite, ("Invalid number of bytes to write\n"));
4169
4170 LogFlow(("Writing %u bytes from %u segments\n", cbTaskWrite, cSegments));
4171
4172#ifdef DEBUG
4173 for (unsigned i = 0; i < cSegments; i++)
4174 AssertMsg(aSeg[i].pvSeg && !(aSeg[i].cbSeg % 512),
4175 ("Segment %u is invalid\n", i));
4176#endif
4177
4178 Assert(cbTaskWrite == (uint32_t)cbTaskWrite);
4179 PVDIOTASK pIoTask = vdIoTaskUserAlloc(pIoStorage, pfnComplete, pvCompleteUser, pIoCtx, (uint32_t)cbTaskWrite);
4180
4181 if (!pIoTask)
4182 return VERR_NO_MEMORY;
4183
4184 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
4185
4186 void *pvTask;
4187 Log(("Spawning pIoTask=%p pIoCtx=%p\n", pIoTask, pIoCtx));
4188 rc = pVDIo->pInterfaceIo->pfnWriteAsync(pVDIo->pInterfaceIo->Core.pvUser,
4189 pIoStorage->pStorage,
4190 uOffset, aSeg, cSegments,
4191 cbTaskWrite, pIoTask, &pvTask);
4192 if (RT_SUCCESS(rc))
4193 {
4194 AssertMsg(cbTaskWrite <= pIoCtx->Req.Io.cbTransferLeft, ("Impossible!\n"));
4195 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTaskWrite);
4196 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4197 vdIoTaskFree(pDisk, pIoTask);
4198 }
4199 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4200 {
4201 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4202 vdIoTaskFree(pDisk, pIoTask);
4203 break;
4204 }
4205
4206 uOffset += cbTaskWrite;
4207 cbWrite -= cbTaskWrite;
4208 }
4209 }
4210
4211 LogFlowFunc(("returns rc=%Rrc\n", rc));
4212 return rc;
4213}
4214
4215static int vdIOIntReadMeta(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4216 void *pvBuf, size_t cbRead, PVDIOCTX pIoCtx,
4217 PPVDMETAXFER ppMetaXfer, PFNVDXFERCOMPLETED pfnComplete,
4218 void *pvCompleteUser)
4219{
4220 PVDIO pVDIo = (PVDIO)pvUser;
4221 PVBOXHDD pDisk = pVDIo->pDisk;
4222 int rc = VINF_SUCCESS;
4223 RTSGSEG Seg;
4224 PVDIOTASK pIoTask;
4225 PVDMETAXFER pMetaXfer = NULL;
4226 void *pvTask = NULL;
4227
4228 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pvBuf=%#p cbRead=%u\n",
4229 pvUser, pIoStorage, uOffset, pvBuf, cbRead));
4230
4231 AssertMsgReturn( pIoCtx
4232 || (!ppMetaXfer && !pfnComplete && !pvCompleteUser),
4233 ("A synchronous metadata read is requested but the parameters are wrong\n"),
4234 VERR_INVALID_POINTER);
4235
4236 /** @todo: Enable check for sync I/O later. */
4237 if ( pIoCtx
4238 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4239 VD_IS_LOCKED(pDisk);
4240
4241 if ( !pIoCtx
4242 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4243 {
4244 /* Handle synchronous metadata I/O. */
4245 /** @todo: Integrate with metadata transfers below. */
4246 rc = pVDIo->pInterfaceIo->pfnReadSync(pVDIo->pInterfaceIo->Core.pvUser,
4247 pIoStorage->pStorage, uOffset,
4248 pvBuf, cbRead, NULL);
4249 if (ppMetaXfer)
4250 *ppMetaXfer = NULL;
4251 }
4252 else
4253 {
4254 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGet(pIoStorage->pTreeMetaXfers, uOffset);
4255 if (!pMetaXfer)
4256 {
4257#ifdef RT_STRICT
4258 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGetBestFit(pIoStorage->pTreeMetaXfers, uOffset, false /* fAbove */);
4259 AssertMsg(!pMetaXfer || (pMetaXfer->Core.Key + (RTFOFF)pMetaXfer->cbMeta <= (RTFOFF)uOffset),
4260 ("Overlapping meta transfers!\n"));
4261#endif
4262
4263 /* Allocate a new meta transfer. */
4264 pMetaXfer = vdMetaXferAlloc(pIoStorage, uOffset, cbRead);
4265 if (!pMetaXfer)
4266 return VERR_NO_MEMORY;
4267
4268 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvCompleteUser, pMetaXfer);
4269 if (!pIoTask)
4270 {
4271 RTMemFree(pMetaXfer);
4272 return VERR_NO_MEMORY;
4273 }
4274
4275 Seg.cbSeg = cbRead;
4276 Seg.pvSeg = pMetaXfer->abData;
4277
4278 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_READ);
4279 rc = pVDIo->pInterfaceIo->pfnReadAsync(pVDIo->pInterfaceIo->Core.pvUser,
4280 pIoStorage->pStorage,
4281 uOffset, &Seg, 1,
4282 cbRead, pIoTask, &pvTask);
4283
4284 if (RT_SUCCESS(rc) || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4285 {
4286 bool fInserted = RTAvlrFileOffsetInsert(pIoStorage->pTreeMetaXfers, &pMetaXfer->Core);
4287 Assert(fInserted);
4288 }
4289 else
4290 RTMemFree(pMetaXfer);
4291
4292 if (RT_SUCCESS(rc))
4293 {
4294 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4295 vdIoTaskFree(pDisk, pIoTask);
4296 }
4297 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS && !pfnComplete)
4298 rc = VERR_VD_NOT_ENOUGH_METADATA;
4299 }
4300
4301 Assert(VALID_PTR(pMetaXfer) || RT_FAILURE(rc));
4302
4303 if (RT_SUCCESS(rc) || rc == VERR_VD_NOT_ENOUGH_METADATA || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4304 {
4305 /* If it is pending add the request to the list. */
4306 if (VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_READ)
4307 {
4308 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4309 AssertPtr(pDeferred);
4310
4311 RTListInit(&pDeferred->NodeDeferred);
4312 pDeferred->pIoCtx = pIoCtx;
4313
4314 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4315 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4316 rc = VERR_VD_NOT_ENOUGH_METADATA;
4317 }
4318 else
4319 {
4320 /* Transfer the data. */
4321 pMetaXfer->cRefs++;
4322 Assert(pMetaXfer->cbMeta >= cbRead);
4323 Assert(pMetaXfer->Core.Key == (RTFOFF)uOffset);
4324 memcpy(pvBuf, pMetaXfer->abData, cbRead);
4325 *ppMetaXfer = pMetaXfer;
4326 }
4327 }
4328 }
4329
4330 LogFlowFunc(("returns rc=%Rrc\n", rc));
4331 return rc;
4332}
4333
4334static int vdIOIntWriteMeta(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4335 const void *pvBuf, size_t cbWrite, PVDIOCTX pIoCtx,
4336 PFNVDXFERCOMPLETED pfnComplete, void *pvCompleteUser)
4337{
4338 PVDIO pVDIo = (PVDIO)pvUser;
4339 PVBOXHDD pDisk = pVDIo->pDisk;
4340 int rc = VINF_SUCCESS;
4341 RTSGSEG Seg;
4342 PVDIOTASK pIoTask;
4343 PVDMETAXFER pMetaXfer = NULL;
4344 bool fInTree = false;
4345 void *pvTask = NULL;
4346
4347 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pvBuf=%#p cbWrite=%u\n",
4348 pvUser, pIoStorage, uOffset, pvBuf, cbWrite));
4349
4350 AssertMsgReturn( pIoCtx
4351 || (!pfnComplete && !pvCompleteUser),
4352 ("A synchronous metadata write is requested but the parameters are wrong\n"),
4353 VERR_INVALID_POINTER);
4354
4355 /** @todo: Enable check for sync I/O later. */
4356 if ( pIoCtx
4357 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4358 VD_IS_LOCKED(pDisk);
4359
4360 if ( !pIoCtx
4361 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4362 {
4363 /* Handle synchronous metadata I/O. */
4364 /** @todo: Integrate with metadata transfers below. */
4365 rc = pVDIo->pInterfaceIo->pfnWriteSync(pVDIo->pInterfaceIo->Core.pvUser,
4366 pIoStorage->pStorage, uOffset,
4367 pvBuf, cbWrite, NULL);
4368 }
4369 else
4370 {
4371 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGet(pIoStorage->pTreeMetaXfers, uOffset);
4372 if (!pMetaXfer)
4373 {
4374 /* Allocate a new meta transfer. */
4375 pMetaXfer = vdMetaXferAlloc(pIoStorage, uOffset, cbWrite);
4376 if (!pMetaXfer)
4377 return VERR_NO_MEMORY;
4378 }
4379 else
4380 {
4381 Assert(pMetaXfer->cbMeta >= cbWrite);
4382 Assert(pMetaXfer->Core.Key == (RTFOFF)uOffset);
4383 fInTree = true;
4384 }
4385
4386 Assert(VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE);
4387
4388 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvCompleteUser, pMetaXfer);
4389 if (!pIoTask)
4390 {
4391 RTMemFree(pMetaXfer);
4392 return VERR_NO_MEMORY;
4393 }
4394
4395 memcpy(pMetaXfer->abData, pvBuf, cbWrite);
4396 Seg.cbSeg = cbWrite;
4397 Seg.pvSeg = pMetaXfer->abData;
4398
4399 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4400
4401 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_WRITE);
4402 rc = pVDIo->pInterfaceIo->pfnWriteAsync(pVDIo->pInterfaceIo->Core.pvUser,
4403 pIoStorage->pStorage,
4404 uOffset, &Seg, 1, cbWrite, pIoTask,
4405 &pvTask);
4406 if (RT_SUCCESS(rc))
4407 {
4408 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4409 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
4410 vdIoTaskFree(pDisk, pIoTask);
4411 if (fInTree && !pMetaXfer->cRefs)
4412 {
4413 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4414 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4415 AssertMsg(fRemoved, ("Metadata transfer wasn't removed\n"));
4416 RTMemFree(pMetaXfer);
4417 pMetaXfer = NULL;
4418 }
4419 }
4420 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4421 {
4422 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4423 AssertPtr(pDeferred);
4424
4425 RTListInit(&pDeferred->NodeDeferred);
4426 pDeferred->pIoCtx = pIoCtx;
4427
4428 if (!fInTree)
4429 {
4430 bool fInserted = RTAvlrFileOffsetInsert(pIoStorage->pTreeMetaXfers, &pMetaXfer->Core);
4431 Assert(fInserted);
4432 }
4433
4434 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4435 }
4436 else
4437 {
4438 RTMemFree(pMetaXfer);
4439 pMetaXfer = NULL;
4440 }
4441 }
4442
4443 LogFlowFunc(("returns rc=%Rrc\n", rc));
4444 return rc;
4445}
4446
4447static void vdIOIntMetaXferRelease(void *pvUser, PVDMETAXFER pMetaXfer)
4448{
4449 PVDIO pVDIo = (PVDIO)pvUser;
4450 PVBOXHDD pDisk = pVDIo->pDisk;
4451 PVDIOSTORAGE pIoStorage;
4452
4453 /*
4454 * It is possible that we get called with a NULL metadata xfer handle
4455 * for synchronous I/O. Just exit.
4456 */
4457 if (!pMetaXfer)
4458 return;
4459
4460 pIoStorage = pMetaXfer->pIoStorage;
4461
4462 VD_IS_LOCKED(pDisk);
4463
4464 Assert( VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE
4465 || VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_WRITE);
4466 Assert(pMetaXfer->cRefs > 0);
4467
4468 pMetaXfer->cRefs--;
4469 if ( !pMetaXfer->cRefs
4470 && RTListIsEmpty(&pMetaXfer->ListIoCtxWaiting)
4471 && VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE)
4472 {
4473 /* Free the meta data entry. */
4474 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4475 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4476 AssertMsg(fRemoved, ("Metadata transfer wasn't removed\n"));
4477
4478 RTMemFree(pMetaXfer);
4479 }
4480}
4481
4482static int vdIOIntFlush(void *pvUser, PVDIOSTORAGE pIoStorage, PVDIOCTX pIoCtx,
4483 PFNVDXFERCOMPLETED pfnComplete, void *pvCompleteUser)
4484{
4485 PVDIO pVDIo = (PVDIO)pvUser;
4486 PVBOXHDD pDisk = pVDIo->pDisk;
4487 int rc = VINF_SUCCESS;
4488 PVDIOTASK pIoTask;
4489 PVDMETAXFER pMetaXfer = NULL;
4490 void *pvTask = NULL;
4491
4492 LogFlowFunc(("pvUser=%#p pIoStorage=%#p pIoCtx=%#p\n",
4493 pvUser, pIoStorage, pIoCtx));
4494
4495 AssertMsgReturn( pIoCtx
4496 || (!pfnComplete && !pvCompleteUser),
4497 ("A synchronous metadata write is requested but the parameters are wrong\n"),
4498 VERR_INVALID_POINTER);
4499
4500 /** @todo: Enable check for sync I/O later. */
4501 if ( pIoCtx
4502 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4503 VD_IS_LOCKED(pDisk);
4504
4505 if (pVDIo->fIgnoreFlush)
4506 return VINF_SUCCESS;
4507
4508 if ( !pIoCtx
4509 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4510 {
4511 /* Handle synchronous flushes. */
4512 /** @todo: Integrate with metadata transfers below. */
4513 rc = pVDIo->pInterfaceIo->pfnFlushSync(pVDIo->pInterfaceIo->Core.pvUser,
4514 pIoStorage->pStorage);
4515 }
4516 else
4517 {
4518 /* Allocate a new meta transfer. */
4519 pMetaXfer = vdMetaXferAlloc(pIoStorage, 0, 0);
4520 if (!pMetaXfer)
4521 return VERR_NO_MEMORY;
4522
4523 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvUser, pMetaXfer);
4524 if (!pIoTask)
4525 {
4526 RTMemFree(pMetaXfer);
4527 return VERR_NO_MEMORY;
4528 }
4529
4530 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4531
4532 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4533 AssertPtr(pDeferred);
4534
4535 RTListInit(&pDeferred->NodeDeferred);
4536 pDeferred->pIoCtx = pIoCtx;
4537
4538 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4539 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_FLUSH);
4540 rc = pVDIo->pInterfaceIo->pfnFlushAsync(pVDIo->pInterfaceIo->Core.pvUser,
4541 pIoStorage->pStorage,
4542 pIoTask, &pvTask);
4543 if (RT_SUCCESS(rc))
4544 {
4545 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4546 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
4547 vdIoTaskFree(pDisk, pIoTask);
4548 RTMemFree(pDeferred);
4549 RTMemFree(pMetaXfer);
4550 }
4551 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4552 RTMemFree(pMetaXfer);
4553 }
4554
4555 LogFlowFunc(("returns rc=%Rrc\n", rc));
4556 return rc;
4557}
4558
4559static size_t vdIOIntIoCtxCopyTo(void *pvUser, PVDIOCTX pIoCtx,
4560 const void *pvBuf, size_t cbBuf)
4561{
4562 PVDIO pVDIo = (PVDIO)pvUser;
4563 PVBOXHDD pDisk = pVDIo->pDisk;
4564 size_t cbCopied = 0;
4565
4566 /** @todo: Enable check for sync I/O later. */
4567 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4568 VD_IS_LOCKED(pDisk);
4569
4570 cbCopied = vdIoCtxCopyTo(pIoCtx, (uint8_t *)pvBuf, cbBuf);
4571 Assert(cbCopied == cbBuf);
4572
4573 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft >= cbCopied); - triggers with vdCopyHelper/dmgRead.
4574 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCopied);
4575
4576 return cbCopied;
4577}
4578
4579static size_t vdIOIntIoCtxCopyFrom(void *pvUser, PVDIOCTX pIoCtx,
4580 void *pvBuf, size_t cbBuf)
4581{
4582 PVDIO pVDIo = (PVDIO)pvUser;
4583 PVBOXHDD pDisk = pVDIo->pDisk;
4584 size_t cbCopied = 0;
4585
4586 /** @todo: Enable check for sync I/O later. */
4587 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4588 VD_IS_LOCKED(pDisk);
4589
4590 cbCopied = vdIoCtxCopyFrom(pIoCtx, (uint8_t *)pvBuf, cbBuf);
4591 Assert(cbCopied == cbBuf);
4592
4593 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft > cbCopied); - triggers with vdCopyHelper/dmgRead.
4594 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCopied);
4595
4596 return cbCopied;
4597}
4598
4599static size_t vdIOIntIoCtxSet(void *pvUser, PVDIOCTX pIoCtx, int ch, size_t cb)
4600{
4601 PVDIO pVDIo = (PVDIO)pvUser;
4602 PVBOXHDD pDisk = pVDIo->pDisk;
4603 size_t cbSet = 0;
4604
4605 /** @todo: Enable check for sync I/O later. */
4606 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4607 VD_IS_LOCKED(pDisk);
4608
4609 cbSet = vdIoCtxSet(pIoCtx, ch, cb);
4610 Assert(cbSet == cb);
4611
4612 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft >= cbSet); - triggers with vdCopyHelper/dmgRead.
4613 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbSet);
4614
4615 return cbSet;
4616}
4617
4618static size_t vdIOIntIoCtxSegArrayCreate(void *pvUser, PVDIOCTX pIoCtx,
4619 PRTSGSEG paSeg, unsigned *pcSeg,
4620 size_t cbData)
4621{
4622 PVDIO pVDIo = (PVDIO)pvUser;
4623 PVBOXHDD pDisk = pVDIo->pDisk;
4624 size_t cbCreated = 0;
4625
4626 /** @todo: Enable check for sync I/O later. */
4627 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4628 VD_IS_LOCKED(pDisk);
4629
4630 cbCreated = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, paSeg, pcSeg, cbData);
4631 Assert(!paSeg || cbData == cbCreated);
4632
4633 return cbCreated;
4634}
4635
4636static void vdIOIntIoCtxCompleted(void *pvUser, PVDIOCTX pIoCtx, int rcReq,
4637 size_t cbCompleted)
4638{
4639 PVDIO pVDIo = (PVDIO)pvUser;
4640 PVBOXHDD pDisk = pVDIo->pDisk;
4641
4642 LogFlowFunc(("pvUser=%#p pIoCtx=%#p rcReq=%Rrc cbCompleted=%zu\n",
4643 pvUser, pIoCtx, rcReq, cbCompleted));
4644
4645 /*
4646 * Grab the disk critical section to avoid races with other threads which
4647 * might still modify the I/O context.
4648 * Example is that iSCSI is doing an asynchronous write but calls us already
4649 * while the other thread is still hanging in vdWriteHelperAsync and couldn't update
4650 * the blocked state yet.
4651 * It can overwrite the state to true before we call vdIoCtxContinue and the
4652 * the request would hang indefinite.
4653 */
4654 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rcReq, VINF_SUCCESS);
4655 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbCompleted);
4656 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCompleted);
4657
4658 /* Set next transfer function if the current one finished.
4659 * @todo: Find a better way to prevent vdIoCtxContinue from calling the current helper again. */
4660 if (!pIoCtx->Req.Io.cbTransferLeft)
4661 {
4662 pIoCtx->pfnIoCtxTransfer = pIoCtx->pfnIoCtxTransferNext;
4663 pIoCtx->pfnIoCtxTransferNext = NULL;
4664 }
4665
4666 vdIoCtxAddToWaitingList(&pDisk->pIoCtxHaltedHead, pIoCtx);
4667 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
4668 {
4669 /* Immediately drop the lock again, it will take care of processing the list. */
4670 vdDiskUnlock(pDisk, NULL);
4671 }
4672}
4673
4674static DECLCALLBACK(bool) vdIOIntIoCtxIsSynchronous(void *pvUser, PVDIOCTX pIoCtx)
4675{
4676 NOREF(pvUser);
4677 return !!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC);
4678}
4679
4680static DECLCALLBACK(bool) vdIOIntIoCtxIsZero(void *pvUser, PVDIOCTX pIoCtx, size_t cbCheck,
4681 bool fAdvance)
4682{
4683 NOREF(pvUser);
4684
4685 bool fIsZero = RTSgBufIsZero(&pIoCtx->Req.Io.SgBuf, cbCheck);
4686 if (fIsZero && fAdvance)
4687 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbCheck);
4688
4689 return fIsZero;
4690}
4691
4692/**
4693 * VD I/O interface callback for opening a file (limited version for VDGetFormat).
4694 */
4695static int vdIOIntOpenLimited(void *pvUser, const char *pszLocation,
4696 uint32_t fOpen, PPVDIOSTORAGE ppIoStorage)
4697{
4698 int rc = VINF_SUCCESS;
4699 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4700 PVDIOSTORAGE pIoStorage = (PVDIOSTORAGE)RTMemAllocZ(sizeof(VDIOSTORAGE));
4701
4702 if (!pIoStorage)
4703 return VERR_NO_MEMORY;
4704
4705 rc = pInterfaceIo->pfnOpen(NULL, pszLocation, fOpen, NULL, &pIoStorage->pStorage);
4706 if (RT_SUCCESS(rc))
4707 *ppIoStorage = pIoStorage;
4708 else
4709 RTMemFree(pIoStorage);
4710
4711 return rc;
4712}
4713
4714static int vdIOIntCloseLimited(void *pvUser, PVDIOSTORAGE pIoStorage)
4715{
4716 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4717 int rc = pInterfaceIo->pfnClose(NULL, pIoStorage->pStorage);
4718
4719 RTMemFree(pIoStorage);
4720 return rc;
4721}
4722
4723static int vdIOIntDeleteLimited(void *pvUser, const char *pcszFilename)
4724{
4725 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4726 return pInterfaceIo->pfnDelete(NULL, pcszFilename);
4727}
4728
4729static int vdIOIntMoveLimited(void *pvUser, const char *pcszSrc,
4730 const char *pcszDst, unsigned fMove)
4731{
4732 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4733 return pInterfaceIo->pfnMove(NULL, pcszSrc, pcszDst, fMove);
4734}
4735
4736static int vdIOIntGetFreeSpaceLimited(void *pvUser, const char *pcszFilename,
4737 int64_t *pcbFreeSpace)
4738{
4739 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4740 return pInterfaceIo->pfnGetFreeSpace(NULL, pcszFilename, pcbFreeSpace);
4741}
4742
4743static int vdIOIntGetModificationTimeLimited(void *pvUser,
4744 const char *pcszFilename,
4745 PRTTIMESPEC pModificationTime)
4746{
4747 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4748 return pInterfaceIo->pfnGetModificationTime(NULL, pcszFilename, pModificationTime);
4749}
4750
4751static int vdIOIntGetSizeLimited(void *pvUser, PVDIOSTORAGE pIoStorage,
4752 uint64_t *pcbSize)
4753{
4754 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4755 return pInterfaceIo->pfnGetSize(NULL, pIoStorage->pStorage, pcbSize);
4756}
4757
4758static int vdIOIntSetSizeLimited(void *pvUser, PVDIOSTORAGE pIoStorage,
4759 uint64_t cbSize)
4760{
4761 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4762 return pInterfaceIo->pfnSetSize(NULL, pIoStorage->pStorage, cbSize);
4763}
4764
4765static int vdIOIntWriteUserLimited(void *pvUser, PVDIOSTORAGE pStorage,
4766 uint64_t uOffset, PVDIOCTX pIoCtx,
4767 size_t cbWrite,
4768 PFNVDXFERCOMPLETED pfnComplete,
4769 void *pvCompleteUser)
4770{
4771 NOREF(pvUser);
4772 NOREF(pStorage);
4773 NOREF(uOffset);
4774 NOREF(pIoCtx);
4775 NOREF(cbWrite);
4776 NOREF(pfnComplete);
4777 NOREF(pvCompleteUser);
4778 AssertMsgFailedReturn(("This needs to be implemented when called\n"), VERR_NOT_IMPLEMENTED);
4779}
4780
4781static int vdIOIntReadUserLimited(void *pvUser, PVDIOSTORAGE pStorage,
4782 uint64_t uOffset, PVDIOCTX pIoCtx,
4783 size_t cbRead)
4784{
4785 NOREF(pvUser);
4786 NOREF(pStorage);
4787 NOREF(uOffset);
4788 NOREF(pIoCtx);
4789 NOREF(cbRead);
4790 AssertMsgFailedReturn(("This needs to be implemented when called\n"), VERR_NOT_IMPLEMENTED);
4791}
4792
4793static int vdIOIntWriteMetaLimited(void *pvUser, PVDIOSTORAGE pStorage,
4794 uint64_t uOffset, const void *pvBuffer,
4795 size_t cbBuffer, PVDIOCTX pIoCtx,
4796 PFNVDXFERCOMPLETED pfnComplete,
4797 void *pvCompleteUser)
4798{
4799 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4800
4801 AssertMsgReturn(!pIoCtx && !pfnComplete && !pvCompleteUser,
4802 ("Async I/O not implemented for the limited interface"),
4803 VERR_NOT_SUPPORTED);
4804
4805 return pInterfaceIo->pfnWriteSync(NULL, pStorage->pStorage, uOffset, pvBuffer, cbBuffer, NULL);
4806}
4807
4808static int vdIOIntReadMetaLimited(void *pvUser, PVDIOSTORAGE pStorage,
4809 uint64_t uOffset, void *pvBuffer,
4810 size_t cbBuffer, PVDIOCTX pIoCtx,
4811 PPVDMETAXFER ppMetaXfer,
4812 PFNVDXFERCOMPLETED pfnComplete,
4813 void *pvCompleteUser)
4814{
4815 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4816
4817 AssertMsgReturn(!pIoCtx && !ppMetaXfer && !pfnComplete && !pvCompleteUser,
4818 ("Async I/O not implemented for the limited interface"),
4819 VERR_NOT_SUPPORTED);
4820
4821 return pInterfaceIo->pfnReadSync(NULL, pStorage->pStorage, uOffset, pvBuffer, cbBuffer, NULL);
4822}
4823
4824static int vdIOIntMetaXferReleaseLimited(void *pvUser, PVDMETAXFER pMetaXfer)
4825{
4826 /* This is a NOP in this case. */
4827 NOREF(pvUser);
4828 NOREF(pMetaXfer);
4829 return VINF_SUCCESS;
4830}
4831
4832static int vdIOIntFlushLimited(void *pvUser, PVDIOSTORAGE pStorage,
4833 PVDIOCTX pIoCtx,
4834 PFNVDXFERCOMPLETED pfnComplete,
4835 void *pvCompleteUser)
4836{
4837 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4838
4839 AssertMsgReturn(!pIoCtx && !pfnComplete && !pvCompleteUser,
4840 ("Async I/O not implemented for the limited interface"),
4841 VERR_NOT_SUPPORTED);
4842
4843 return pInterfaceIo->pfnFlushSync(NULL, pStorage->pStorage);
4844}
4845
4846/**
4847 * internal: send output to the log (unconditionally).
4848 */
4849int vdLogMessage(void *pvUser, const char *pszFormat, va_list args)
4850{
4851 NOREF(pvUser);
4852 RTLogPrintfV(pszFormat, args);
4853 return VINF_SUCCESS;
4854}
4855
4856DECLINLINE(int) vdMessageWrapper(PVBOXHDD pDisk, const char *pszFormat, ...)
4857{
4858 va_list va;
4859 va_start(va, pszFormat);
4860 int rc = pDisk->pInterfaceError->pfnMessage(pDisk->pInterfaceError->Core.pvUser,
4861 pszFormat, va);
4862 va_end(va);
4863 return rc;
4864}
4865
4866
4867/**
4868 * internal: adjust PCHS geometry
4869 */
4870static void vdFixupPCHSGeometry(PVDGEOMETRY pPCHS, uint64_t cbSize)
4871{
4872 /* Fix broken PCHS geometry. Can happen for two reasons: either the backend
4873 * mixes up PCHS and LCHS, or the application used to create the source
4874 * image has put garbage in it. Additionally, if the PCHS geometry covers
4875 * more than the image size, set it back to the default. */
4876 if ( pPCHS->cHeads > 16
4877 || pPCHS->cSectors > 63
4878 || pPCHS->cCylinders == 0
4879 || (uint64_t)pPCHS->cHeads * pPCHS->cSectors * pPCHS->cCylinders * 512 > cbSize)
4880 {
4881 Assert(!(RT_MIN(cbSize / 512 / 16 / 63, 16383) - (uint32_t)RT_MIN(cbSize / 512 / 16 / 63, 16383)));
4882 pPCHS->cCylinders = (uint32_t)RT_MIN(cbSize / 512 / 16 / 63, 16383);
4883 pPCHS->cHeads = 16;
4884 pPCHS->cSectors = 63;
4885 }
4886}
4887
4888/**
4889 * internal: adjust PCHS geometry
4890 */
4891static void vdFixupLCHSGeometry(PVDGEOMETRY pLCHS, uint64_t cbSize)
4892{
4893 /* Fix broken LCHS geometry. Can happen for two reasons: either the backend
4894 * mixes up PCHS and LCHS, or the application used to create the source
4895 * image has put garbage in it. The fix in this case is to clear the LCHS
4896 * geometry to trigger autodetection when it is used next. If the geometry
4897 * already says "please autodetect" (cylinders=0) keep it. */
4898 if ( ( pLCHS->cHeads > 255
4899 || pLCHS->cHeads == 0
4900 || pLCHS->cSectors > 63
4901 || pLCHS->cSectors == 0)
4902 && pLCHS->cCylinders != 0)
4903 {
4904 pLCHS->cCylinders = 0;
4905 pLCHS->cHeads = 0;
4906 pLCHS->cSectors = 0;
4907 }
4908 /* Always recompute the number of cylinders stored in the LCHS
4909 * geometry if it isn't set to "autotedetect" at the moment.
4910 * This is very useful if the destination image size is
4911 * larger or smaller than the source image size. Do not modify
4912 * the number of heads and sectors. Windows guests hate it. */
4913 if ( pLCHS->cCylinders != 0
4914 && pLCHS->cHeads != 0 /* paranoia */
4915 && pLCHS->cSectors != 0 /* paranoia */)
4916 {
4917 Assert(!(RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024) - (uint32_t)RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024)));
4918 pLCHS->cCylinders = (uint32_t)RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024);
4919 }
4920}
4921
4922/**
4923 * Sets the I/O callbacks of the given interface to the fallback methods
4924 *
4925 * @returns nothing.
4926 * @param pIfIo The I/O interface to setup.
4927 */
4928static void vdIfIoFallbackCallbacksSetup(PVDINTERFACEIO pIfIo)
4929{
4930 pIfIo->pfnOpen = vdIOOpenFallback;
4931 pIfIo->pfnClose = vdIOCloseFallback;
4932 pIfIo->pfnDelete = vdIODeleteFallback;
4933 pIfIo->pfnMove = vdIOMoveFallback;
4934 pIfIo->pfnGetFreeSpace = vdIOGetFreeSpaceFallback;
4935 pIfIo->pfnGetModificationTime = vdIOGetModificationTimeFallback;
4936 pIfIo->pfnGetSize = vdIOGetSizeFallback;
4937 pIfIo->pfnSetSize = vdIOSetSizeFallback;
4938 pIfIo->pfnReadSync = vdIOReadSyncFallback;
4939 pIfIo->pfnWriteSync = vdIOWriteSyncFallback;
4940 pIfIo->pfnFlushSync = vdIOFlushSyncFallback;
4941 pIfIo->pfnReadAsync = vdIOReadAsyncFallback;
4942 pIfIo->pfnWriteAsync = vdIOWriteAsyncFallback;
4943 pIfIo->pfnFlushAsync = vdIOFlushAsyncFallback;
4944}
4945
4946/**
4947 * Sets the internal I/O callbacks of the given interface.
4948 *
4949 * @returns nothing.
4950 * @param pIfIoInt The internal I/O interface to setup.
4951 */
4952static void vdIfIoIntCallbacksSetup(PVDINTERFACEIOINT pIfIoInt)
4953{
4954 pIfIoInt->pfnOpen = vdIOIntOpen;
4955 pIfIoInt->pfnClose = vdIOIntClose;
4956 pIfIoInt->pfnDelete = vdIOIntDelete;
4957 pIfIoInt->pfnMove = vdIOIntMove;
4958 pIfIoInt->pfnGetFreeSpace = vdIOIntGetFreeSpace;
4959 pIfIoInt->pfnGetModificationTime = vdIOIntGetModificationTime;
4960 pIfIoInt->pfnGetSize = vdIOIntGetSize;
4961 pIfIoInt->pfnSetSize = vdIOIntSetSize;
4962 pIfIoInt->pfnReadUser = vdIOIntReadUser;
4963 pIfIoInt->pfnWriteUser = vdIOIntWriteUser;
4964 pIfIoInt->pfnReadMeta = vdIOIntReadMeta;
4965 pIfIoInt->pfnWriteMeta = vdIOIntWriteMeta;
4966 pIfIoInt->pfnMetaXferRelease = vdIOIntMetaXferRelease;
4967 pIfIoInt->pfnFlush = vdIOIntFlush;
4968 pIfIoInt->pfnIoCtxCopyFrom = vdIOIntIoCtxCopyFrom;
4969 pIfIoInt->pfnIoCtxCopyTo = vdIOIntIoCtxCopyTo;
4970 pIfIoInt->pfnIoCtxSet = vdIOIntIoCtxSet;
4971 pIfIoInt->pfnIoCtxSegArrayCreate = vdIOIntIoCtxSegArrayCreate;
4972 pIfIoInt->pfnIoCtxCompleted = vdIOIntIoCtxCompleted;
4973 pIfIoInt->pfnIoCtxIsSynchronous = vdIOIntIoCtxIsSynchronous;
4974 pIfIoInt->pfnIoCtxIsZero = vdIOIntIoCtxIsZero;
4975}
4976
4977/**
4978 * Internally used completion handler for synchronous I/O contexts.
4979 */
4980static DECLCALLBACK(void) vdIoCtxSyncComplete(void *pvUser1, void *pvUser2, int rcReq)
4981{
4982 PVBOXHDD pDisk = (PVBOXHDD)pvUser1;
4983
4984 pDisk->rcSync = rcReq;
4985 RTSemEventSignal(pDisk->hEventSemSyncIo);
4986}
4987
4988/**
4989 * Initializes HDD backends.
4990 *
4991 * @returns VBox status code.
4992 */
4993VBOXDDU_DECL(int) VDInit(void)
4994{
4995 int rc = vdAddBackends(aStaticBackends, RT_ELEMENTS(aStaticBackends));
4996 if (RT_SUCCESS(rc))
4997 {
4998 rc = vdAddCacheBackends(aStaticCacheBackends, RT_ELEMENTS(aStaticCacheBackends));
4999 if (RT_SUCCESS(rc))
5000 {
5001 rc = vdLoadDynamicBackends();
5002 if (RT_SUCCESS(rc))
5003 rc = vdLoadDynamicCacheBackends();
5004 }
5005 }
5006 LogRel(("VDInit finished\n"));
5007 return rc;
5008}
5009
5010/**
5011 * Destroys loaded HDD backends.
5012 *
5013 * @returns VBox status code.
5014 */
5015VBOXDDU_DECL(int) VDShutdown(void)
5016{
5017 PVBOXHDDBACKEND *pBackends = g_apBackends;
5018 PVDCACHEBACKEND *pCacheBackends = g_apCacheBackends;
5019 unsigned cBackends = g_cBackends;
5020
5021 if (!pBackends)
5022 return VERR_INTERNAL_ERROR;
5023
5024 g_cBackends = 0;
5025 g_apBackends = NULL;
5026
5027#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
5028 for (unsigned i = 0; i < cBackends; i++)
5029 if (pBackends[i]->hPlugin != NIL_RTLDRMOD)
5030 RTLdrClose(pBackends[i]->hPlugin);
5031#endif
5032
5033 /* Clear the supported cache backends. */
5034 cBackends = g_cCacheBackends;
5035 g_cCacheBackends = 0;
5036 g_apCacheBackends = NULL;
5037
5038#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
5039 for (unsigned i = 0; i < cBackends; i++)
5040 if (pCacheBackends[i]->hPlugin != NIL_RTLDRMOD)
5041 RTLdrClose(pCacheBackends[i]->hPlugin);
5042#endif
5043
5044 if (pCacheBackends)
5045 RTMemFree(pCacheBackends);
5046 RTMemFree(pBackends);
5047 return VINF_SUCCESS;
5048}
5049
5050
5051/**
5052 * Lists all HDD backends and their capabilities in a caller-provided buffer.
5053 *
5054 * @returns VBox status code.
5055 * VERR_BUFFER_OVERFLOW if not enough space is passed.
5056 * @param cEntriesAlloc Number of list entries available.
5057 * @param pEntries Pointer to array for the entries.
5058 * @param pcEntriesUsed Number of entries returned.
5059 */
5060VBOXDDU_DECL(int) VDBackendInfo(unsigned cEntriesAlloc, PVDBACKENDINFO pEntries,
5061 unsigned *pcEntriesUsed)
5062{
5063 int rc = VINF_SUCCESS;
5064 PRTDIR pPluginDir = NULL;
5065 unsigned cEntries = 0;
5066
5067 LogFlowFunc(("cEntriesAlloc=%u pEntries=%#p pcEntriesUsed=%#p\n", cEntriesAlloc, pEntries, pcEntriesUsed));
5068 /* Check arguments. */
5069 AssertMsgReturn(cEntriesAlloc,
5070 ("cEntriesAlloc=%u\n", cEntriesAlloc),
5071 VERR_INVALID_PARAMETER);
5072 AssertMsgReturn(VALID_PTR(pEntries),
5073 ("pEntries=%#p\n", pEntries),
5074 VERR_INVALID_PARAMETER);
5075 AssertMsgReturn(VALID_PTR(pcEntriesUsed),
5076 ("pcEntriesUsed=%#p\n", pcEntriesUsed),
5077 VERR_INVALID_PARAMETER);
5078 if (!g_apBackends)
5079 VDInit();
5080
5081 if (cEntriesAlloc < g_cBackends)
5082 {
5083 *pcEntriesUsed = g_cBackends;
5084 return VERR_BUFFER_OVERFLOW;
5085 }
5086
5087 for (unsigned i = 0; i < g_cBackends; i++)
5088 {
5089 pEntries[i].pszBackend = g_apBackends[i]->pszBackendName;
5090 pEntries[i].uBackendCaps = g_apBackends[i]->uBackendCaps;
5091 pEntries[i].paFileExtensions = g_apBackends[i]->paFileExtensions;
5092 pEntries[i].paConfigInfo = g_apBackends[i]->paConfigInfo;
5093 pEntries[i].pfnComposeLocation = g_apBackends[i]->pfnComposeLocation;
5094 pEntries[i].pfnComposeName = g_apBackends[i]->pfnComposeName;
5095 }
5096
5097 LogFlowFunc(("returns %Rrc *pcEntriesUsed=%u\n", rc, cEntries));
5098 *pcEntriesUsed = g_cBackends;
5099 return rc;
5100}
5101
5102/**
5103 * Lists the capabilities of a backend identified by its name.
5104 *
5105 * @returns VBox status code.
5106 * @param pszBackend The backend name.
5107 * @param pEntries Pointer to an entry.
5108 */
5109VBOXDDU_DECL(int) VDBackendInfoOne(const char *pszBackend, PVDBACKENDINFO pEntry)
5110{
5111 LogFlowFunc(("pszBackend=%#p pEntry=%#p\n", pszBackend, pEntry));
5112 /* Check arguments. */
5113 AssertMsgReturn(VALID_PTR(pszBackend),
5114 ("pszBackend=%#p\n", pszBackend),
5115 VERR_INVALID_PARAMETER);
5116 AssertMsgReturn(VALID_PTR(pEntry),
5117 ("pEntry=%#p\n", pEntry),
5118 VERR_INVALID_PARAMETER);
5119 if (!g_apBackends)
5120 VDInit();
5121
5122 /* Go through loaded backends. */
5123 for (unsigned i = 0; i < g_cBackends; i++)
5124 {
5125 if (!RTStrICmp(pszBackend, g_apBackends[i]->pszBackendName))
5126 {
5127 pEntry->pszBackend = g_apBackends[i]->pszBackendName;
5128 pEntry->uBackendCaps = g_apBackends[i]->uBackendCaps;
5129 pEntry->paFileExtensions = g_apBackends[i]->paFileExtensions;
5130 pEntry->paConfigInfo = g_apBackends[i]->paConfigInfo;
5131 return VINF_SUCCESS;
5132 }
5133 }
5134
5135 return VERR_NOT_FOUND;
5136}
5137
5138/**
5139 * Allocates and initializes an empty HDD container.
5140 * No image files are opened.
5141 *
5142 * @returns VBox status code.
5143 * @param pVDIfsDisk Pointer to the per-disk VD interface list.
5144 * @param enmType Type of the image container.
5145 * @param ppDisk Where to store the reference to HDD container.
5146 */
5147VBOXDDU_DECL(int) VDCreate(PVDINTERFACE pVDIfsDisk, VDTYPE enmType, PVBOXHDD *ppDisk)
5148{
5149 int rc = VINF_SUCCESS;
5150 PVBOXHDD pDisk = NULL;
5151
5152 LogFlowFunc(("pVDIfsDisk=%#p\n", pVDIfsDisk));
5153 do
5154 {
5155 /* Check arguments. */
5156 AssertMsgBreakStmt(VALID_PTR(ppDisk),
5157 ("ppDisk=%#p\n", ppDisk),
5158 rc = VERR_INVALID_PARAMETER);
5159
5160 pDisk = (PVBOXHDD)RTMemAllocZ(sizeof(VBOXHDD));
5161 if (pDisk)
5162 {
5163 pDisk->u32Signature = VBOXHDDDISK_SIGNATURE;
5164 pDisk->enmType = enmType;
5165 pDisk->cImages = 0;
5166 pDisk->pBase = NULL;
5167 pDisk->pLast = NULL;
5168 pDisk->cbSize = 0;
5169 pDisk->PCHSGeometry.cCylinders = 0;
5170 pDisk->PCHSGeometry.cHeads = 0;
5171 pDisk->PCHSGeometry.cSectors = 0;
5172 pDisk->LCHSGeometry.cCylinders = 0;
5173 pDisk->LCHSGeometry.cHeads = 0;
5174 pDisk->LCHSGeometry.cSectors = 0;
5175 pDisk->pVDIfsDisk = pVDIfsDisk;
5176 pDisk->pInterfaceError = NULL;
5177 pDisk->pInterfaceThreadSync = NULL;
5178 pDisk->pIoCtxLockOwner = NULL;
5179 pDisk->pIoCtxHead = NULL;
5180 pDisk->fLocked = false;
5181 pDisk->hEventSemSyncIo = NIL_RTSEMEVENT;
5182 pDisk->hMemCacheIoCtx = NIL_RTMEMCACHE;
5183 pDisk->hMemCacheIoTask = NIL_RTMEMCACHE;
5184
5185 rc = RTSemEventCreate(&pDisk->hEventSemSyncIo);
5186 if (RT_FAILURE(rc))
5187 break;
5188
5189 /* Create the I/O ctx cache */
5190 rc = RTMemCacheCreate(&pDisk->hMemCacheIoCtx, sizeof(VDIOCTX), 0, UINT32_MAX,
5191 NULL, NULL, NULL, 0);
5192 if (RT_FAILURE(rc))
5193 break;
5194
5195 /* Create the I/O task cache */
5196 rc = RTMemCacheCreate(&pDisk->hMemCacheIoTask, sizeof(VDIOTASK), 0, UINT32_MAX,
5197 NULL, NULL, NULL, 0);
5198 if (RT_FAILURE(rc))
5199 break;
5200
5201 pDisk->pInterfaceError = VDIfErrorGet(pVDIfsDisk);
5202 pDisk->pInterfaceThreadSync = VDIfThreadSyncGet(pVDIfsDisk);
5203
5204 *ppDisk = pDisk;
5205 }
5206 else
5207 {
5208 rc = VERR_NO_MEMORY;
5209 break;
5210 }
5211 } while (0);
5212
5213 if ( RT_FAILURE(rc)
5214 && pDisk)
5215 {
5216 if (pDisk->hEventSemSyncIo != NIL_RTSEMEVENT)
5217 RTSemEventDestroy(pDisk->hEventSemSyncIo);
5218 if (pDisk->hMemCacheIoCtx != NIL_RTMEMCACHE)
5219 RTMemCacheDestroy(pDisk->hMemCacheIoCtx);
5220 if (pDisk->hMemCacheIoTask != NIL_RTMEMCACHE)
5221 RTMemCacheDestroy(pDisk->hMemCacheIoTask);
5222 }
5223
5224 LogFlowFunc(("returns %Rrc (pDisk=%#p)\n", rc, pDisk));
5225 return rc;
5226}
5227
5228/**
5229 * Destroys HDD container.
5230 * If container has opened image files they will be closed.
5231 *
5232 * @returns VBox status code.
5233 * @param pDisk Pointer to HDD container.
5234 */
5235VBOXDDU_DECL(int) VDDestroy(PVBOXHDD pDisk)
5236{
5237 int rc = VINF_SUCCESS;
5238 LogFlowFunc(("pDisk=%#p\n", pDisk));
5239 do
5240 {
5241 /* sanity check */
5242 AssertPtrBreak(pDisk);
5243 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5244 Assert(!pDisk->fLocked);
5245
5246 rc = VDCloseAll(pDisk);
5247 RTMemCacheDestroy(pDisk->hMemCacheIoCtx);
5248 RTMemCacheDestroy(pDisk->hMemCacheIoTask);
5249 RTSemEventDestroy(pDisk->hEventSemSyncIo);
5250 RTMemFree(pDisk);
5251 } while (0);
5252 LogFlowFunc(("returns %Rrc\n", rc));
5253 return rc;
5254}
5255
5256/**
5257 * Try to get the backend name which can use this image.
5258 *
5259 * @returns VBox status code.
5260 * VINF_SUCCESS if a plugin was found.
5261 * ppszFormat contains the string which can be used as backend name.
5262 * VERR_NOT_SUPPORTED if no backend was found.
5263 * @param pVDIfsDisk Pointer to the per-disk VD interface list.
5264 * @param pVDIfsImage Pointer to the per-image VD interface list.
5265 * @param pszFilename Name of the image file for which the backend is queried.
5266 * @param ppszFormat Receives pointer of the UTF-8 string which contains the format name.
5267 * The returned pointer must be freed using RTStrFree().
5268 */
5269VBOXDDU_DECL(int) VDGetFormat(PVDINTERFACE pVDIfsDisk, PVDINTERFACE pVDIfsImage,
5270 const char *pszFilename, char **ppszFormat, VDTYPE *penmType)
5271{
5272 int rc = VERR_NOT_SUPPORTED;
5273 VDINTERFACEIOINT VDIfIoInt;
5274 VDINTERFACEIO VDIfIoFallback;
5275 PVDINTERFACEIO pInterfaceIo;
5276
5277 LogFlowFunc(("pszFilename=\"%s\"\n", pszFilename));
5278 /* Check arguments. */
5279 AssertMsgReturn(VALID_PTR(pszFilename) && *pszFilename,
5280 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5281 VERR_INVALID_PARAMETER);
5282 AssertMsgReturn(VALID_PTR(ppszFormat),
5283 ("ppszFormat=%#p\n", ppszFormat),
5284 VERR_INVALID_PARAMETER);
5285 AssertMsgReturn(VALID_PTR(penmType),
5286 ("penmType=%#p\n", penmType),
5287 VERR_INVALID_PARAMETER);
5288
5289 if (!g_apBackends)
5290 VDInit();
5291
5292 pInterfaceIo = VDIfIoGet(pVDIfsImage);
5293 if (!pInterfaceIo)
5294 {
5295 /*
5296 * Caller doesn't provide an I/O interface, create our own using the
5297 * native file API.
5298 */
5299 vdIfIoFallbackCallbacksSetup(&VDIfIoFallback);
5300 pInterfaceIo = &VDIfIoFallback;
5301 }
5302
5303 /* Set up the internal I/O interface. */
5304 AssertReturn(!VDIfIoIntGet(pVDIfsImage), VERR_INVALID_PARAMETER);
5305 VDIfIoInt.pfnOpen = vdIOIntOpenLimited;
5306 VDIfIoInt.pfnClose = vdIOIntCloseLimited;
5307 VDIfIoInt.pfnDelete = vdIOIntDeleteLimited;
5308 VDIfIoInt.pfnMove = vdIOIntMoveLimited;
5309 VDIfIoInt.pfnGetFreeSpace = vdIOIntGetFreeSpaceLimited;
5310 VDIfIoInt.pfnGetModificationTime = vdIOIntGetModificationTimeLimited;
5311 VDIfIoInt.pfnGetSize = vdIOIntGetSizeLimited;
5312 VDIfIoInt.pfnSetSize = vdIOIntSetSizeLimited;
5313 VDIfIoInt.pfnReadUser = vdIOIntReadUserLimited;
5314 VDIfIoInt.pfnWriteUser = vdIOIntWriteUserLimited;
5315 VDIfIoInt.pfnReadMeta = vdIOIntReadMetaLimited;
5316 VDIfIoInt.pfnWriteMeta = vdIOIntWriteMetaLimited;
5317 VDIfIoInt.pfnFlush = vdIOIntFlushLimited;
5318 rc = VDInterfaceAdd(&VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
5319 pInterfaceIo, sizeof(VDINTERFACEIOINT), &pVDIfsImage);
5320 AssertRC(rc);
5321
5322 /* Find the backend supporting this file format. */
5323 for (unsigned i = 0; i < g_cBackends; i++)
5324 {
5325 if (g_apBackends[i]->pfnCheckIfValid)
5326 {
5327 rc = g_apBackends[i]->pfnCheckIfValid(pszFilename, pVDIfsDisk,
5328 pVDIfsImage, penmType);
5329 if ( RT_SUCCESS(rc)
5330 /* The correct backend has been found, but there is a small
5331 * incompatibility so that the file cannot be used. Stop here
5332 * and signal success - the actual open will of course fail,
5333 * but that will create a really sensible error message. */
5334 || ( rc != VERR_VD_GEN_INVALID_HEADER
5335 && rc != VERR_VD_VDI_INVALID_HEADER
5336 && rc != VERR_VD_VMDK_INVALID_HEADER
5337 && rc != VERR_VD_ISCSI_INVALID_HEADER
5338 && rc != VERR_VD_VHD_INVALID_HEADER
5339 && rc != VERR_VD_RAW_INVALID_HEADER
5340 && rc != VERR_VD_PARALLELS_INVALID_HEADER
5341 && rc != VERR_VD_DMG_INVALID_HEADER))
5342 {
5343 /* Copy the name into the new string. */
5344 char *pszFormat = RTStrDup(g_apBackends[i]->pszBackendName);
5345 if (!pszFormat)
5346 {
5347 rc = VERR_NO_MEMORY;
5348 break;
5349 }
5350 *ppszFormat = pszFormat;
5351 /* Do not consider the typical file access errors as success,
5352 * which allows the caller to deal with such issues. */
5353 if ( rc != VERR_ACCESS_DENIED
5354 && rc != VERR_PATH_NOT_FOUND
5355 && rc != VERR_FILE_NOT_FOUND)
5356 rc = VINF_SUCCESS;
5357 break;
5358 }
5359 rc = VERR_NOT_SUPPORTED;
5360 }
5361 }
5362
5363 /* Try the cache backends. */
5364 if (rc == VERR_NOT_SUPPORTED)
5365 {
5366 for (unsigned i = 0; i < g_cCacheBackends; i++)
5367 {
5368 if (g_apCacheBackends[i]->pfnProbe)
5369 {
5370 rc = g_apCacheBackends[i]->pfnProbe(pszFilename, pVDIfsDisk,
5371 pVDIfsImage);
5372 if ( RT_SUCCESS(rc)
5373 || (rc != VERR_VD_GEN_INVALID_HEADER))
5374 {
5375 /* Copy the name into the new string. */
5376 char *pszFormat = RTStrDup(g_apBackends[i]->pszBackendName);
5377 if (!pszFormat)
5378 {
5379 rc = VERR_NO_MEMORY;
5380 break;
5381 }
5382 *ppszFormat = pszFormat;
5383 rc = VINF_SUCCESS;
5384 break;
5385 }
5386 rc = VERR_NOT_SUPPORTED;
5387 }
5388 }
5389 }
5390
5391 LogFlowFunc(("returns %Rrc *ppszFormat=\"%s\"\n", rc, *ppszFormat));
5392 return rc;
5393}
5394
5395/**
5396 * Opens an image file.
5397 *
5398 * The first opened image file in HDD container must have a base image type,
5399 * others (next opened images) must be a differencing or undo images.
5400 * Linkage is checked for differencing image to be in consistence with the previously opened image.
5401 * When another differencing image is opened and the last image was opened in read/write access
5402 * mode, then the last image is reopened in read-only with deny write sharing mode. This allows
5403 * other processes to use images in read-only mode too.
5404 *
5405 * Note that the image is opened in read-only mode if a read/write open is not possible.
5406 * Use VDIsReadOnly to check open mode.
5407 *
5408 * @returns VBox status code.
5409 * @param pDisk Pointer to HDD container.
5410 * @param pszBackend Name of the image file backend to use.
5411 * @param pszFilename Name of the image file to open.
5412 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
5413 * @param pVDIfsImage Pointer to the per-image VD interface list.
5414 */
5415VBOXDDU_DECL(int) VDOpen(PVBOXHDD pDisk, const char *pszBackend,
5416 const char *pszFilename, unsigned uOpenFlags,
5417 PVDINTERFACE pVDIfsImage)
5418{
5419 int rc = VINF_SUCCESS;
5420 int rc2;
5421 bool fLockWrite = false;
5422 PVDIMAGE pImage = NULL;
5423
5424 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uOpenFlags=%#x, pVDIfsImage=%#p\n",
5425 pDisk, pszBackend, pszFilename, uOpenFlags, pVDIfsImage));
5426
5427 do
5428 {
5429 /* sanity check */
5430 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
5431 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5432
5433 /* Check arguments. */
5434 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
5435 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
5436 rc = VERR_INVALID_PARAMETER);
5437 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
5438 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5439 rc = VERR_INVALID_PARAMETER);
5440 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
5441 ("uOpenFlags=%#x\n", uOpenFlags),
5442 rc = VERR_INVALID_PARAMETER);
5443 AssertMsgBreakStmt( !(uOpenFlags & VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS)
5444 || (uOpenFlags & VD_OPEN_FLAGS_READONLY),
5445 ("uOpenFlags=%#x\n", uOpenFlags),
5446 rc = VERR_INVALID_PARAMETER);
5447
5448 /*
5449 * Destroy the current discard state first which might still have pending blocks
5450 * for the currently opened image which will be switched to readonly mode.
5451 */
5452 /* Lock disk for writing, as we modify pDisk information below. */
5453 rc2 = vdThreadStartWrite(pDisk);
5454 AssertRC(rc2);
5455 fLockWrite = true;
5456 rc = vdDiscardStateDestroy(pDisk);
5457 if (RT_FAILURE(rc))
5458 break;
5459 rc2 = vdThreadFinishWrite(pDisk);
5460 AssertRC(rc2);
5461 fLockWrite = false;
5462
5463 /* Set up image descriptor. */
5464 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
5465 if (!pImage)
5466 {
5467 rc = VERR_NO_MEMORY;
5468 break;
5469 }
5470 pImage->pszFilename = RTStrDup(pszFilename);
5471 if (!pImage->pszFilename)
5472 {
5473 rc = VERR_NO_MEMORY;
5474 break;
5475 }
5476
5477 pImage->VDIo.pDisk = pDisk;
5478 pImage->pVDIfsImage = pVDIfsImage;
5479
5480 rc = vdFindBackend(pszBackend, &pImage->Backend);
5481 if (RT_FAILURE(rc))
5482 break;
5483 if (!pImage->Backend)
5484 {
5485 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
5486 N_("VD: unknown backend name '%s'"), pszBackend);
5487 break;
5488 }
5489
5490 /*
5491 * Fail if the backend can't do async I/O but the
5492 * flag is set.
5493 */
5494 if ( !(pImage->Backend->uBackendCaps & VD_CAP_ASYNC)
5495 && (uOpenFlags & VD_OPEN_FLAGS_ASYNC_IO))
5496 {
5497 rc = vdError(pDisk, VERR_NOT_SUPPORTED, RT_SRC_POS,
5498 N_("VD: Backend '%s' does not support async I/O"), pszBackend);
5499 break;
5500 }
5501
5502 /*
5503 * Fail if the backend doesn't support the discard operation but the
5504 * flag is set.
5505 */
5506 if ( !(pImage->Backend->uBackendCaps & VD_CAP_DISCARD)
5507 && (uOpenFlags & VD_OPEN_FLAGS_DISCARD))
5508 {
5509 rc = vdError(pDisk, VERR_VD_DISCARD_NOT_SUPPORTED, RT_SRC_POS,
5510 N_("VD: Backend '%s' does not support discard"), pszBackend);
5511 break;
5512 }
5513
5514 /* Set up the I/O interface. */
5515 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
5516 if (!pImage->VDIo.pInterfaceIo)
5517 {
5518 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
5519 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
5520 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
5521 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
5522 }
5523
5524 /* Set up the internal I/O interface. */
5525 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
5526 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
5527 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
5528 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
5529 AssertRC(rc);
5530
5531 pImage->uOpenFlags = uOpenFlags & (VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_DISCARD | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS);
5532 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
5533 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
5534 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS),
5535 pDisk->pVDIfsDisk,
5536 pImage->pVDIfsImage,
5537 pDisk->enmType,
5538 &pImage->pBackendData);
5539 /*
5540 * If the image is corrupted and there is a repair method try to repair it
5541 * first if it was openend in read-write mode and open again afterwards.
5542 */
5543 if ( RT_UNLIKELY(rc == VERR_VD_IMAGE_CORRUPTED)
5544 && !(uOpenFlags & VD_OPEN_FLAGS_READONLY)
5545 && pImage->Backend->pfnRepair)
5546 {
5547 rc = pImage->Backend->pfnRepair(pszFilename, pDisk->pVDIfsDisk, pImage->pVDIfsImage, 0 /* fFlags */);
5548 if (RT_SUCCESS(rc))
5549 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
5550 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS),
5551 pDisk->pVDIfsDisk,
5552 pImage->pVDIfsImage,
5553 pDisk->enmType,
5554 &pImage->pBackendData);
5555 else
5556 {
5557 rc = vdError(pDisk, rc, RT_SRC_POS,
5558 N_("VD: error %Rrc repairing corrupted image file '%s'"), rc, pszFilename);
5559 break;
5560 }
5561 }
5562 else if (RT_UNLIKELY(rc == VERR_VD_IMAGE_CORRUPTED))
5563 {
5564 rc = vdError(pDisk, rc, RT_SRC_POS,
5565 N_("VD: Image file '%s' is corrupted and can't be opened"), pszFilename);
5566 break;
5567 }
5568
5569 /* If the open in read-write mode failed, retry in read-only mode. */
5570 if (RT_FAILURE(rc))
5571 {
5572 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY)
5573 && ( rc == VERR_ACCESS_DENIED
5574 || rc == VERR_PERMISSION_DENIED
5575 || rc == VERR_WRITE_PROTECT
5576 || rc == VERR_SHARING_VIOLATION
5577 || rc == VERR_FILE_LOCK_FAILED))
5578 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
5579 (uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS))
5580 | VD_OPEN_FLAGS_READONLY,
5581 pDisk->pVDIfsDisk,
5582 pImage->pVDIfsImage,
5583 pDisk->enmType,
5584 &pImage->pBackendData);
5585 if (RT_FAILURE(rc))
5586 {
5587 rc = vdError(pDisk, rc, RT_SRC_POS,
5588 N_("VD: error %Rrc opening image file '%s'"), rc, pszFilename);
5589 break;
5590 }
5591 }
5592
5593 /* Lock disk for writing, as we modify pDisk information below. */
5594 rc2 = vdThreadStartWrite(pDisk);
5595 AssertRC(rc2);
5596 fLockWrite = true;
5597
5598 pImage->VDIo.pBackendData = pImage->pBackendData;
5599
5600 /* Check image type. As the image itself has only partial knowledge
5601 * whether it's a base image or not, this info is derived here. The
5602 * base image can be fixed or normal, all others must be normal or
5603 * diff images. Some image formats don't distinguish between normal
5604 * and diff images, so this must be corrected here. */
5605 unsigned uImageFlags;
5606 uImageFlags = pImage->Backend->pfnGetImageFlags(pImage->pBackendData);
5607 if (RT_FAILURE(rc))
5608 uImageFlags = VD_IMAGE_FLAGS_NONE;
5609 if ( RT_SUCCESS(rc)
5610 && !(uOpenFlags & VD_OPEN_FLAGS_INFO))
5611 {
5612 if ( pDisk->cImages == 0
5613 && (uImageFlags & VD_IMAGE_FLAGS_DIFF))
5614 {
5615 rc = VERR_VD_INVALID_TYPE;
5616 break;
5617 }
5618 else if (pDisk->cImages != 0)
5619 {
5620 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
5621 {
5622 rc = VERR_VD_INVALID_TYPE;
5623 break;
5624 }
5625 else
5626 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
5627 }
5628 }
5629
5630 /* Ensure we always get correct diff information, even if the backend
5631 * doesn't actually have a stored flag for this. It must not return
5632 * bogus information for the parent UUID if it is not a diff image. */
5633 RTUUID parentUuid;
5634 RTUuidClear(&parentUuid);
5635 rc2 = pImage->Backend->pfnGetParentUuid(pImage->pBackendData, &parentUuid);
5636 if (RT_SUCCESS(rc2) && !RTUuidIsNull(&parentUuid))
5637 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
5638
5639 pImage->uImageFlags = uImageFlags;
5640
5641 /* Force sane optimization settings. It's not worth avoiding writes
5642 * to fixed size images. The overhead would have almost no payback. */
5643 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
5644 pImage->uOpenFlags |= VD_OPEN_FLAGS_HONOR_SAME;
5645
5646 /** @todo optionally check UUIDs */
5647
5648 /* Cache disk information. */
5649 pDisk->cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
5650
5651 /* Cache PCHS geometry. */
5652 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
5653 &pDisk->PCHSGeometry);
5654 if (RT_FAILURE(rc2))
5655 {
5656 pDisk->PCHSGeometry.cCylinders = 0;
5657 pDisk->PCHSGeometry.cHeads = 0;
5658 pDisk->PCHSGeometry.cSectors = 0;
5659 }
5660 else
5661 {
5662 /* Make sure the PCHS geometry is properly clipped. */
5663 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
5664 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
5665 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
5666 }
5667
5668 /* Cache LCHS geometry. */
5669 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
5670 &pDisk->LCHSGeometry);
5671 if (RT_FAILURE(rc2))
5672 {
5673 pDisk->LCHSGeometry.cCylinders = 0;
5674 pDisk->LCHSGeometry.cHeads = 0;
5675 pDisk->LCHSGeometry.cSectors = 0;
5676 }
5677 else
5678 {
5679 /* Make sure the LCHS geometry is properly clipped. */
5680 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
5681 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
5682 }
5683
5684 if (pDisk->cImages != 0)
5685 {
5686 /* Switch previous image to read-only mode. */
5687 unsigned uOpenFlagsPrevImg;
5688 uOpenFlagsPrevImg = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
5689 if (!(uOpenFlagsPrevImg & VD_OPEN_FLAGS_READONLY))
5690 {
5691 uOpenFlagsPrevImg |= VD_OPEN_FLAGS_READONLY;
5692 rc = pDisk->pLast->Backend->pfnSetOpenFlags(pDisk->pLast->pBackendData, uOpenFlagsPrevImg);
5693 }
5694 }
5695
5696 if (RT_SUCCESS(rc))
5697 {
5698 /* Image successfully opened, make it the last image. */
5699 vdAddImageToList(pDisk, pImage);
5700 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
5701 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
5702 }
5703 else
5704 {
5705 /* Error detected, but image opened. Close image. */
5706 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, false);
5707 AssertRC(rc2);
5708 pImage->pBackendData = NULL;
5709 }
5710 } while (0);
5711
5712 if (RT_UNLIKELY(fLockWrite))
5713 {
5714 rc2 = vdThreadFinishWrite(pDisk);
5715 AssertRC(rc2);
5716 }
5717
5718 if (RT_FAILURE(rc))
5719 {
5720 if (pImage)
5721 {
5722 if (pImage->pszFilename)
5723 RTStrFree(pImage->pszFilename);
5724 RTMemFree(pImage);
5725 }
5726 }
5727
5728 LogFlowFunc(("returns %Rrc\n", rc));
5729 return rc;
5730}
5731
5732/**
5733 * Opens a cache image.
5734 *
5735 * @return VBox status code.
5736 * @param pDisk Pointer to the HDD container which should use the cache image.
5737 * @param pszBackend Name of the cache file backend to use (case insensitive).
5738 * @param pszFilename Name of the cache image to open.
5739 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
5740 * @param pVDIfsCache Pointer to the per-cache VD interface list.
5741 */
5742VBOXDDU_DECL(int) VDCacheOpen(PVBOXHDD pDisk, const char *pszBackend,
5743 const char *pszFilename, unsigned uOpenFlags,
5744 PVDINTERFACE pVDIfsCache)
5745{
5746 int rc = VINF_SUCCESS;
5747 int rc2;
5748 bool fLockWrite = false;
5749 PVDCACHE pCache = NULL;
5750
5751 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uOpenFlags=%#x, pVDIfsCache=%#p\n",
5752 pDisk, pszBackend, pszFilename, uOpenFlags, pVDIfsCache));
5753
5754 do
5755 {
5756 /* sanity check */
5757 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
5758 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5759
5760 /* Check arguments. */
5761 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
5762 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
5763 rc = VERR_INVALID_PARAMETER);
5764 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
5765 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5766 rc = VERR_INVALID_PARAMETER);
5767 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
5768 ("uOpenFlags=%#x\n", uOpenFlags),
5769 rc = VERR_INVALID_PARAMETER);
5770
5771 /* Set up image descriptor. */
5772 pCache = (PVDCACHE)RTMemAllocZ(sizeof(VDCACHE));
5773 if (!pCache)
5774 {
5775 rc = VERR_NO_MEMORY;
5776 break;
5777 }
5778 pCache->pszFilename = RTStrDup(pszFilename);
5779 if (!pCache->pszFilename)
5780 {
5781 rc = VERR_NO_MEMORY;
5782 break;
5783 }
5784
5785 pCache->VDIo.pDisk = pDisk;
5786 pCache->pVDIfsCache = pVDIfsCache;
5787
5788 rc = vdFindCacheBackend(pszBackend, &pCache->Backend);
5789 if (RT_FAILURE(rc))
5790 break;
5791 if (!pCache->Backend)
5792 {
5793 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
5794 N_("VD: unknown backend name '%s'"), pszBackend);
5795 break;
5796 }
5797
5798 /* Set up the I/O interface. */
5799 pCache->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsCache);
5800 if (!pCache->VDIo.pInterfaceIo)
5801 {
5802 vdIfIoFallbackCallbacksSetup(&pCache->VDIo.VDIfIo);
5803 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
5804 pDisk, sizeof(VDINTERFACEIO), &pVDIfsCache);
5805 pCache->VDIo.pInterfaceIo = &pCache->VDIo.VDIfIo;
5806 }
5807
5808 /* Set up the internal I/O interface. */
5809 AssertBreakStmt(!VDIfIoIntGet(pVDIfsCache), rc = VERR_INVALID_PARAMETER);
5810 vdIfIoIntCallbacksSetup(&pCache->VDIo.VDIfIoInt);
5811 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
5812 &pCache->VDIo, sizeof(VDINTERFACEIOINT), &pCache->pVDIfsCache);
5813 AssertRC(rc);
5814
5815 pCache->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
5816 rc = pCache->Backend->pfnOpen(pCache->pszFilename,
5817 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
5818 pDisk->pVDIfsDisk,
5819 pCache->pVDIfsCache,
5820 &pCache->pBackendData);
5821 /* If the open in read-write mode failed, retry in read-only mode. */
5822 if (RT_FAILURE(rc))
5823 {
5824 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY)
5825 && ( rc == VERR_ACCESS_DENIED
5826 || rc == VERR_PERMISSION_DENIED
5827 || rc == VERR_WRITE_PROTECT
5828 || rc == VERR_SHARING_VIOLATION
5829 || rc == VERR_FILE_LOCK_FAILED))
5830 rc = pCache->Backend->pfnOpen(pCache->pszFilename,
5831 (uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME)
5832 | VD_OPEN_FLAGS_READONLY,
5833 pDisk->pVDIfsDisk,
5834 pCache->pVDIfsCache,
5835 &pCache->pBackendData);
5836 if (RT_FAILURE(rc))
5837 {
5838 rc = vdError(pDisk, rc, RT_SRC_POS,
5839 N_("VD: error %Rrc opening image file '%s'"), rc, pszFilename);
5840 break;
5841 }
5842 }
5843
5844 /* Lock disk for writing, as we modify pDisk information below. */
5845 rc2 = vdThreadStartWrite(pDisk);
5846 AssertRC(rc2);
5847 fLockWrite = true;
5848
5849 /*
5850 * Check that the modification UUID of the cache and last image
5851 * match. If not the image was modified in-between without the cache.
5852 * The cache might contain stale data.
5853 */
5854 RTUUID UuidImage, UuidCache;
5855
5856 rc = pCache->Backend->pfnGetModificationUuid(pCache->pBackendData,
5857 &UuidCache);
5858 if (RT_SUCCESS(rc))
5859 {
5860 rc = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
5861 &UuidImage);
5862 if (RT_SUCCESS(rc))
5863 {
5864 if (RTUuidCompare(&UuidImage, &UuidCache))
5865 rc = VERR_VD_CACHE_NOT_UP_TO_DATE;
5866 }
5867 }
5868
5869 /*
5870 * We assume that the user knows what he is doing if one of the images
5871 * doesn't support the modification uuid.
5872 */
5873 if (rc == VERR_NOT_SUPPORTED)
5874 rc = VINF_SUCCESS;
5875
5876 if (RT_SUCCESS(rc))
5877 {
5878 /* Cache successfully opened, make it the current one. */
5879 if (!pDisk->pCache)
5880 pDisk->pCache = pCache;
5881 else
5882 rc = VERR_VD_CACHE_ALREADY_EXISTS;
5883 }
5884
5885 if (RT_FAILURE(rc))
5886 {
5887 /* Error detected, but image opened. Close image. */
5888 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, false);
5889 AssertRC(rc2);
5890 pCache->pBackendData = NULL;
5891 }
5892 } while (0);
5893
5894 if (RT_UNLIKELY(fLockWrite))
5895 {
5896 rc2 = vdThreadFinishWrite(pDisk);
5897 AssertRC(rc2);
5898 }
5899
5900 if (RT_FAILURE(rc))
5901 {
5902 if (pCache)
5903 {
5904 if (pCache->pszFilename)
5905 RTStrFree(pCache->pszFilename);
5906 RTMemFree(pCache);
5907 }
5908 }
5909
5910 LogFlowFunc(("returns %Rrc\n", rc));
5911 return rc;
5912}
5913
5914/**
5915 * Creates and opens a new base image file.
5916 *
5917 * @returns VBox status code.
5918 * @param pDisk Pointer to HDD container.
5919 * @param pszBackend Name of the image file backend to use.
5920 * @param pszFilename Name of the image file to create.
5921 * @param cbSize Image size in bytes.
5922 * @param uImageFlags Flags specifying special image features.
5923 * @param pszComment Pointer to image comment. NULL is ok.
5924 * @param pPCHSGeometry Pointer to physical disk geometry <= (16383,16,63). Not NULL.
5925 * @param pLCHSGeometry Pointer to logical disk geometry <= (x,255,63). Not NULL.
5926 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
5927 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
5928 * @param pVDIfsImage Pointer to the per-image VD interface list.
5929 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
5930 */
5931VBOXDDU_DECL(int) VDCreateBase(PVBOXHDD pDisk, const char *pszBackend,
5932 const char *pszFilename, uint64_t cbSize,
5933 unsigned uImageFlags, const char *pszComment,
5934 PCVDGEOMETRY pPCHSGeometry,
5935 PCVDGEOMETRY pLCHSGeometry,
5936 PCRTUUID pUuid, unsigned uOpenFlags,
5937 PVDINTERFACE pVDIfsImage,
5938 PVDINTERFACE pVDIfsOperation)
5939{
5940 int rc = VINF_SUCCESS;
5941 int rc2;
5942 bool fLockWrite = false, fLockRead = false;
5943 PVDIMAGE pImage = NULL;
5944 RTUUID uuid;
5945
5946 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" cbSize=%llu uImageFlags=%#x pszComment=\"%s\" PCHS=%u/%u/%u LCHS=%u/%u/%u Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
5947 pDisk, pszBackend, pszFilename, cbSize, uImageFlags, pszComment,
5948 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
5949 pPCHSGeometry->cSectors, pLCHSGeometry->cCylinders,
5950 pLCHSGeometry->cHeads, pLCHSGeometry->cSectors, pUuid,
5951 uOpenFlags, pVDIfsImage, pVDIfsOperation));
5952
5953 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
5954
5955 do
5956 {
5957 /* sanity check */
5958 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
5959 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5960
5961 /* Check arguments. */
5962 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
5963 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
5964 rc = VERR_INVALID_PARAMETER);
5965 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
5966 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5967 rc = VERR_INVALID_PARAMETER);
5968 AssertMsgBreakStmt(cbSize,
5969 ("cbSize=%llu\n", cbSize),
5970 rc = VERR_INVALID_PARAMETER);
5971 AssertMsgBreakStmt( ((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0)
5972 || ((uImageFlags & (VD_IMAGE_FLAGS_FIXED | VD_IMAGE_FLAGS_DIFF)) != VD_IMAGE_FLAGS_FIXED),
5973 ("uImageFlags=%#x\n", uImageFlags),
5974 rc = VERR_INVALID_PARAMETER);
5975 /* The PCHS geometry fields may be 0 to leave it for later. */
5976 AssertMsgBreakStmt( VALID_PTR(pPCHSGeometry)
5977 && pPCHSGeometry->cHeads <= 16
5978 && pPCHSGeometry->cSectors <= 63,
5979 ("pPCHSGeometry=%#p PCHS=%u/%u/%u\n", pPCHSGeometry,
5980 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
5981 pPCHSGeometry->cSectors),
5982 rc = VERR_INVALID_PARAMETER);
5983 /* The LCHS geometry fields may be 0 to leave it to later autodetection. */
5984 AssertMsgBreakStmt( VALID_PTR(pLCHSGeometry)
5985 && pLCHSGeometry->cHeads <= 255
5986 && pLCHSGeometry->cSectors <= 63,
5987 ("pLCHSGeometry=%#p LCHS=%u/%u/%u\n", pLCHSGeometry,
5988 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads,
5989 pLCHSGeometry->cSectors),
5990 rc = VERR_INVALID_PARAMETER);
5991 /* The UUID may be NULL. */
5992 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
5993 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
5994 rc = VERR_INVALID_PARAMETER);
5995 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
5996 ("uOpenFlags=%#x\n", uOpenFlags),
5997 rc = VERR_INVALID_PARAMETER);
5998
5999 /* Check state. Needs a temporary read lock. Holding the write lock
6000 * all the time would be blocking other activities for too long. */
6001 rc2 = vdThreadStartRead(pDisk);
6002 AssertRC(rc2);
6003 fLockRead = true;
6004 AssertMsgBreakStmt(pDisk->cImages == 0,
6005 ("Create base image cannot be done with other images open\n"),
6006 rc = VERR_VD_INVALID_STATE);
6007 rc2 = vdThreadFinishRead(pDisk);
6008 AssertRC(rc2);
6009 fLockRead = false;
6010
6011 /* Set up image descriptor. */
6012 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
6013 if (!pImage)
6014 {
6015 rc = VERR_NO_MEMORY;
6016 break;
6017 }
6018 pImage->pszFilename = RTStrDup(pszFilename);
6019 if (!pImage->pszFilename)
6020 {
6021 rc = VERR_NO_MEMORY;
6022 break;
6023 }
6024 pImage->VDIo.pDisk = pDisk;
6025 pImage->pVDIfsImage = pVDIfsImage;
6026
6027 /* Set up the I/O interface. */
6028 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
6029 if (!pImage->VDIo.pInterfaceIo)
6030 {
6031 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
6032 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6033 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
6034 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
6035 }
6036
6037 /* Set up the internal I/O interface. */
6038 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
6039 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
6040 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6041 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
6042 AssertRC(rc);
6043
6044 rc = vdFindBackend(pszBackend, &pImage->Backend);
6045 if (RT_FAILURE(rc))
6046 break;
6047 if (!pImage->Backend)
6048 {
6049 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6050 N_("VD: unknown backend name '%s'"), pszBackend);
6051 break;
6052 }
6053 if (!(pImage->Backend->uBackendCaps & ( VD_CAP_CREATE_FIXED
6054 | VD_CAP_CREATE_DYNAMIC)))
6055 {
6056 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6057 N_("VD: backend '%s' cannot create base images"), pszBackend);
6058 break;
6059 }
6060
6061 /* Create UUID if the caller didn't specify one. */
6062 if (!pUuid)
6063 {
6064 rc = RTUuidCreate(&uuid);
6065 if (RT_FAILURE(rc))
6066 {
6067 rc = vdError(pDisk, rc, RT_SRC_POS,
6068 N_("VD: cannot generate UUID for image '%s'"),
6069 pszFilename);
6070 break;
6071 }
6072 pUuid = &uuid;
6073 }
6074
6075 pImage->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6076 uImageFlags &= ~VD_IMAGE_FLAGS_DIFF;
6077 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6078 rc = pImage->Backend->pfnCreate(pImage->pszFilename, cbSize,
6079 uImageFlags, pszComment, pPCHSGeometry,
6080 pLCHSGeometry, pUuid,
6081 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6082 0, 99,
6083 pDisk->pVDIfsDisk,
6084 pImage->pVDIfsImage,
6085 pVDIfsOperation,
6086 &pImage->pBackendData);
6087
6088 if (RT_SUCCESS(rc))
6089 {
6090 pImage->VDIo.pBackendData = pImage->pBackendData;
6091 pImage->uImageFlags = uImageFlags;
6092
6093 /* Force sane optimization settings. It's not worth avoiding writes
6094 * to fixed size images. The overhead would have almost no payback. */
6095 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
6096 pImage->uOpenFlags |= VD_OPEN_FLAGS_HONOR_SAME;
6097
6098 /* Lock disk for writing, as we modify pDisk information below. */
6099 rc2 = vdThreadStartWrite(pDisk);
6100 AssertRC(rc2);
6101 fLockWrite = true;
6102
6103 /** @todo optionally check UUIDs */
6104
6105 /* Re-check state, as the lock wasn't held and another image
6106 * creation call could have been done by another thread. */
6107 AssertMsgStmt(pDisk->cImages == 0,
6108 ("Create base image cannot be done with other images open\n"),
6109 rc = VERR_VD_INVALID_STATE);
6110 }
6111
6112 if (RT_SUCCESS(rc))
6113 {
6114 /* Cache disk information. */
6115 pDisk->cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
6116
6117 /* Cache PCHS geometry. */
6118 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
6119 &pDisk->PCHSGeometry);
6120 if (RT_FAILURE(rc2))
6121 {
6122 pDisk->PCHSGeometry.cCylinders = 0;
6123 pDisk->PCHSGeometry.cHeads = 0;
6124 pDisk->PCHSGeometry.cSectors = 0;
6125 }
6126 else
6127 {
6128 /* Make sure the CHS geometry is properly clipped. */
6129 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
6130 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
6131 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
6132 }
6133
6134 /* Cache LCHS geometry. */
6135 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
6136 &pDisk->LCHSGeometry);
6137 if (RT_FAILURE(rc2))
6138 {
6139 pDisk->LCHSGeometry.cCylinders = 0;
6140 pDisk->LCHSGeometry.cHeads = 0;
6141 pDisk->LCHSGeometry.cSectors = 0;
6142 }
6143 else
6144 {
6145 /* Make sure the CHS geometry is properly clipped. */
6146 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
6147 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
6148 }
6149
6150 /* Image successfully opened, make it the last image. */
6151 vdAddImageToList(pDisk, pImage);
6152 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
6153 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
6154 }
6155 else
6156 {
6157 /* Error detected, image may or may not be opened. Close and delete
6158 * image if it was opened. */
6159 if (pImage->pBackendData)
6160 {
6161 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, true);
6162 AssertRC(rc2);
6163 pImage->pBackendData = NULL;
6164 }
6165 }
6166 } while (0);
6167
6168 if (RT_UNLIKELY(fLockWrite))
6169 {
6170 rc2 = vdThreadFinishWrite(pDisk);
6171 AssertRC(rc2);
6172 }
6173 else if (RT_UNLIKELY(fLockRead))
6174 {
6175 rc2 = vdThreadFinishRead(pDisk);
6176 AssertRC(rc2);
6177 }
6178
6179 if (RT_FAILURE(rc))
6180 {
6181 if (pImage)
6182 {
6183 if (pImage->pszFilename)
6184 RTStrFree(pImage->pszFilename);
6185 RTMemFree(pImage);
6186 }
6187 }
6188
6189 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6190 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6191
6192 LogFlowFunc(("returns %Rrc\n", rc));
6193 return rc;
6194}
6195
6196/**
6197 * Creates and opens a new differencing image file in HDD container.
6198 * See comments for VDOpen function about differencing images.
6199 *
6200 * @returns VBox status code.
6201 * @param pDisk Pointer to HDD container.
6202 * @param pszBackend Name of the image file backend to use.
6203 * @param pszFilename Name of the differencing image file to create.
6204 * @param uImageFlags Flags specifying special image features.
6205 * @param pszComment Pointer to image comment. NULL is ok.
6206 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6207 * @param pParentUuid New parent UUID of the image. If NULL, the UUID is queried automatically.
6208 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6209 * @param pVDIfsImage Pointer to the per-image VD interface list.
6210 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6211 */
6212VBOXDDU_DECL(int) VDCreateDiff(PVBOXHDD pDisk, const char *pszBackend,
6213 const char *pszFilename, unsigned uImageFlags,
6214 const char *pszComment, PCRTUUID pUuid,
6215 PCRTUUID pParentUuid, unsigned uOpenFlags,
6216 PVDINTERFACE pVDIfsImage,
6217 PVDINTERFACE pVDIfsOperation)
6218{
6219 int rc = VINF_SUCCESS;
6220 int rc2;
6221 bool fLockWrite = false, fLockRead = false;
6222 PVDIMAGE pImage = NULL;
6223 RTUUID uuid;
6224
6225 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uImageFlags=%#x pszComment=\"%s\" Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6226 pDisk, pszBackend, pszFilename, uImageFlags, pszComment, pUuid, uOpenFlags, pVDIfsImage, pVDIfsOperation));
6227
6228 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6229
6230 do
6231 {
6232 /* sanity check */
6233 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6234 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6235
6236 /* Check arguments. */
6237 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6238 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6239 rc = VERR_INVALID_PARAMETER);
6240 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6241 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6242 rc = VERR_INVALID_PARAMETER);
6243 AssertMsgBreakStmt((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0,
6244 ("uImageFlags=%#x\n", uImageFlags),
6245 rc = VERR_INVALID_PARAMETER);
6246 /* The UUID may be NULL. */
6247 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6248 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6249 rc = VERR_INVALID_PARAMETER);
6250 /* The parent UUID may be NULL. */
6251 AssertMsgBreakStmt(pParentUuid == NULL || VALID_PTR(pParentUuid),
6252 ("pParentUuid=%#p ParentUUID=%RTuuid\n", pParentUuid, pParentUuid),
6253 rc = VERR_INVALID_PARAMETER);
6254 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6255 ("uOpenFlags=%#x\n", uOpenFlags),
6256 rc = VERR_INVALID_PARAMETER);
6257
6258 /* Check state. Needs a temporary read lock. Holding the write lock
6259 * all the time would be blocking other activities for too long. */
6260 rc2 = vdThreadStartRead(pDisk);
6261 AssertRC(rc2);
6262 fLockRead = true;
6263 AssertMsgBreakStmt(pDisk->cImages != 0,
6264 ("Create diff image cannot be done without other images open\n"),
6265 rc = VERR_VD_INVALID_STATE);
6266 rc2 = vdThreadFinishRead(pDisk);
6267 AssertRC(rc2);
6268 fLockRead = false;
6269
6270 /*
6271 * Destroy the current discard state first which might still have pending blocks
6272 * for the currently opened image which will be switched to readonly mode.
6273 */
6274 /* Lock disk for writing, as we modify pDisk information below. */
6275 rc2 = vdThreadStartWrite(pDisk);
6276 AssertRC(rc2);
6277 fLockWrite = true;
6278 rc = vdDiscardStateDestroy(pDisk);
6279 if (RT_FAILURE(rc))
6280 break;
6281 rc2 = vdThreadFinishWrite(pDisk);
6282 AssertRC(rc2);
6283 fLockWrite = false;
6284
6285 /* Set up image descriptor. */
6286 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
6287 if (!pImage)
6288 {
6289 rc = VERR_NO_MEMORY;
6290 break;
6291 }
6292 pImage->pszFilename = RTStrDup(pszFilename);
6293 if (!pImage->pszFilename)
6294 {
6295 rc = VERR_NO_MEMORY;
6296 break;
6297 }
6298
6299 rc = vdFindBackend(pszBackend, &pImage->Backend);
6300 if (RT_FAILURE(rc))
6301 break;
6302 if (!pImage->Backend)
6303 {
6304 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6305 N_("VD: unknown backend name '%s'"), pszBackend);
6306 break;
6307 }
6308 if ( !(pImage->Backend->uBackendCaps & VD_CAP_DIFF)
6309 || !(pImage->Backend->uBackendCaps & ( VD_CAP_CREATE_FIXED
6310 | VD_CAP_CREATE_DYNAMIC)))
6311 {
6312 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6313 N_("VD: backend '%s' cannot create diff images"), pszBackend);
6314 break;
6315 }
6316
6317 pImage->VDIo.pDisk = pDisk;
6318 pImage->pVDIfsImage = pVDIfsImage;
6319
6320 /* Set up the I/O interface. */
6321 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
6322 if (!pImage->VDIo.pInterfaceIo)
6323 {
6324 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
6325 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6326 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
6327 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
6328 }
6329
6330 /* Set up the internal I/O interface. */
6331 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
6332 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
6333 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6334 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
6335 AssertRC(rc);
6336
6337 /* Create UUID if the caller didn't specify one. */
6338 if (!pUuid)
6339 {
6340 rc = RTUuidCreate(&uuid);
6341 if (RT_FAILURE(rc))
6342 {
6343 rc = vdError(pDisk, rc, RT_SRC_POS,
6344 N_("VD: cannot generate UUID for image '%s'"),
6345 pszFilename);
6346 break;
6347 }
6348 pUuid = &uuid;
6349 }
6350
6351 pImage->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6352 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6353 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
6354 rc = pImage->Backend->pfnCreate(pImage->pszFilename, pDisk->cbSize,
6355 uImageFlags | VD_IMAGE_FLAGS_DIFF,
6356 pszComment, &pDisk->PCHSGeometry,
6357 &pDisk->LCHSGeometry, pUuid,
6358 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6359 0, 99,
6360 pDisk->pVDIfsDisk,
6361 pImage->pVDIfsImage,
6362 pVDIfsOperation,
6363 &pImage->pBackendData);
6364
6365 if (RT_SUCCESS(rc))
6366 {
6367 pImage->VDIo.pBackendData = pImage->pBackendData;
6368 pImage->uImageFlags = uImageFlags;
6369
6370 /* Lock disk for writing, as we modify pDisk information below. */
6371 rc2 = vdThreadStartWrite(pDisk);
6372 AssertRC(rc2);
6373 fLockWrite = true;
6374
6375 /* Switch previous image to read-only mode. */
6376 unsigned uOpenFlagsPrevImg;
6377 uOpenFlagsPrevImg = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
6378 if (!(uOpenFlagsPrevImg & VD_OPEN_FLAGS_READONLY))
6379 {
6380 uOpenFlagsPrevImg |= VD_OPEN_FLAGS_READONLY;
6381 rc = pDisk->pLast->Backend->pfnSetOpenFlags(pDisk->pLast->pBackendData, uOpenFlagsPrevImg);
6382 }
6383
6384 /** @todo optionally check UUIDs */
6385
6386 /* Re-check state, as the lock wasn't held and another image
6387 * creation call could have been done by another thread. */
6388 AssertMsgStmt(pDisk->cImages != 0,
6389 ("Create diff image cannot be done without other images open\n"),
6390 rc = VERR_VD_INVALID_STATE);
6391 }
6392
6393 if (RT_SUCCESS(rc))
6394 {
6395 RTUUID Uuid;
6396 RTTIMESPEC ts;
6397
6398 if (pParentUuid && !RTUuidIsNull(pParentUuid))
6399 {
6400 Uuid = *pParentUuid;
6401 pImage->Backend->pfnSetParentUuid(pImage->pBackendData, &Uuid);
6402 }
6403 else
6404 {
6405 rc2 = pDisk->pLast->Backend->pfnGetUuid(pDisk->pLast->pBackendData,
6406 &Uuid);
6407 if (RT_SUCCESS(rc2))
6408 pImage->Backend->pfnSetParentUuid(pImage->pBackendData, &Uuid);
6409 }
6410 rc2 = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6411 &Uuid);
6412 if (RT_SUCCESS(rc2))
6413 pImage->Backend->pfnSetParentModificationUuid(pImage->pBackendData,
6414 &Uuid);
6415 if (pDisk->pLast->Backend->pfnGetTimeStamp)
6416 rc2 = pDisk->pLast->Backend->pfnGetTimeStamp(pDisk->pLast->pBackendData,
6417 &ts);
6418 else
6419 rc2 = VERR_NOT_IMPLEMENTED;
6420 if (RT_SUCCESS(rc2) && pImage->Backend->pfnSetParentTimeStamp)
6421 pImage->Backend->pfnSetParentTimeStamp(pImage->pBackendData, &ts);
6422
6423 if (pImage->Backend->pfnSetParentFilename)
6424 rc2 = pImage->Backend->pfnSetParentFilename(pImage->pBackendData, pDisk->pLast->pszFilename);
6425 }
6426
6427 if (RT_SUCCESS(rc))
6428 {
6429 /* Image successfully opened, make it the last image. */
6430 vdAddImageToList(pDisk, pImage);
6431 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
6432 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
6433 }
6434 else
6435 {
6436 /* Error detected, but image opened. Close and delete image. */
6437 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, true);
6438 AssertRC(rc2);
6439 pImage->pBackendData = NULL;
6440 }
6441 } while (0);
6442
6443 if (RT_UNLIKELY(fLockWrite))
6444 {
6445 rc2 = vdThreadFinishWrite(pDisk);
6446 AssertRC(rc2);
6447 }
6448 else if (RT_UNLIKELY(fLockRead))
6449 {
6450 rc2 = vdThreadFinishRead(pDisk);
6451 AssertRC(rc2);
6452 }
6453
6454 if (RT_FAILURE(rc))
6455 {
6456 if (pImage)
6457 {
6458 if (pImage->pszFilename)
6459 RTStrFree(pImage->pszFilename);
6460 RTMemFree(pImage);
6461 }
6462 }
6463
6464 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6465 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6466
6467 LogFlowFunc(("returns %Rrc\n", rc));
6468 return rc;
6469}
6470
6471
6472/**
6473 * Creates and opens new cache image file in HDD container.
6474 *
6475 * @return VBox status code.
6476 * @param pDisk Name of the cache file backend to use (case insensitive).
6477 * @param pszFilename Name of the differencing cache file to create.
6478 * @param cbSize Maximum size of the cache.
6479 * @param uImageFlags Flags specifying special cache features.
6480 * @param pszComment Pointer to image comment. NULL is ok.
6481 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6482 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6483 * @param pVDIfsCache Pointer to the per-cache VD interface list.
6484 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6485 */
6486VBOXDDU_DECL(int) VDCreateCache(PVBOXHDD pDisk, const char *pszBackend,
6487 const char *pszFilename, uint64_t cbSize,
6488 unsigned uImageFlags, const char *pszComment,
6489 PCRTUUID pUuid, unsigned uOpenFlags,
6490 PVDINTERFACE pVDIfsCache, PVDINTERFACE pVDIfsOperation)
6491{
6492 int rc = VINF_SUCCESS;
6493 int rc2;
6494 bool fLockWrite = false, fLockRead = false;
6495 PVDCACHE pCache = NULL;
6496 RTUUID uuid;
6497
6498 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" cbSize=%llu uImageFlags=%#x pszComment=\"%s\" Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6499 pDisk, pszBackend, pszFilename, cbSize, uImageFlags, pszComment, pUuid, uOpenFlags, pVDIfsCache, pVDIfsOperation));
6500
6501 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6502
6503 do
6504 {
6505 /* sanity check */
6506 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6507 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6508
6509 /* Check arguments. */
6510 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6511 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6512 rc = VERR_INVALID_PARAMETER);
6513 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6514 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6515 rc = VERR_INVALID_PARAMETER);
6516 AssertMsgBreakStmt(cbSize,
6517 ("cbSize=%llu\n", cbSize),
6518 rc = VERR_INVALID_PARAMETER);
6519 AssertMsgBreakStmt((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0,
6520 ("uImageFlags=%#x\n", uImageFlags),
6521 rc = VERR_INVALID_PARAMETER);
6522 /* The UUID may be NULL. */
6523 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6524 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6525 rc = VERR_INVALID_PARAMETER);
6526 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6527 ("uOpenFlags=%#x\n", uOpenFlags),
6528 rc = VERR_INVALID_PARAMETER);
6529
6530 /* Check state. Needs a temporary read lock. Holding the write lock
6531 * all the time would be blocking other activities for too long. */
6532 rc2 = vdThreadStartRead(pDisk);
6533 AssertRC(rc2);
6534 fLockRead = true;
6535 AssertMsgBreakStmt(!pDisk->pCache,
6536 ("Create cache image cannot be done with a cache already attached\n"),
6537 rc = VERR_VD_CACHE_ALREADY_EXISTS);
6538 rc2 = vdThreadFinishRead(pDisk);
6539 AssertRC(rc2);
6540 fLockRead = false;
6541
6542 /* Set up image descriptor. */
6543 pCache = (PVDCACHE)RTMemAllocZ(sizeof(VDCACHE));
6544 if (!pCache)
6545 {
6546 rc = VERR_NO_MEMORY;
6547 break;
6548 }
6549 pCache->pszFilename = RTStrDup(pszFilename);
6550 if (!pCache->pszFilename)
6551 {
6552 rc = VERR_NO_MEMORY;
6553 break;
6554 }
6555
6556 rc = vdFindCacheBackend(pszBackend, &pCache->Backend);
6557 if (RT_FAILURE(rc))
6558 break;
6559 if (!pCache->Backend)
6560 {
6561 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6562 N_("VD: unknown backend name '%s'"), pszBackend);
6563 break;
6564 }
6565
6566 pCache->VDIo.pDisk = pDisk;
6567 pCache->pVDIfsCache = pVDIfsCache;
6568
6569 /* Set up the I/O interface. */
6570 pCache->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsCache);
6571 if (!pCache->VDIo.pInterfaceIo)
6572 {
6573 vdIfIoFallbackCallbacksSetup(&pCache->VDIo.VDIfIo);
6574 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6575 pDisk, sizeof(VDINTERFACEIO), &pVDIfsCache);
6576 pCache->VDIo.pInterfaceIo = &pCache->VDIo.VDIfIo;
6577 }
6578
6579 /* Set up the internal I/O interface. */
6580 AssertBreakStmt(!VDIfIoIntGet(pVDIfsCache), rc = VERR_INVALID_PARAMETER);
6581 vdIfIoIntCallbacksSetup(&pCache->VDIo.VDIfIoInt);
6582 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6583 &pCache->VDIo, sizeof(VDINTERFACEIOINT), &pCache->pVDIfsCache);
6584 AssertRC(rc);
6585
6586 /* Create UUID if the caller didn't specify one. */
6587 if (!pUuid)
6588 {
6589 rc = RTUuidCreate(&uuid);
6590 if (RT_FAILURE(rc))
6591 {
6592 rc = vdError(pDisk, rc, RT_SRC_POS,
6593 N_("VD: cannot generate UUID for image '%s'"),
6594 pszFilename);
6595 break;
6596 }
6597 pUuid = &uuid;
6598 }
6599
6600 pCache->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6601 pCache->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6602 rc = pCache->Backend->pfnCreate(pCache->pszFilename, cbSize,
6603 uImageFlags,
6604 pszComment, pUuid,
6605 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6606 0, 99,
6607 pDisk->pVDIfsDisk,
6608 pCache->pVDIfsCache,
6609 pVDIfsOperation,
6610 &pCache->pBackendData);
6611
6612 if (RT_SUCCESS(rc))
6613 {
6614 /* Lock disk for writing, as we modify pDisk information below. */
6615 rc2 = vdThreadStartWrite(pDisk);
6616 AssertRC(rc2);
6617 fLockWrite = true;
6618
6619 pCache->VDIo.pBackendData = pCache->pBackendData;
6620
6621 /* Re-check state, as the lock wasn't held and another image
6622 * creation call could have been done by another thread. */
6623 AssertMsgStmt(!pDisk->pCache,
6624 ("Create cache image cannot be done with another cache open\n"),
6625 rc = VERR_VD_CACHE_ALREADY_EXISTS);
6626 }
6627
6628 if ( RT_SUCCESS(rc)
6629 && pDisk->pLast)
6630 {
6631 RTUUID UuidModification;
6632
6633 /* Set same modification Uuid as the last image. */
6634 rc = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6635 &UuidModification);
6636 if (RT_SUCCESS(rc))
6637 {
6638 rc = pCache->Backend->pfnSetModificationUuid(pCache->pBackendData,
6639 &UuidModification);
6640 }
6641
6642 if (rc == VERR_NOT_SUPPORTED)
6643 rc = VINF_SUCCESS;
6644 }
6645
6646 if (RT_SUCCESS(rc))
6647 {
6648 /* Cache successfully created. */
6649 pDisk->pCache = pCache;
6650 }
6651 else
6652 {
6653 /* Error detected, but image opened. Close and delete image. */
6654 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, true);
6655 AssertRC(rc2);
6656 pCache->pBackendData = NULL;
6657 }
6658 } while (0);
6659
6660 if (RT_UNLIKELY(fLockWrite))
6661 {
6662 rc2 = vdThreadFinishWrite(pDisk);
6663 AssertRC(rc2);
6664 }
6665 else if (RT_UNLIKELY(fLockRead))
6666 {
6667 rc2 = vdThreadFinishRead(pDisk);
6668 AssertRC(rc2);
6669 }
6670
6671 if (RT_FAILURE(rc))
6672 {
6673 if (pCache)
6674 {
6675 if (pCache->pszFilename)
6676 RTStrFree(pCache->pszFilename);
6677 RTMemFree(pCache);
6678 }
6679 }
6680
6681 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6682 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6683
6684 LogFlowFunc(("returns %Rrc\n", rc));
6685 return rc;
6686}
6687
6688/**
6689 * Merges two images (not necessarily with direct parent/child relationship).
6690 * As a side effect the source image and potentially the other images which
6691 * are also merged to the destination are deleted from both the disk and the
6692 * images in the HDD container.
6693 *
6694 * @returns VBox status code.
6695 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
6696 * @param pDisk Pointer to HDD container.
6697 * @param nImageFrom Name of the image file to merge from.
6698 * @param nImageTo Name of the image file to merge to.
6699 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6700 */
6701VBOXDDU_DECL(int) VDMerge(PVBOXHDD pDisk, unsigned nImageFrom,
6702 unsigned nImageTo, PVDINTERFACE pVDIfsOperation)
6703{
6704 int rc = VINF_SUCCESS;
6705 int rc2;
6706 bool fLockWrite = false, fLockRead = false;
6707 void *pvBuf = NULL;
6708
6709 LogFlowFunc(("pDisk=%#p nImageFrom=%u nImageTo=%u pVDIfsOperation=%#p\n",
6710 pDisk, nImageFrom, nImageTo, pVDIfsOperation));
6711
6712 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6713
6714 do
6715 {
6716 /* sanity check */
6717 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6718 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6719
6720 /* For simplicity reasons lock for writing as the image reopen below
6721 * might need it. After all the reopen is usually needed. */
6722 rc2 = vdThreadStartWrite(pDisk);
6723 AssertRC(rc2);
6724 fLockWrite = true;
6725 PVDIMAGE pImageFrom = vdGetImageByNumber(pDisk, nImageFrom);
6726 PVDIMAGE pImageTo = vdGetImageByNumber(pDisk, nImageTo);
6727 if (!pImageFrom || !pImageTo)
6728 {
6729 rc = VERR_VD_IMAGE_NOT_FOUND;
6730 break;
6731 }
6732 AssertBreakStmt(pImageFrom != pImageTo, rc = VERR_INVALID_PARAMETER);
6733
6734 /* Make sure destination image is writable. */
6735 unsigned uOpenFlags = pImageTo->Backend->pfnGetOpenFlags(pImageTo->pBackendData);
6736 if (uOpenFlags & VD_OPEN_FLAGS_READONLY)
6737 {
6738 /*
6739 * Clear skip consistency checks because the image is made writable now and
6740 * skipping consistency checks is only possible for readonly images.
6741 */
6742 uOpenFlags &= ~(VD_OPEN_FLAGS_READONLY | VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS);
6743 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
6744 uOpenFlags);
6745 if (RT_FAILURE(rc))
6746 break;
6747 }
6748
6749 /* Get size of destination image. */
6750 uint64_t cbSize = pImageTo->Backend->pfnGetSize(pImageTo->pBackendData);
6751 rc2 = vdThreadFinishWrite(pDisk);
6752 AssertRC(rc2);
6753 fLockWrite = false;
6754
6755 /* Allocate tmp buffer. */
6756 pvBuf = RTMemTmpAlloc(VD_MERGE_BUFFER_SIZE);
6757 if (!pvBuf)
6758 {
6759 rc = VERR_NO_MEMORY;
6760 break;
6761 }
6762
6763 /* Merging is done directly on the images itself. This potentially
6764 * causes trouble if the disk is full in the middle of operation. */
6765 if (nImageFrom < nImageTo)
6766 {
6767 /* Merge parent state into child. This means writing all not
6768 * allocated blocks in the destination image which are allocated in
6769 * the images to be merged. */
6770 uint64_t uOffset = 0;
6771 uint64_t cbRemaining = cbSize;
6772 do
6773 {
6774 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
6775 RTSGSEG SegmentBuf;
6776 RTSGBUF SgBuf;
6777 VDIOCTX IoCtx;
6778
6779 SegmentBuf.pvSeg = pvBuf;
6780 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
6781 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
6782 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, 0, 0, NULL,
6783 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
6784
6785 /* Need to hold the write lock during a read-write operation. */
6786 rc2 = vdThreadStartWrite(pDisk);
6787 AssertRC(rc2);
6788 fLockWrite = true;
6789
6790 rc = pImageTo->Backend->pfnRead(pImageTo->pBackendData,
6791 uOffset, cbThisRead,
6792 &IoCtx, &cbThisRead);
6793 if (rc == VERR_VD_BLOCK_FREE)
6794 {
6795 /* Search for image with allocated block. Do not attempt to
6796 * read more than the previous reads marked as valid.
6797 * Otherwise this would return stale data when different
6798 * block sizes are used for the images. */
6799 for (PVDIMAGE pCurrImage = pImageTo->pPrev;
6800 pCurrImage != NULL && pCurrImage != pImageFrom->pPrev && rc == VERR_VD_BLOCK_FREE;
6801 pCurrImage = pCurrImage->pPrev)
6802 {
6803 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
6804 uOffset, cbThisRead,
6805 &IoCtx, &cbThisRead);
6806 }
6807
6808 if (rc != VERR_VD_BLOCK_FREE)
6809 {
6810 if (RT_FAILURE(rc))
6811 break;
6812 /* Updating the cache is required because this might be a live merge. */
6813 rc = vdWriteHelperEx(pDisk, pImageTo, pImageFrom->pPrev,
6814 uOffset, pvBuf, cbThisRead,
6815 VDIOCTX_FLAGS_READ_UPDATE_CACHE, 0);
6816 if (RT_FAILURE(rc))
6817 break;
6818 }
6819 else
6820 rc = VINF_SUCCESS;
6821 }
6822 else if (RT_FAILURE(rc))
6823 break;
6824
6825 rc2 = vdThreadFinishWrite(pDisk);
6826 AssertRC(rc2);
6827 fLockWrite = false;
6828
6829 uOffset += cbThisRead;
6830 cbRemaining -= cbThisRead;
6831
6832 if (pIfProgress && pIfProgress->pfnProgress)
6833 {
6834 /** @todo r=klaus: this can update the progress to the same
6835 * percentage over and over again if the image format makes
6836 * relatively small increments. */
6837 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
6838 uOffset * 99 / cbSize);
6839 if (RT_FAILURE(rc))
6840 break;
6841 }
6842 } while (uOffset < cbSize);
6843 }
6844 else
6845 {
6846 /*
6847 * We may need to update the parent uuid of the child coming after
6848 * the last image to be merged. We have to reopen it read/write.
6849 *
6850 * This is done before we do the actual merge to prevent an
6851 * inconsistent chain if the mode change fails for some reason.
6852 */
6853 if (pImageFrom->pNext)
6854 {
6855 PVDIMAGE pImageChild = pImageFrom->pNext;
6856
6857 /* Take the write lock. */
6858 rc2 = vdThreadStartWrite(pDisk);
6859 AssertRC(rc2);
6860 fLockWrite = true;
6861
6862 /* We need to open the image in read/write mode. */
6863 uOpenFlags = pImageChild->Backend->pfnGetOpenFlags(pImageChild->pBackendData);
6864
6865 if (uOpenFlags & VD_OPEN_FLAGS_READONLY)
6866 {
6867 uOpenFlags &= ~VD_OPEN_FLAGS_READONLY;
6868 rc = pImageChild->Backend->pfnSetOpenFlags(pImageChild->pBackendData,
6869 uOpenFlags);
6870 if (RT_FAILURE(rc))
6871 break;
6872 }
6873
6874 rc2 = vdThreadFinishWrite(pDisk);
6875 AssertRC(rc2);
6876 fLockWrite = false;
6877 }
6878
6879 /* If the merge is from the last image we have to relay all writes
6880 * to the merge destination as well, so that concurrent writes
6881 * (in case of a live merge) are handled correctly. */
6882 if (!pImageFrom->pNext)
6883 {
6884 /* Take the write lock. */
6885 rc2 = vdThreadStartWrite(pDisk);
6886 AssertRC(rc2);
6887 fLockWrite = true;
6888
6889 pDisk->pImageRelay = pImageTo;
6890
6891 rc2 = vdThreadFinishWrite(pDisk);
6892 AssertRC(rc2);
6893 fLockWrite = false;
6894 }
6895
6896 /* Merge child state into parent. This means writing all blocks
6897 * which are allocated in the image up to the source image to the
6898 * destination image. */
6899 uint64_t uOffset = 0;
6900 uint64_t cbRemaining = cbSize;
6901 do
6902 {
6903 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
6904 RTSGSEG SegmentBuf;
6905 RTSGBUF SgBuf;
6906 VDIOCTX IoCtx;
6907
6908 rc = VERR_VD_BLOCK_FREE;
6909
6910 SegmentBuf.pvSeg = pvBuf;
6911 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
6912 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
6913 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, 0, 0, NULL,
6914 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
6915
6916 /* Need to hold the write lock during a read-write operation. */
6917 rc2 = vdThreadStartWrite(pDisk);
6918 AssertRC(rc2);
6919 fLockWrite = true;
6920
6921 /* Search for image with allocated block. Do not attempt to
6922 * read more than the previous reads marked as valid. Otherwise
6923 * this would return stale data when different block sizes are
6924 * used for the images. */
6925 for (PVDIMAGE pCurrImage = pImageFrom;
6926 pCurrImage != NULL && pCurrImage != pImageTo && rc == VERR_VD_BLOCK_FREE;
6927 pCurrImage = pCurrImage->pPrev)
6928 {
6929 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
6930 uOffset, cbThisRead,
6931 &IoCtx, &cbThisRead);
6932 }
6933
6934 if (rc != VERR_VD_BLOCK_FREE)
6935 {
6936 if (RT_FAILURE(rc))
6937 break;
6938 rc = vdWriteHelper(pDisk, pImageTo, uOffset, pvBuf,
6939 cbThisRead, VDIOCTX_FLAGS_READ_UPDATE_CACHE);
6940 if (RT_FAILURE(rc))
6941 break;
6942 }
6943 else
6944 rc = VINF_SUCCESS;
6945
6946 rc2 = vdThreadFinishWrite(pDisk);
6947 AssertRC(rc2);
6948 fLockWrite = false;
6949
6950 uOffset += cbThisRead;
6951 cbRemaining -= cbThisRead;
6952
6953 if (pIfProgress && pIfProgress->pfnProgress)
6954 {
6955 /** @todo r=klaus: this can update the progress to the same
6956 * percentage over and over again if the image format makes
6957 * relatively small increments. */
6958 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
6959 uOffset * 99 / cbSize);
6960 if (RT_FAILURE(rc))
6961 break;
6962 }
6963 } while (uOffset < cbSize);
6964
6965 /* In case we set up a "write proxy" image above we must clear
6966 * this again now to prevent stray writes. Failure or not. */
6967 if (!pImageFrom->pNext)
6968 {
6969 /* Take the write lock. */
6970 rc2 = vdThreadStartWrite(pDisk);
6971 AssertRC(rc2);
6972 fLockWrite = true;
6973
6974 pDisk->pImageRelay = NULL;
6975
6976 rc2 = vdThreadFinishWrite(pDisk);
6977 AssertRC(rc2);
6978 fLockWrite = false;
6979 }
6980 }
6981
6982 /*
6983 * Leave in case of an error to avoid corrupted data in the image chain
6984 * (includes cancelling the operation by the user).
6985 */
6986 if (RT_FAILURE(rc))
6987 break;
6988
6989 /* Need to hold the write lock while finishing the merge. */
6990 rc2 = vdThreadStartWrite(pDisk);
6991 AssertRC(rc2);
6992 fLockWrite = true;
6993
6994 /* Update parent UUID so that image chain is consistent.
6995 * The two attempts work around the problem that some backends
6996 * (e.g. iSCSI) do not support UUIDs, so we exploit the fact that
6997 * so far there can only be one such image in the chain. */
6998 /** @todo needs a better long-term solution, passing the UUID
6999 * knowledge from the caller or some such */
7000 RTUUID Uuid;
7001 PVDIMAGE pImageChild = NULL;
7002 if (nImageFrom < nImageTo)
7003 {
7004 if (pImageFrom->pPrev)
7005 {
7006 /* plan A: ask the parent itself for its UUID */
7007 rc = pImageFrom->pPrev->Backend->pfnGetUuid(pImageFrom->pPrev->pBackendData,
7008 &Uuid);
7009 if (RT_FAILURE(rc))
7010 {
7011 /* plan B: ask the child of the parent for parent UUID */
7012 rc = pImageFrom->Backend->pfnGetParentUuid(pImageFrom->pBackendData,
7013 &Uuid);
7014 }
7015 AssertRC(rc);
7016 }
7017 else
7018 RTUuidClear(&Uuid);
7019 rc = pImageTo->Backend->pfnSetParentUuid(pImageTo->pBackendData,
7020 &Uuid);
7021 AssertRC(rc);
7022 }
7023 else
7024 {
7025 /* Update the parent uuid of the child of the last merged image. */
7026 if (pImageFrom->pNext)
7027 {
7028 /* plan A: ask the parent itself for its UUID */
7029 rc = pImageTo->Backend->pfnGetUuid(pImageTo->pBackendData,
7030 &Uuid);
7031 if (RT_FAILURE(rc))
7032 {
7033 /* plan B: ask the child of the parent for parent UUID */
7034 rc = pImageTo->pNext->Backend->pfnGetParentUuid(pImageTo->pNext->pBackendData,
7035 &Uuid);
7036 }
7037 AssertRC(rc);
7038
7039 rc = pImageFrom->Backend->pfnSetParentUuid(pImageFrom->pNext->pBackendData,
7040 &Uuid);
7041 AssertRC(rc);
7042
7043 pImageChild = pImageFrom->pNext;
7044 }
7045 }
7046
7047 /* Delete the no longer needed images. */
7048 PVDIMAGE pImg = pImageFrom, pTmp;
7049 while (pImg != pImageTo)
7050 {
7051 if (nImageFrom < nImageTo)
7052 pTmp = pImg->pNext;
7053 else
7054 pTmp = pImg->pPrev;
7055 vdRemoveImageFromList(pDisk, pImg);
7056 pImg->Backend->pfnClose(pImg->pBackendData, true);
7057 RTMemFree(pImg->pszFilename);
7058 RTMemFree(pImg);
7059 pImg = pTmp;
7060 }
7061
7062 /* Make sure destination image is back to read only if necessary. */
7063 if (pImageTo != pDisk->pLast)
7064 {
7065 uOpenFlags = pImageTo->Backend->pfnGetOpenFlags(pImageTo->pBackendData);
7066 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
7067 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7068 uOpenFlags);
7069 if (RT_FAILURE(rc))
7070 break;
7071 }
7072
7073 /*
7074 * Make sure the child is readonly
7075 * for the child -> parent merge direction
7076 * if necessary.
7077 */
7078 if ( nImageFrom > nImageTo
7079 && pImageChild
7080 && pImageChild != pDisk->pLast)
7081 {
7082 uOpenFlags = pImageChild->Backend->pfnGetOpenFlags(pImageChild->pBackendData);
7083 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
7084 rc = pImageChild->Backend->pfnSetOpenFlags(pImageChild->pBackendData,
7085 uOpenFlags);
7086 if (RT_FAILURE(rc))
7087 break;
7088 }
7089 } while (0);
7090
7091 if (RT_UNLIKELY(fLockWrite))
7092 {
7093 rc2 = vdThreadFinishWrite(pDisk);
7094 AssertRC(rc2);
7095 }
7096 else if (RT_UNLIKELY(fLockRead))
7097 {
7098 rc2 = vdThreadFinishRead(pDisk);
7099 AssertRC(rc2);
7100 }
7101
7102 if (pvBuf)
7103 RTMemTmpFree(pvBuf);
7104
7105 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
7106 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7107
7108 LogFlowFunc(("returns %Rrc\n", rc));
7109 return rc;
7110}
7111
7112/**
7113 * Copies an image from one HDD container to another - extended version.
7114 * The copy is opened in the target HDD container.
7115 * It is possible to convert between different image formats, because the
7116 * backend for the destination may be different from the source.
7117 * If both the source and destination reference the same HDD container,
7118 * then the image is moved (by copying/deleting or renaming) to the new location.
7119 * The source container is unchanged if the move operation fails, otherwise
7120 * the image at the new location is opened in the same way as the old one was.
7121 *
7122 * @note The read/write accesses across disks are not synchronized, just the
7123 * accesses to each disk. Once there is a use case which requires a defined
7124 * read/write behavior in this situation this needs to be extended.
7125 *
7126 * @return VBox status code.
7127 * @return VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7128 * @param pDiskFrom Pointer to source HDD container.
7129 * @param nImage Image number, counts from 0. 0 is always base image of container.
7130 * @param pDiskTo Pointer to destination HDD container.
7131 * @param pszBackend Name of the image file backend to use (may be NULL to use the same as the source, case insensitive).
7132 * @param pszFilename New name of the image (may be NULL to specify that the
7133 * copy destination is the destination container, or
7134 * if pDiskFrom == pDiskTo, i.e. when moving).
7135 * @param fMoveByRename If true, attempt to perform a move by renaming (if successful the new size is ignored).
7136 * @param cbSize New image size (0 means leave unchanged).
7137 * @param nImageSameFrom todo
7138 * @param nImageSameTo todo
7139 * @param uImageFlags Flags specifying special destination image features.
7140 * @param pDstUuid New UUID of the destination image. If NULL, a new UUID is created.
7141 * This parameter is used if and only if a true copy is created.
7142 * In all rename/move cases or copy to existing image cases the modification UUIDs are copied over.
7143 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
7144 * Only used if the destination image is created.
7145 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7146 * @param pDstVDIfsImage Pointer to the per-image VD interface list, for the
7147 * destination image.
7148 * @param pDstVDIfsOperation Pointer to the per-operation VD interface list,
7149 * for the destination operation.
7150 */
7151VBOXDDU_DECL(int) VDCopyEx(PVBOXHDD pDiskFrom, unsigned nImage, PVBOXHDD pDiskTo,
7152 const char *pszBackend, const char *pszFilename,
7153 bool fMoveByRename, uint64_t cbSize,
7154 unsigned nImageFromSame, unsigned nImageToSame,
7155 unsigned uImageFlags, PCRTUUID pDstUuid,
7156 unsigned uOpenFlags, PVDINTERFACE pVDIfsOperation,
7157 PVDINTERFACE pDstVDIfsImage,
7158 PVDINTERFACE pDstVDIfsOperation)
7159{
7160 int rc = VINF_SUCCESS;
7161 int rc2;
7162 bool fLockReadFrom = false, fLockWriteFrom = false, fLockWriteTo = false;
7163 PVDIMAGE pImageTo = NULL;
7164
7165 LogFlowFunc(("pDiskFrom=%#p nImage=%u pDiskTo=%#p pszBackend=\"%s\" pszFilename=\"%s\" fMoveByRename=%d cbSize=%llu nImageFromSame=%u nImageToSame=%u uImageFlags=%#x pDstUuid=%#p uOpenFlags=%#x pVDIfsOperation=%#p pDstVDIfsImage=%#p pDstVDIfsOperation=%#p\n",
7166 pDiskFrom, nImage, pDiskTo, pszBackend, pszFilename, fMoveByRename, cbSize, nImageFromSame, nImageToSame, uImageFlags, pDstUuid, uOpenFlags, pVDIfsOperation, pDstVDIfsImage, pDstVDIfsOperation));
7167
7168 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7169 PVDINTERFACEPROGRESS pDstIfProgress = VDIfProgressGet(pDstVDIfsOperation);
7170
7171 do {
7172 /* Check arguments. */
7173 AssertMsgBreakStmt(VALID_PTR(pDiskFrom), ("pDiskFrom=%#p\n", pDiskFrom),
7174 rc = VERR_INVALID_PARAMETER);
7175 AssertMsg(pDiskFrom->u32Signature == VBOXHDDDISK_SIGNATURE,
7176 ("u32Signature=%08x\n", pDiskFrom->u32Signature));
7177
7178 rc2 = vdThreadStartRead(pDiskFrom);
7179 AssertRC(rc2);
7180 fLockReadFrom = true;
7181 PVDIMAGE pImageFrom = vdGetImageByNumber(pDiskFrom, nImage);
7182 AssertPtrBreakStmt(pImageFrom, rc = VERR_VD_IMAGE_NOT_FOUND);
7183 AssertMsgBreakStmt(VALID_PTR(pDiskTo), ("pDiskTo=%#p\n", pDiskTo),
7184 rc = VERR_INVALID_PARAMETER);
7185 AssertMsg(pDiskTo->u32Signature == VBOXHDDDISK_SIGNATURE,
7186 ("u32Signature=%08x\n", pDiskTo->u32Signature));
7187 AssertMsgBreakStmt( (nImageFromSame < nImage || nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN)
7188 && (nImageToSame < pDiskTo->cImages || nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7189 && ( (nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN && nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7190 || (nImageFromSame != VD_IMAGE_CONTENT_UNKNOWN && nImageToSame != VD_IMAGE_CONTENT_UNKNOWN)),
7191 ("nImageFromSame=%u nImageToSame=%u\n", nImageFromSame, nImageToSame),
7192 rc = VERR_INVALID_PARAMETER);
7193
7194 /* Move the image. */
7195 if (pDiskFrom == pDiskTo)
7196 {
7197 /* Rename only works when backends are the same, are file based
7198 * and the rename method is implemented. */
7199 if ( fMoveByRename
7200 && !RTStrICmp(pszBackend, pImageFrom->Backend->pszBackendName)
7201 && pImageFrom->Backend->uBackendCaps & VD_CAP_FILE
7202 && pImageFrom->Backend->pfnRename)
7203 {
7204 rc2 = vdThreadFinishRead(pDiskFrom);
7205 AssertRC(rc2);
7206 fLockReadFrom = false;
7207
7208 rc2 = vdThreadStartWrite(pDiskFrom);
7209 AssertRC(rc2);
7210 fLockWriteFrom = true;
7211 rc = pImageFrom->Backend->pfnRename(pImageFrom->pBackendData, pszFilename ? pszFilename : pImageFrom->pszFilename);
7212 break;
7213 }
7214
7215 /** @todo Moving (including shrinking/growing) of the image is
7216 * requested, but the rename attempt failed or it wasn't possible.
7217 * Must now copy image to temp location. */
7218 AssertReleaseMsgFailed(("VDCopy: moving by copy/delete not implemented\n"));
7219 }
7220
7221 /* pszFilename is allowed to be NULL, as this indicates copy to the existing image. */
7222 AssertMsgBreakStmt(pszFilename == NULL || (VALID_PTR(pszFilename) && *pszFilename),
7223 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
7224 rc = VERR_INVALID_PARAMETER);
7225
7226 uint64_t cbSizeFrom;
7227 cbSizeFrom = pImageFrom->Backend->pfnGetSize(pImageFrom->pBackendData);
7228 if (cbSizeFrom == 0)
7229 {
7230 rc = VERR_VD_VALUE_NOT_FOUND;
7231 break;
7232 }
7233
7234 VDGEOMETRY PCHSGeometryFrom = {0, 0, 0};
7235 VDGEOMETRY LCHSGeometryFrom = {0, 0, 0};
7236 pImageFrom->Backend->pfnGetPCHSGeometry(pImageFrom->pBackendData, &PCHSGeometryFrom);
7237 pImageFrom->Backend->pfnGetLCHSGeometry(pImageFrom->pBackendData, &LCHSGeometryFrom);
7238
7239 RTUUID ImageUuid, ImageModificationUuid;
7240 if (pDiskFrom != pDiskTo)
7241 {
7242 if (pDstUuid)
7243 ImageUuid = *pDstUuid;
7244 else
7245 RTUuidCreate(&ImageUuid);
7246 }
7247 else
7248 {
7249 rc = pImageFrom->Backend->pfnGetUuid(pImageFrom->pBackendData, &ImageUuid);
7250 if (RT_FAILURE(rc))
7251 RTUuidCreate(&ImageUuid);
7252 }
7253 rc = pImageFrom->Backend->pfnGetModificationUuid(pImageFrom->pBackendData, &ImageModificationUuid);
7254 if (RT_FAILURE(rc))
7255 RTUuidClear(&ImageModificationUuid);
7256
7257 char szComment[1024];
7258 rc = pImageFrom->Backend->pfnGetComment(pImageFrom->pBackendData, szComment, sizeof(szComment));
7259 if (RT_FAILURE(rc))
7260 szComment[0] = '\0';
7261 else
7262 szComment[sizeof(szComment) - 1] = '\0';
7263
7264 rc2 = vdThreadFinishRead(pDiskFrom);
7265 AssertRC(rc2);
7266 fLockReadFrom = false;
7267
7268 rc2 = vdThreadStartRead(pDiskTo);
7269 AssertRC(rc2);
7270 unsigned cImagesTo = pDiskTo->cImages;
7271 rc2 = vdThreadFinishRead(pDiskTo);
7272 AssertRC(rc2);
7273
7274 if (pszFilename)
7275 {
7276 if (cbSize == 0)
7277 cbSize = cbSizeFrom;
7278
7279 /* Create destination image with the properties of source image. */
7280 /** @todo replace the VDCreateDiff/VDCreateBase calls by direct
7281 * calls to the backend. Unifies the code and reduces the API
7282 * dependencies. Would also make the synchronization explicit. */
7283 if (cImagesTo > 0)
7284 {
7285 rc = VDCreateDiff(pDiskTo, pszBackend, pszFilename,
7286 uImageFlags, szComment, &ImageUuid,
7287 NULL /* pParentUuid */,
7288 uOpenFlags & ~VD_OPEN_FLAGS_READONLY,
7289 pDstVDIfsImage, NULL);
7290
7291 rc2 = vdThreadStartWrite(pDiskTo);
7292 AssertRC(rc2);
7293 fLockWriteTo = true;
7294 } else {
7295 /** @todo hack to force creation of a fixed image for
7296 * the RAW backend, which can't handle anything else. */
7297 if (!RTStrICmp(pszBackend, "RAW"))
7298 uImageFlags |= VD_IMAGE_FLAGS_FIXED;
7299
7300 vdFixupPCHSGeometry(&PCHSGeometryFrom, cbSize);
7301 vdFixupLCHSGeometry(&LCHSGeometryFrom, cbSize);
7302
7303 rc = VDCreateBase(pDiskTo, pszBackend, pszFilename, cbSize,
7304 uImageFlags, szComment,
7305 &PCHSGeometryFrom, &LCHSGeometryFrom,
7306 NULL, uOpenFlags & ~VD_OPEN_FLAGS_READONLY,
7307 pDstVDIfsImage, NULL);
7308
7309 rc2 = vdThreadStartWrite(pDiskTo);
7310 AssertRC(rc2);
7311 fLockWriteTo = true;
7312
7313 if (RT_SUCCESS(rc) && !RTUuidIsNull(&ImageUuid))
7314 pDiskTo->pLast->Backend->pfnSetUuid(pDiskTo->pLast->pBackendData, &ImageUuid);
7315 }
7316 if (RT_FAILURE(rc))
7317 break;
7318
7319 pImageTo = pDiskTo->pLast;
7320 AssertPtrBreakStmt(pImageTo, rc = VERR_VD_IMAGE_NOT_FOUND);
7321
7322 cbSize = RT_MIN(cbSize, cbSizeFrom);
7323 }
7324 else
7325 {
7326 pImageTo = pDiskTo->pLast;
7327 AssertPtrBreakStmt(pImageTo, rc = VERR_VD_IMAGE_NOT_FOUND);
7328
7329 uint64_t cbSizeTo;
7330 cbSizeTo = pImageTo->Backend->pfnGetSize(pImageTo->pBackendData);
7331 if (cbSizeTo == 0)
7332 {
7333 rc = VERR_VD_VALUE_NOT_FOUND;
7334 break;
7335 }
7336
7337 if (cbSize == 0)
7338 cbSize = RT_MIN(cbSizeFrom, cbSizeTo);
7339
7340 vdFixupPCHSGeometry(&PCHSGeometryFrom, cbSize);
7341 vdFixupLCHSGeometry(&LCHSGeometryFrom, cbSize);
7342
7343 /* Update the geometry in the destination image. */
7344 pImageTo->Backend->pfnSetPCHSGeometry(pImageTo->pBackendData, &PCHSGeometryFrom);
7345 pImageTo->Backend->pfnSetLCHSGeometry(pImageTo->pBackendData, &LCHSGeometryFrom);
7346 }
7347
7348 rc2 = vdThreadFinishWrite(pDiskTo);
7349 AssertRC(rc2);
7350 fLockWriteTo = false;
7351
7352 /* Whether we can take the optimized copy path (false) or not.
7353 * Don't optimize if the image existed or if it is a child image. */
7354 bool fSuppressRedundantIo = ( !(pszFilename == NULL || cImagesTo > 0)
7355 || (nImageToSame != VD_IMAGE_CONTENT_UNKNOWN));
7356 unsigned cImagesFromReadBack, cImagesToReadBack;
7357
7358 if (nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN)
7359 cImagesFromReadBack = 0;
7360 else
7361 {
7362 if (nImage == VD_LAST_IMAGE)
7363 cImagesFromReadBack = pDiskFrom->cImages - nImageFromSame - 1;
7364 else
7365 cImagesFromReadBack = nImage - nImageFromSame;
7366 }
7367
7368 if (nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7369 cImagesToReadBack = 0;
7370 else
7371 cImagesToReadBack = pDiskTo->cImages - nImageToSame - 1;
7372
7373 /* Copy the data. */
7374 rc = vdCopyHelper(pDiskFrom, pImageFrom, pDiskTo, cbSize,
7375 cImagesFromReadBack, cImagesToReadBack,
7376 fSuppressRedundantIo, pIfProgress, pDstIfProgress);
7377
7378 if (RT_SUCCESS(rc))
7379 {
7380 rc2 = vdThreadStartWrite(pDiskTo);
7381 AssertRC(rc2);
7382 fLockWriteTo = true;
7383
7384 /* Only set modification UUID if it is non-null, since the source
7385 * backend might not provide a valid modification UUID. */
7386 if (!RTUuidIsNull(&ImageModificationUuid))
7387 pImageTo->Backend->pfnSetModificationUuid(pImageTo->pBackendData, &ImageModificationUuid);
7388
7389 /* Set the requested open flags if they differ from the value
7390 * required for creating the image and copying the contents. */
7391 if ( pImageTo && pszFilename
7392 && uOpenFlags != (uOpenFlags & ~VD_OPEN_FLAGS_READONLY))
7393 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7394 uOpenFlags);
7395 }
7396 } while (0);
7397
7398 if (RT_FAILURE(rc) && pImageTo && pszFilename)
7399 {
7400 /* Take the write lock only if it is not taken. Not worth making the
7401 * above code even more complicated. */
7402 if (RT_UNLIKELY(!fLockWriteTo))
7403 {
7404 rc2 = vdThreadStartWrite(pDiskTo);
7405 AssertRC(rc2);
7406 fLockWriteTo = true;
7407 }
7408 /* Error detected, but new image created. Remove image from list. */
7409 vdRemoveImageFromList(pDiskTo, pImageTo);
7410
7411 /* Close and delete image. */
7412 rc2 = pImageTo->Backend->pfnClose(pImageTo->pBackendData, true);
7413 AssertRC(rc2);
7414 pImageTo->pBackendData = NULL;
7415
7416 /* Free remaining resources. */
7417 if (pImageTo->pszFilename)
7418 RTStrFree(pImageTo->pszFilename);
7419
7420 RTMemFree(pImageTo);
7421 }
7422
7423 if (RT_UNLIKELY(fLockWriteTo))
7424 {
7425 rc2 = vdThreadFinishWrite(pDiskTo);
7426 AssertRC(rc2);
7427 }
7428 if (RT_UNLIKELY(fLockWriteFrom))
7429 {
7430 rc2 = vdThreadFinishWrite(pDiskFrom);
7431 AssertRC(rc2);
7432 }
7433 else if (RT_UNLIKELY(fLockReadFrom))
7434 {
7435 rc2 = vdThreadFinishRead(pDiskFrom);
7436 AssertRC(rc2);
7437 }
7438
7439 if (RT_SUCCESS(rc))
7440 {
7441 if (pIfProgress && pIfProgress->pfnProgress)
7442 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7443 if (pDstIfProgress && pDstIfProgress->pfnProgress)
7444 pDstIfProgress->pfnProgress(pDstIfProgress->Core.pvUser, 100);
7445 }
7446
7447 LogFlowFunc(("returns %Rrc\n", rc));
7448 return rc;
7449}
7450
7451/**
7452 * Copies an image from one HDD container to another.
7453 * The copy is opened in the target HDD container.
7454 * It is possible to convert between different image formats, because the
7455 * backend for the destination may be different from the source.
7456 * If both the source and destination reference the same HDD container,
7457 * then the image is moved (by copying/deleting or renaming) to the new location.
7458 * The source container is unchanged if the move operation fails, otherwise
7459 * the image at the new location is opened in the same way as the old one was.
7460 *
7461 * @returns VBox status code.
7462 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7463 * @param pDiskFrom Pointer to source HDD container.
7464 * @param nImage Image number, counts from 0. 0 is always base image of container.
7465 * @param pDiskTo Pointer to destination HDD container.
7466 * @param pszBackend Name of the image file backend to use.
7467 * @param pszFilename New name of the image (may be NULL if pDiskFrom == pDiskTo).
7468 * @param fMoveByRename If true, attempt to perform a move by renaming (if successful the new size is ignored).
7469 * @param cbSize New image size (0 means leave unchanged).
7470 * @param uImageFlags Flags specifying special destination image features.
7471 * @param pDstUuid New UUID of the destination image. If NULL, a new UUID is created.
7472 * This parameter is used if and only if a true copy is created.
7473 * In all rename/move cases the UUIDs are copied over.
7474 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
7475 * Only used if the destination image is created.
7476 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7477 * @param pDstVDIfsImage Pointer to the per-image VD interface list, for the
7478 * destination image.
7479 * @param pDstVDIfsOperation Pointer to the per-image VD interface list,
7480 * for the destination image.
7481 */
7482VBOXDDU_DECL(int) VDCopy(PVBOXHDD pDiskFrom, unsigned nImage, PVBOXHDD pDiskTo,
7483 const char *pszBackend, const char *pszFilename,
7484 bool fMoveByRename, uint64_t cbSize,
7485 unsigned uImageFlags, PCRTUUID pDstUuid,
7486 unsigned uOpenFlags, PVDINTERFACE pVDIfsOperation,
7487 PVDINTERFACE pDstVDIfsImage,
7488 PVDINTERFACE pDstVDIfsOperation)
7489{
7490 return VDCopyEx(pDiskFrom, nImage, pDiskTo, pszBackend, pszFilename, fMoveByRename,
7491 cbSize, VD_IMAGE_CONTENT_UNKNOWN, VD_IMAGE_CONTENT_UNKNOWN,
7492 uImageFlags, pDstUuid, uOpenFlags, pVDIfsOperation,
7493 pDstVDIfsImage, pDstVDIfsOperation);
7494}
7495
7496/**
7497 * Optimizes the storage consumption of an image. Typically the unused blocks
7498 * have to be wiped with zeroes to achieve a substantial reduced storage use.
7499 * Another optimization done is reordering the image blocks, which can provide
7500 * a significant performance boost, as reads and writes tend to use less random
7501 * file offsets.
7502 *
7503 * @return VBox status code.
7504 * @return VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7505 * @return VERR_VD_IMAGE_READ_ONLY if image is not writable.
7506 * @return VERR_NOT_SUPPORTED if this kind of image can be compacted, but
7507 * the code for this isn't implemented yet.
7508 * @param pDisk Pointer to HDD container.
7509 * @param nImage Image number, counts from 0. 0 is always base image of container.
7510 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7511 */
7512VBOXDDU_DECL(int) VDCompact(PVBOXHDD pDisk, unsigned nImage,
7513 PVDINTERFACE pVDIfsOperation)
7514{
7515 int rc = VINF_SUCCESS;
7516 int rc2;
7517 bool fLockRead = false, fLockWrite = false;
7518 void *pvBuf = NULL;
7519 void *pvTmp = NULL;
7520
7521 LogFlowFunc(("pDisk=%#p nImage=%u pVDIfsOperation=%#p\n",
7522 pDisk, nImage, pVDIfsOperation));
7523
7524 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7525
7526 do {
7527 /* Check arguments. */
7528 AssertMsgBreakStmt(VALID_PTR(pDisk), ("pDisk=%#p\n", pDisk),
7529 rc = VERR_INVALID_PARAMETER);
7530 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE,
7531 ("u32Signature=%08x\n", pDisk->u32Signature));
7532
7533 rc2 = vdThreadStartRead(pDisk);
7534 AssertRC(rc2);
7535 fLockRead = true;
7536
7537 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
7538 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
7539
7540 /* If there is no compact callback for not file based backends then
7541 * the backend doesn't need compaction. No need to make much fuss about
7542 * this. For file based ones signal this as not yet supported. */
7543 if (!pImage->Backend->pfnCompact)
7544 {
7545 if (pImage->Backend->uBackendCaps & VD_CAP_FILE)
7546 rc = VERR_NOT_SUPPORTED;
7547 else
7548 rc = VINF_SUCCESS;
7549 break;
7550 }
7551
7552 /* Insert interface for reading parent state into per-operation list,
7553 * if there is a parent image. */
7554 VDINTERFACEPARENTSTATE VDIfParent;
7555 VDPARENTSTATEDESC ParentUser;
7556 if (pImage->pPrev)
7557 {
7558 VDIfParent.pfnParentRead = vdParentRead;
7559 ParentUser.pDisk = pDisk;
7560 ParentUser.pImage = pImage->pPrev;
7561 rc = VDInterfaceAdd(&VDIfParent.Core, "VDCompact_ParentState", VDINTERFACETYPE_PARENTSTATE,
7562 &ParentUser, sizeof(VDINTERFACEPARENTSTATE), &pVDIfsOperation);
7563 AssertRC(rc);
7564 }
7565
7566 rc2 = vdThreadFinishRead(pDisk);
7567 AssertRC(rc2);
7568 fLockRead = false;
7569
7570 rc2 = vdThreadStartWrite(pDisk);
7571 AssertRC(rc2);
7572 fLockWrite = true;
7573
7574 rc = pImage->Backend->pfnCompact(pImage->pBackendData,
7575 0, 99,
7576 pDisk->pVDIfsDisk,
7577 pImage->pVDIfsImage,
7578 pVDIfsOperation);
7579 } while (0);
7580
7581 if (RT_UNLIKELY(fLockWrite))
7582 {
7583 rc2 = vdThreadFinishWrite(pDisk);
7584 AssertRC(rc2);
7585 }
7586 else if (RT_UNLIKELY(fLockRead))
7587 {
7588 rc2 = vdThreadFinishRead(pDisk);
7589 AssertRC(rc2);
7590 }
7591
7592 if (pvBuf)
7593 RTMemTmpFree(pvBuf);
7594 if (pvTmp)
7595 RTMemTmpFree(pvTmp);
7596
7597 if (RT_SUCCESS(rc))
7598 {
7599 if (pIfProgress && pIfProgress->pfnProgress)
7600 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7601 }
7602
7603 LogFlowFunc(("returns %Rrc\n", rc));
7604 return rc;
7605}
7606
7607/**
7608 * Resizes the given disk image to the given size.
7609 *
7610 * @return VBox status
7611 * @return VERR_VD_IMAGE_READ_ONLY if image is not writable.
7612 * @return VERR_NOT_SUPPORTED if this kind of image can be compacted, but
7613 *
7614 * @param pDisk Pointer to the HDD container.
7615 * @param cbSize New size of the image.
7616 * @param pPCHSGeometry Pointer to the new physical disk geometry <= (16383,16,63). Not NULL.
7617 * @param pLCHSGeometry Pointer to the new logical disk geometry <= (x,255,63). Not NULL.
7618 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7619 */
7620VBOXDDU_DECL(int) VDResize(PVBOXHDD pDisk, uint64_t cbSize,
7621 PCVDGEOMETRY pPCHSGeometry,
7622 PCVDGEOMETRY pLCHSGeometry,
7623 PVDINTERFACE pVDIfsOperation)
7624{
7625 /** @todo r=klaus resizing was designed to be part of VDCopy, so having a separate function is not desirable. */
7626 int rc = VINF_SUCCESS;
7627 int rc2;
7628 bool fLockRead = false, fLockWrite = false;
7629
7630 LogFlowFunc(("pDisk=%#p cbSize=%llu pVDIfsOperation=%#p\n",
7631 pDisk, cbSize, pVDIfsOperation));
7632
7633 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7634
7635 do {
7636 /* Check arguments. */
7637 AssertMsgBreakStmt(VALID_PTR(pDisk), ("pDisk=%#p\n", pDisk),
7638 rc = VERR_INVALID_PARAMETER);
7639 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE,
7640 ("u32Signature=%08x\n", pDisk->u32Signature));
7641
7642 rc2 = vdThreadStartRead(pDisk);
7643 AssertRC(rc2);
7644 fLockRead = true;
7645
7646 /* Must have at least one image in the chain, will resize last. */
7647 AssertMsgBreakStmt(pDisk->cImages >= 1, ("cImages=%u\n", pDisk->cImages),
7648 rc = VERR_NOT_SUPPORTED);
7649
7650 PVDIMAGE pImage = pDisk->pLast;
7651
7652 /* If there is no compact callback for not file based backends then
7653 * the backend doesn't need compaction. No need to make much fuss about
7654 * this. For file based ones signal this as not yet supported. */
7655 if (!pImage->Backend->pfnResize)
7656 {
7657 if (pImage->Backend->uBackendCaps & VD_CAP_FILE)
7658 rc = VERR_NOT_SUPPORTED;
7659 else
7660 rc = VINF_SUCCESS;
7661 break;
7662 }
7663
7664 rc2 = vdThreadFinishRead(pDisk);
7665 AssertRC(rc2);
7666 fLockRead = false;
7667
7668 rc2 = vdThreadStartWrite(pDisk);
7669 AssertRC(rc2);
7670 fLockWrite = true;
7671
7672 VDGEOMETRY PCHSGeometryOld;
7673 VDGEOMETRY LCHSGeometryOld;
7674 PCVDGEOMETRY pPCHSGeometryNew;
7675 PCVDGEOMETRY pLCHSGeometryNew;
7676
7677 if (pPCHSGeometry->cCylinders == 0)
7678 {
7679 /* Auto-detect marker, calculate new value ourself. */
7680 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData, &PCHSGeometryOld);
7681 if (RT_SUCCESS(rc) && (PCHSGeometryOld.cCylinders != 0))
7682 PCHSGeometryOld.cCylinders = RT_MIN(cbSize / 512 / PCHSGeometryOld.cHeads / PCHSGeometryOld.cSectors, 16383);
7683 else if (rc == VERR_VD_GEOMETRY_NOT_SET)
7684 rc = VINF_SUCCESS;
7685
7686 pPCHSGeometryNew = &PCHSGeometryOld;
7687 }
7688 else
7689 pPCHSGeometryNew = pPCHSGeometry;
7690
7691 if (pLCHSGeometry->cCylinders == 0)
7692 {
7693 /* Auto-detect marker, calculate new value ourself. */
7694 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData, &LCHSGeometryOld);
7695 if (RT_SUCCESS(rc) && (LCHSGeometryOld.cCylinders != 0))
7696 LCHSGeometryOld.cCylinders = cbSize / 512 / LCHSGeometryOld.cHeads / LCHSGeometryOld.cSectors;
7697 else if (rc == VERR_VD_GEOMETRY_NOT_SET)
7698 rc = VINF_SUCCESS;
7699
7700 pLCHSGeometryNew = &LCHSGeometryOld;
7701 }
7702 else
7703 pLCHSGeometryNew = pLCHSGeometry;
7704
7705 if (RT_SUCCESS(rc))
7706 rc = pImage->Backend->pfnResize(pImage->pBackendData,
7707 cbSize,
7708 pPCHSGeometryNew,
7709 pLCHSGeometryNew,
7710 0, 99,
7711 pDisk->pVDIfsDisk,
7712 pImage->pVDIfsImage,
7713 pVDIfsOperation);
7714 } while (0);
7715
7716 if (RT_UNLIKELY(fLockWrite))
7717 {
7718 rc2 = vdThreadFinishWrite(pDisk);
7719 AssertRC(rc2);
7720 }
7721 else if (RT_UNLIKELY(fLockRead))
7722 {
7723 rc2 = vdThreadFinishRead(pDisk);
7724 AssertRC(rc2);
7725 }
7726
7727 if (RT_SUCCESS(rc))
7728 {
7729 if (pIfProgress && pIfProgress->pfnProgress)
7730 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7731
7732 pDisk->cbSize = cbSize;
7733 }
7734
7735 LogFlowFunc(("returns %Rrc\n", rc));
7736 return rc;
7737}
7738
7739/**
7740 * Closes the last opened image file in HDD container.
7741 * If previous image file was opened in read-only mode (the normal case) and
7742 * the last opened image is in read-write mode then the previous image will be
7743 * reopened in read/write mode.
7744 *
7745 * @returns VBox status code.
7746 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
7747 * @param pDisk Pointer to HDD container.
7748 * @param fDelete If true, delete the image from the host disk.
7749 */
7750VBOXDDU_DECL(int) VDClose(PVBOXHDD pDisk, bool fDelete)
7751{
7752 int rc = VINF_SUCCESS;
7753 int rc2;
7754 bool fLockWrite = false;
7755
7756 LogFlowFunc(("pDisk=%#p fDelete=%d\n", pDisk, fDelete));
7757 do
7758 {
7759 /* sanity check */
7760 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
7761 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
7762
7763 /* Not worth splitting this up into a read lock phase and write
7764 * lock phase, as closing an image is a relatively fast operation
7765 * dominated by the part which needs the write lock. */
7766 rc2 = vdThreadStartWrite(pDisk);
7767 AssertRC(rc2);
7768 fLockWrite = true;
7769
7770 PVDIMAGE pImage = pDisk->pLast;
7771 if (!pImage)
7772 {
7773 rc = VERR_VD_NOT_OPENED;
7774 break;
7775 }
7776
7777 /* Destroy the current discard state first which might still have pending blocks. */
7778 rc = vdDiscardStateDestroy(pDisk);
7779 if (RT_FAILURE(rc))
7780 break;
7781
7782 unsigned uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
7783 /* Remove image from list of opened images. */
7784 vdRemoveImageFromList(pDisk, pImage);
7785 /* Close (and optionally delete) image. */
7786 rc = pImage->Backend->pfnClose(pImage->pBackendData, fDelete);
7787 /* Free remaining resources related to the image. */
7788 RTStrFree(pImage->pszFilename);
7789 RTMemFree(pImage);
7790
7791 pImage = pDisk->pLast;
7792 if (!pImage)
7793 break;
7794
7795 /* If disk was previously in read/write mode, make sure it will stay
7796 * like this (if possible) after closing this image. Set the open flags
7797 * accordingly. */
7798 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
7799 {
7800 uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
7801 uOpenFlags &= ~ VD_OPEN_FLAGS_READONLY;
7802 rc = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData, uOpenFlags);
7803 }
7804
7805 /* Cache disk information. */
7806 pDisk->cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
7807
7808 /* Cache PCHS geometry. */
7809 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
7810 &pDisk->PCHSGeometry);
7811 if (RT_FAILURE(rc2))
7812 {
7813 pDisk->PCHSGeometry.cCylinders = 0;
7814 pDisk->PCHSGeometry.cHeads = 0;
7815 pDisk->PCHSGeometry.cSectors = 0;
7816 }
7817 else
7818 {
7819 /* Make sure the PCHS geometry is properly clipped. */
7820 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
7821 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
7822 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
7823 }
7824
7825 /* Cache LCHS geometry. */
7826 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
7827 &pDisk->LCHSGeometry);
7828 if (RT_FAILURE(rc2))
7829 {
7830 pDisk->LCHSGeometry.cCylinders = 0;
7831 pDisk->LCHSGeometry.cHeads = 0;
7832 pDisk->LCHSGeometry.cSectors = 0;
7833 }
7834 else
7835 {
7836 /* Make sure the LCHS geometry is properly clipped. */
7837 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
7838 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
7839 }
7840 } while (0);
7841
7842 if (RT_UNLIKELY(fLockWrite))
7843 {
7844 rc2 = vdThreadFinishWrite(pDisk);
7845 AssertRC(rc2);
7846 }
7847
7848 LogFlowFunc(("returns %Rrc\n", rc));
7849 return rc;
7850}
7851
7852/**
7853 * Closes the currently opened cache image file in HDD container.
7854 *
7855 * @return VBox status code.
7856 * @return VERR_VD_NOT_OPENED if no cache is opened in HDD container.
7857 * @param pDisk Pointer to HDD container.
7858 * @param fDelete If true, delete the image from the host disk.
7859 */
7860VBOXDDU_DECL(int) VDCacheClose(PVBOXHDD pDisk, bool fDelete)
7861{
7862 int rc = VINF_SUCCESS;
7863 int rc2;
7864 bool fLockWrite = false;
7865 PVDCACHE pCache = NULL;
7866
7867 LogFlowFunc(("pDisk=%#p fDelete=%d\n", pDisk, fDelete));
7868
7869 do
7870 {
7871 /* sanity check */
7872 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
7873 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
7874
7875 rc2 = vdThreadStartWrite(pDisk);
7876 AssertRC(rc2);
7877 fLockWrite = true;
7878
7879 AssertPtrBreakStmt(pDisk->pCache, rc = VERR_VD_CACHE_NOT_FOUND);
7880
7881 pCache = pDisk->pCache;
7882 pDisk->pCache = NULL;
7883
7884 pCache->Backend->pfnClose(pCache->pBackendData, fDelete);
7885 if (pCache->pszFilename)
7886 RTStrFree(pCache->pszFilename);
7887 RTMemFree(pCache);
7888 } while (0);
7889
7890 if (RT_LIKELY(fLockWrite))
7891 {
7892 rc2 = vdThreadFinishWrite(pDisk);
7893 AssertRC(rc2);
7894 }
7895
7896 LogFlowFunc(("returns %Rrc\n", rc));
7897 return rc;
7898}
7899
7900/**
7901 * Closes all opened image files in HDD container.
7902 *
7903 * @returns VBox status code.
7904 * @param pDisk Pointer to HDD container.
7905 */
7906VBOXDDU_DECL(int) VDCloseAll(PVBOXHDD pDisk)
7907{
7908 int rc = VINF_SUCCESS;
7909 int rc2;
7910 bool fLockWrite = false;
7911
7912 LogFlowFunc(("pDisk=%#p\n", pDisk));
7913 do
7914 {
7915 /* sanity check */
7916 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
7917 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
7918
7919 /* Lock the entire operation. */
7920 rc2 = vdThreadStartWrite(pDisk);
7921 AssertRC(rc2);
7922 fLockWrite = true;
7923
7924 PVDCACHE pCache = pDisk->pCache;
7925 if (pCache)
7926 {
7927 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, false);
7928 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
7929 rc = rc2;
7930
7931 if (pCache->pszFilename)
7932 RTStrFree(pCache->pszFilename);
7933 RTMemFree(pCache);
7934 }
7935
7936 PVDIMAGE pImage = pDisk->pLast;
7937 while (VALID_PTR(pImage))
7938 {
7939 PVDIMAGE pPrev = pImage->pPrev;
7940 /* Remove image from list of opened images. */
7941 vdRemoveImageFromList(pDisk, pImage);
7942 /* Close image. */
7943 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, false);
7944 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
7945 rc = rc2;
7946 /* Free remaining resources related to the image. */
7947 RTStrFree(pImage->pszFilename);
7948 RTMemFree(pImage);
7949 pImage = pPrev;
7950 }
7951 Assert(!VALID_PTR(pDisk->pLast));
7952 } while (0);
7953
7954 if (RT_UNLIKELY(fLockWrite))
7955 {
7956 rc2 = vdThreadFinishWrite(pDisk);
7957 AssertRC(rc2);
7958 }
7959
7960 LogFlowFunc(("returns %Rrc\n", rc));
7961 return rc;
7962}
7963
7964/**
7965 * Read data from virtual HDD.
7966 *
7967 * @returns VBox status code.
7968 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
7969 * @param pDisk Pointer to HDD container.
7970 * @param uOffset Offset of first reading byte from start of disk.
7971 * @param pvBuf Pointer to buffer for reading data.
7972 * @param cbRead Number of bytes to read.
7973 */
7974VBOXDDU_DECL(int) VDRead(PVBOXHDD pDisk, uint64_t uOffset, void *pvBuf,
7975 size_t cbRead)
7976{
7977 int rc = VINF_SUCCESS;
7978 int rc2;
7979 bool fLockRead = false;
7980
7981 LogFlowFunc(("pDisk=%#p uOffset=%llu pvBuf=%p cbRead=%zu\n",
7982 pDisk, uOffset, pvBuf, cbRead));
7983 do
7984 {
7985 /* sanity check */
7986 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
7987 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
7988
7989 /* Check arguments. */
7990 AssertMsgBreakStmt(VALID_PTR(pvBuf),
7991 ("pvBuf=%#p\n", pvBuf),
7992 rc = VERR_INVALID_PARAMETER);
7993 AssertMsgBreakStmt(cbRead,
7994 ("cbRead=%zu\n", cbRead),
7995 rc = VERR_INVALID_PARAMETER);
7996
7997 rc2 = vdThreadStartRead(pDisk);
7998 AssertRC(rc2);
7999 fLockRead = true;
8000
8001 PVDIMAGE pImage = pDisk->pLast;
8002 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8003
8004 if (uOffset + cbRead > pDisk->cbSize)
8005 {
8006 /* Floppy images might be smaller than the standard expected by
8007 the floppy controller code. So, we won't fail here. */
8008 AssertMsgBreakStmt(pDisk->enmType == VDTYPE_FLOPPY,
8009 ("uOffset=%llu cbRead=%zu pDisk->cbSize=%llu\n",
8010 uOffset, cbRead, pDisk->cbSize),
8011 rc = VERR_EOF);
8012 memset(pvBuf, 0xf6, cbRead); /* f6h = format.com filler byte */
8013 if (uOffset >= pDisk->cbSize)
8014 break;
8015 cbRead = pDisk->cbSize - uOffset;
8016 }
8017
8018 rc = vdReadHelper(pDisk, pImage, uOffset, pvBuf, cbRead,
8019 true /* fUpdateCache */);
8020 } while (0);
8021
8022 if (RT_UNLIKELY(fLockRead))
8023 {
8024 rc2 = vdThreadFinishRead(pDisk);
8025 AssertRC(rc2);
8026 }
8027
8028 LogFlowFunc(("returns %Rrc\n", rc));
8029 return rc;
8030}
8031
8032/**
8033 * Write data to virtual HDD.
8034 *
8035 * @returns VBox status code.
8036 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8037 * @param pDisk Pointer to HDD container.
8038 * @param uOffset Offset of the first byte being
8039 * written from start of disk.
8040 * @param pvBuf Pointer to buffer for writing data.
8041 * @param cbWrite Number of bytes to write.
8042 */
8043VBOXDDU_DECL(int) VDWrite(PVBOXHDD pDisk, uint64_t uOffset, const void *pvBuf,
8044 size_t cbWrite)
8045{
8046 int rc = VINF_SUCCESS;
8047 int rc2;
8048 bool fLockWrite = false;
8049
8050 LogFlowFunc(("pDisk=%#p uOffset=%llu pvBuf=%p cbWrite=%zu\n",
8051 pDisk, uOffset, pvBuf, cbWrite));
8052 do
8053 {
8054 /* sanity check */
8055 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8056 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8057
8058 /* Check arguments. */
8059 AssertMsgBreakStmt(VALID_PTR(pvBuf),
8060 ("pvBuf=%#p\n", pvBuf),
8061 rc = VERR_INVALID_PARAMETER);
8062 AssertMsgBreakStmt(cbWrite,
8063 ("cbWrite=%zu\n", cbWrite),
8064 rc = VERR_INVALID_PARAMETER);
8065
8066 rc2 = vdThreadStartWrite(pDisk);
8067 AssertRC(rc2);
8068 fLockWrite = true;
8069
8070 AssertMsgBreakStmt(uOffset + cbWrite <= pDisk->cbSize,
8071 ("uOffset=%llu cbWrite=%zu pDisk->cbSize=%llu\n",
8072 uOffset, cbWrite, pDisk->cbSize),
8073 rc = VERR_INVALID_PARAMETER);
8074
8075 PVDIMAGE pImage = pDisk->pLast;
8076 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8077
8078 vdSetModifiedFlag(pDisk);
8079 rc = vdWriteHelper(pDisk, pImage, uOffset, pvBuf, cbWrite,
8080 VDIOCTX_FLAGS_READ_UPDATE_CACHE);
8081 if (RT_FAILURE(rc))
8082 break;
8083
8084 /* If there is a merge (in the direction towards a parent) running
8085 * concurrently then we have to also "relay" the write to this parent,
8086 * as the merge position might be already past the position where
8087 * this write is going. The "context" of the write can come from the
8088 * natural chain, since merging either already did or will take care
8089 * of the "other" content which is might be needed to fill the block
8090 * to a full allocation size. The cache doesn't need to be touched
8091 * as this write is covered by the previous one. */
8092 if (RT_UNLIKELY(pDisk->pImageRelay))
8093 rc = vdWriteHelper(pDisk, pDisk->pImageRelay, uOffset,
8094 pvBuf, cbWrite, VDIOCTX_FLAGS_DEFAULT);
8095 } while (0);
8096
8097 if (RT_UNLIKELY(fLockWrite))
8098 {
8099 rc2 = vdThreadFinishWrite(pDisk);
8100 AssertRC(rc2);
8101 }
8102
8103 LogFlowFunc(("returns %Rrc\n", rc));
8104 return rc;
8105}
8106
8107/**
8108 * Make sure the on disk representation of a virtual HDD is up to date.
8109 *
8110 * @returns VBox status code.
8111 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8112 * @param pDisk Pointer to HDD container.
8113 */
8114VBOXDDU_DECL(int) VDFlush(PVBOXHDD pDisk)
8115{
8116 int rc = VINF_SUCCESS;
8117 int rc2;
8118 bool fLockWrite = false;
8119
8120 LogFlowFunc(("pDisk=%#p\n", pDisk));
8121 do
8122 {
8123 /* sanity check */
8124 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8125 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8126
8127 rc2 = vdThreadStartWrite(pDisk);
8128 AssertRC(rc2);
8129 fLockWrite = true;
8130
8131 PVDIMAGE pImage = pDisk->pLast;
8132 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8133
8134 PVDIOCTX pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_FLUSH, 0,
8135 0, pDisk->pLast, NULL,
8136 vdIoCtxSyncComplete, pDisk, NULL,
8137 NULL, vdFlushHelperAsync,
8138 VDIOCTX_FLAGS_SYNC);
8139
8140 if (!pIoCtx)
8141 {
8142 rc = VERR_NO_MEMORY;
8143 break;
8144 }
8145
8146 rc = vdIoCtxProcessSync(pIoCtx);
8147 } while (0);
8148
8149 if (RT_UNLIKELY(fLockWrite))
8150 {
8151 rc2 = vdThreadFinishWrite(pDisk);
8152 AssertRC(rc2);
8153 }
8154
8155 LogFlowFunc(("returns %Rrc\n", rc));
8156 return rc;
8157}
8158
8159/**
8160 * Get number of opened images in HDD container.
8161 *
8162 * @returns Number of opened images for HDD container. 0 if no images have been opened.
8163 * @param pDisk Pointer to HDD container.
8164 */
8165VBOXDDU_DECL(unsigned) VDGetCount(PVBOXHDD pDisk)
8166{
8167 unsigned cImages;
8168 int rc2;
8169 bool fLockRead = false;
8170
8171 LogFlowFunc(("pDisk=%#p\n", pDisk));
8172 do
8173 {
8174 /* sanity check */
8175 AssertPtrBreakStmt(pDisk, cImages = 0);
8176 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8177
8178 rc2 = vdThreadStartRead(pDisk);
8179 AssertRC(rc2);
8180 fLockRead = true;
8181
8182 cImages = pDisk->cImages;
8183 } while (0);
8184
8185 if (RT_UNLIKELY(fLockRead))
8186 {
8187 rc2 = vdThreadFinishRead(pDisk);
8188 AssertRC(rc2);
8189 }
8190
8191 LogFlowFunc(("returns %u\n", cImages));
8192 return cImages;
8193}
8194
8195/**
8196 * Get read/write mode of HDD container.
8197 *
8198 * @returns Virtual disk ReadOnly status.
8199 * @returns true if no image is opened in HDD container.
8200 * @param pDisk Pointer to HDD container.
8201 */
8202VBOXDDU_DECL(bool) VDIsReadOnly(PVBOXHDD pDisk)
8203{
8204 bool fReadOnly;
8205 int rc2;
8206 bool fLockRead = false;
8207
8208 LogFlowFunc(("pDisk=%#p\n", pDisk));
8209 do
8210 {
8211 /* sanity check */
8212 AssertPtrBreakStmt(pDisk, fReadOnly = false);
8213 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8214
8215 rc2 = vdThreadStartRead(pDisk);
8216 AssertRC(rc2);
8217 fLockRead = true;
8218
8219 PVDIMAGE pImage = pDisk->pLast;
8220 AssertPtrBreakStmt(pImage, fReadOnly = true);
8221
8222 unsigned uOpenFlags;
8223 uOpenFlags = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
8224 fReadOnly = !!(uOpenFlags & VD_OPEN_FLAGS_READONLY);
8225 } while (0);
8226
8227 if (RT_UNLIKELY(fLockRead))
8228 {
8229 rc2 = vdThreadFinishRead(pDisk);
8230 AssertRC(rc2);
8231 }
8232
8233 LogFlowFunc(("returns %d\n", fReadOnly));
8234 return fReadOnly;
8235}
8236
8237/**
8238 * Get sector size of an image in HDD container.
8239 *
8240 * @return Virtual disk sector size in bytes.
8241 * @return 0 if image with specified number was not opened.
8242 * @param pDisk Pointer to HDD container.
8243 * @param nImage Image number, counts from 0. 0 is always base image of container.
8244 */
8245VBOXDDU_DECL(uint32_t) VDGetSectorSize(PVBOXHDD pDisk, unsigned nImage)
8246{
8247 uint64_t cbSector;
8248 int rc2;
8249 bool fLockRead = false;
8250
8251 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8252 do
8253 {
8254 /* sanity check */
8255 AssertPtrBreakStmt(pDisk, cbSector = 0);
8256 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8257
8258 rc2 = vdThreadStartRead(pDisk);
8259 AssertRC(rc2);
8260 fLockRead = true;
8261
8262 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8263 AssertPtrBreakStmt(pImage, cbSector = 0);
8264 cbSector = pImage->Backend->pfnGetSectorSize(pImage->pBackendData);
8265 } while (0);
8266
8267 if (RT_UNLIKELY(fLockRead))
8268 {
8269 rc2 = vdThreadFinishRead(pDisk);
8270 AssertRC(rc2);
8271 }
8272
8273 LogFlowFunc(("returns %u\n", cbSector));
8274 return cbSector;
8275}
8276
8277/**
8278 * Get total capacity of an image in HDD container.
8279 *
8280 * @returns Virtual disk size in bytes.
8281 * @returns 0 if no image with specified number was not opened.
8282 * @param pDisk Pointer to HDD container.
8283 * @param nImage Image number, counts from 0. 0 is always base image of container.
8284 */
8285VBOXDDU_DECL(uint64_t) VDGetSize(PVBOXHDD pDisk, unsigned nImage)
8286{
8287 uint64_t cbSize;
8288 int rc2;
8289 bool fLockRead = false;
8290
8291 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8292 do
8293 {
8294 /* sanity check */
8295 AssertPtrBreakStmt(pDisk, cbSize = 0);
8296 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8297
8298 rc2 = vdThreadStartRead(pDisk);
8299 AssertRC(rc2);
8300 fLockRead = true;
8301
8302 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8303 AssertPtrBreakStmt(pImage, cbSize = 0);
8304 cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
8305 } while (0);
8306
8307 if (RT_UNLIKELY(fLockRead))
8308 {
8309 rc2 = vdThreadFinishRead(pDisk);
8310 AssertRC(rc2);
8311 }
8312
8313 LogFlowFunc(("returns %llu\n", cbSize));
8314 return cbSize;
8315}
8316
8317/**
8318 * Get total file size of an image in HDD container.
8319 *
8320 * @returns Virtual disk size in bytes.
8321 * @returns 0 if no image is opened in HDD container.
8322 * @param pDisk Pointer to HDD container.
8323 * @param nImage Image number, counts from 0. 0 is always base image of container.
8324 */
8325VBOXDDU_DECL(uint64_t) VDGetFileSize(PVBOXHDD pDisk, unsigned nImage)
8326{
8327 uint64_t cbSize;
8328 int rc2;
8329 bool fLockRead = false;
8330
8331 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8332 do
8333 {
8334 /* sanity check */
8335 AssertPtrBreakStmt(pDisk, cbSize = 0);
8336 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8337
8338 rc2 = vdThreadStartRead(pDisk);
8339 AssertRC(rc2);
8340 fLockRead = true;
8341
8342 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8343 AssertPtrBreakStmt(pImage, cbSize = 0);
8344 cbSize = pImage->Backend->pfnGetFileSize(pImage->pBackendData);
8345 } while (0);
8346
8347 if (RT_UNLIKELY(fLockRead))
8348 {
8349 rc2 = vdThreadFinishRead(pDisk);
8350 AssertRC(rc2);
8351 }
8352
8353 LogFlowFunc(("returns %llu\n", cbSize));
8354 return cbSize;
8355}
8356
8357/**
8358 * Get virtual disk PCHS geometry stored in HDD container.
8359 *
8360 * @returns VBox status code.
8361 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8362 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8363 * @param pDisk Pointer to HDD container.
8364 * @param nImage Image number, counts from 0. 0 is always base image of container.
8365 * @param pPCHSGeometry Where to store PCHS geometry. Not NULL.
8366 */
8367VBOXDDU_DECL(int) VDGetPCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
8368 PVDGEOMETRY pPCHSGeometry)
8369{
8370 int rc = VINF_SUCCESS;
8371 int rc2;
8372 bool fLockRead = false;
8373
8374 LogFlowFunc(("pDisk=%#p nImage=%u pPCHSGeometry=%#p\n",
8375 pDisk, nImage, pPCHSGeometry));
8376 do
8377 {
8378 /* sanity check */
8379 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8380 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8381
8382 /* Check arguments. */
8383 AssertMsgBreakStmt(VALID_PTR(pPCHSGeometry),
8384 ("pPCHSGeometry=%#p\n", pPCHSGeometry),
8385 rc = VERR_INVALID_PARAMETER);
8386
8387 rc2 = vdThreadStartRead(pDisk);
8388 AssertRC(rc2);
8389 fLockRead = true;
8390
8391 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8392 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8393
8394 if (pImage == pDisk->pLast)
8395 {
8396 /* Use cached information if possible. */
8397 if (pDisk->PCHSGeometry.cCylinders != 0)
8398 *pPCHSGeometry = pDisk->PCHSGeometry;
8399 else
8400 rc = VERR_VD_GEOMETRY_NOT_SET;
8401 }
8402 else
8403 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8404 pPCHSGeometry);
8405 } while (0);
8406
8407 if (RT_UNLIKELY(fLockRead))
8408 {
8409 rc2 = vdThreadFinishRead(pDisk);
8410 AssertRC(rc2);
8411 }
8412
8413 LogFlowFunc(("%Rrc (PCHS=%u/%u/%u)\n", rc,
8414 pDisk->PCHSGeometry.cCylinders, pDisk->PCHSGeometry.cHeads,
8415 pDisk->PCHSGeometry.cSectors));
8416 return rc;
8417}
8418
8419/**
8420 * Store virtual disk PCHS geometry in HDD container.
8421 *
8422 * Note that in case of unrecoverable error all images in HDD container will be closed.
8423 *
8424 * @returns VBox status code.
8425 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8426 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8427 * @param pDisk Pointer to HDD container.
8428 * @param nImage Image number, counts from 0. 0 is always base image of container.
8429 * @param pPCHSGeometry Where to load PCHS geometry from. Not NULL.
8430 */
8431VBOXDDU_DECL(int) VDSetPCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
8432 PCVDGEOMETRY pPCHSGeometry)
8433{
8434 int rc = VINF_SUCCESS;
8435 int rc2;
8436 bool fLockWrite = false;
8437
8438 LogFlowFunc(("pDisk=%#p nImage=%u pPCHSGeometry=%#p PCHS=%u/%u/%u\n",
8439 pDisk, nImage, pPCHSGeometry, pPCHSGeometry->cCylinders,
8440 pPCHSGeometry->cHeads, pPCHSGeometry->cSectors));
8441 do
8442 {
8443 /* sanity check */
8444 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8445 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8446
8447 /* Check arguments. */
8448 AssertMsgBreakStmt( VALID_PTR(pPCHSGeometry)
8449 && pPCHSGeometry->cHeads <= 16
8450 && pPCHSGeometry->cSectors <= 63,
8451 ("pPCHSGeometry=%#p PCHS=%u/%u/%u\n", pPCHSGeometry,
8452 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
8453 pPCHSGeometry->cSectors),
8454 rc = VERR_INVALID_PARAMETER);
8455
8456 rc2 = vdThreadStartWrite(pDisk);
8457 AssertRC(rc2);
8458 fLockWrite = true;
8459
8460 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8461 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8462
8463 if (pImage == pDisk->pLast)
8464 {
8465 if ( pPCHSGeometry->cCylinders != pDisk->PCHSGeometry.cCylinders
8466 || pPCHSGeometry->cHeads != pDisk->PCHSGeometry.cHeads
8467 || pPCHSGeometry->cSectors != pDisk->PCHSGeometry.cSectors)
8468 {
8469 /* Only update geometry if it is changed. Avoids similar checks
8470 * in every backend. Most of the time the new geometry is set
8471 * to the previous values, so no need to go through the hassle
8472 * of updating an image which could be opened in read-only mode
8473 * right now. */
8474 rc = pImage->Backend->pfnSetPCHSGeometry(pImage->pBackendData,
8475 pPCHSGeometry);
8476
8477 /* Cache new geometry values in any case. */
8478 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8479 &pDisk->PCHSGeometry);
8480 if (RT_FAILURE(rc2))
8481 {
8482 pDisk->PCHSGeometry.cCylinders = 0;
8483 pDisk->PCHSGeometry.cHeads = 0;
8484 pDisk->PCHSGeometry.cSectors = 0;
8485 }
8486 else
8487 {
8488 /* Make sure the CHS geometry is properly clipped. */
8489 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 255);
8490 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
8491 }
8492 }
8493 }
8494 else
8495 {
8496 VDGEOMETRY PCHS;
8497 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8498 &PCHS);
8499 if ( RT_FAILURE(rc)
8500 || pPCHSGeometry->cCylinders != PCHS.cCylinders
8501 || pPCHSGeometry->cHeads != PCHS.cHeads
8502 || pPCHSGeometry->cSectors != PCHS.cSectors)
8503 {
8504 /* Only update geometry if it is changed. Avoids similar checks
8505 * in every backend. Most of the time the new geometry is set
8506 * to the previous values, so no need to go through the hassle
8507 * of updating an image which could be opened in read-only mode
8508 * right now. */
8509 rc = pImage->Backend->pfnSetPCHSGeometry(pImage->pBackendData,
8510 pPCHSGeometry);
8511 }
8512 }
8513 } while (0);
8514
8515 if (RT_UNLIKELY(fLockWrite))
8516 {
8517 rc2 = vdThreadFinishWrite(pDisk);
8518 AssertRC(rc2);
8519 }
8520
8521 LogFlowFunc(("returns %Rrc\n", rc));
8522 return rc;
8523}
8524
8525/**
8526 * Get virtual disk LCHS geometry stored in HDD container.
8527 *
8528 * @returns VBox status code.
8529 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8530 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8531 * @param pDisk Pointer to HDD container.
8532 * @param nImage Image number, counts from 0. 0 is always base image of container.
8533 * @param pLCHSGeometry Where to store LCHS geometry. Not NULL.
8534 */
8535VBOXDDU_DECL(int) VDGetLCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
8536 PVDGEOMETRY pLCHSGeometry)
8537{
8538 int rc = VINF_SUCCESS;
8539 int rc2;
8540 bool fLockRead = false;
8541
8542 LogFlowFunc(("pDisk=%#p nImage=%u pLCHSGeometry=%#p\n",
8543 pDisk, nImage, pLCHSGeometry));
8544 do
8545 {
8546 /* sanity check */
8547 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8548 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8549
8550 /* Check arguments. */
8551 AssertMsgBreakStmt(VALID_PTR(pLCHSGeometry),
8552 ("pLCHSGeometry=%#p\n", pLCHSGeometry),
8553 rc = VERR_INVALID_PARAMETER);
8554
8555 rc2 = vdThreadStartRead(pDisk);
8556 AssertRC(rc2);
8557 fLockRead = true;
8558
8559 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8560 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8561
8562 if (pImage == pDisk->pLast)
8563 {
8564 /* Use cached information if possible. */
8565 if (pDisk->LCHSGeometry.cCylinders != 0)
8566 *pLCHSGeometry = pDisk->LCHSGeometry;
8567 else
8568 rc = VERR_VD_GEOMETRY_NOT_SET;
8569 }
8570 else
8571 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
8572 pLCHSGeometry);
8573 } while (0);
8574
8575 if (RT_UNLIKELY(fLockRead))
8576 {
8577 rc2 = vdThreadFinishRead(pDisk);
8578 AssertRC(rc2);
8579 }
8580
8581 LogFlowFunc((": %Rrc (LCHS=%u/%u/%u)\n", rc,
8582 pDisk->LCHSGeometry.cCylinders, pDisk->LCHSGeometry.cHeads,
8583 pDisk->LCHSGeometry.cSectors));
8584 return rc;
8585}
8586
8587/**
8588 * Store virtual disk LCHS geometry in HDD container.
8589 *
8590 * Note that in case of unrecoverable error all images in HDD container will be closed.
8591 *
8592 * @returns VBox status code.
8593 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8594 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8595 * @param pDisk Pointer to HDD container.
8596 * @param nImage Image number, counts from 0. 0 is always base image of container.
8597 * @param pLCHSGeometry Where to load LCHS geometry from. Not NULL.
8598 */
8599VBOXDDU_DECL(int) VDSetLCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
8600 PCVDGEOMETRY pLCHSGeometry)
8601{
8602 int rc = VINF_SUCCESS;
8603 int rc2;
8604 bool fLockWrite = false;
8605
8606 LogFlowFunc(("pDisk=%#p nImage=%u pLCHSGeometry=%#p LCHS=%u/%u/%u\n",
8607 pDisk, nImage, pLCHSGeometry, pLCHSGeometry->cCylinders,
8608 pLCHSGeometry->cHeads, pLCHSGeometry->cSectors));
8609 do
8610 {
8611 /* sanity check */
8612 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8613 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8614
8615 /* Check arguments. */
8616 AssertMsgBreakStmt( VALID_PTR(pLCHSGeometry)
8617 && pLCHSGeometry->cHeads <= 255
8618 && pLCHSGeometry->cSectors <= 63,
8619 ("pLCHSGeometry=%#p LCHS=%u/%u/%u\n", pLCHSGeometry,
8620 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads,
8621 pLCHSGeometry->cSectors),
8622 rc = VERR_INVALID_PARAMETER);
8623
8624 rc2 = vdThreadStartWrite(pDisk);
8625 AssertRC(rc2);
8626 fLockWrite = true;
8627
8628 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8629 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8630
8631 if (pImage == pDisk->pLast)
8632 {
8633 if ( pLCHSGeometry->cCylinders != pDisk->LCHSGeometry.cCylinders
8634 || pLCHSGeometry->cHeads != pDisk->LCHSGeometry.cHeads
8635 || pLCHSGeometry->cSectors != pDisk->LCHSGeometry.cSectors)
8636 {
8637 /* Only update geometry if it is changed. Avoids similar checks
8638 * in every backend. Most of the time the new geometry is set
8639 * to the previous values, so no need to go through the hassle
8640 * of updating an image which could be opened in read-only mode
8641 * right now. */
8642 rc = pImage->Backend->pfnSetLCHSGeometry(pImage->pBackendData,
8643 pLCHSGeometry);
8644
8645 /* Cache new geometry values in any case. */
8646 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
8647 &pDisk->LCHSGeometry);
8648 if (RT_FAILURE(rc2))
8649 {
8650 pDisk->LCHSGeometry.cCylinders = 0;
8651 pDisk->LCHSGeometry.cHeads = 0;
8652 pDisk->LCHSGeometry.cSectors = 0;
8653 }
8654 else
8655 {
8656 /* Make sure the CHS geometry is properly clipped. */
8657 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
8658 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
8659 }
8660 }
8661 }
8662 else
8663 {
8664 VDGEOMETRY LCHS;
8665 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
8666 &LCHS);
8667 if ( RT_FAILURE(rc)
8668 || pLCHSGeometry->cCylinders != LCHS.cCylinders
8669 || pLCHSGeometry->cHeads != LCHS.cHeads
8670 || pLCHSGeometry->cSectors != LCHS.cSectors)
8671 {
8672 /* Only update geometry if it is changed. Avoids similar checks
8673 * in every backend. Most of the time the new geometry is set
8674 * to the previous values, so no need to go through the hassle
8675 * of updating an image which could be opened in read-only mode
8676 * right now. */
8677 rc = pImage->Backend->pfnSetLCHSGeometry(pImage->pBackendData,
8678 pLCHSGeometry);
8679 }
8680 }
8681 } while (0);
8682
8683 if (RT_UNLIKELY(fLockWrite))
8684 {
8685 rc2 = vdThreadFinishWrite(pDisk);
8686 AssertRC(rc2);
8687 }
8688
8689 LogFlowFunc(("returns %Rrc\n", rc));
8690 return rc;
8691}
8692
8693/**
8694 * Get version of image in HDD container.
8695 *
8696 * @returns VBox status code.
8697 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8698 * @param pDisk Pointer to HDD container.
8699 * @param nImage Image number, counts from 0. 0 is always base image of container.
8700 * @param puVersion Where to store the image version.
8701 */
8702VBOXDDU_DECL(int) VDGetVersion(PVBOXHDD pDisk, unsigned nImage,
8703 unsigned *puVersion)
8704{
8705 int rc = VINF_SUCCESS;
8706 int rc2;
8707 bool fLockRead = false;
8708
8709 LogFlowFunc(("pDisk=%#p nImage=%u puVersion=%#p\n",
8710 pDisk, nImage, puVersion));
8711 do
8712 {
8713 /* sanity check */
8714 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8715 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8716
8717 /* Check arguments. */
8718 AssertMsgBreakStmt(VALID_PTR(puVersion),
8719 ("puVersion=%#p\n", puVersion),
8720 rc = VERR_INVALID_PARAMETER);
8721
8722 rc2 = vdThreadStartRead(pDisk);
8723 AssertRC(rc2);
8724 fLockRead = true;
8725
8726 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8727 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8728
8729 *puVersion = pImage->Backend->pfnGetVersion(pImage->pBackendData);
8730 } while (0);
8731
8732 if (RT_UNLIKELY(fLockRead))
8733 {
8734 rc2 = vdThreadFinishRead(pDisk);
8735 AssertRC(rc2);
8736 }
8737
8738 LogFlowFunc(("returns %Rrc uVersion=%#x\n", rc, *puVersion));
8739 return rc;
8740}
8741
8742/**
8743 * List the capabilities of image backend in HDD container.
8744 *
8745 * @returns VBox status code.
8746 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8747 * @param pDisk Pointer to the HDD container.
8748 * @param nImage Image number, counts from 0. 0 is always base image of container.
8749 * @param pbackendInfo Where to store the backend information.
8750 */
8751VBOXDDU_DECL(int) VDBackendInfoSingle(PVBOXHDD pDisk, unsigned nImage,
8752 PVDBACKENDINFO pBackendInfo)
8753{
8754 int rc = VINF_SUCCESS;
8755 int rc2;
8756 bool fLockRead = false;
8757
8758 LogFlowFunc(("pDisk=%#p nImage=%u pBackendInfo=%#p\n",
8759 pDisk, nImage, pBackendInfo));
8760 do
8761 {
8762 /* sanity check */
8763 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8764 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8765
8766 /* Check arguments. */
8767 AssertMsgBreakStmt(VALID_PTR(pBackendInfo),
8768 ("pBackendInfo=%#p\n", pBackendInfo),
8769 rc = VERR_INVALID_PARAMETER);
8770
8771 rc2 = vdThreadStartRead(pDisk);
8772 AssertRC(rc2);
8773 fLockRead = true;
8774
8775 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8776 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8777
8778 pBackendInfo->pszBackend = pImage->Backend->pszBackendName;
8779 pBackendInfo->uBackendCaps = pImage->Backend->uBackendCaps;
8780 pBackendInfo->paFileExtensions = pImage->Backend->paFileExtensions;
8781 pBackendInfo->paConfigInfo = pImage->Backend->paConfigInfo;
8782 } while (0);
8783
8784 if (RT_UNLIKELY(fLockRead))
8785 {
8786 rc2 = vdThreadFinishRead(pDisk);
8787 AssertRC(rc2);
8788 }
8789
8790 LogFlowFunc(("returns %Rrc\n", rc));
8791 return rc;
8792}
8793
8794/**
8795 * Get flags of image in HDD container.
8796 *
8797 * @returns VBox status code.
8798 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8799 * @param pDisk Pointer to HDD container.
8800 * @param nImage Image number, counts from 0. 0 is always base image of container.
8801 * @param puImageFlags Where to store the image flags.
8802 */
8803VBOXDDU_DECL(int) VDGetImageFlags(PVBOXHDD pDisk, unsigned nImage,
8804 unsigned *puImageFlags)
8805{
8806 int rc = VINF_SUCCESS;
8807 int rc2;
8808 bool fLockRead = false;
8809
8810 LogFlowFunc(("pDisk=%#p nImage=%u puImageFlags=%#p\n",
8811 pDisk, nImage, puImageFlags));
8812 do
8813 {
8814 /* sanity check */
8815 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8816 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8817
8818 /* Check arguments. */
8819 AssertMsgBreakStmt(VALID_PTR(puImageFlags),
8820 ("puImageFlags=%#p\n", puImageFlags),
8821 rc = VERR_INVALID_PARAMETER);
8822
8823 rc2 = vdThreadStartRead(pDisk);
8824 AssertRC(rc2);
8825 fLockRead = true;
8826
8827 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8828 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8829
8830 *puImageFlags = pImage->uImageFlags;
8831 } while (0);
8832
8833 if (RT_UNLIKELY(fLockRead))
8834 {
8835 rc2 = vdThreadFinishRead(pDisk);
8836 AssertRC(rc2);
8837 }
8838
8839 LogFlowFunc(("returns %Rrc uImageFlags=%#x\n", rc, *puImageFlags));
8840 return rc;
8841}
8842
8843/**
8844 * Get open flags of image in HDD container.
8845 *
8846 * @returns VBox status code.
8847 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8848 * @param pDisk Pointer to HDD container.
8849 * @param nImage Image number, counts from 0. 0 is always base image of container.
8850 * @param puOpenFlags Where to store the image open flags.
8851 */
8852VBOXDDU_DECL(int) VDGetOpenFlags(PVBOXHDD pDisk, unsigned nImage,
8853 unsigned *puOpenFlags)
8854{
8855 int rc = VINF_SUCCESS;
8856 int rc2;
8857 bool fLockRead = false;
8858
8859 LogFlowFunc(("pDisk=%#p nImage=%u puOpenFlags=%#p\n",
8860 pDisk, nImage, puOpenFlags));
8861 do
8862 {
8863 /* sanity check */
8864 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8865 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8866
8867 /* Check arguments. */
8868 AssertMsgBreakStmt(VALID_PTR(puOpenFlags),
8869 ("puOpenFlags=%#p\n", puOpenFlags),
8870 rc = VERR_INVALID_PARAMETER);
8871
8872 rc2 = vdThreadStartRead(pDisk);
8873 AssertRC(rc2);
8874 fLockRead = true;
8875
8876 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8877 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8878
8879 *puOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
8880 } while (0);
8881
8882 if (RT_UNLIKELY(fLockRead))
8883 {
8884 rc2 = vdThreadFinishRead(pDisk);
8885 AssertRC(rc2);
8886 }
8887
8888 LogFlowFunc(("returns %Rrc uOpenFlags=%#x\n", rc, *puOpenFlags));
8889 return rc;
8890}
8891
8892/**
8893 * Set open flags of image in HDD container.
8894 * This operation may cause file locking changes and/or files being reopened.
8895 * Note that in case of unrecoverable error all images in HDD container will be closed.
8896 *
8897 * @returns VBox status code.
8898 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8899 * @param pDisk Pointer to HDD container.
8900 * @param nImage Image number, counts from 0. 0 is always base image of container.
8901 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
8902 */
8903VBOXDDU_DECL(int) VDSetOpenFlags(PVBOXHDD pDisk, unsigned nImage,
8904 unsigned uOpenFlags)
8905{
8906 int rc;
8907 int rc2;
8908 bool fLockWrite = false;
8909
8910 LogFlowFunc(("pDisk=%#p uOpenFlags=%#u\n", pDisk, uOpenFlags));
8911 do
8912 {
8913 /* sanity check */
8914 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8915 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8916
8917 /* Check arguments. */
8918 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
8919 ("uOpenFlags=%#x\n", uOpenFlags),
8920 rc = VERR_INVALID_PARAMETER);
8921
8922 rc2 = vdThreadStartWrite(pDisk);
8923 AssertRC(rc2);
8924 fLockWrite = true;
8925
8926 /* Destroy any discard state because the image might be changed to readonly mode. */
8927 rc = vdDiscardStateDestroy(pDisk);
8928 if (RT_FAILURE(rc))
8929 break;
8930
8931 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8932 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8933
8934 rc = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData,
8935 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS));
8936 if (RT_SUCCESS(rc))
8937 pImage->uOpenFlags = uOpenFlags & (VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_DISCARD | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS);
8938 } while (0);
8939
8940 if (RT_UNLIKELY(fLockWrite))
8941 {
8942 rc2 = vdThreadFinishWrite(pDisk);
8943 AssertRC(rc2);
8944 }
8945
8946 LogFlowFunc(("returns %Rrc\n", rc));
8947 return rc;
8948}
8949
8950/**
8951 * Get base filename of image in HDD container. Some image formats use
8952 * other filenames as well, so don't use this for anything but informational
8953 * purposes.
8954 *
8955 * @returns VBox status code.
8956 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8957 * @returns VERR_BUFFER_OVERFLOW if pszFilename buffer too small to hold filename.
8958 * @param pDisk Pointer to HDD container.
8959 * @param nImage Image number, counts from 0. 0 is always base image of container.
8960 * @param pszFilename Where to store the image file name.
8961 * @param cbFilename Size of buffer pszFilename points to.
8962 */
8963VBOXDDU_DECL(int) VDGetFilename(PVBOXHDD pDisk, unsigned nImage,
8964 char *pszFilename, unsigned cbFilename)
8965{
8966 int rc;
8967 int rc2;
8968 bool fLockRead = false;
8969
8970 LogFlowFunc(("pDisk=%#p nImage=%u pszFilename=%#p cbFilename=%u\n",
8971 pDisk, nImage, pszFilename, cbFilename));
8972 do
8973 {
8974 /* sanity check */
8975 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8976 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8977
8978 /* Check arguments. */
8979 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
8980 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
8981 rc = VERR_INVALID_PARAMETER);
8982 AssertMsgBreakStmt(cbFilename,
8983 ("cbFilename=%u\n", cbFilename),
8984 rc = VERR_INVALID_PARAMETER);
8985
8986 rc2 = vdThreadStartRead(pDisk);
8987 AssertRC(rc2);
8988 fLockRead = true;
8989
8990 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8991 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8992
8993 size_t cb = strlen(pImage->pszFilename);
8994 if (cb <= cbFilename)
8995 {
8996 strcpy(pszFilename, pImage->pszFilename);
8997 rc = VINF_SUCCESS;
8998 }
8999 else
9000 {
9001 strncpy(pszFilename, pImage->pszFilename, cbFilename - 1);
9002 pszFilename[cbFilename - 1] = '\0';
9003 rc = VERR_BUFFER_OVERFLOW;
9004 }
9005 } while (0);
9006
9007 if (RT_UNLIKELY(fLockRead))
9008 {
9009 rc2 = vdThreadFinishRead(pDisk);
9010 AssertRC(rc2);
9011 }
9012
9013 LogFlowFunc(("returns %Rrc, pszFilename=\"%s\"\n", rc, pszFilename));
9014 return rc;
9015}
9016
9017/**
9018 * Get the comment line of image in HDD container.
9019 *
9020 * @returns VBox status code.
9021 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9022 * @returns VERR_BUFFER_OVERFLOW if pszComment buffer too small to hold comment text.
9023 * @param pDisk Pointer to HDD container.
9024 * @param nImage Image number, counts from 0. 0 is always base image of container.
9025 * @param pszComment Where to store the comment string of image. NULL is ok.
9026 * @param cbComment The size of pszComment buffer. 0 is ok.
9027 */
9028VBOXDDU_DECL(int) VDGetComment(PVBOXHDD pDisk, unsigned nImage,
9029 char *pszComment, unsigned cbComment)
9030{
9031 int rc;
9032 int rc2;
9033 bool fLockRead = false;
9034
9035 LogFlowFunc(("pDisk=%#p nImage=%u pszComment=%#p cbComment=%u\n",
9036 pDisk, nImage, pszComment, cbComment));
9037 do
9038 {
9039 /* sanity check */
9040 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9041 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9042
9043 /* Check arguments. */
9044 AssertMsgBreakStmt(VALID_PTR(pszComment),
9045 ("pszComment=%#p \"%s\"\n", pszComment, pszComment),
9046 rc = VERR_INVALID_PARAMETER);
9047 AssertMsgBreakStmt(cbComment,
9048 ("cbComment=%u\n", cbComment),
9049 rc = VERR_INVALID_PARAMETER);
9050
9051 rc2 = vdThreadStartRead(pDisk);
9052 AssertRC(rc2);
9053 fLockRead = true;
9054
9055 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9056 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9057
9058 rc = pImage->Backend->pfnGetComment(pImage->pBackendData, pszComment,
9059 cbComment);
9060 } while (0);
9061
9062 if (RT_UNLIKELY(fLockRead))
9063 {
9064 rc2 = vdThreadFinishRead(pDisk);
9065 AssertRC(rc2);
9066 }
9067
9068 LogFlowFunc(("returns %Rrc, pszComment=\"%s\"\n", rc, pszComment));
9069 return rc;
9070}
9071
9072/**
9073 * Changes the comment line of image in HDD container.
9074 *
9075 * @returns VBox status code.
9076 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9077 * @param pDisk Pointer to HDD container.
9078 * @param nImage Image number, counts from 0. 0 is always base image of container.
9079 * @param pszComment New comment string (UTF-8). NULL is allowed to reset the comment.
9080 */
9081VBOXDDU_DECL(int) VDSetComment(PVBOXHDD pDisk, unsigned nImage,
9082 const char *pszComment)
9083{
9084 int rc;
9085 int rc2;
9086 bool fLockWrite = false;
9087
9088 LogFlowFunc(("pDisk=%#p nImage=%u pszComment=%#p \"%s\"\n",
9089 pDisk, nImage, pszComment, pszComment));
9090 do
9091 {
9092 /* sanity check */
9093 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9094 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9095
9096 /* Check arguments. */
9097 AssertMsgBreakStmt(VALID_PTR(pszComment) || pszComment == NULL,
9098 ("pszComment=%#p \"%s\"\n", pszComment, pszComment),
9099 rc = VERR_INVALID_PARAMETER);
9100
9101 rc2 = vdThreadStartWrite(pDisk);
9102 AssertRC(rc2);
9103 fLockWrite = true;
9104
9105 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9106 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9107
9108 rc = pImage->Backend->pfnSetComment(pImage->pBackendData, pszComment);
9109 } while (0);
9110
9111 if (RT_UNLIKELY(fLockWrite))
9112 {
9113 rc2 = vdThreadFinishWrite(pDisk);
9114 AssertRC(rc2);
9115 }
9116
9117 LogFlowFunc(("returns %Rrc\n", rc));
9118 return rc;
9119}
9120
9121
9122/**
9123 * Get UUID of image in HDD container.
9124 *
9125 * @returns VBox status code.
9126 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9127 * @param pDisk Pointer to HDD container.
9128 * @param nImage Image number, counts from 0. 0 is always base image of container.
9129 * @param pUuid Where to store the image creation UUID.
9130 */
9131VBOXDDU_DECL(int) VDGetUuid(PVBOXHDD pDisk, unsigned nImage, PRTUUID pUuid)
9132{
9133 int rc;
9134 int rc2;
9135 bool fLockRead = false;
9136
9137 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9138 do
9139 {
9140 /* sanity check */
9141 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9142 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9143
9144 /* Check arguments. */
9145 AssertMsgBreakStmt(VALID_PTR(pUuid),
9146 ("pUuid=%#p\n", pUuid),
9147 rc = VERR_INVALID_PARAMETER);
9148
9149 rc2 = vdThreadStartRead(pDisk);
9150 AssertRC(rc2);
9151 fLockRead = true;
9152
9153 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9154 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9155
9156 rc = pImage->Backend->pfnGetUuid(pImage->pBackendData, pUuid);
9157 } while (0);
9158
9159 if (RT_UNLIKELY(fLockRead))
9160 {
9161 rc2 = vdThreadFinishRead(pDisk);
9162 AssertRC(rc2);
9163 }
9164
9165 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9166 return rc;
9167}
9168
9169/**
9170 * Set the image's UUID. Should not be used by normal applications.
9171 *
9172 * @returns VBox status code.
9173 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9174 * @param pDisk Pointer to HDD container.
9175 * @param nImage Image number, counts from 0. 0 is always base image of container.
9176 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
9177 */
9178VBOXDDU_DECL(int) VDSetUuid(PVBOXHDD pDisk, unsigned nImage, PCRTUUID pUuid)
9179{
9180 int rc;
9181 int rc2;
9182 bool fLockWrite = false;
9183
9184 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9185 pDisk, nImage, pUuid, pUuid));
9186 do
9187 {
9188 /* sanity check */
9189 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9190 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9191
9192 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9193 ("pUuid=%#p\n", pUuid),
9194 rc = VERR_INVALID_PARAMETER);
9195
9196 rc2 = vdThreadStartWrite(pDisk);
9197 AssertRC(rc2);
9198 fLockWrite = true;
9199
9200 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9201 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9202
9203 RTUUID Uuid;
9204 if (!pUuid)
9205 {
9206 RTUuidCreate(&Uuid);
9207 pUuid = &Uuid;
9208 }
9209 rc = pImage->Backend->pfnSetUuid(pImage->pBackendData, pUuid);
9210 } while (0);
9211
9212 if (RT_UNLIKELY(fLockWrite))
9213 {
9214 rc2 = vdThreadFinishWrite(pDisk);
9215 AssertRC(rc2);
9216 }
9217
9218 LogFlowFunc(("returns %Rrc\n", rc));
9219 return rc;
9220}
9221
9222/**
9223 * Get last modification UUID of image in HDD container.
9224 *
9225 * @returns VBox status code.
9226 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9227 * @param pDisk Pointer to HDD container.
9228 * @param nImage Image number, counts from 0. 0 is always base image of container.
9229 * @param pUuid Where to store the image modification UUID.
9230 */
9231VBOXDDU_DECL(int) VDGetModificationUuid(PVBOXHDD pDisk, unsigned nImage, PRTUUID pUuid)
9232{
9233 int rc = VINF_SUCCESS;
9234 int rc2;
9235 bool fLockRead = false;
9236
9237 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9238 do
9239 {
9240 /* sanity check */
9241 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9242 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9243
9244 /* Check arguments. */
9245 AssertMsgBreakStmt(VALID_PTR(pUuid),
9246 ("pUuid=%#p\n", pUuid),
9247 rc = VERR_INVALID_PARAMETER);
9248
9249 rc2 = vdThreadStartRead(pDisk);
9250 AssertRC(rc2);
9251 fLockRead = true;
9252
9253 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9254 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9255
9256 rc = pImage->Backend->pfnGetModificationUuid(pImage->pBackendData,
9257 pUuid);
9258 } while (0);
9259
9260 if (RT_UNLIKELY(fLockRead))
9261 {
9262 rc2 = vdThreadFinishRead(pDisk);
9263 AssertRC(rc2);
9264 }
9265
9266 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9267 return rc;
9268}
9269
9270/**
9271 * Set the image's last modification UUID. Should not be used by normal applications.
9272 *
9273 * @returns VBox status code.
9274 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9275 * @param pDisk Pointer to HDD container.
9276 * @param nImage Image number, counts from 0. 0 is always base image of container.
9277 * @param pUuid New modification UUID of the image. If NULL, a new UUID is created.
9278 */
9279VBOXDDU_DECL(int) VDSetModificationUuid(PVBOXHDD pDisk, unsigned nImage, PCRTUUID pUuid)
9280{
9281 int rc;
9282 int rc2;
9283 bool fLockWrite = false;
9284
9285 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9286 pDisk, nImage, pUuid, pUuid));
9287 do
9288 {
9289 /* sanity check */
9290 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9291 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9292
9293 /* Check arguments. */
9294 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9295 ("pUuid=%#p\n", pUuid),
9296 rc = VERR_INVALID_PARAMETER);
9297
9298 rc2 = vdThreadStartWrite(pDisk);
9299 AssertRC(rc2);
9300 fLockWrite = true;
9301
9302 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9303 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9304
9305 RTUUID Uuid;
9306 if (!pUuid)
9307 {
9308 RTUuidCreate(&Uuid);
9309 pUuid = &Uuid;
9310 }
9311 rc = pImage->Backend->pfnSetModificationUuid(pImage->pBackendData,
9312 pUuid);
9313 } while (0);
9314
9315 if (RT_UNLIKELY(fLockWrite))
9316 {
9317 rc2 = vdThreadFinishWrite(pDisk);
9318 AssertRC(rc2);
9319 }
9320
9321 LogFlowFunc(("returns %Rrc\n", rc));
9322 return rc;
9323}
9324
9325/**
9326 * Get parent UUID of image in HDD container.
9327 *
9328 * @returns VBox status code.
9329 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9330 * @param pDisk Pointer to HDD container.
9331 * @param nImage Image number, counts from 0. 0 is always base image of container.
9332 * @param pUuid Where to store the parent image UUID.
9333 */
9334VBOXDDU_DECL(int) VDGetParentUuid(PVBOXHDD pDisk, unsigned nImage,
9335 PRTUUID pUuid)
9336{
9337 int rc = VINF_SUCCESS;
9338 int rc2;
9339 bool fLockRead = false;
9340
9341 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9342 do
9343 {
9344 /* sanity check */
9345 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9346 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9347
9348 /* Check arguments. */
9349 AssertMsgBreakStmt(VALID_PTR(pUuid),
9350 ("pUuid=%#p\n", pUuid),
9351 rc = VERR_INVALID_PARAMETER);
9352
9353 rc2 = vdThreadStartRead(pDisk);
9354 AssertRC(rc2);
9355 fLockRead = true;
9356
9357 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9358 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9359
9360 rc = pImage->Backend->pfnGetParentUuid(pImage->pBackendData, pUuid);
9361 } while (0);
9362
9363 if (RT_UNLIKELY(fLockRead))
9364 {
9365 rc2 = vdThreadFinishRead(pDisk);
9366 AssertRC(rc2);
9367 }
9368
9369 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9370 return rc;
9371}
9372
9373/**
9374 * Set the image's parent UUID. Should not be used by normal applications.
9375 *
9376 * @returns VBox status code.
9377 * @param pDisk Pointer to HDD container.
9378 * @param nImage Image number, counts from 0. 0 is always base image of container.
9379 * @param pUuid New parent UUID of the image. If NULL, a new UUID is created.
9380 */
9381VBOXDDU_DECL(int) VDSetParentUuid(PVBOXHDD pDisk, unsigned nImage,
9382 PCRTUUID pUuid)
9383{
9384 int rc;
9385 int rc2;
9386 bool fLockWrite = false;
9387
9388 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9389 pDisk, nImage, pUuid, pUuid));
9390 do
9391 {
9392 /* sanity check */
9393 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9394 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9395
9396 /* Check arguments. */
9397 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9398 ("pUuid=%#p\n", pUuid),
9399 rc = VERR_INVALID_PARAMETER);
9400
9401 rc2 = vdThreadStartWrite(pDisk);
9402 AssertRC(rc2);
9403 fLockWrite = true;
9404
9405 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9406 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9407
9408 RTUUID Uuid;
9409 if (!pUuid)
9410 {
9411 RTUuidCreate(&Uuid);
9412 pUuid = &Uuid;
9413 }
9414 rc = pImage->Backend->pfnSetParentUuid(pImage->pBackendData, pUuid);
9415 } while (0);
9416
9417 if (RT_UNLIKELY(fLockWrite))
9418 {
9419 rc2 = vdThreadFinishWrite(pDisk);
9420 AssertRC(rc2);
9421 }
9422
9423 LogFlowFunc(("returns %Rrc\n", rc));
9424 return rc;
9425}
9426
9427
9428/**
9429 * Debug helper - dumps all opened images in HDD container into the log file.
9430 *
9431 * @param pDisk Pointer to HDD container.
9432 */
9433VBOXDDU_DECL(void) VDDumpImages(PVBOXHDD pDisk)
9434{
9435 int rc2;
9436 bool fLockRead = false;
9437
9438 do
9439 {
9440 /* sanity check */
9441 AssertPtrBreak(pDisk);
9442 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9443
9444 if (!pDisk->pInterfaceError || !VALID_PTR(pDisk->pInterfaceError->pfnMessage))
9445 pDisk->pInterfaceError->pfnMessage = vdLogMessage;
9446
9447 rc2 = vdThreadStartRead(pDisk);
9448 AssertRC(rc2);
9449 fLockRead = true;
9450
9451 vdMessageWrapper(pDisk, "--- Dumping VD Disk, Images=%u\n", pDisk->cImages);
9452 for (PVDIMAGE pImage = pDisk->pBase; pImage; pImage = pImage->pNext)
9453 {
9454 vdMessageWrapper(pDisk, "Dumping VD image \"%s\" (Backend=%s)\n",
9455 pImage->pszFilename, pImage->Backend->pszBackendName);
9456 pImage->Backend->pfnDump(pImage->pBackendData);
9457 }
9458 } while (0);
9459
9460 if (RT_UNLIKELY(fLockRead))
9461 {
9462 rc2 = vdThreadFinishRead(pDisk);
9463 AssertRC(rc2);
9464 }
9465}
9466
9467
9468VBOXDDU_DECL(int) VDDiscardRanges(PVBOXHDD pDisk, PCRTRANGE paRanges, unsigned cRanges)
9469{
9470 int rc;
9471 int rc2;
9472 bool fLockWrite = false;
9473
9474 LogFlowFunc(("pDisk=%#p paRanges=%#p cRanges=%u\n",
9475 pDisk, paRanges, cRanges));
9476 do
9477 {
9478 /* sanity check */
9479 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9480 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9481
9482 /* Check arguments. */
9483 AssertMsgBreakStmt(cRanges,
9484 ("cRanges=%u\n", cRanges),
9485 rc = VERR_INVALID_PARAMETER);
9486 AssertMsgBreakStmt(VALID_PTR(paRanges),
9487 ("paRanges=%#p\n", paRanges),
9488 rc = VERR_INVALID_PARAMETER);
9489
9490 rc2 = vdThreadStartWrite(pDisk);
9491 AssertRC(rc2);
9492 fLockWrite = true;
9493
9494 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
9495
9496 AssertMsgBreakStmt(pDisk->pLast->uOpenFlags & VD_OPEN_FLAGS_DISCARD,
9497 ("Discarding not supported\n"),
9498 rc = VERR_NOT_SUPPORTED);
9499
9500 PVDIOCTX pIoCtx = vdIoCtxDiscardAlloc(pDisk, paRanges, cRanges,
9501 vdIoCtxSyncComplete, pDisk, NULL, NULL,
9502 vdDiscardHelperAsync,
9503 VDIOCTX_FLAGS_SYNC);
9504 if (!pIoCtx)
9505 {
9506 rc = VERR_NO_MEMORY;
9507 break;
9508 }
9509
9510 rc = vdIoCtxProcessSync(pIoCtx);
9511 } while (0);
9512
9513 if (RT_UNLIKELY(fLockWrite))
9514 {
9515 rc2 = vdThreadFinishWrite(pDisk);
9516 AssertRC(rc2);
9517 }
9518
9519 LogFlowFunc(("returns %Rrc\n", rc));
9520 return rc;
9521}
9522
9523
9524VBOXDDU_DECL(int) VDAsyncRead(PVBOXHDD pDisk, uint64_t uOffset, size_t cbRead,
9525 PCRTSGBUF pcSgBuf,
9526 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
9527 void *pvUser1, void *pvUser2)
9528{
9529 int rc = VERR_VD_BLOCK_FREE;
9530 int rc2;
9531 bool fLockRead = false;
9532 PVDIOCTX pIoCtx = NULL;
9533
9534 LogFlowFunc(("pDisk=%#p uOffset=%llu pcSgBuf=%#p cbRead=%zu pvUser1=%#p pvUser2=%#p\n",
9535 pDisk, uOffset, pcSgBuf, cbRead, pvUser1, pvUser2));
9536
9537 do
9538 {
9539 /* sanity check */
9540 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9541 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9542
9543 /* Check arguments. */
9544 AssertMsgBreakStmt(cbRead,
9545 ("cbRead=%zu\n", cbRead),
9546 rc = VERR_INVALID_PARAMETER);
9547 AssertMsgBreakStmt(VALID_PTR(pcSgBuf),
9548 ("pcSgBuf=%#p\n", pcSgBuf),
9549 rc = VERR_INVALID_PARAMETER);
9550
9551 rc2 = vdThreadStartRead(pDisk);
9552 AssertRC(rc2);
9553 fLockRead = true;
9554
9555 AssertMsgBreakStmt(uOffset + cbRead <= pDisk->cbSize,
9556 ("uOffset=%llu cbRead=%zu pDisk->cbSize=%llu\n",
9557 uOffset, cbRead, pDisk->cbSize),
9558 rc = VERR_INVALID_PARAMETER);
9559 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
9560
9561 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_READ, uOffset,
9562 cbRead, pDisk->pLast, pcSgBuf,
9563 pfnComplete, pvUser1, pvUser2,
9564 NULL, vdReadHelperAsync,
9565 VDIOCTX_FLAGS_ZERO_FREE_BLOCKS);
9566 if (!pIoCtx)
9567 {
9568 rc = VERR_NO_MEMORY;
9569 break;
9570 }
9571
9572 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
9573 if (rc == VINF_VD_ASYNC_IO_FINISHED)
9574 {
9575 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
9576 vdIoCtxFree(pDisk, pIoCtx);
9577 else
9578 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
9579 }
9580 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
9581 vdIoCtxFree(pDisk, pIoCtx);
9582
9583 } while (0);
9584
9585 if (RT_UNLIKELY(fLockRead) && ( rc == VINF_VD_ASYNC_IO_FINISHED
9586 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
9587 {
9588 rc2 = vdThreadFinishRead(pDisk);
9589 AssertRC(rc2);
9590 }
9591
9592 LogFlowFunc(("returns %Rrc\n", rc));
9593 return rc;
9594}
9595
9596
9597VBOXDDU_DECL(int) VDAsyncWrite(PVBOXHDD pDisk, uint64_t uOffset, size_t cbWrite,
9598 PCRTSGBUF pcSgBuf,
9599 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
9600 void *pvUser1, void *pvUser2)
9601{
9602 int rc;
9603 int rc2;
9604 bool fLockWrite = false;
9605 PVDIOCTX pIoCtx = NULL;
9606
9607 LogFlowFunc(("pDisk=%#p uOffset=%llu cSgBuf=%#p cbWrite=%zu pvUser1=%#p pvUser2=%#p\n",
9608 pDisk, uOffset, pcSgBuf, cbWrite, pvUser1, pvUser2));
9609 do
9610 {
9611 /* sanity check */
9612 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9613 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9614
9615 /* Check arguments. */
9616 AssertMsgBreakStmt(cbWrite,
9617 ("cbWrite=%zu\n", cbWrite),
9618 rc = VERR_INVALID_PARAMETER);
9619 AssertMsgBreakStmt(VALID_PTR(pcSgBuf),
9620 ("pcSgBuf=%#p\n", pcSgBuf),
9621 rc = VERR_INVALID_PARAMETER);
9622
9623 rc2 = vdThreadStartWrite(pDisk);
9624 AssertRC(rc2);
9625 fLockWrite = true;
9626
9627 AssertMsgBreakStmt(uOffset + cbWrite <= pDisk->cbSize,
9628 ("uOffset=%llu cbWrite=%zu pDisk->cbSize=%llu\n",
9629 uOffset, cbWrite, pDisk->cbSize),
9630 rc = VERR_INVALID_PARAMETER);
9631 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
9632
9633 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_WRITE, uOffset,
9634 cbWrite, pDisk->pLast, pcSgBuf,
9635 pfnComplete, pvUser1, pvUser2,
9636 NULL, vdWriteHelperAsync,
9637 VDIOCTX_FLAGS_DEFAULT);
9638 if (!pIoCtx)
9639 {
9640 rc = VERR_NO_MEMORY;
9641 break;
9642 }
9643
9644 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
9645 if (rc == VINF_VD_ASYNC_IO_FINISHED)
9646 {
9647 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
9648 vdIoCtxFree(pDisk, pIoCtx);
9649 else
9650 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
9651 }
9652 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
9653 vdIoCtxFree(pDisk, pIoCtx);
9654 } while (0);
9655
9656 if (RT_UNLIKELY(fLockWrite) && ( rc == VINF_VD_ASYNC_IO_FINISHED
9657 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
9658 {
9659 rc2 = vdThreadFinishWrite(pDisk);
9660 AssertRC(rc2);
9661 }
9662
9663 LogFlowFunc(("returns %Rrc\n", rc));
9664 return rc;
9665}
9666
9667
9668VBOXDDU_DECL(int) VDAsyncFlush(PVBOXHDD pDisk, PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
9669 void *pvUser1, void *pvUser2)
9670{
9671 int rc;
9672 int rc2;
9673 bool fLockWrite = false;
9674 PVDIOCTX pIoCtx = NULL;
9675
9676 LogFlowFunc(("pDisk=%#p\n", pDisk));
9677
9678 do
9679 {
9680 /* sanity check */
9681 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9682 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9683
9684 rc2 = vdThreadStartWrite(pDisk);
9685 AssertRC(rc2);
9686 fLockWrite = true;
9687
9688 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
9689
9690 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_FLUSH, 0,
9691 0, pDisk->pLast, NULL,
9692 pfnComplete, pvUser1, pvUser2,
9693 NULL, vdFlushHelperAsync,
9694 VDIOCTX_FLAGS_DEFAULT);
9695 if (!pIoCtx)
9696 {
9697 rc = VERR_NO_MEMORY;
9698 break;
9699 }
9700
9701 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
9702 if (rc == VINF_VD_ASYNC_IO_FINISHED)
9703 {
9704 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
9705 vdIoCtxFree(pDisk, pIoCtx);
9706 else
9707 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
9708 }
9709 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
9710 vdIoCtxFree(pDisk, pIoCtx);
9711 } while (0);
9712
9713 if (RT_UNLIKELY(fLockWrite) && ( rc == VINF_VD_ASYNC_IO_FINISHED
9714 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
9715 {
9716 rc2 = vdThreadFinishWrite(pDisk);
9717 AssertRC(rc2);
9718 }
9719
9720 LogFlowFunc(("returns %Rrc\n", rc));
9721 return rc;
9722}
9723
9724VBOXDDU_DECL(int) VDAsyncDiscardRanges(PVBOXHDD pDisk, PCRTRANGE paRanges, unsigned cRanges,
9725 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
9726 void *pvUser1, void *pvUser2)
9727{
9728 int rc;
9729 int rc2;
9730 bool fLockWrite = false;
9731 PVDIOCTX pIoCtx = NULL;
9732
9733 LogFlowFunc(("pDisk=%#p\n", pDisk));
9734
9735 do
9736 {
9737 /* sanity check */
9738 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9739 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9740
9741 rc2 = vdThreadStartWrite(pDisk);
9742 AssertRC(rc2);
9743 fLockWrite = true;
9744
9745 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
9746
9747 pIoCtx = vdIoCtxDiscardAlloc(pDisk, paRanges, cRanges,
9748 pfnComplete, pvUser1, pvUser2, NULL,
9749 vdDiscardHelperAsync,
9750 VDIOCTX_FLAGS_DEFAULT);
9751 if (!pIoCtx)
9752 {
9753 rc = VERR_NO_MEMORY;
9754 break;
9755 }
9756
9757 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
9758 if (rc == VINF_VD_ASYNC_IO_FINISHED)
9759 {
9760 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
9761 vdIoCtxFree(pDisk, pIoCtx);
9762 else
9763 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
9764 }
9765 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
9766 vdIoCtxFree(pDisk, pIoCtx);
9767 } while (0);
9768
9769 if (RT_UNLIKELY(fLockWrite) && ( rc == VINF_VD_ASYNC_IO_FINISHED
9770 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
9771 {
9772 rc2 = vdThreadFinishWrite(pDisk);
9773 AssertRC(rc2);
9774 }
9775
9776 LogFlowFunc(("returns %Rrc\n", rc));
9777 return rc;
9778}
9779
9780VBOXDDU_DECL(int) VDRepair(PVDINTERFACE pVDIfsDisk, PVDINTERFACE pVDIfsImage,
9781 const char *pszFilename, const char *pszBackend,
9782 uint32_t fFlags)
9783{
9784 int rc = VERR_NOT_SUPPORTED;
9785 PCVBOXHDDBACKEND pBackend = NULL;
9786 VDINTERFACEIOINT VDIfIoInt;
9787 VDINTERFACEIO VDIfIoFallback;
9788 PVDINTERFACEIO pInterfaceIo;
9789
9790 LogFlowFunc(("pszFilename=\"%s\"\n", pszFilename));
9791 /* Check arguments. */
9792 AssertMsgReturn(VALID_PTR(pszFilename) && *pszFilename,
9793 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
9794 VERR_INVALID_PARAMETER);
9795 AssertMsgReturn(VALID_PTR(pszBackend),
9796 ("pszBackend=%#p\n", pszBackend),
9797 VERR_INVALID_PARAMETER);
9798 AssertMsgReturn((fFlags & ~VD_REPAIR_FLAGS_MASK) == 0,
9799 ("fFlags=%#x\n", fFlags),
9800 VERR_INVALID_PARAMETER);
9801
9802 pInterfaceIo = VDIfIoGet(pVDIfsImage);
9803 if (!pInterfaceIo)
9804 {
9805 /*
9806 * Caller doesn't provide an I/O interface, create our own using the
9807 * native file API.
9808 */
9809 vdIfIoFallbackCallbacksSetup(&VDIfIoFallback);
9810 pInterfaceIo = &VDIfIoFallback;
9811 }
9812
9813 /* Set up the internal I/O interface. */
9814 AssertReturn(!VDIfIoIntGet(pVDIfsImage), VERR_INVALID_PARAMETER);
9815 VDIfIoInt.pfnOpen = vdIOIntOpenLimited;
9816 VDIfIoInt.pfnClose = vdIOIntCloseLimited;
9817 VDIfIoInt.pfnDelete = vdIOIntDeleteLimited;
9818 VDIfIoInt.pfnMove = vdIOIntMoveLimited;
9819 VDIfIoInt.pfnGetFreeSpace = vdIOIntGetFreeSpaceLimited;
9820 VDIfIoInt.pfnGetModificationTime = vdIOIntGetModificationTimeLimited;
9821 VDIfIoInt.pfnGetSize = vdIOIntGetSizeLimited;
9822 VDIfIoInt.pfnSetSize = vdIOIntSetSizeLimited;
9823 VDIfIoInt.pfnReadUser = vdIOIntReadUserLimited;
9824 VDIfIoInt.pfnWriteUser = vdIOIntWriteUserLimited;
9825 VDIfIoInt.pfnReadMeta = vdIOIntReadMetaLimited;
9826 VDIfIoInt.pfnWriteMeta = vdIOIntWriteMetaLimited;
9827 VDIfIoInt.pfnFlush = vdIOIntFlushLimited;
9828 rc = VDInterfaceAdd(&VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
9829 pInterfaceIo, sizeof(VDINTERFACEIOINT), &pVDIfsImage);
9830 AssertRC(rc);
9831
9832 rc = vdFindBackend(pszBackend, &pBackend);
9833 if (RT_SUCCESS(rc))
9834 {
9835 if (pBackend->pfnRepair)
9836 rc = pBackend->pfnRepair(pszFilename, pVDIfsDisk, pVDIfsImage, fFlags);
9837 else
9838 rc = VERR_VD_IMAGE_REPAIR_NOT_SUPPORTED;
9839 }
9840
9841 LogFlowFunc(("returns %Rrc\n", rc));
9842 return rc;
9843}
9844
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette