VirtualBox

source: vbox/trunk/src/VBox/Storage/VD.cpp@ 50991

Last change on this file since 50991 was 50991, checked in by vboxsync, 11 years ago

Storage: Add support for filter plugins

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 359.1 KB
Line 
1/* $Id: VD.cpp 50991 2014-04-08 10:45:31Z vboxsync $ */
2/** @file
3 * VBoxHDD - VBox HDD Container implementation.
4 */
5
6/*
7 * Copyright (C) 2006-2013 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18/*******************************************************************************
19* Header Files *
20*******************************************************************************/
21#define LOG_GROUP LOG_GROUP_VD
22#include <VBox/vd.h>
23#include <VBox/err.h>
24#include <VBox/sup.h>
25#include <VBox/log.h>
26
27#include <iprt/alloc.h>
28#include <iprt/assert.h>
29#include <iprt/uuid.h>
30#include <iprt/file.h>
31#include <iprt/string.h>
32#include <iprt/asm.h>
33#include <iprt/ldr.h>
34#include <iprt/dir.h>
35#include <iprt/path.h>
36#include <iprt/param.h>
37#include <iprt/memcache.h>
38#include <iprt/sg.h>
39#include <iprt/list.h>
40#include <iprt/avl.h>
41#include <iprt/semaphore.h>
42
43#include <VBox/vd-plugin.h>
44
45#include "VDBackends.h"
46
47/** Disable dynamic backends on non x86 architectures. This feature
48 * requires the SUPR3 library which is not available there.
49 */
50#if !defined(VBOX_HDD_NO_DYNAMIC_BACKENDS) && !defined(RT_ARCH_X86) && !defined(RT_ARCH_AMD64)
51# define VBOX_HDD_NO_DYNAMIC_BACKENDS
52#endif
53
54#define VBOXHDDDISK_SIGNATURE 0x6f0e2a7d
55
56/** Buffer size used for merging images. */
57#define VD_MERGE_BUFFER_SIZE (16 * _1M)
58
59/** Maximum number of segments in one I/O task. */
60#define VD_IO_TASK_SEGMENTS_MAX 64
61
62/** Threshold after not recently used blocks are removed from the list. */
63#define VD_DISCARD_REMOVE_THRESHOLD (10 * _1M) /** @todo: experiment */
64
65/**
66 * VD async I/O interface storage descriptor.
67 */
68typedef struct VDIIOFALLBACKSTORAGE
69{
70 /** File handle. */
71 RTFILE File;
72 /** Completion callback. */
73 PFNVDCOMPLETED pfnCompleted;
74 /** Thread for async access. */
75 RTTHREAD ThreadAsync;
76} VDIIOFALLBACKSTORAGE, *PVDIIOFALLBACKSTORAGE;
77
78/**
79 * Structure containing everything I/O related
80 * for the image and cache descriptors.
81 */
82typedef struct VDIO
83{
84 /** I/O interface to the upper layer. */
85 PVDINTERFACEIO pInterfaceIo;
86
87 /** Per image internal I/O interface. */
88 VDINTERFACEIOINT VDIfIoInt;
89
90 /** Fallback I/O interface, only used if the caller doesn't provide it. */
91 VDINTERFACEIO VDIfIo;
92
93 /** Opaque backend data. */
94 void *pBackendData;
95 /** Disk this image is part of */
96 PVBOXHDD pDisk;
97 /** Flag whether to ignore flush requests. */
98 bool fIgnoreFlush;
99} VDIO, *PVDIO;
100
101/** Forward declaration of an I/O task */
102typedef struct VDIOTASK *PVDIOTASK;
103
104/**
105 * VBox HDD Container image descriptor.
106 */
107typedef struct VDIMAGE
108{
109 /** Link to parent image descriptor, if any. */
110 struct VDIMAGE *pPrev;
111 /** Link to child image descriptor, if any. */
112 struct VDIMAGE *pNext;
113 /** Container base filename. (UTF-8) */
114 char *pszFilename;
115 /** Data managed by the backend which keeps the actual info. */
116 void *pBackendData;
117 /** Cached sanitized image flags. */
118 unsigned uImageFlags;
119 /** Image open flags (only those handled generically in this code and which
120 * the backends will never ever see). */
121 unsigned uOpenFlags;
122
123 /** Function pointers for the various backend methods. */
124 PCVBOXHDDBACKEND Backend;
125 /** Pointer to list of VD interfaces, per-image. */
126 PVDINTERFACE pVDIfsImage;
127 /** I/O related things. */
128 VDIO VDIo;
129} VDIMAGE, *PVDIMAGE;
130
131/**
132 * uModified bit flags.
133 */
134#define VD_IMAGE_MODIFIED_FLAG RT_BIT(0)
135#define VD_IMAGE_MODIFIED_FIRST RT_BIT(1)
136#define VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE RT_BIT(2)
137
138
139/**
140 * VBox HDD Cache image descriptor.
141 */
142typedef struct VDCACHE
143{
144 /** Cache base filename. (UTF-8) */
145 char *pszFilename;
146 /** Data managed by the backend which keeps the actual info. */
147 void *pBackendData;
148 /** Cached sanitized image flags. */
149 unsigned uImageFlags;
150 /** Image open flags (only those handled generically in this code and which
151 * the backends will never ever see). */
152 unsigned uOpenFlags;
153
154 /** Function pointers for the various backend methods. */
155 PCVDCACHEBACKEND Backend;
156
157 /** Pointer to list of VD interfaces, per-cache. */
158 PVDINTERFACE pVDIfsCache;
159 /** I/O related things. */
160 VDIO VDIo;
161} VDCACHE, *PVDCACHE;
162
163/**
164 * A block waiting for a discard.
165 */
166typedef struct VDDISCARDBLOCK
167{
168 /** AVL core. */
169 AVLRU64NODECORE Core;
170 /** LRU list node. */
171 RTLISTNODE NodeLru;
172 /** Number of bytes to discard. */
173 size_t cbDiscard;
174 /** Bitmap of allocated sectors. */
175 void *pbmAllocated;
176} VDDISCARDBLOCK, *PVDDISCARDBLOCK;
177
178/**
179 * VD discard state.
180 */
181typedef struct VDDISCARDSTATE
182{
183 /** Number of bytes waiting for a discard. */
184 size_t cbDiscarding;
185 /** AVL tree with blocks waiting for a discard.
186 * The uOffset + cbDiscard range is the search key. */
187 PAVLRU64TREE pTreeBlocks;
188 /** LRU list of the least frequently discarded blocks.
189 * If there are to many blocks waiting the least frequently used
190 * will be removed and the range will be set to 0.
191 */
192 RTLISTNODE ListLru;
193} VDDISCARDSTATE, *PVDDISCARDSTATE;
194
195/**
196 * VD filter instance.
197 */
198typedef struct VDFILTER
199{
200 /** Pointer to the previous filter. */
201 struct VDFILTER *pPrev;
202 /** Pointer to the next filter. */
203 struct VDFILTER *pNext;
204 /** Opaque VD filter backend instance data. */
205 void *pvBackendData;
206 /** Pointer to the filter backend interface. */
207 PCVDFILTERBACKEND pBackend;
208} VDFILTER;
209/** Pointer to a VD filter instance. */
210typedef VDFILTER *PVDFILTER;
211
212/**
213 * VBox HDD Container main structure, private part.
214 */
215struct VBOXHDD
216{
217 /** Structure signature (VBOXHDDDISK_SIGNATURE). */
218 uint32_t u32Signature;
219
220 /** Image type. */
221 VDTYPE enmType;
222
223 /** Number of opened images. */
224 unsigned cImages;
225
226 /** Base image. */
227 PVDIMAGE pBase;
228
229 /** Last opened image in the chain.
230 * The same as pBase if only one image is used. */
231 PVDIMAGE pLast;
232
233 /** If a merge to one of the parents is running this may be non-NULL
234 * to indicate to what image the writes should be additionally relayed. */
235 PVDIMAGE pImageRelay;
236
237 /** Flags representing the modification state. */
238 unsigned uModified;
239
240 /** Cached size of this disk. */
241 uint64_t cbSize;
242 /** Cached PCHS geometry for this disk. */
243 VDGEOMETRY PCHSGeometry;
244 /** Cached LCHS geometry for this disk. */
245 VDGEOMETRY LCHSGeometry;
246
247 /** Pointer to list of VD interfaces, per-disk. */
248 PVDINTERFACE pVDIfsDisk;
249 /** Pointer to the common interface structure for error reporting. */
250 PVDINTERFACEERROR pInterfaceError;
251 /** Pointer to the optional thread synchronization callbacks. */
252 PVDINTERFACETHREADSYNC pInterfaceThreadSync;
253
254 /** Memory cache for I/O contexts */
255 RTMEMCACHE hMemCacheIoCtx;
256 /** Memory cache for I/O tasks. */
257 RTMEMCACHE hMemCacheIoTask;
258 /** An I/O context is currently using the disk structures
259 * Every I/O context must be placed on one of the lists below. */
260 volatile bool fLocked;
261 /** Head of pending I/O tasks waiting for completion - LIFO order. */
262 volatile PVDIOTASK pIoTasksPendingHead;
263 /** Head of newly queued I/O contexts - LIFO order. */
264 volatile PVDIOCTX pIoCtxHead;
265 /** Head of halted I/O contexts which are given back to generic
266 * disk framework by the backend. - LIFO order. */
267 volatile PVDIOCTX pIoCtxHaltedHead;
268
269 /** Head of blocked I/O contexts, processed only
270 * after pIoCtxLockOwner was freed - LIFO order. */
271 volatile PVDIOCTX pIoCtxBlockedHead;
272 /** I/O context which locked the disk for a growing write or flush request.
273 * Other flush or growing write requests need to wait until
274 * the current one completes. - NIL_VDIOCTX if unlocked. */
275 volatile PVDIOCTX pIoCtxLockOwner;
276
277 /** Pointer to the L2 disk cache if any. */
278 PVDCACHE pCache;
279 /** Pointer to the discard state if any. */
280 PVDDISCARDSTATE pDiscard;
281
282 /** Pointer to the first filter in the chain. */
283 PVDFILTER pFilterHead;
284 /** Pointer to the last filter in the chain. */
285 PVDFILTER pFilterTail;
286};
287
288# define VD_IS_LOCKED(a_pDisk) \
289 do \
290 { \
291 AssertMsg(a_pDisk->fLocked, \
292 ("Lock not held\n"));\
293 } while(0)
294
295/**
296 * VBox parent read descriptor, used internally for compaction.
297 */
298typedef struct VDPARENTSTATEDESC
299{
300 /** Pointer to disk descriptor. */
301 PVBOXHDD pDisk;
302 /** Pointer to image descriptor. */
303 PVDIMAGE pImage;
304} VDPARENTSTATEDESC, *PVDPARENTSTATEDESC;
305
306/**
307 * Transfer direction.
308 */
309typedef enum VDIOCTXTXDIR
310{
311 /** Read */
312 VDIOCTXTXDIR_READ = 0,
313 /** Write */
314 VDIOCTXTXDIR_WRITE,
315 /** Flush */
316 VDIOCTXTXDIR_FLUSH,
317 /** Discard */
318 VDIOCTXTXDIR_DISCARD,
319 /** 32bit hack */
320 VDIOCTXTXDIR_32BIT_HACK = 0x7fffffff
321} VDIOCTXTXDIR, *PVDIOCTXTXDIR;
322
323/** Transfer function */
324typedef DECLCALLBACK(int) FNVDIOCTXTRANSFER (PVDIOCTX pIoCtx);
325/** Pointer to a transfer function. */
326typedef FNVDIOCTXTRANSFER *PFNVDIOCTXTRANSFER;
327
328/**
329 * I/O context
330 */
331typedef struct VDIOCTX
332{
333 /** Pointer to the next I/O context. */
334 struct VDIOCTX * volatile pIoCtxNext;
335 /** Disk this is request is for. */
336 PVBOXHDD pDisk;
337 /** Return code. */
338 int rcReq;
339 /** Various flags for the I/O context. */
340 uint32_t fFlags;
341 /** Number of data transfers currently pending. */
342 volatile uint32_t cDataTransfersPending;
343 /** How many meta data transfers are pending. */
344 volatile uint32_t cMetaTransfersPending;
345 /** Flag whether the request finished */
346 volatile bool fComplete;
347 /** Temporary allocated memory which is freed
348 * when the context completes. */
349 void *pvAllocation;
350 /** Transfer function. */
351 PFNVDIOCTXTRANSFER pfnIoCtxTransfer;
352 /** Next transfer part after the current one completed. */
353 PFNVDIOCTXTRANSFER pfnIoCtxTransferNext;
354 /** Transfer direction */
355 VDIOCTXTXDIR enmTxDir;
356 /** Request type dependent data. */
357 union
358 {
359 /** I/O request (read/write). */
360 struct
361 {
362 /** Number of bytes left until this context completes. */
363 volatile uint32_t cbTransferLeft;
364 /** Current offset */
365 volatile uint64_t uOffset;
366 /** Number of bytes to transfer */
367 volatile size_t cbTransfer;
368 /** Current image in the chain. */
369 PVDIMAGE pImageCur;
370 /** Start image to read from. pImageCur is reset to this
371 * value after it reached the first image in the chain. */
372 PVDIMAGE pImageStart;
373 /** S/G buffer */
374 RTSGBUF SgBuf;
375 /** Number of bytes to clear in the buffer before the current read. */
376 size_t cbBufClear;
377 /** Number of images to read. */
378 unsigned cImagesRead;
379 /** Override for the parent image to start reading from. */
380 PVDIMAGE pImageParentOverride;
381 /** Original offset of the transfer - required for filtering read requests. */
382 uint64_t uOffsetXferOrig;
383 /** Original size of the transfer - required for fitlering read requests. */
384 size_t cbXferOrig;
385 } Io;
386 /** Discard requests. */
387 struct
388 {
389 /** Pointer to the range descriptor array. */
390 PCRTRANGE paRanges;
391 /** Number of ranges in the array. */
392 unsigned cRanges;
393 /** Range descriptor index which is processed. */
394 unsigned idxRange;
395 /** Start offset to discard currently. */
396 uint64_t offCur;
397 /** How many bytes left to discard in the current range. */
398 size_t cbDiscardLeft;
399 /** How many bytes to discard in the current block (<= cbDiscardLeft). */
400 size_t cbThisDiscard;
401 /** Discard block handled currently. */
402 PVDDISCARDBLOCK pBlock;
403 } Discard;
404 } Req;
405 /** Parent I/O context if any. Sets the type of the context (root/child) */
406 PVDIOCTX pIoCtxParent;
407 /** Type dependent data (root/child) */
408 union
409 {
410 /** Root data */
411 struct
412 {
413 /** Completion callback */
414 PFNVDASYNCTRANSFERCOMPLETE pfnComplete;
415 /** User argument 1 passed on completion. */
416 void *pvUser1;
417 /** User argument 2 passed on completion. */
418 void *pvUser2;
419 } Root;
420 /** Child data */
421 struct
422 {
423 /** Saved start offset */
424 uint64_t uOffsetSaved;
425 /** Saved transfer size */
426 size_t cbTransferLeftSaved;
427 /** Number of bytes transferred from the parent if this context completes. */
428 size_t cbTransferParent;
429 /** Number of bytes to pre read */
430 size_t cbPreRead;
431 /** Number of bytes to post read. */
432 size_t cbPostRead;
433 /** Number of bytes to write left in the parent. */
434 size_t cbWriteParent;
435 /** Write type dependent data. */
436 union
437 {
438 /** Optimized */
439 struct
440 {
441 /** Bytes to fill to satisfy the block size. Not part of the virtual disk. */
442 size_t cbFill;
443 /** Bytes to copy instead of reading from the parent */
444 size_t cbWriteCopy;
445 /** Bytes to read from the image. */
446 size_t cbReadImage;
447 } Optimized;
448 } Write;
449 } Child;
450 } Type;
451} VDIOCTX;
452
453/** Default flags for an I/O context, i.e. unblocked and async. */
454#define VDIOCTX_FLAGS_DEFAULT (0)
455/** Flag whether the context is blocked. */
456#define VDIOCTX_FLAGS_BLOCKED RT_BIT_32(0)
457/** Flag whether the I/O context is using synchronous I/O. */
458#define VDIOCTX_FLAGS_SYNC RT_BIT_32(1)
459/** Flag whether the read should update the cache. */
460#define VDIOCTX_FLAGS_READ_UPDATE_CACHE RT_BIT_32(2)
461/** Flag whether free blocks should be zeroed.
462 * If false and no image has data for sepcified
463 * range VERR_VD_BLOCK_FREE is returned for the I/O context.
464 * Note that unallocated blocks are still zeroed
465 * if at least one image has valid data for a part
466 * of the range.
467 */
468#define VDIOCTX_FLAGS_ZERO_FREE_BLOCKS RT_BIT_32(3)
469/** Don't free the I/O context when complete because
470 * it was alloacted elsewhere (stack, ...). */
471#define VDIOCTX_FLAGS_DONT_FREE RT_BIT_32(4)
472/* Don't set the modified flag for this I/O context when writing. */
473#define VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG RT_BIT_32(5)
474
475/** NIL I/O context pointer value. */
476#define NIL_VDIOCTX ((PVDIOCTX)0)
477
478/**
479 * List node for deferred I/O contexts.
480 */
481typedef struct VDIOCTXDEFERRED
482{
483 /** Node in the list of deferred requests.
484 * A request can be deferred if the image is growing
485 * and the request accesses the same range or if
486 * the backend needs to read or write metadata from the disk
487 * before it can continue. */
488 RTLISTNODE NodeDeferred;
489 /** I/O context this entry points to. */
490 PVDIOCTX pIoCtx;
491} VDIOCTXDEFERRED, *PVDIOCTXDEFERRED;
492
493/**
494 * I/O task.
495 */
496typedef struct VDIOTASK
497{
498 /** Next I/O task waiting in the list. */
499 struct VDIOTASK * volatile pNext;
500 /** Storage this task belongs to. */
501 PVDIOSTORAGE pIoStorage;
502 /** Optional completion callback. */
503 PFNVDXFERCOMPLETED pfnComplete;
504 /** Opaque user data. */
505 void *pvUser;
506 /** Completion status code for the task. */
507 int rcReq;
508 /** Flag whether this is a meta data transfer. */
509 bool fMeta;
510 /** Type dependent data. */
511 union
512 {
513 /** User data transfer. */
514 struct
515 {
516 /** Number of bytes this task transferred. */
517 uint32_t cbTransfer;
518 /** Pointer to the I/O context the task belongs. */
519 PVDIOCTX pIoCtx;
520 } User;
521 /** Meta data transfer. */
522 struct
523 {
524 /** Meta transfer this task is for. */
525 PVDMETAXFER pMetaXfer;
526 } Meta;
527 } Type;
528} VDIOTASK;
529
530/**
531 * Storage handle.
532 */
533typedef struct VDIOSTORAGE
534{
535 /** Image I/O state this storage handle belongs to. */
536 PVDIO pVDIo;
537 /** AVL tree for pending async metadata transfers. */
538 PAVLRFOFFTREE pTreeMetaXfers;
539 /** Storage handle */
540 void *pStorage;
541} VDIOSTORAGE;
542
543/**
544 * Metadata transfer.
545 *
546 * @note This entry can't be freed if either the list is not empty or
547 * the reference counter is not 0.
548 * The assumption is that the backends don't need to read huge amounts of
549 * metadata to complete a transfer so the additional memory overhead should
550 * be relatively small.
551 */
552typedef struct VDMETAXFER
553{
554 /** AVL core for fast search (the file offset is the key) */
555 AVLRFOFFNODECORE Core;
556 /** I/O storage for this transfer. */
557 PVDIOSTORAGE pIoStorage;
558 /** Flags. */
559 uint32_t fFlags;
560 /** List of I/O contexts waiting for this metadata transfer to complete. */
561 RTLISTNODE ListIoCtxWaiting;
562 /** Number of references to this entry. */
563 unsigned cRefs;
564 /** Size of the data stored with this entry. */
565 size_t cbMeta;
566 /** Data stored - variable size. */
567 uint8_t abData[1];
568} VDMETAXFER;
569
570/**
571 * The transfer direction for the metadata.
572 */
573#define VDMETAXFER_TXDIR_MASK 0x3
574#define VDMETAXFER_TXDIR_NONE 0x0
575#define VDMETAXFER_TXDIR_WRITE 0x1
576#define VDMETAXFER_TXDIR_READ 0x2
577#define VDMETAXFER_TXDIR_FLUSH 0x3
578#define VDMETAXFER_TXDIR_GET(flags) ((flags) & VDMETAXFER_TXDIR_MASK)
579#define VDMETAXFER_TXDIR_SET(flags, dir) ((flags) = (flags & ~VDMETAXFER_TXDIR_MASK) | (dir))
580
581/**
582 * Plugin structure.
583 */
584typedef struct VDPLUGIN
585{
586 /** Pointer to the next plugin structure. */
587 RTLISTNODE NodePlugin;
588 /** Handle of loaded plugin library. */
589 RTLDRMOD hPlugin;
590} VDPLUGIN;
591/** Pointer to a plugin structure. */
592typedef VDPLUGIN *PVDPLUGIN;
593
594/** Head of loaded plugin list. */
595static RTLISTANCHOR g_ListPluginsLoaded;
596
597/** Number of image backends supported. */
598static unsigned g_cBackends = 0;
599/** Array of pointers to the image backends. */
600static PCVBOXHDDBACKEND *g_apBackends = NULL;
601/** Builtin image backends. */
602static PCVBOXHDDBACKEND aStaticBackends[] =
603{
604 &g_VmdkBackend,
605 &g_VDIBackend,
606 &g_VhdBackend,
607 &g_ParallelsBackend,
608 &g_DmgBackend,
609 &g_QedBackend,
610 &g_QCowBackend,
611 &g_VhdxBackend,
612 &g_RawBackend,
613 &g_ISCSIBackend
614};
615
616/** Number of supported cache backends. */
617static unsigned g_cCacheBackends = 0;
618/** Array of pointers to the cache backends. */
619static PCVDCACHEBACKEND *g_apCacheBackends = NULL;
620/** Builtin cache backends. */
621static PCVDCACHEBACKEND aStaticCacheBackends[] =
622{
623 &g_VciCacheBackend
624};
625
626/** Number of supported filter backends. */
627static unsigned g_cFilterBackends = 0;
628/** Array of pointers to the filters backends. */
629static PCVDFILTERBACKEND *g_apFilterBackends = NULL;
630
631/** Forward declaration of the async discard helper. */
632static int vdDiscardHelperAsync(PVDIOCTX pIoCtx);
633static int vdWriteHelperAsync(PVDIOCTX pIoCtx);
634static void vdDiskProcessBlockedIoCtx(PVBOXHDD pDisk);
635static int vdDiskUnlock(PVBOXHDD pDisk, PVDIOCTX pIoCtxRc);
636static DECLCALLBACK(void) vdIoCtxSyncComplete(void *pvUser1, void *pvUser2, int rcReq);
637
638/**
639 * internal: add several backends.
640 */
641static int vdAddBackends(PCVBOXHDDBACKEND *ppBackends, unsigned cBackends)
642{
643 PCVBOXHDDBACKEND *pTmp = (PCVBOXHDDBACKEND*)RTMemRealloc(g_apBackends,
644 (g_cBackends + cBackends) * sizeof(PCVBOXHDDBACKEND));
645 if (RT_UNLIKELY(!pTmp))
646 return VERR_NO_MEMORY;
647 g_apBackends = pTmp;
648 memcpy(&g_apBackends[g_cBackends], ppBackends, cBackends * sizeof(PCVBOXHDDBACKEND));
649 g_cBackends += cBackends;
650 return VINF_SUCCESS;
651}
652
653/**
654 * internal: add single backend.
655 */
656DECLINLINE(int) vdAddBackend(PCVBOXHDDBACKEND pBackend)
657{
658 return vdAddBackends(&pBackend, 1);
659}
660
661/**
662 * internal: add several cache backends.
663 */
664static int vdAddCacheBackends(PCVDCACHEBACKEND *ppBackends, unsigned cBackends)
665{
666 PCVDCACHEBACKEND *pTmp = (PCVDCACHEBACKEND*)RTMemRealloc(g_apCacheBackends,
667 (g_cCacheBackends + cBackends) * sizeof(PCVDCACHEBACKEND));
668 if (RT_UNLIKELY(!pTmp))
669 return VERR_NO_MEMORY;
670 g_apCacheBackends = pTmp;
671 memcpy(&g_apCacheBackends[g_cCacheBackends], ppBackends, cBackends * sizeof(PCVDCACHEBACKEND));
672 g_cCacheBackends += cBackends;
673 return VINF_SUCCESS;
674}
675
676/**
677 * internal: add single cache backend.
678 */
679DECLINLINE(int) vdAddCacheBackend(PCVDCACHEBACKEND pBackend)
680{
681 return vdAddCacheBackends(&pBackend, 1);
682}
683
684/**
685 * Add several filter bakends.
686 *
687 * @returns VBox status code.
688 * @param ppBackends Array of filter backends to add.
689 * @param cBackends Number of backends to add.
690 */
691static int vdAddFilterBackends(PCVDFILTERBACKEND *ppBackends, unsigned cBackends)
692{
693 PCVDFILTERBACKEND *pTmp = (PCVDFILTERBACKEND *)RTMemRealloc(g_apFilterBackends,
694 (g_cFilterBackends + cBackends) * sizeof(PCVDFILTERBACKEND));
695 if (RT_UNLIKELY(!pTmp))
696 return VERR_NO_MEMORY;
697 g_apFilterBackends = pTmp;
698 memcpy(&g_apFilterBackends[g_cFilterBackends], ppBackends, cBackends * sizeof(PCVDFILTERBACKEND));
699 g_cFilterBackends += cBackends;
700 return VINF_SUCCESS;
701}
702
703/**
704 * Add a single filter backend to the list of supported filters.
705 *
706 * @returns VBox status code.
707 * @param pBackend The backend to add.
708 */
709DECLINLINE(int) vdAddFilterBackend(PCVDFILTERBACKEND pBackend)
710{
711 return vdAddFilterBackends(&pBackend, 1);
712}
713
714/**
715 * internal: issue error message.
716 */
717static int vdError(PVBOXHDD pDisk, int rc, RT_SRC_POS_DECL,
718 const char *pszFormat, ...)
719{
720 va_list va;
721 va_start(va, pszFormat);
722 if (pDisk->pInterfaceError)
723 pDisk->pInterfaceError->pfnError(pDisk->pInterfaceError->Core.pvUser, rc, RT_SRC_POS_ARGS, pszFormat, va);
724 va_end(va);
725 return rc;
726}
727
728/**
729 * internal: thread synchronization, start read.
730 */
731DECLINLINE(int) vdThreadStartRead(PVBOXHDD pDisk)
732{
733 int rc = VINF_SUCCESS;
734 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
735 rc = pDisk->pInterfaceThreadSync->pfnStartRead(pDisk->pInterfaceThreadSync->Core.pvUser);
736 return rc;
737}
738
739/**
740 * internal: thread synchronization, finish read.
741 */
742DECLINLINE(int) vdThreadFinishRead(PVBOXHDD pDisk)
743{
744 int rc = VINF_SUCCESS;
745 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
746 rc = pDisk->pInterfaceThreadSync->pfnFinishRead(pDisk->pInterfaceThreadSync->Core.pvUser);
747 return rc;
748}
749
750/**
751 * internal: thread synchronization, start write.
752 */
753DECLINLINE(int) vdThreadStartWrite(PVBOXHDD pDisk)
754{
755 int rc = VINF_SUCCESS;
756 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
757 rc = pDisk->pInterfaceThreadSync->pfnStartWrite(pDisk->pInterfaceThreadSync->Core.pvUser);
758 return rc;
759}
760
761/**
762 * internal: thread synchronization, finish write.
763 */
764DECLINLINE(int) vdThreadFinishWrite(PVBOXHDD pDisk)
765{
766 int rc = VINF_SUCCESS;
767 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
768 rc = pDisk->pInterfaceThreadSync->pfnFinishWrite(pDisk->pInterfaceThreadSync->Core.pvUser);
769 return rc;
770}
771
772/**
773 * internal: find image format backend.
774 */
775static int vdFindBackend(const char *pszBackend, PCVBOXHDDBACKEND *ppBackend)
776{
777 int rc = VINF_SUCCESS;
778 PCVBOXHDDBACKEND pBackend = NULL;
779
780 if (!g_apBackends)
781 VDInit();
782
783 for (unsigned i = 0; i < g_cBackends; i++)
784 {
785 if (!RTStrICmp(pszBackend, g_apBackends[i]->pszBackendName))
786 {
787 pBackend = g_apBackends[i];
788 break;
789 }
790 }
791 *ppBackend = pBackend;
792 return rc;
793}
794
795/**
796 * internal: find cache format backend.
797 */
798static int vdFindCacheBackend(const char *pszBackend, PCVDCACHEBACKEND *ppBackend)
799{
800 int rc = VINF_SUCCESS;
801 PCVDCACHEBACKEND pBackend = NULL;
802
803 if (!g_apCacheBackends)
804 VDInit();
805
806 for (unsigned i = 0; i < g_cCacheBackends; i++)
807 {
808 if (!RTStrICmp(pszBackend, g_apCacheBackends[i]->pszBackendName))
809 {
810 pBackend = g_apCacheBackends[i];
811 break;
812 }
813 }
814 *ppBackend = pBackend;
815 return rc;
816}
817
818/**
819 * internal: find filter backend.
820 */
821static int vdFindFilterBackend(const char *pszFilter, PCVDFILTERBACKEND *ppBackend)
822{
823 int rc = VINF_SUCCESS;
824 PCVDFILTERBACKEND pBackend = NULL;
825
826 for (unsigned i = 0; i < g_cFilterBackends; i++)
827 {
828 if (!RTStrICmp(pszFilter, g_apFilterBackends[i]->pszBackendName))
829 {
830 pBackend = g_apFilterBackends[i];
831 break;
832 }
833 }
834 *ppBackend = pBackend;
835 return rc;
836}
837
838
839/**
840 * internal: add image structure to the end of images list.
841 */
842static void vdAddImageToList(PVBOXHDD pDisk, PVDIMAGE pImage)
843{
844 pImage->pPrev = NULL;
845 pImage->pNext = NULL;
846
847 if (pDisk->pBase)
848 {
849 Assert(pDisk->cImages > 0);
850 pImage->pPrev = pDisk->pLast;
851 pDisk->pLast->pNext = pImage;
852 pDisk->pLast = pImage;
853 }
854 else
855 {
856 Assert(pDisk->cImages == 0);
857 pDisk->pBase = pImage;
858 pDisk->pLast = pImage;
859 }
860
861 pDisk->cImages++;
862}
863
864/**
865 * internal: remove image structure from the images list.
866 */
867static void vdRemoveImageFromList(PVBOXHDD pDisk, PVDIMAGE pImage)
868{
869 Assert(pDisk->cImages > 0);
870
871 if (pImage->pPrev)
872 pImage->pPrev->pNext = pImage->pNext;
873 else
874 pDisk->pBase = pImage->pNext;
875
876 if (pImage->pNext)
877 pImage->pNext->pPrev = pImage->pPrev;
878 else
879 pDisk->pLast = pImage->pPrev;
880
881 pImage->pPrev = NULL;
882 pImage->pNext = NULL;
883
884 pDisk->cImages--;
885}
886
887/**
888 * internal: add filter structure to the end of filter list.
889 */
890static void vdAddFilterToList(PVBOXHDD pDisk, PVDFILTER pFilter)
891{
892 pFilter->pPrev = NULL;
893 pFilter->pNext = NULL;
894
895 if (pDisk->pFilterHead)
896 {
897 pFilter->pPrev = pDisk->pFilterTail;
898 pDisk->pFilterTail->pNext = pFilter;
899 pDisk->pFilterTail = pFilter;
900 }
901 else
902 {
903 pDisk->pFilterHead = pFilter;
904 pDisk->pFilterTail = pFilter;
905 }
906}
907
908/**
909 * internal: Remove last filter structure from the filter list.
910 */
911static void vdRemoveFilterFromList(PVBOXHDD pDisk, PVDFILTER pFilter)
912{
913 Assert(pDisk->pFilterHead != NULL && pDisk->pFilterTail != NULL);
914
915 if (pFilter->pPrev)
916 pFilter->pPrev->pNext = pFilter->pNext;
917 else
918 pDisk->pFilterHead = pFilter->pNext;
919
920 if (pFilter->pNext)
921 pFilter->pNext->pPrev = pFilter->pPrev;
922 else
923 pDisk->pFilterTail = pFilter->pPrev;
924
925 pFilter->pPrev = NULL;
926 pFilter->pNext = NULL;
927}
928
929/**
930 * internal: find image by index into the images list.
931 */
932static PVDIMAGE vdGetImageByNumber(PVBOXHDD pDisk, unsigned nImage)
933{
934 PVDIMAGE pImage = pDisk->pBase;
935 if (nImage == VD_LAST_IMAGE)
936 return pDisk->pLast;
937 while (pImage && nImage)
938 {
939 pImage = pImage->pNext;
940 nImage--;
941 }
942 return pImage;
943}
944
945/**
946 * Applies the filter chain to the given write request.
947 *
948 * @returns VBox status code.
949 * @param pDisk The HDD container.
950 * @param uOffset The start offset of the write.
951 * @param cbWrite Number of bytes to write.
952 * @param pIoCtx The I/O context associated with the request.
953 */
954static int vdFilterChainApplyWrite(PVBOXHDD pDisk, uint64_t uOffset, size_t cbWrite,
955 PVDIOCTX pIoCtx)
956{
957 int rc = VINF_SUCCESS;
958
959 if (pDisk->pFilterHead)
960 {
961 PVDFILTER pFilterCurr = pDisk->pFilterHead;
962
963 do
964 {
965 rc = pFilterCurr->pBackend->pfnFilterWrite(pFilterCurr->pvBackendData, uOffset, cbWrite, pIoCtx);
966 /* Reset S/G buffer for the next filter. */
967 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
968
969 pFilterCurr = pFilterCurr->pNext;
970 } while ( RT_SUCCESS(rc)
971 && pFilterCurr);
972 }
973
974 return rc;
975}
976
977/**
978 * Applies the filter chain to the given read request.
979 *
980 * @returns VBox status code.
981 * @param pDisk The HDD container.
982 * @param uOffset The start offset of the read.
983 * @param cbRead Number of bytes read.
984 * @param pIoCtx The I/O context associated with the request.
985 */
986static int vdFilterChainApplyRead(PVBOXHDD pDisk, uint64_t uOffset, size_t cbRead,
987 PVDIOCTX pIoCtx)
988{
989 int rc = VINF_SUCCESS;
990
991 if (pDisk->pFilterHead)
992 {
993 PVDFILTER pFilterCurr = pDisk->pFilterHead;
994
995 do
996 {
997 rc = pFilterCurr->pBackend->pfnFilterRead(pFilterCurr->pvBackendData, uOffset, cbRead, pIoCtx);
998 /* Reset S/G buffer for the next filter. */
999 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
1000
1001 pFilterCurr = pFilterCurr->pNext;
1002 } while ( RT_SUCCESS(rc)
1003 && pFilterCurr);
1004 }
1005
1006 return rc;
1007}
1008
1009DECLINLINE(void) vdIoCtxRootComplete(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1010{
1011 if ( RT_SUCCESS(pIoCtx->rcReq)
1012 && pIoCtx->enmTxDir == VDIOCTXTXDIR_READ)
1013 pIoCtx->rcReq = vdFilterChainApplyRead(pDisk, pIoCtx->Req.Io.uOffsetXferOrig,
1014 pIoCtx->Req.Io.cbXferOrig, pIoCtx);
1015
1016 pIoCtx->Type.Root.pfnComplete(pIoCtx->Type.Root.pvUser1,
1017 pIoCtx->Type.Root.pvUser2,
1018 pIoCtx->rcReq);
1019}
1020
1021/**
1022 * Initialize the structure members of a given I/O context.
1023 */
1024DECLINLINE(void) vdIoCtxInit(PVDIOCTX pIoCtx, PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1025 uint64_t uOffset, size_t cbTransfer, PVDIMAGE pImageStart,
1026 PCRTSGBUF pcSgBuf, void *pvAllocation,
1027 PFNVDIOCTXTRANSFER pfnIoCtxTransfer, uint32_t fFlags)
1028{
1029 pIoCtx->pDisk = pDisk;
1030 pIoCtx->enmTxDir = enmTxDir;
1031 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbTransfer; Assert((uint32_t)cbTransfer == cbTransfer);
1032 pIoCtx->Req.Io.uOffset = uOffset;
1033 pIoCtx->Req.Io.cbTransfer = cbTransfer;
1034 pIoCtx->Req.Io.pImageStart = pImageStart;
1035 pIoCtx->Req.Io.pImageCur = pImageStart;
1036 pIoCtx->Req.Io.cbBufClear = 0;
1037 pIoCtx->Req.Io.pImageParentOverride = NULL;
1038 pIoCtx->Req.Io.uOffsetXferOrig = uOffset;
1039 pIoCtx->Req.Io.cbXferOrig = cbTransfer;
1040 pIoCtx->cDataTransfersPending = 0;
1041 pIoCtx->cMetaTransfersPending = 0;
1042 pIoCtx->fComplete = false;
1043 pIoCtx->fFlags = fFlags;
1044 pIoCtx->pvAllocation = pvAllocation;
1045 pIoCtx->pfnIoCtxTransfer = pfnIoCtxTransfer;
1046 pIoCtx->pfnIoCtxTransferNext = NULL;
1047 pIoCtx->rcReq = VINF_SUCCESS;
1048 pIoCtx->pIoCtxParent = NULL;
1049
1050 /* There is no S/G list for a flush request. */
1051 if ( enmTxDir != VDIOCTXTXDIR_FLUSH
1052 && enmTxDir != VDIOCTXTXDIR_DISCARD)
1053 RTSgBufClone(&pIoCtx->Req.Io.SgBuf, pcSgBuf);
1054 else
1055 memset(&pIoCtx->Req.Io.SgBuf, 0, sizeof(RTSGBUF));
1056}
1057
1058/**
1059 * Internal: Tries to read the desired range from the given cache.
1060 *
1061 * @returns VBox status code.
1062 * @retval VERR_VD_BLOCK_FREE if the block is not in the cache.
1063 * pcbRead will be set to the number of bytes not in the cache.
1064 * Everything thereafter might be in the cache.
1065 * @param pCache The cache to read from.
1066 * @param uOffset Offset of the virtual disk to read.
1067 * @param cbRead How much to read.
1068 * @param pIoCtx The I/O context to read into.
1069 * @param pcbRead Where to store the number of bytes actually read.
1070 * On success this indicates the number of bytes read from the cache.
1071 * If VERR_VD_BLOCK_FREE is returned this gives the number of bytes
1072 * which are not in the cache.
1073 * In both cases everything beyond this value
1074 * might or might not be in the cache.
1075 */
1076static int vdCacheReadHelper(PVDCACHE pCache, uint64_t uOffset,
1077 size_t cbRead, PVDIOCTX pIoCtx, size_t *pcbRead)
1078{
1079 int rc = VINF_SUCCESS;
1080
1081 LogFlowFunc(("pCache=%#p uOffset=%llu pIoCtx=%p cbRead=%zu pcbRead=%#p\n",
1082 pCache, uOffset, pIoCtx, cbRead, pcbRead));
1083
1084 AssertPtr(pCache);
1085 AssertPtr(pcbRead);
1086
1087 rc = pCache->Backend->pfnRead(pCache->pBackendData, uOffset, cbRead,
1088 pIoCtx, pcbRead);
1089
1090 LogFlowFunc(("returns rc=%Rrc pcbRead=%zu\n", rc, *pcbRead));
1091 return rc;
1092}
1093
1094/**
1095 * Internal: Writes data for the given block into the cache.
1096 *
1097 * @returns VBox status code.
1098 * @param pCache The cache to write to.
1099 * @param uOffset Offset of the virtual disk to write to the cache.
1100 * @param cbWrite How much to write.
1101 * @param pIoCtx The I/O context to ẃrite from.
1102 * @param pcbWritten How much data could be written, optional.
1103 */
1104static int vdCacheWriteHelper(PVDCACHE pCache, uint64_t uOffset, size_t cbWrite,
1105 PVDIOCTX pIoCtx, size_t *pcbWritten)
1106{
1107 int rc = VINF_SUCCESS;
1108
1109 LogFlowFunc(("pCache=%#p uOffset=%llu pIoCtx=%p cbWrite=%zu pcbWritten=%#p\n",
1110 pCache, uOffset, pIoCtx, cbWrite, pcbWritten));
1111
1112 AssertPtr(pCache);
1113 AssertPtr(pIoCtx);
1114 Assert(cbWrite > 0);
1115
1116 if (pcbWritten)
1117 rc = pCache->Backend->pfnWrite(pCache->pBackendData, uOffset, cbWrite,
1118 pIoCtx, pcbWritten);
1119 else
1120 {
1121 size_t cbWritten = 0;
1122
1123 do
1124 {
1125 rc = pCache->Backend->pfnWrite(pCache->pBackendData, uOffset, cbWrite,
1126 pIoCtx, &cbWritten);
1127 uOffset += cbWritten;
1128 cbWrite -= cbWritten;
1129 } while ( cbWrite
1130 && ( RT_SUCCESS(rc)
1131 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS));
1132 }
1133
1134 LogFlowFunc(("returns rc=%Rrc pcbWritten=%zu\n",
1135 rc, pcbWritten ? *pcbWritten : cbWrite));
1136 return rc;
1137}
1138
1139/**
1140 * Creates a new empty discard state.
1141 *
1142 * @returns Pointer to the new discard state or NULL if out of memory.
1143 */
1144static PVDDISCARDSTATE vdDiscardStateCreate(void)
1145{
1146 PVDDISCARDSTATE pDiscard = (PVDDISCARDSTATE)RTMemAllocZ(sizeof(VDDISCARDSTATE));
1147
1148 if (pDiscard)
1149 {
1150 RTListInit(&pDiscard->ListLru);
1151 pDiscard->pTreeBlocks = (PAVLRU64TREE)RTMemAllocZ(sizeof(AVLRU64TREE));
1152 if (!pDiscard->pTreeBlocks)
1153 {
1154 RTMemFree(pDiscard);
1155 pDiscard = NULL;
1156 }
1157 }
1158
1159 return pDiscard;
1160}
1161
1162/**
1163 * Removes the least recently used blocks from the waiting list until
1164 * the new value is reached.
1165 *
1166 * @returns VBox status code.
1167 * @param pDisk VD disk container.
1168 * @param pDiscard The discard state.
1169 * @param cbDiscardingNew How many bytes should be waiting on success.
1170 * The number of bytes waiting can be less.
1171 */
1172static int vdDiscardRemoveBlocks(PVBOXHDD pDisk, PVDDISCARDSTATE pDiscard, size_t cbDiscardingNew)
1173{
1174 int rc = VINF_SUCCESS;
1175
1176 LogFlowFunc(("pDisk=%#p pDiscard=%#p cbDiscardingNew=%zu\n",
1177 pDisk, pDiscard, cbDiscardingNew));
1178
1179 while (pDiscard->cbDiscarding > cbDiscardingNew)
1180 {
1181 PVDDISCARDBLOCK pBlock = RTListGetLast(&pDiscard->ListLru, VDDISCARDBLOCK, NodeLru);
1182
1183 Assert(!RTListIsEmpty(&pDiscard->ListLru));
1184
1185 /* Go over the allocation bitmap and mark all discarded sectors as unused. */
1186 uint64_t offStart = pBlock->Core.Key;
1187 uint32_t idxStart = 0;
1188 size_t cbLeft = pBlock->cbDiscard;
1189 bool fAllocated = ASMBitTest(pBlock->pbmAllocated, idxStart);
1190 uint32_t cSectors = (uint32_t)(pBlock->cbDiscard / 512);
1191
1192 while (cbLeft > 0)
1193 {
1194 int32_t idxEnd;
1195 size_t cbThis = cbLeft;
1196
1197 if (fAllocated)
1198 {
1199 /* Check for the first unallocated bit. */
1200 idxEnd = ASMBitNextClear(pBlock->pbmAllocated, cSectors, idxStart);
1201 if (idxEnd != -1)
1202 {
1203 cbThis = (idxEnd - idxStart) * 512;
1204 fAllocated = false;
1205 }
1206 }
1207 else
1208 {
1209 /* Mark as unused and check for the first set bit. */
1210 idxEnd = ASMBitNextSet(pBlock->pbmAllocated, cSectors, idxStart);
1211 if (idxEnd != -1)
1212 cbThis = (idxEnd - idxStart) * 512;
1213
1214
1215 VDIOCTX IoCtx;
1216 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_DISCARD, 0, 0, NULL,
1217 NULL, NULL, NULL, VDIOCTX_FLAGS_SYNC);
1218 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData,
1219 &IoCtx, offStart, cbThis, NULL,
1220 NULL, &cbThis, NULL,
1221 VD_DISCARD_MARK_UNUSED);
1222 if (RT_FAILURE(rc))
1223 break;
1224
1225 fAllocated = true;
1226 }
1227
1228 idxStart = idxEnd;
1229 offStart += cbThis;
1230 cbLeft -= cbThis;
1231 }
1232
1233 if (RT_FAILURE(rc))
1234 break;
1235
1236 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
1237 Assert(pBlockRemove == pBlock);
1238 RTListNodeRemove(&pBlock->NodeLru);
1239
1240 pDiscard->cbDiscarding -= pBlock->cbDiscard;
1241 RTMemFree(pBlock->pbmAllocated);
1242 RTMemFree(pBlock);
1243 }
1244
1245 Assert(RT_FAILURE(rc) || pDiscard->cbDiscarding <= cbDiscardingNew);
1246
1247 LogFlowFunc(("returns rc=%Rrc\n", rc));
1248 return rc;
1249}
1250
1251/**
1252 * Destroys the current discard state, writing any waiting blocks to the image.
1253 *
1254 * @returns VBox status code.
1255 * @param pDisk VD disk container.
1256 */
1257static int vdDiscardStateDestroy(PVBOXHDD pDisk)
1258{
1259 int rc = VINF_SUCCESS;
1260
1261 if (pDisk->pDiscard)
1262 {
1263 rc = vdDiscardRemoveBlocks(pDisk, pDisk->pDiscard, 0 /* Remove all blocks. */);
1264 AssertRC(rc);
1265 RTMemFree(pDisk->pDiscard->pTreeBlocks);
1266 RTMemFree(pDisk->pDiscard);
1267 pDisk->pDiscard = NULL;
1268 }
1269
1270 return rc;
1271}
1272
1273/**
1274 * Marks the given range as allocated in the image.
1275 * Required if there are discards in progress and a write to a block which can get discarded
1276 * is written to.
1277 *
1278 * @returns VBox status code.
1279 * @param pDisk VD container data.
1280 * @param uOffset First byte to mark as allocated.
1281 * @param cbRange Number of bytes to mark as allocated.
1282 */
1283static int vdDiscardSetRangeAllocated(PVBOXHDD pDisk, uint64_t uOffset, size_t cbRange)
1284{
1285 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
1286 int rc = VINF_SUCCESS;
1287
1288 if (pDiscard)
1289 {
1290 do
1291 {
1292 size_t cbThisRange = cbRange;
1293 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTAvlrU64RangeGet(pDiscard->pTreeBlocks, uOffset);
1294
1295 if (pBlock)
1296 {
1297 int32_t idxStart, idxEnd;
1298
1299 Assert(!(cbThisRange % 512));
1300 Assert(!((uOffset - pBlock->Core.Key) % 512));
1301
1302 cbThisRange = RT_MIN(cbThisRange, pBlock->Core.KeyLast - uOffset + 1);
1303
1304 idxStart = (uOffset - pBlock->Core.Key) / 512;
1305 idxEnd = idxStart + (int32_t)(cbThisRange / 512);
1306 ASMBitSetRange(pBlock->pbmAllocated, idxStart, idxEnd);
1307 }
1308 else
1309 {
1310 pBlock = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, uOffset, true);
1311 if (pBlock)
1312 cbThisRange = RT_MIN(cbThisRange, pBlock->Core.Key - uOffset);
1313 }
1314
1315 Assert(cbRange >= cbThisRange);
1316
1317 uOffset += cbThisRange;
1318 cbRange -= cbThisRange;
1319 } while (cbRange != 0);
1320 }
1321
1322 return rc;
1323}
1324
1325DECLINLINE(PVDIOCTX) vdIoCtxAlloc(PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1326 uint64_t uOffset, size_t cbTransfer,
1327 PVDIMAGE pImageStart,PCRTSGBUF pcSgBuf,
1328 void *pvAllocation, PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1329 uint32_t fFlags)
1330{
1331 PVDIOCTX pIoCtx = NULL;
1332
1333 pIoCtx = (PVDIOCTX)RTMemCacheAlloc(pDisk->hMemCacheIoCtx);
1334 if (RT_LIKELY(pIoCtx))
1335 {
1336 vdIoCtxInit(pIoCtx, pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1337 pcSgBuf, pvAllocation, pfnIoCtxTransfer, fFlags);
1338 }
1339
1340 return pIoCtx;
1341}
1342
1343DECLINLINE(PVDIOCTX) vdIoCtxRootAlloc(PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1344 uint64_t uOffset, size_t cbTransfer,
1345 PVDIMAGE pImageStart, PCRTSGBUF pcSgBuf,
1346 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1347 void *pvUser1, void *pvUser2,
1348 void *pvAllocation,
1349 PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1350 uint32_t fFlags)
1351{
1352 PVDIOCTX pIoCtx = vdIoCtxAlloc(pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1353 pcSgBuf, pvAllocation, pfnIoCtxTransfer, fFlags);
1354
1355 if (RT_LIKELY(pIoCtx))
1356 {
1357 pIoCtx->pIoCtxParent = NULL;
1358 pIoCtx->Type.Root.pfnComplete = pfnComplete;
1359 pIoCtx->Type.Root.pvUser1 = pvUser1;
1360 pIoCtx->Type.Root.pvUser2 = pvUser2;
1361 }
1362
1363 LogFlow(("Allocated root I/O context %#p\n", pIoCtx));
1364 return pIoCtx;
1365}
1366
1367DECLINLINE(void) vdIoCtxDiscardInit(PVDIOCTX pIoCtx, PVBOXHDD pDisk, PCRTRANGE paRanges,
1368 unsigned cRanges, PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1369 void *pvUser1, void *pvUser2, void *pvAllocation,
1370 PFNVDIOCTXTRANSFER pfnIoCtxTransfer, uint32_t fFlags)
1371{
1372 pIoCtx->pIoCtxNext = NULL;
1373 pIoCtx->pDisk = pDisk;
1374 pIoCtx->enmTxDir = VDIOCTXTXDIR_DISCARD;
1375 pIoCtx->cDataTransfersPending = 0;
1376 pIoCtx->cMetaTransfersPending = 0;
1377 pIoCtx->fComplete = false;
1378 pIoCtx->fFlags = fFlags;
1379 pIoCtx->pvAllocation = pvAllocation;
1380 pIoCtx->pfnIoCtxTransfer = pfnIoCtxTransfer;
1381 pIoCtx->pfnIoCtxTransferNext = NULL;
1382 pIoCtx->rcReq = VINF_SUCCESS;
1383 pIoCtx->Req.Discard.paRanges = paRanges;
1384 pIoCtx->Req.Discard.cRanges = cRanges;
1385 pIoCtx->Req.Discard.idxRange = 0;
1386 pIoCtx->Req.Discard.cbDiscardLeft = 0;
1387 pIoCtx->Req.Discard.offCur = 0;
1388 pIoCtx->Req.Discard.cbThisDiscard = 0;
1389
1390 pIoCtx->pIoCtxParent = NULL;
1391 pIoCtx->Type.Root.pfnComplete = pfnComplete;
1392 pIoCtx->Type.Root.pvUser1 = pvUser1;
1393 pIoCtx->Type.Root.pvUser2 = pvUser2;
1394}
1395
1396DECLINLINE(PVDIOCTX) vdIoCtxDiscardAlloc(PVBOXHDD pDisk, PCRTRANGE paRanges,
1397 unsigned cRanges,
1398 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1399 void *pvUser1, void *pvUser2,
1400 void *pvAllocation,
1401 PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1402 uint32_t fFlags)
1403{
1404 PVDIOCTX pIoCtx = NULL;
1405
1406 pIoCtx = (PVDIOCTX)RTMemCacheAlloc(pDisk->hMemCacheIoCtx);
1407 if (RT_LIKELY(pIoCtx))
1408 {
1409 vdIoCtxDiscardInit(pIoCtx, pDisk, paRanges, cRanges, pfnComplete, pvUser1,
1410 pvUser2, pvAllocation, pfnIoCtxTransfer, fFlags);
1411 }
1412
1413 LogFlow(("Allocated discard I/O context %#p\n", pIoCtx));
1414 return pIoCtx;
1415}
1416
1417DECLINLINE(PVDIOCTX) vdIoCtxChildAlloc(PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1418 uint64_t uOffset, size_t cbTransfer,
1419 PVDIMAGE pImageStart, PCRTSGBUF pcSgBuf,
1420 PVDIOCTX pIoCtxParent, size_t cbTransferParent,
1421 size_t cbWriteParent, void *pvAllocation,
1422 PFNVDIOCTXTRANSFER pfnIoCtxTransfer)
1423{
1424 PVDIOCTX pIoCtx = vdIoCtxAlloc(pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1425 pcSgBuf, pvAllocation, pfnIoCtxTransfer, pIoCtxParent->fFlags & ~VDIOCTX_FLAGS_DONT_FREE);
1426
1427 AssertPtr(pIoCtxParent);
1428 Assert(!pIoCtxParent->pIoCtxParent);
1429
1430 if (RT_LIKELY(pIoCtx))
1431 {
1432 pIoCtx->pIoCtxParent = pIoCtxParent;
1433 pIoCtx->Type.Child.uOffsetSaved = uOffset;
1434 pIoCtx->Type.Child.cbTransferLeftSaved = cbTransfer;
1435 pIoCtx->Type.Child.cbTransferParent = cbTransferParent;
1436 pIoCtx->Type.Child.cbWriteParent = cbWriteParent;
1437 }
1438
1439 LogFlow(("Allocated child I/O context %#p\n", pIoCtx));
1440 return pIoCtx;
1441}
1442
1443DECLINLINE(PVDIOTASK) vdIoTaskUserAlloc(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser, PVDIOCTX pIoCtx, uint32_t cbTransfer)
1444{
1445 PVDIOTASK pIoTask = NULL;
1446
1447 pIoTask = (PVDIOTASK)RTMemCacheAlloc(pIoStorage->pVDIo->pDisk->hMemCacheIoTask);
1448 if (pIoTask)
1449 {
1450 pIoTask->pIoStorage = pIoStorage;
1451 pIoTask->pfnComplete = pfnComplete;
1452 pIoTask->pvUser = pvUser;
1453 pIoTask->fMeta = false;
1454 pIoTask->Type.User.cbTransfer = cbTransfer;
1455 pIoTask->Type.User.pIoCtx = pIoCtx;
1456 }
1457
1458 return pIoTask;
1459}
1460
1461DECLINLINE(PVDIOTASK) vdIoTaskMetaAlloc(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser, PVDMETAXFER pMetaXfer)
1462{
1463 PVDIOTASK pIoTask = NULL;
1464
1465 pIoTask = (PVDIOTASK)RTMemCacheAlloc(pIoStorage->pVDIo->pDisk->hMemCacheIoTask);
1466 if (pIoTask)
1467 {
1468 pIoTask->pIoStorage = pIoStorage;
1469 pIoTask->pfnComplete = pfnComplete;
1470 pIoTask->pvUser = pvUser;
1471 pIoTask->fMeta = true;
1472 pIoTask->Type.Meta.pMetaXfer = pMetaXfer;
1473 }
1474
1475 return pIoTask;
1476}
1477
1478DECLINLINE(void) vdIoCtxFree(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1479{
1480 Log(("Freeing I/O context %#p\n", pIoCtx));
1481
1482 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_DONT_FREE))
1483 {
1484 if (pIoCtx->pvAllocation)
1485 RTMemFree(pIoCtx->pvAllocation);
1486#ifdef DEBUG
1487 memset(&pIoCtx->pDisk, 0xff, sizeof(void *));
1488#endif
1489 RTMemCacheFree(pDisk->hMemCacheIoCtx, pIoCtx);
1490 }
1491}
1492
1493DECLINLINE(void) vdIoTaskFree(PVBOXHDD pDisk, PVDIOTASK pIoTask)
1494{
1495#ifdef DEBUG
1496 memset(pIoTask, 0xff, sizeof(VDIOTASK));
1497#endif
1498 RTMemCacheFree(pDisk->hMemCacheIoTask, pIoTask);
1499}
1500
1501DECLINLINE(void) vdIoCtxChildReset(PVDIOCTX pIoCtx)
1502{
1503 AssertPtr(pIoCtx->pIoCtxParent);
1504
1505 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
1506 pIoCtx->Req.Io.uOffset = pIoCtx->Type.Child.uOffsetSaved;
1507 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)pIoCtx->Type.Child.cbTransferLeftSaved;
1508 Assert((uint32_t)pIoCtx->Type.Child.cbTransferLeftSaved == pIoCtx->Type.Child.cbTransferLeftSaved);
1509}
1510
1511DECLINLINE(PVDMETAXFER) vdMetaXferAlloc(PVDIOSTORAGE pIoStorage, uint64_t uOffset, size_t cb)
1512{
1513 PVDMETAXFER pMetaXfer = (PVDMETAXFER)RTMemAlloc(RT_OFFSETOF(VDMETAXFER, abData[cb]));
1514
1515 if (RT_LIKELY(pMetaXfer))
1516 {
1517 pMetaXfer->Core.Key = uOffset;
1518 pMetaXfer->Core.KeyLast = uOffset + cb - 1;
1519 pMetaXfer->fFlags = VDMETAXFER_TXDIR_NONE;
1520 pMetaXfer->cbMeta = cb;
1521 pMetaXfer->pIoStorage = pIoStorage;
1522 pMetaXfer->cRefs = 0;
1523 RTListInit(&pMetaXfer->ListIoCtxWaiting);
1524 }
1525 return pMetaXfer;
1526}
1527
1528DECLINLINE(void) vdIoCtxAddToWaitingList(volatile PVDIOCTX *ppList, PVDIOCTX pIoCtx)
1529{
1530 /* Put it on the waiting list. */
1531 PVDIOCTX pNext = ASMAtomicUoReadPtrT(ppList, PVDIOCTX);
1532 PVDIOCTX pHeadOld;
1533 pIoCtx->pIoCtxNext = pNext;
1534 while (!ASMAtomicCmpXchgExPtr(ppList, pIoCtx, pNext, &pHeadOld))
1535 {
1536 pNext = pHeadOld;
1537 Assert(pNext != pIoCtx);
1538 pIoCtx->pIoCtxNext = pNext;
1539 ASMNopPause();
1540 }
1541}
1542
1543DECLINLINE(void) vdIoCtxDefer(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1544{
1545 LogFlowFunc(("Deferring write pIoCtx=%#p\n", pIoCtx));
1546
1547 Assert(!pIoCtx->pIoCtxParent && !(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED));
1548 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
1549 vdIoCtxAddToWaitingList(&pDisk->pIoCtxBlockedHead, pIoCtx);
1550}
1551
1552static size_t vdIoCtxCopy(PVDIOCTX pIoCtxDst, PVDIOCTX pIoCtxSrc, size_t cbData)
1553{
1554 return RTSgBufCopy(&pIoCtxDst->Req.Io.SgBuf, &pIoCtxSrc->Req.Io.SgBuf, cbData);
1555}
1556
1557static int vdIoCtxCmp(PVDIOCTX pIoCtx1, PVDIOCTX pIoCtx2, size_t cbData)
1558{
1559 return RTSgBufCmp(&pIoCtx1->Req.Io.SgBuf, &pIoCtx2->Req.Io.SgBuf, cbData);
1560}
1561
1562static size_t vdIoCtxCopyTo(PVDIOCTX pIoCtx, const uint8_t *pbData, size_t cbData)
1563{
1564 return RTSgBufCopyFromBuf(&pIoCtx->Req.Io.SgBuf, pbData, cbData);
1565}
1566
1567static size_t vdIoCtxCopyFrom(PVDIOCTX pIoCtx, uint8_t *pbData, size_t cbData)
1568{
1569 return RTSgBufCopyToBuf(&pIoCtx->Req.Io.SgBuf, pbData, cbData);
1570}
1571
1572static size_t vdIoCtxSet(PVDIOCTX pIoCtx, uint8_t ch, size_t cbData)
1573{
1574 return RTSgBufSet(&pIoCtx->Req.Io.SgBuf, ch, cbData);
1575}
1576
1577/**
1578 * Process the I/O context, core method which assumes that the I/O context
1579 * acquired the lock.
1580 *
1581 * @returns VBox status code.
1582 * @param pIoCtx I/O context to process.
1583 */
1584static int vdIoCtxProcessLocked(PVDIOCTX pIoCtx)
1585{
1586 int rc = VINF_SUCCESS;
1587
1588 VD_IS_LOCKED(pIoCtx->pDisk);
1589
1590 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
1591
1592 if ( !pIoCtx->cMetaTransfersPending
1593 && !pIoCtx->cDataTransfersPending
1594 && !pIoCtx->pfnIoCtxTransfer)
1595 {
1596 rc = VINF_VD_ASYNC_IO_FINISHED;
1597 goto out;
1598 }
1599
1600 /*
1601 * We complete the I/O context in case of an error
1602 * if there is no I/O task pending.
1603 */
1604 if ( RT_FAILURE(pIoCtx->rcReq)
1605 && !pIoCtx->cMetaTransfersPending
1606 && !pIoCtx->cDataTransfersPending)
1607 {
1608 rc = VINF_VD_ASYNC_IO_FINISHED;
1609 goto out;
1610 }
1611
1612 /* Don't change anything if there is a metadata transfer pending or we are blocked. */
1613 if ( pIoCtx->cMetaTransfersPending
1614 || (pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
1615 {
1616 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1617 goto out;
1618 }
1619
1620 if (pIoCtx->pfnIoCtxTransfer)
1621 {
1622 /* Call the transfer function advancing to the next while there is no error. */
1623 while ( pIoCtx->pfnIoCtxTransfer
1624 && !pIoCtx->cMetaTransfersPending
1625 && RT_SUCCESS(rc))
1626 {
1627 LogFlowFunc(("calling transfer function %#p\n", pIoCtx->pfnIoCtxTransfer));
1628 rc = pIoCtx->pfnIoCtxTransfer(pIoCtx);
1629
1630 /* Advance to the next part of the transfer if the current one succeeded. */
1631 if (RT_SUCCESS(rc))
1632 {
1633 pIoCtx->pfnIoCtxTransfer = pIoCtx->pfnIoCtxTransferNext;
1634 pIoCtx->pfnIoCtxTransferNext = NULL;
1635 }
1636 }
1637 }
1638
1639 if ( RT_SUCCESS(rc)
1640 && !pIoCtx->cMetaTransfersPending
1641 && !pIoCtx->cDataTransfersPending)
1642 rc = VINF_VD_ASYNC_IO_FINISHED;
1643 else if ( RT_SUCCESS(rc)
1644 || rc == VERR_VD_NOT_ENOUGH_METADATA
1645 || rc == VERR_VD_IOCTX_HALT)
1646 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1647 else if ( RT_FAILURE(rc)
1648 && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
1649 {
1650 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rc, VINF_SUCCESS);
1651
1652 /*
1653 * The I/O context completed if we have an error and there is no data
1654 * or meta data transfer pending.
1655 */
1656 if ( !pIoCtx->cMetaTransfersPending
1657 && !pIoCtx->cDataTransfersPending)
1658 rc = VINF_VD_ASYNC_IO_FINISHED;
1659 else
1660 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1661 }
1662
1663out:
1664 LogFlowFunc(("pIoCtx=%#p rc=%Rrc cDataTransfersPending=%u cMetaTransfersPending=%u fComplete=%RTbool\n",
1665 pIoCtx, rc, pIoCtx->cDataTransfersPending, pIoCtx->cMetaTransfersPending,
1666 pIoCtx->fComplete));
1667
1668 return rc;
1669}
1670
1671/**
1672 * Processes the list of waiting I/O contexts.
1673 *
1674 * @returns VBox status code, only valid if pIoCtxRc is not NULL, treat as void
1675 * function otherwise.
1676 * @param pDisk The disk structure.
1677 * @param pIoCtxRc An I/O context handle which waits on the list. When processed
1678 * The status code is returned. NULL if there is no I/O context
1679 * to return the status code for.
1680 */
1681static int vdDiskProcessWaitingIoCtx(PVBOXHDD pDisk, PVDIOCTX pIoCtxRc)
1682{
1683 int rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1684
1685 LogFlowFunc(("pDisk=%#p pIoCtxRc=%#p\n", pDisk, pIoCtxRc));
1686
1687 VD_IS_LOCKED(pDisk);
1688
1689 /* Get the waiting list and process it in FIFO order. */
1690 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxHead, NULL, PVDIOCTX);
1691
1692 /* Reverse it. */
1693 PVDIOCTX pCur = pIoCtxHead;
1694 pIoCtxHead = NULL;
1695 while (pCur)
1696 {
1697 PVDIOCTX pInsert = pCur;
1698 pCur = pCur->pIoCtxNext;
1699 pInsert->pIoCtxNext = pIoCtxHead;
1700 pIoCtxHead = pInsert;
1701 }
1702
1703 /* Process now. */
1704 pCur = pIoCtxHead;
1705 while (pCur)
1706 {
1707 int rcTmp;
1708 PVDIOCTX pTmp = pCur;
1709
1710 pCur = pCur->pIoCtxNext;
1711 pTmp->pIoCtxNext = NULL;
1712
1713 /*
1714 * Need to clear the sync flag here if there is a new I/O context
1715 * with it set and the context is not given in pIoCtxRc.
1716 * This happens most likely on a different thread and that one shouldn't
1717 * process the context synchronously.
1718 *
1719 * The thread who issued the context will wait on the event semaphore
1720 * anyway which is signalled when the completion handler is called.
1721 */
1722 if ( pTmp->fFlags & VDIOCTX_FLAGS_SYNC
1723 && pTmp != pIoCtxRc)
1724 pTmp->fFlags &= ~VDIOCTX_FLAGS_SYNC;
1725
1726 rcTmp = vdIoCtxProcessLocked(pTmp);
1727 if (pTmp == pIoCtxRc)
1728 {
1729 /* The given I/O context was processed, pass the return code to the caller. */
1730 if ( rcTmp == VINF_VD_ASYNC_IO_FINISHED
1731 && (pTmp->fFlags & VDIOCTX_FLAGS_SYNC))
1732 rc = pTmp->rcReq;
1733 else
1734 rc = rcTmp;
1735 }
1736 else if ( rcTmp == VINF_VD_ASYNC_IO_FINISHED
1737 && ASMAtomicCmpXchgBool(&pTmp->fComplete, true, false))
1738 {
1739 LogFlowFunc(("Waiting I/O context completed pTmp=%#p\n", pTmp));
1740 vdThreadFinishWrite(pDisk);
1741 vdIoCtxRootComplete(pDisk, pTmp);
1742 vdIoCtxFree(pDisk, pTmp);
1743 }
1744 }
1745
1746 LogFlowFunc(("returns rc=%Rrc\n", rc));
1747 return rc;
1748}
1749
1750/**
1751 * Processes the list of blocked I/O contexts.
1752 *
1753 * @returns nothing.
1754 * @param pDisk The disk structure.
1755 */
1756static void vdDiskProcessBlockedIoCtx(PVBOXHDD pDisk)
1757{
1758 LogFlowFunc(("pDisk=%#p\n", pDisk));
1759
1760 VD_IS_LOCKED(pDisk);
1761
1762 /* Get the waiting list and process it in FIFO order. */
1763 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxBlockedHead, NULL, PVDIOCTX);
1764
1765 /* Reverse it. */
1766 PVDIOCTX pCur = pIoCtxHead;
1767 pIoCtxHead = NULL;
1768 while (pCur)
1769 {
1770 PVDIOCTX pInsert = pCur;
1771 pCur = pCur->pIoCtxNext;
1772 pInsert->pIoCtxNext = pIoCtxHead;
1773 pIoCtxHead = pInsert;
1774 }
1775
1776 /* Process now. */
1777 pCur = pIoCtxHead;
1778 while (pCur)
1779 {
1780 int rc;
1781 PVDIOCTX pTmp = pCur;
1782
1783 pCur = pCur->pIoCtxNext;
1784 pTmp->pIoCtxNext = NULL;
1785
1786 Assert(!pTmp->pIoCtxParent);
1787 Assert(pTmp->fFlags & VDIOCTX_FLAGS_BLOCKED);
1788 pTmp->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
1789
1790 rc = vdIoCtxProcessLocked(pTmp);
1791 if ( rc == VINF_VD_ASYNC_IO_FINISHED
1792 && ASMAtomicCmpXchgBool(&pTmp->fComplete, true, false))
1793 {
1794 LogFlowFunc(("Waiting I/O context completed pTmp=%#p\n", pTmp));
1795 vdThreadFinishWrite(pDisk);
1796 vdIoCtxRootComplete(pDisk, pTmp);
1797 vdIoCtxFree(pDisk, pTmp);
1798 }
1799 }
1800
1801 LogFlowFunc(("returns\n"));
1802}
1803
1804/**
1805 * Processes the I/O context trying to lock the criticial section.
1806 * The context is deferred if the critical section is busy.
1807 *
1808 * @returns VBox status code.
1809 * @param pIoCtx The I/O context to process.
1810 */
1811static int vdIoCtxProcessTryLockDefer(PVDIOCTX pIoCtx)
1812{
1813 int rc = VINF_SUCCESS;
1814 PVBOXHDD pDisk = pIoCtx->pDisk;
1815
1816 Log(("Defer pIoCtx=%#p\n", pIoCtx));
1817
1818 /* Put it on the waiting list first. */
1819 vdIoCtxAddToWaitingList(&pDisk->pIoCtxHead, pIoCtx);
1820
1821 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
1822 {
1823 /* Leave it again, the context will be processed just before leaving the lock. */
1824 LogFlowFunc(("Successfully acquired the lock\n"));
1825 rc = vdDiskUnlock(pDisk, pIoCtx);
1826 }
1827 else
1828 {
1829 LogFlowFunc(("Lock is held\n"));
1830 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1831 }
1832
1833 return rc;
1834}
1835
1836/**
1837 * Process the I/O context in a synchronous manner, waiting
1838 * for it to complete.
1839 *
1840 * @returns VBox status code of the completed request.
1841 * @param pIoCtx The sync I/O context.
1842 * @param hEventComplete Event sempahore to wait on for completion.
1843 */
1844static int vdIoCtxProcessSync(PVDIOCTX pIoCtx, RTSEMEVENT hEventComplete)
1845{
1846 int rc = VINF_SUCCESS;
1847 PVBOXHDD pDisk = pIoCtx->pDisk;
1848
1849 LogFlowFunc(("pIoCtx=%p\n", pIoCtx));
1850
1851 AssertMsg(pIoCtx->fFlags & (VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE),
1852 ("I/O context is not marked as synchronous\n"));
1853
1854 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
1855 if (rc == VINF_VD_ASYNC_IO_FINISHED)
1856 rc = VINF_SUCCESS;
1857
1858 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
1859 {
1860 rc = RTSemEventWait(hEventComplete, RT_INDEFINITE_WAIT);
1861 AssertRC(rc);
1862 }
1863
1864 rc = pIoCtx->rcReq;
1865 vdIoCtxFree(pDisk, pIoCtx);
1866
1867 return rc;
1868}
1869
1870DECLINLINE(bool) vdIoCtxIsDiskLockOwner(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1871{
1872 return pDisk->pIoCtxLockOwner == pIoCtx;
1873}
1874
1875static int vdIoCtxLockDisk(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1876{
1877 int rc = VINF_SUCCESS;
1878
1879 VD_IS_LOCKED(pDisk);
1880
1881 LogFlowFunc(("pDisk=%#p pIoCtx=%#p\n", pDisk, pIoCtx));
1882
1883 if (!ASMAtomicCmpXchgPtr(&pDisk->pIoCtxLockOwner, pIoCtx, NIL_VDIOCTX))
1884 {
1885 Assert(pDisk->pIoCtxLockOwner != pIoCtx); /* No nesting allowed. */
1886 vdIoCtxDefer(pDisk, pIoCtx);
1887 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1888 }
1889
1890 LogFlowFunc(("returns -> %Rrc\n", rc));
1891 return rc;
1892}
1893
1894static void vdIoCtxUnlockDisk(PVBOXHDD pDisk, PVDIOCTX pIoCtx, bool fProcessBlockedReqs)
1895{
1896 LogFlowFunc(("pDisk=%#p pIoCtx=%#p fProcessBlockedReqs=%RTbool\n",
1897 pDisk, pIoCtx, fProcessBlockedReqs));
1898
1899 VD_IS_LOCKED(pDisk);
1900
1901 LogFlow(("Unlocking disk lock owner is %#p\n", pDisk->pIoCtxLockOwner));
1902 Assert(pDisk->pIoCtxLockOwner == pIoCtx);
1903 ASMAtomicXchgPtrT(&pDisk->pIoCtxLockOwner, NIL_VDIOCTX, PVDIOCTX);
1904
1905 if (fProcessBlockedReqs)
1906 {
1907 /* Process any blocked writes if the current request didn't caused another growing. */
1908 vdDiskProcessBlockedIoCtx(pDisk);
1909 }
1910
1911 LogFlowFunc(("returns\n"));
1912}
1913
1914/**
1915 * Internal: Reads a given amount of data from the image chain of the disk.
1916 **/
1917static int vdDiskReadHelper(PVBOXHDD pDisk, PVDIMAGE pImage, PVDIMAGE pImageParentOverride,
1918 uint64_t uOffset, size_t cbRead, PVDIOCTX pIoCtx, size_t *pcbThisRead)
1919{
1920 int rc = VINF_SUCCESS;
1921 size_t cbThisRead = cbRead;
1922
1923 AssertPtr(pcbThisRead);
1924
1925 *pcbThisRead = 0;
1926
1927 /*
1928 * Try to read from the given image.
1929 * If the block is not allocated read from override chain if present.
1930 */
1931 rc = pImage->Backend->pfnRead(pImage->pBackendData,
1932 uOffset, cbThisRead, pIoCtx,
1933 &cbThisRead);
1934
1935 if (rc == VERR_VD_BLOCK_FREE)
1936 {
1937 for (PVDIMAGE pCurrImage = pImageParentOverride ? pImageParentOverride : pImage->pPrev;
1938 pCurrImage != NULL && rc == VERR_VD_BLOCK_FREE;
1939 pCurrImage = pCurrImage->pPrev)
1940 {
1941 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
1942 uOffset, cbThisRead, pIoCtx,
1943 &cbThisRead);
1944 }
1945 }
1946
1947 if (RT_SUCCESS(rc) || rc == VERR_VD_BLOCK_FREE)
1948 *pcbThisRead = cbThisRead;
1949
1950 return rc;
1951}
1952
1953/**
1954 * internal: read the specified amount of data in whatever blocks the backend
1955 * will give us - async version.
1956 */
1957static int vdReadHelperAsync(PVDIOCTX pIoCtx)
1958{
1959 int rc;
1960 PVBOXHDD pDisk = pIoCtx->pDisk;
1961 size_t cbToRead = pIoCtx->Req.Io.cbTransfer;
1962 uint64_t uOffset = pIoCtx->Req.Io.uOffset;
1963 PVDIMAGE pCurrImage = pIoCtx->Req.Io.pImageCur;
1964 PVDIMAGE pImageParentOverride = pIoCtx->Req.Io.pImageParentOverride;
1965 unsigned cImagesRead = pIoCtx->Req.Io.cImagesRead;
1966 size_t cbThisRead;
1967
1968 /* Loop until all reads started or we have a backend which needs to read metadata. */
1969 do
1970 {
1971 /* Search for image with allocated block. Do not attempt to read more
1972 * than the previous reads marked as valid. Otherwise this would return
1973 * stale data when different block sizes are used for the images. */
1974 cbThisRead = cbToRead;
1975
1976 if ( pDisk->pCache
1977 && !pImageParentOverride)
1978 {
1979 rc = vdCacheReadHelper(pDisk->pCache, uOffset, cbThisRead,
1980 pIoCtx, &cbThisRead);
1981 if (rc == VERR_VD_BLOCK_FREE)
1982 {
1983 rc = vdDiskReadHelper(pDisk, pCurrImage, NULL, uOffset, cbThisRead,
1984 pIoCtx, &cbThisRead);
1985
1986 /* If the read was successful, write the data back into the cache. */
1987 if ( RT_SUCCESS(rc)
1988 && pIoCtx->fFlags & VDIOCTX_FLAGS_READ_UPDATE_CACHE)
1989 {
1990 rc = vdCacheWriteHelper(pDisk->pCache, uOffset, cbThisRead,
1991 pIoCtx, NULL);
1992 }
1993 }
1994 }
1995 else
1996 {
1997
1998 /*
1999 * Try to read from the given image.
2000 * If the block is not allocated read from override chain if present.
2001 */
2002 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
2003 uOffset, cbThisRead, pIoCtx,
2004 &cbThisRead);
2005
2006 if ( rc == VERR_VD_BLOCK_FREE
2007 && cImagesRead != 1)
2008 {
2009 unsigned cImagesToProcess = cImagesRead;
2010
2011 pCurrImage = pImageParentOverride ? pImageParentOverride : pCurrImage->pPrev;
2012 pIoCtx->Req.Io.pImageParentOverride = NULL;
2013
2014 while (pCurrImage && rc == VERR_VD_BLOCK_FREE)
2015 {
2016 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
2017 uOffset, cbThisRead,
2018 pIoCtx, &cbThisRead);
2019 if (cImagesToProcess == 1)
2020 break;
2021 else if (cImagesToProcess > 0)
2022 cImagesToProcess--;
2023
2024 if (rc == VERR_VD_BLOCK_FREE)
2025 pCurrImage = pCurrImage->pPrev;
2026 }
2027 }
2028 }
2029
2030 /* The task state will be updated on success already, don't do it here!. */
2031 if (rc == VERR_VD_BLOCK_FREE)
2032 {
2033 /* No image in the chain contains the data for the block. */
2034 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbThisRead); Assert(cbThisRead == (uint32_t)cbThisRead);
2035
2036 /* Fill the free space with 0 if we are told to do so
2037 * or a previous read returned valid data. */
2038 if (pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS)
2039 vdIoCtxSet(pIoCtx, '\0', cbThisRead);
2040 else
2041 pIoCtx->Req.Io.cbBufClear += cbThisRead;
2042
2043 if (pIoCtx->Req.Io.pImageCur->uOpenFlags & VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS)
2044 rc = VINF_VD_NEW_ZEROED_BLOCK;
2045 else
2046 rc = VINF_SUCCESS;
2047 }
2048 else if (rc == VERR_VD_IOCTX_HALT)
2049 {
2050 uOffset += cbThisRead;
2051 cbToRead -= cbThisRead;
2052 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2053 }
2054 else if ( RT_SUCCESS(rc)
2055 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2056 {
2057 /* First not free block, fill the space before with 0. */
2058 if ( pIoCtx->Req.Io.cbBufClear
2059 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS))
2060 {
2061 RTSGBUF SgBuf;
2062 RTSgBufClone(&SgBuf, &pIoCtx->Req.Io.SgBuf);
2063 RTSgBufReset(&SgBuf);
2064 RTSgBufSet(&SgBuf, 0, pIoCtx->Req.Io.cbBufClear);
2065 pIoCtx->Req.Io.cbBufClear = 0;
2066 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2067 }
2068 rc = VINF_SUCCESS;
2069 }
2070
2071 if (RT_FAILURE(rc))
2072 break;
2073
2074 cbToRead -= cbThisRead;
2075 uOffset += cbThisRead;
2076 pCurrImage = pIoCtx->Req.Io.pImageStart; /* Start with the highest image in the chain. */
2077 } while (cbToRead != 0 && RT_SUCCESS(rc));
2078
2079 if ( rc == VERR_VD_NOT_ENOUGH_METADATA
2080 || rc == VERR_VD_IOCTX_HALT)
2081 {
2082 /* Save the current state. */
2083 pIoCtx->Req.Io.uOffset = uOffset;
2084 pIoCtx->Req.Io.cbTransfer = cbToRead;
2085 pIoCtx->Req.Io.pImageCur = pCurrImage ? pCurrImage : pIoCtx->Req.Io.pImageStart;
2086 }
2087
2088 return (!(pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS))
2089 ? VERR_VD_BLOCK_FREE
2090 : rc;
2091}
2092
2093/**
2094 * internal: parent image read wrapper for compacting.
2095 */
2096static int vdParentRead(void *pvUser, uint64_t uOffset, void *pvBuf,
2097 size_t cbRead)
2098{
2099 PVDPARENTSTATEDESC pParentState = (PVDPARENTSTATEDESC)pvUser;
2100
2101 /** @todo
2102 * Only used for compaction so far which is not possible to mix with async I/O.
2103 * Needs to be changed if we want to support online compaction of images.
2104 */
2105 bool fLocked = ASMAtomicXchgBool(&pParentState->pDisk->fLocked, true);
2106 AssertMsgReturn(!fLocked,
2107 ("Calling synchronous parent read while another thread holds the disk lock\n"),
2108 VERR_VD_INVALID_STATE);
2109
2110 /* Fake an I/O context. */
2111 RTSGSEG Segment;
2112 RTSGBUF SgBuf;
2113 VDIOCTX IoCtx;
2114
2115 Segment.pvSeg = pvBuf;
2116 Segment.cbSeg = cbRead;
2117 RTSgBufInit(&SgBuf, &Segment, 1);
2118 vdIoCtxInit(&IoCtx, pParentState->pDisk, VDIOCTXTXDIR_READ, uOffset, cbRead, pParentState->pImage,
2119 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_ZERO_FREE_BLOCKS);
2120 int rc = vdReadHelperAsync(&IoCtx);
2121 ASMAtomicXchgBool(&pParentState->pDisk->fLocked, false);
2122 return rc;
2123}
2124
2125/**
2126 * Extended version of vdReadHelper(), implementing certain optimizations
2127 * for image cloning.
2128 *
2129 * @returns VBox status code.
2130 * @param pDisk The disk to read from.
2131 * @param pImage The image to start reading from.
2132 * @param pImageParentOverride The parent image to read from
2133 * if the starting image returns a free block.
2134 * If NULL is passed the real parent of the image
2135 * in the chain is used.
2136 * @param uOffset Offset in the disk to start reading from.
2137 * @param pvBuf Where to store the read data.
2138 * @param cbRead How much to read.
2139 * @param fZeroFreeBlocks Flag whether free blocks should be zeroed.
2140 * If false and no image has data for sepcified
2141 * range VERR_VD_BLOCK_FREE is returned.
2142 * Note that unallocated blocks are still zeroed
2143 * if at least one image has valid data for a part
2144 * of the range.
2145 * @param fUpdateCache Flag whether to update the attached cache if
2146 * available.
2147 * @param cImagesRead Number of images in the chain to read until
2148 * the read is cut off. A value of 0 disables the cut off.
2149 */
2150static int vdReadHelperEx(PVBOXHDD pDisk, PVDIMAGE pImage, PVDIMAGE pImageParentOverride,
2151 uint64_t uOffset, void *pvBuf, size_t cbRead,
2152 bool fZeroFreeBlocks, bool fUpdateCache, unsigned cImagesRead)
2153{
2154 int rc = VINF_SUCCESS;
2155 uint32_t fFlags = VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE;
2156 RTSGSEG Segment;
2157 RTSGBUF SgBuf;
2158 VDIOCTX IoCtx;
2159 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
2160
2161 rc = RTSemEventCreate(&hEventComplete);
2162 if (RT_FAILURE(rc))
2163 return rc;
2164
2165 if (fZeroFreeBlocks)
2166 fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2167 if (fUpdateCache)
2168 fFlags |= VDIOCTX_FLAGS_READ_UPDATE_CACHE;
2169
2170 Segment.pvSeg = pvBuf;
2171 Segment.cbSeg = cbRead;
2172 RTSgBufInit(&SgBuf, &Segment, 1);
2173 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, uOffset, cbRead, pImage, &SgBuf,
2174 NULL, vdReadHelperAsync, fFlags);
2175
2176 IoCtx.Req.Io.pImageParentOverride = pImageParentOverride;
2177 IoCtx.Req.Io.cImagesRead = cImagesRead;
2178 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
2179 IoCtx.Type.Root.pvUser1 = pDisk;
2180 IoCtx.Type.Root.pvUser2 = hEventComplete;
2181 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
2182 if (RT_SUCCESS(rc))
2183 rc = vdFilterChainApplyRead(pDisk, uOffset, cbRead, &IoCtx);
2184
2185 RTSemEventDestroy(hEventComplete);
2186 return rc;
2187}
2188
2189/**
2190 * internal: read the specified amount of data in whatever blocks the backend
2191 * will give us.
2192 */
2193static int vdReadHelper(PVBOXHDD pDisk, PVDIMAGE pImage, uint64_t uOffset,
2194 void *pvBuf, size_t cbRead, bool fUpdateCache)
2195{
2196 return vdReadHelperEx(pDisk, pImage, NULL, uOffset, pvBuf, cbRead,
2197 true /* fZeroFreeBlocks */, fUpdateCache, 0);
2198}
2199
2200/**
2201 * internal: mark the disk as not modified.
2202 */
2203static void vdResetModifiedFlag(PVBOXHDD pDisk)
2204{
2205 if (pDisk->uModified & VD_IMAGE_MODIFIED_FLAG)
2206 {
2207 /* generate new last-modified uuid */
2208 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
2209 {
2210 RTUUID Uuid;
2211
2212 RTUuidCreate(&Uuid);
2213 pDisk->pLast->Backend->pfnSetModificationUuid(pDisk->pLast->pBackendData,
2214 &Uuid);
2215
2216 if (pDisk->pCache)
2217 pDisk->pCache->Backend->pfnSetModificationUuid(pDisk->pCache->pBackendData,
2218 &Uuid);
2219 }
2220
2221 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FLAG;
2222 }
2223}
2224
2225/**
2226 * internal: mark the disk as modified.
2227 */
2228static void vdSetModifiedFlag(PVBOXHDD pDisk)
2229{
2230 pDisk->uModified |= VD_IMAGE_MODIFIED_FLAG;
2231 if (pDisk->uModified & VD_IMAGE_MODIFIED_FIRST)
2232 {
2233 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FIRST;
2234
2235 /* First modify, so create a UUID and ensure it's written to disk. */
2236 vdResetModifiedFlag(pDisk);
2237
2238 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
2239 {
2240 VDIOCTX IoCtx;
2241 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_FLUSH, 0, 0, NULL,
2242 NULL, NULL, NULL, VDIOCTX_FLAGS_SYNC);
2243 pDisk->pLast->Backend->pfnFlush(pDisk->pLast->pBackendData, &IoCtx);
2244 }
2245 }
2246}
2247
2248/**
2249 * internal: write buffer to the image, taking care of block boundaries and
2250 * write optimizations.
2251 */
2252static int vdWriteHelperEx(PVBOXHDD pDisk, PVDIMAGE pImage,
2253 PVDIMAGE pImageParentOverride, uint64_t uOffset,
2254 const void *pvBuf, size_t cbWrite,
2255 uint32_t fFlags, unsigned cImagesRead)
2256{
2257 int rc = VINF_SUCCESS;
2258 RTSGSEG Segment;
2259 RTSGBUF SgBuf;
2260 VDIOCTX IoCtx;
2261 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
2262
2263 rc = RTSemEventCreate(&hEventComplete);
2264 if (RT_FAILURE(rc))
2265 return rc;
2266
2267 fFlags |= VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE;
2268
2269 Segment.pvSeg = (void *)pvBuf;
2270 Segment.cbSeg = cbWrite;
2271 RTSgBufInit(&SgBuf, &Segment, 1);
2272 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_WRITE, uOffset, cbWrite, pImage, &SgBuf,
2273 NULL, vdWriteHelperAsync, fFlags);
2274
2275 IoCtx.Req.Io.pImageParentOverride = pImageParentOverride;
2276 IoCtx.Req.Io.cImagesRead = cImagesRead;
2277 IoCtx.pIoCtxParent = NULL;
2278 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
2279 IoCtx.Type.Root.pvUser1 = pDisk;
2280 IoCtx.Type.Root.pvUser2 = hEventComplete;
2281 /* Apply write filter chain here. */
2282 rc = vdFilterChainApplyWrite(pDisk, uOffset, cbWrite, &IoCtx);
2283 if (RT_SUCCESS(rc))
2284 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
2285
2286 RTSemEventDestroy(hEventComplete);
2287 return rc;
2288}
2289
2290/**
2291 * internal: write buffer to the image, taking care of block boundaries and
2292 * write optimizations.
2293 */
2294static int vdWriteHelper(PVBOXHDD pDisk, PVDIMAGE pImage, uint64_t uOffset,
2295 const void *pvBuf, size_t cbWrite, uint32_t fFlags)
2296{
2297 return vdWriteHelperEx(pDisk, pImage, NULL, uOffset, pvBuf, cbWrite,
2298 fFlags, 0);
2299}
2300
2301/**
2302 * Internal: Copies the content of one disk to another one applying optimizations
2303 * to speed up the copy process if possible.
2304 */
2305static int vdCopyHelper(PVBOXHDD pDiskFrom, PVDIMAGE pImageFrom, PVBOXHDD pDiskTo,
2306 uint64_t cbSize, unsigned cImagesFromRead, unsigned cImagesToRead,
2307 bool fSuppressRedundantIo, PVDINTERFACEPROGRESS pIfProgress,
2308 PVDINTERFACEPROGRESS pDstIfProgress)
2309{
2310 int rc = VINF_SUCCESS;
2311 int rc2;
2312 uint64_t uOffset = 0;
2313 uint64_t cbRemaining = cbSize;
2314 void *pvBuf = NULL;
2315 bool fLockReadFrom = false;
2316 bool fLockWriteTo = false;
2317 bool fBlockwiseCopy = fSuppressRedundantIo || (cImagesFromRead > 0);
2318 unsigned uProgressOld = 0;
2319
2320 LogFlowFunc(("pDiskFrom=%#p pImageFrom=%#p pDiskTo=%#p cbSize=%llu cImagesFromRead=%u cImagesToRead=%u fSuppressRedundantIo=%RTbool pIfProgress=%#p pDstIfProgress=%#p\n",
2321 pDiskFrom, pImageFrom, pDiskTo, cbSize, cImagesFromRead, cImagesToRead, fSuppressRedundantIo, pDstIfProgress, pDstIfProgress));
2322
2323 /* Allocate tmp buffer. */
2324 pvBuf = RTMemTmpAlloc(VD_MERGE_BUFFER_SIZE);
2325 if (!pvBuf)
2326 return rc;
2327
2328 do
2329 {
2330 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
2331
2332 /* Note that we don't attempt to synchronize cross-disk accesses.
2333 * It wouldn't be very difficult to do, just the lock order would
2334 * need to be defined somehow to prevent deadlocks. Postpone such
2335 * magic as there is no use case for this. */
2336
2337 rc2 = vdThreadStartRead(pDiskFrom);
2338 AssertRC(rc2);
2339 fLockReadFrom = true;
2340
2341 if (fBlockwiseCopy)
2342 {
2343 RTSGSEG SegmentBuf;
2344 RTSGBUF SgBuf;
2345 VDIOCTX IoCtx;
2346
2347 SegmentBuf.pvSeg = pvBuf;
2348 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
2349 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
2350 vdIoCtxInit(&IoCtx, pDiskFrom, VDIOCTXTXDIR_READ, 0, 0, NULL,
2351 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
2352
2353 /* Read the source data. */
2354 rc = pImageFrom->Backend->pfnRead(pImageFrom->pBackendData,
2355 uOffset, cbThisRead, &IoCtx,
2356 &cbThisRead);
2357
2358 if ( rc == VERR_VD_BLOCK_FREE
2359 && cImagesFromRead != 1)
2360 {
2361 unsigned cImagesToProcess = cImagesFromRead;
2362
2363 for (PVDIMAGE pCurrImage = pImageFrom->pPrev;
2364 pCurrImage != NULL && rc == VERR_VD_BLOCK_FREE;
2365 pCurrImage = pCurrImage->pPrev)
2366 {
2367 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
2368 uOffset, cbThisRead,
2369 &IoCtx, &cbThisRead);
2370 if (cImagesToProcess == 1)
2371 break;
2372 else if (cImagesToProcess > 0)
2373 cImagesToProcess--;
2374 }
2375 }
2376 }
2377 else
2378 rc = vdReadHelper(pDiskFrom, pImageFrom, uOffset, pvBuf, cbThisRead,
2379 false /* fUpdateCache */);
2380
2381 if (RT_FAILURE(rc) && rc != VERR_VD_BLOCK_FREE)
2382 break;
2383
2384 rc2 = vdThreadFinishRead(pDiskFrom);
2385 AssertRC(rc2);
2386 fLockReadFrom = false;
2387
2388 if (rc != VERR_VD_BLOCK_FREE)
2389 {
2390 rc2 = vdThreadStartWrite(pDiskTo);
2391 AssertRC(rc2);
2392 fLockWriteTo = true;
2393
2394 /* Only do collapsed I/O if we are copying the data blockwise. */
2395 rc = vdWriteHelperEx(pDiskTo, pDiskTo->pLast, NULL, uOffset, pvBuf,
2396 cbThisRead, VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG /* fFlags */,
2397 fBlockwiseCopy ? cImagesToRead : 0);
2398 if (RT_FAILURE(rc))
2399 break;
2400
2401 rc2 = vdThreadFinishWrite(pDiskTo);
2402 AssertRC(rc2);
2403 fLockWriteTo = false;
2404 }
2405 else /* Don't propagate the error to the outside */
2406 rc = VINF_SUCCESS;
2407
2408 uOffset += cbThisRead;
2409 cbRemaining -= cbThisRead;
2410
2411 unsigned uProgressNew = uOffset * 99 / cbSize;
2412 if (uProgressNew != uProgressOld)
2413 {
2414 uProgressOld = uProgressNew;
2415
2416 if (pIfProgress && pIfProgress->pfnProgress)
2417 {
2418 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
2419 uProgressOld);
2420 if (RT_FAILURE(rc))
2421 break;
2422 }
2423 if (pDstIfProgress && pDstIfProgress->pfnProgress)
2424 {
2425 rc = pDstIfProgress->pfnProgress(pDstIfProgress->Core.pvUser,
2426 uProgressOld);
2427 if (RT_FAILURE(rc))
2428 break;
2429 }
2430 }
2431 } while (uOffset < cbSize);
2432
2433 RTMemFree(pvBuf);
2434
2435 if (fLockReadFrom)
2436 {
2437 rc2 = vdThreadFinishRead(pDiskFrom);
2438 AssertRC(rc2);
2439 }
2440
2441 if (fLockWriteTo)
2442 {
2443 rc2 = vdThreadFinishWrite(pDiskTo);
2444 AssertRC(rc2);
2445 }
2446
2447 LogFlowFunc(("returns rc=%Rrc\n", rc));
2448 return rc;
2449}
2450
2451/**
2452 * Flush helper async version.
2453 */
2454static int vdSetModifiedHelperAsync(PVDIOCTX pIoCtx)
2455{
2456 int rc = VINF_SUCCESS;
2457 PVBOXHDD pDisk = pIoCtx->pDisk;
2458 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2459
2460 rc = pImage->Backend->pfnFlush(pImage->pBackendData, pIoCtx);
2461 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2462 rc = VINF_SUCCESS;
2463
2464 return rc;
2465}
2466
2467/**
2468 * internal: mark the disk as modified - async version.
2469 */
2470static int vdSetModifiedFlagAsync(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
2471{
2472 int rc = VINF_SUCCESS;
2473
2474 VD_IS_LOCKED(pDisk);
2475
2476 pDisk->uModified |= VD_IMAGE_MODIFIED_FLAG;
2477 if (pDisk->uModified & VD_IMAGE_MODIFIED_FIRST)
2478 {
2479 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2480 if (RT_SUCCESS(rc))
2481 {
2482 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FIRST;
2483
2484 /* First modify, so create a UUID and ensure it's written to disk. */
2485 vdResetModifiedFlag(pDisk);
2486
2487 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
2488 {
2489 PVDIOCTX pIoCtxFlush = vdIoCtxChildAlloc(pDisk, VDIOCTXTXDIR_FLUSH,
2490 0, 0, pDisk->pLast,
2491 NULL, pIoCtx, 0, 0, NULL,
2492 vdSetModifiedHelperAsync);
2493
2494 if (pIoCtxFlush)
2495 {
2496 rc = vdIoCtxProcessLocked(pIoCtxFlush);
2497 if (rc == VINF_VD_ASYNC_IO_FINISHED)
2498 {
2499 vdIoCtxUnlockDisk(pDisk, pIoCtx, false /* fProcessDeferredReqs */);
2500 vdIoCtxFree(pDisk, pIoCtxFlush);
2501 }
2502 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2503 {
2504 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
2505 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2506 }
2507 else /* Another error */
2508 vdIoCtxFree(pDisk, pIoCtxFlush);
2509 }
2510 else
2511 rc = VERR_NO_MEMORY;
2512 }
2513 }
2514 }
2515
2516 return rc;
2517}
2518
2519static int vdWriteHelperCommitAsync(PVDIOCTX pIoCtx)
2520{
2521 int rc = VINF_SUCCESS;
2522 PVDIMAGE pImage = pIoCtx->Req.Io.pImageStart;
2523 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2524 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2525 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2526
2527 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2528 rc = pImage->Backend->pfnWrite(pImage->pBackendData,
2529 pIoCtx->Req.Io.uOffset - cbPreRead,
2530 cbPreRead + cbThisWrite + cbPostRead,
2531 pIoCtx, NULL, &cbPreRead, &cbPostRead, 0);
2532 Assert(rc != VERR_VD_BLOCK_FREE);
2533 Assert(rc == VERR_VD_NOT_ENOUGH_METADATA || cbPreRead == 0);
2534 Assert(rc == VERR_VD_NOT_ENOUGH_METADATA || cbPostRead == 0);
2535 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2536 rc = VINF_SUCCESS;
2537 else if (rc == VERR_VD_IOCTX_HALT)
2538 {
2539 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2540 rc = VINF_SUCCESS;
2541 }
2542
2543 LogFlowFunc(("returns rc=%Rrc\n", rc));
2544 return rc;
2545}
2546
2547static int vdWriteHelperOptimizedCmpAndWriteAsync(PVDIOCTX pIoCtx)
2548{
2549 int rc = VINF_SUCCESS;
2550 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2551 size_t cbThisWrite = 0;
2552 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2553 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2554 size_t cbWriteCopy = pIoCtx->Type.Child.Write.Optimized.cbWriteCopy;
2555 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2556 size_t cbReadImage = pIoCtx->Type.Child.Write.Optimized.cbReadImage;
2557 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
2558
2559 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2560
2561 AssertPtr(pIoCtxParent);
2562 Assert(!pIoCtxParent->pIoCtxParent);
2563 Assert(!pIoCtx->Req.Io.cbTransferLeft && !pIoCtx->cMetaTransfersPending);
2564
2565 vdIoCtxChildReset(pIoCtx);
2566 cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2567 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbPreRead);
2568
2569 /* Check if the write would modify anything in this block. */
2570 if (!RTSgBufCmp(&pIoCtx->Req.Io.SgBuf, &pIoCtxParent->Req.Io.SgBuf, cbThisWrite))
2571 {
2572 RTSGBUF SgBufSrcTmp;
2573
2574 RTSgBufClone(&SgBufSrcTmp, &pIoCtxParent->Req.Io.SgBuf);
2575 RTSgBufAdvance(&SgBufSrcTmp, cbThisWrite);
2576 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbThisWrite);
2577
2578 if (!cbWriteCopy || !RTSgBufCmp(&pIoCtx->Req.Io.SgBuf, &SgBufSrcTmp, cbWriteCopy))
2579 {
2580 /* Block is completely unchanged, so no need to write anything. */
2581 LogFlowFunc(("Block didn't changed\n"));
2582 ASMAtomicWriteU32(&pIoCtx->Req.Io.cbTransferLeft, 0);
2583 RTSgBufAdvance(&pIoCtxParent->Req.Io.SgBuf, cbThisWrite);
2584 return VINF_VD_ASYNC_IO_FINISHED;
2585 }
2586 }
2587
2588 /* Copy the data to the right place in the buffer. */
2589 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2590 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbPreRead);
2591 vdIoCtxCopy(pIoCtx, pIoCtxParent, cbThisWrite);
2592
2593 /* Handle the data that goes after the write to fill the block. */
2594 if (cbPostRead)
2595 {
2596 /* Now assemble the remaining data. */
2597 if (cbWriteCopy)
2598 {
2599 /*
2600 * The S/G buffer of the parent needs to be cloned because
2601 * it is not allowed to modify the state.
2602 */
2603 RTSGBUF SgBufParentTmp;
2604
2605 RTSgBufClone(&SgBufParentTmp, &pIoCtxParent->Req.Io.SgBuf);
2606 RTSgBufCopy(&pIoCtx->Req.Io.SgBuf, &SgBufParentTmp, cbWriteCopy);
2607 }
2608
2609 /* Zero out the remainder of this block. Will never be visible, as this
2610 * is beyond the limit of the image. */
2611 if (cbFill)
2612 {
2613 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbReadImage);
2614 vdIoCtxSet(pIoCtx, '\0', cbFill);
2615 }
2616 }
2617
2618 /* Write the full block to the virtual disk. */
2619 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2620 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2621
2622 return rc;
2623}
2624
2625static int vdWriteHelperOptimizedPreReadAsync(PVDIOCTX pIoCtx)
2626{
2627 int rc = VINF_SUCCESS;
2628
2629 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2630
2631 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2632
2633 if ( pIoCtx->Req.Io.cbTransferLeft
2634 && !pIoCtx->cDataTransfersPending)
2635 rc = vdReadHelperAsync(pIoCtx);
2636
2637 if ( RT_SUCCESS(rc)
2638 && ( pIoCtx->Req.Io.cbTransferLeft
2639 || pIoCtx->cMetaTransfersPending))
2640 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2641 else
2642 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperOptimizedCmpAndWriteAsync;
2643
2644 return rc;
2645}
2646
2647/**
2648 * internal: write a complete block (only used for diff images), taking the
2649 * remaining data from parent images. This implementation optimizes out writes
2650 * that do not change the data relative to the state as of the parent images.
2651 * All backends which support differential/growing images support this - async version.
2652 */
2653static int vdWriteHelperOptimizedAsync(PVDIOCTX pIoCtx)
2654{
2655 PVBOXHDD pDisk = pIoCtx->pDisk;
2656 uint64_t uOffset = pIoCtx->Type.Child.uOffsetSaved;
2657 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2658 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2659 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2660 size_t cbWrite = pIoCtx->Type.Child.cbWriteParent;
2661 size_t cbFill = 0;
2662 size_t cbWriteCopy = 0;
2663 size_t cbReadImage = 0;
2664
2665 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2666
2667 AssertPtr(pIoCtx->pIoCtxParent);
2668 Assert(!pIoCtx->pIoCtxParent->pIoCtxParent);
2669
2670 if (cbPostRead)
2671 {
2672 /* Figure out how much we cannot read from the image, because
2673 * the last block to write might exceed the nominal size of the
2674 * image for technical reasons. */
2675 if (uOffset + cbThisWrite + cbPostRead > pDisk->cbSize)
2676 cbFill = uOffset + cbThisWrite + cbPostRead - pDisk->cbSize;
2677
2678 /* If we have data to be written, use that instead of reading
2679 * data from the image. */
2680 if (cbWrite > cbThisWrite)
2681 cbWriteCopy = RT_MIN(cbWrite - cbThisWrite, cbPostRead);
2682
2683 /* The rest must be read from the image. */
2684 cbReadImage = cbPostRead - cbWriteCopy - cbFill;
2685 }
2686
2687 pIoCtx->Type.Child.Write.Optimized.cbFill = cbFill;
2688 pIoCtx->Type.Child.Write.Optimized.cbWriteCopy = cbWriteCopy;
2689 pIoCtx->Type.Child.Write.Optimized.cbReadImage = cbReadImage;
2690
2691 /* Read the entire data of the block so that we can compare whether it will
2692 * be modified by the write or not. */
2693 size_t cbTmp = cbPreRead + cbThisWrite + cbPostRead - cbFill; Assert(cbTmp == (uint32_t)cbTmp);
2694 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbTmp;
2695 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2696 pIoCtx->Req.Io.uOffset -= cbPreRead;
2697
2698 /* Next step */
2699 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperOptimizedPreReadAsync;
2700 return VINF_SUCCESS;
2701}
2702
2703static int vdWriteHelperStandardReadImageAsync(PVDIOCTX pIoCtx)
2704{
2705 int rc = VINF_SUCCESS;
2706
2707 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2708
2709 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2710
2711 if ( pIoCtx->Req.Io.cbTransferLeft
2712 && !pIoCtx->cDataTransfersPending)
2713 rc = vdReadHelperAsync(pIoCtx);
2714
2715 if ( RT_SUCCESS(rc)
2716 && ( pIoCtx->Req.Io.cbTransferLeft
2717 || pIoCtx->cMetaTransfersPending))
2718 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2719 else
2720 {
2721 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2722
2723 /* Zero out the remainder of this block. Will never be visible, as this
2724 * is beyond the limit of the image. */
2725 if (cbFill)
2726 vdIoCtxSet(pIoCtx, '\0', cbFill);
2727
2728 /* Write the full block to the virtual disk. */
2729 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2730
2731 vdIoCtxChildReset(pIoCtx);
2732 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2733 }
2734
2735 return rc;
2736}
2737
2738static int vdWriteHelperStandardAssemble(PVDIOCTX pIoCtx)
2739{
2740 int rc = VINF_SUCCESS;
2741 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2742 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2743 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
2744
2745 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2746
2747 vdIoCtxCopy(pIoCtx, pIoCtxParent, cbThisWrite);
2748 if (cbPostRead)
2749 {
2750 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2751 size_t cbWriteCopy = pIoCtx->Type.Child.Write.Optimized.cbWriteCopy;
2752 size_t cbReadImage = pIoCtx->Type.Child.Write.Optimized.cbReadImage;
2753
2754 /* Now assemble the remaining data. */
2755 if (cbWriteCopy)
2756 {
2757 /*
2758 * The S/G buffer of the parent needs to be cloned because
2759 * it is not allowed to modify the state.
2760 */
2761 RTSGBUF SgBufParentTmp;
2762
2763 RTSgBufClone(&SgBufParentTmp, &pIoCtxParent->Req.Io.SgBuf);
2764 RTSgBufCopy(&pIoCtx->Req.Io.SgBuf, &SgBufParentTmp, cbWriteCopy);
2765 }
2766
2767 if (cbReadImage)
2768 {
2769 /* Read remaining data. */
2770 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardReadImageAsync;
2771
2772 /* Read the data that goes before the write to fill the block. */
2773 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbReadImage; Assert(cbReadImage == (uint32_t)cbReadImage);
2774 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2775 pIoCtx->Req.Io.uOffset += cbWriteCopy;
2776 }
2777 else
2778 {
2779 /* Zero out the remainder of this block. Will never be visible, as this
2780 * is beyond the limit of the image. */
2781 if (cbFill)
2782 vdIoCtxSet(pIoCtx, '\0', cbFill);
2783
2784 /* Write the full block to the virtual disk. */
2785 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2786 vdIoCtxChildReset(pIoCtx);
2787 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2788 }
2789 }
2790 else
2791 {
2792 /* Write the full block to the virtual disk. */
2793 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2794 vdIoCtxChildReset(pIoCtx);
2795 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2796 }
2797
2798 return rc;
2799}
2800
2801static int vdWriteHelperStandardPreReadAsync(PVDIOCTX pIoCtx)
2802{
2803 int rc = VINF_SUCCESS;
2804
2805 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2806
2807 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2808
2809 if ( pIoCtx->Req.Io.cbTransferLeft
2810 && !pIoCtx->cDataTransfersPending)
2811 rc = vdReadHelperAsync(pIoCtx);
2812
2813 if ( RT_SUCCESS(rc)
2814 && ( pIoCtx->Req.Io.cbTransferLeft
2815 || pIoCtx->cMetaTransfersPending))
2816 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2817 else
2818 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardAssemble;
2819
2820 return rc;
2821}
2822
2823static int vdWriteHelperStandardAsync(PVDIOCTX pIoCtx)
2824{
2825 PVBOXHDD pDisk = pIoCtx->pDisk;
2826 uint64_t uOffset = pIoCtx->Type.Child.uOffsetSaved;
2827 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2828 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2829 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2830 size_t cbWrite = pIoCtx->Type.Child.cbWriteParent;
2831 size_t cbFill = 0;
2832 size_t cbWriteCopy = 0;
2833 size_t cbReadImage = 0;
2834
2835 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2836
2837 AssertPtr(pIoCtx->pIoCtxParent);
2838 Assert(!pIoCtx->pIoCtxParent->pIoCtxParent);
2839
2840 /* Calculate the amount of data to read that goes after the write to fill the block. */
2841 if (cbPostRead)
2842 {
2843 /* If we have data to be written, use that instead of reading
2844 * data from the image. */
2845 if (cbWrite > cbThisWrite)
2846 cbWriteCopy = RT_MIN(cbWrite - cbThisWrite, cbPostRead);
2847 else
2848 cbWriteCopy = 0;
2849
2850 /* Figure out how much we cannot read from the image, because
2851 * the last block to write might exceed the nominal size of the
2852 * image for technical reasons. */
2853 if (uOffset + cbThisWrite + cbPostRead > pDisk->cbSize)
2854 cbFill = uOffset + cbThisWrite + cbPostRead - pDisk->cbSize;
2855
2856 /* The rest must be read from the image. */
2857 cbReadImage = cbPostRead - cbWriteCopy - cbFill;
2858 }
2859
2860 pIoCtx->Type.Child.Write.Optimized.cbFill = cbFill;
2861 pIoCtx->Type.Child.Write.Optimized.cbWriteCopy = cbWriteCopy;
2862 pIoCtx->Type.Child.Write.Optimized.cbReadImage = cbReadImage;
2863
2864 /* Next step */
2865 if (cbPreRead)
2866 {
2867 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardPreReadAsync;
2868
2869 /* Read the data that goes before the write to fill the block. */
2870 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbPreRead; Assert(cbPreRead == (uint32_t)cbPreRead);
2871 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2872 pIoCtx->Req.Io.uOffset -= cbPreRead;
2873 }
2874 else
2875 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardAssemble;
2876
2877 return VINF_SUCCESS;
2878}
2879
2880/**
2881 * internal: write buffer to the image, taking care of block boundaries and
2882 * write optimizations - async version.
2883 */
2884static int vdWriteHelperAsync(PVDIOCTX pIoCtx)
2885{
2886 int rc;
2887 size_t cbWrite = pIoCtx->Req.Io.cbTransfer;
2888 uint64_t uOffset = pIoCtx->Req.Io.uOffset;
2889 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2890 PVBOXHDD pDisk = pIoCtx->pDisk;
2891 unsigned fWrite;
2892 size_t cbThisWrite;
2893 size_t cbPreRead, cbPostRead;
2894
2895 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG))
2896 {
2897 rc = vdSetModifiedFlagAsync(pDisk, pIoCtx);
2898 if (RT_FAILURE(rc)) /* Includes I/O in progress. */
2899 return rc;
2900 }
2901
2902 rc = vdDiscardSetRangeAllocated(pDisk, uOffset, cbWrite);
2903 if (RT_FAILURE(rc))
2904 return rc;
2905
2906 /* Loop until all written. */
2907 do
2908 {
2909 /* Try to write the possibly partial block to the last opened image.
2910 * This works when the block is already allocated in this image or
2911 * if it is a full-block write (and allocation isn't suppressed below).
2912 * For image formats which don't support zero blocks, it's beneficial
2913 * to avoid unnecessarily allocating unchanged blocks. This prevents
2914 * unwanted expanding of images. VMDK is an example. */
2915 cbThisWrite = cbWrite;
2916 fWrite = (pImage->uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME)
2917 ? 0 : VD_WRITE_NO_ALLOC;
2918 rc = pImage->Backend->pfnWrite(pImage->pBackendData, uOffset,
2919 cbThisWrite, pIoCtx,
2920 &cbThisWrite, &cbPreRead,
2921 &cbPostRead, fWrite);
2922 if (rc == VERR_VD_BLOCK_FREE)
2923 {
2924 /* Lock the disk .*/
2925 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2926 if (RT_SUCCESS(rc))
2927 {
2928 /*
2929 * Allocate segment and buffer in one go.
2930 * A bit hackish but avoids the need to allocate memory twice.
2931 */
2932 PRTSGBUF pTmp = (PRTSGBUF)RTMemAlloc(cbPreRead + cbThisWrite + cbPostRead + sizeof(RTSGSEG) + sizeof(RTSGBUF));
2933 AssertBreakStmt(VALID_PTR(pTmp), rc = VERR_NO_MEMORY);
2934 PRTSGSEG pSeg = (PRTSGSEG)(pTmp + 1);
2935
2936 pSeg->pvSeg = pSeg + 1;
2937 pSeg->cbSeg = cbPreRead + cbThisWrite + cbPostRead;
2938 RTSgBufInit(pTmp, pSeg, 1);
2939
2940 PVDIOCTX pIoCtxWrite = vdIoCtxChildAlloc(pDisk, VDIOCTXTXDIR_WRITE,
2941 uOffset, pSeg->cbSeg, pImage,
2942 pTmp,
2943 pIoCtx, cbThisWrite,
2944 cbWrite,
2945 pTmp,
2946 (pImage->uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME)
2947 ? vdWriteHelperStandardAsync
2948 : vdWriteHelperOptimizedAsync);
2949 if (!VALID_PTR(pIoCtxWrite))
2950 {
2951 RTMemTmpFree(pTmp);
2952 rc = VERR_NO_MEMORY;
2953 break;
2954 }
2955
2956 LogFlowFunc(("Disk is growing because of pIoCtx=%#p pIoCtxWrite=%#p\n",
2957 pIoCtx, pIoCtxWrite));
2958
2959 pIoCtxWrite->Type.Child.cbPreRead = cbPreRead;
2960 pIoCtxWrite->Type.Child.cbPostRead = cbPostRead;
2961 pIoCtxWrite->Req.Io.pImageParentOverride = pIoCtx->Req.Io.pImageParentOverride;
2962
2963 /* Process the write request */
2964 rc = vdIoCtxProcessLocked(pIoCtxWrite);
2965
2966 if (RT_FAILURE(rc) && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
2967 {
2968 vdIoCtxFree(pDisk, pIoCtxWrite);
2969 break;
2970 }
2971 else if ( rc == VINF_VD_ASYNC_IO_FINISHED
2972 && ASMAtomicCmpXchgBool(&pIoCtxWrite->fComplete, true, false))
2973 {
2974 LogFlow(("Child write request completed\n"));
2975 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbThisWrite);
2976 Assert(cbThisWrite == (uint32_t)cbThisWrite);
2977 rc = pIoCtxWrite->rcReq;
2978 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbThisWrite);
2979 vdIoCtxUnlockDisk(pDisk, pIoCtx, false /* fProcessDeferredReqs*/ );
2980 vdIoCtxFree(pDisk, pIoCtxWrite);
2981 }
2982 else
2983 {
2984 LogFlow(("Child write pending\n"));
2985 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
2986 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2987 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2988 cbWrite -= cbThisWrite;
2989 uOffset += cbThisWrite;
2990 break;
2991 }
2992 }
2993 else
2994 {
2995 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2996 break;
2997 }
2998 }
2999
3000 if (rc == VERR_VD_IOCTX_HALT)
3001 {
3002 cbWrite -= cbThisWrite;
3003 uOffset += cbThisWrite;
3004 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
3005 break;
3006 }
3007 else if (rc == VERR_VD_NOT_ENOUGH_METADATA)
3008 break;
3009
3010 cbWrite -= cbThisWrite;
3011 uOffset += cbThisWrite;
3012 } while (cbWrite != 0 && (RT_SUCCESS(rc) || rc == VERR_VD_ASYNC_IO_IN_PROGRESS));
3013
3014 if ( rc == VERR_VD_ASYNC_IO_IN_PROGRESS
3015 || rc == VERR_VD_NOT_ENOUGH_METADATA
3016 || rc == VERR_VD_IOCTX_HALT)
3017 {
3018 /*
3019 * Tell the caller that we don't need to go back here because all
3020 * writes are initiated.
3021 */
3022 if ( !cbWrite
3023 && rc != VERR_VD_IOCTX_HALT)
3024 rc = VINF_SUCCESS;
3025
3026 pIoCtx->Req.Io.uOffset = uOffset;
3027 pIoCtx->Req.Io.cbTransfer = cbWrite;
3028 }
3029
3030 return rc;
3031}
3032
3033/**
3034 * Flush helper async version.
3035 */
3036static int vdFlushHelperAsync(PVDIOCTX pIoCtx)
3037{
3038 int rc = VINF_SUCCESS;
3039 PVBOXHDD pDisk = pIoCtx->pDisk;
3040 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
3041
3042 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
3043 if (RT_SUCCESS(rc))
3044 {
3045 vdResetModifiedFlag(pDisk);
3046 rc = pImage->Backend->pfnFlush(pImage->pBackendData, pIoCtx);
3047 if ( ( RT_SUCCESS(rc)
3048 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS
3049 || rc == VERR_VD_IOCTX_HALT)
3050 && pDisk->pCache)
3051 {
3052 rc = pDisk->pCache->Backend->pfnFlush(pDisk->pCache->pBackendData, pIoCtx);
3053 if ( RT_SUCCESS(rc)
3054 || ( rc != VERR_VD_ASYNC_IO_IN_PROGRESS
3055 && rc != VERR_VD_IOCTX_HALT))
3056 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessBlockedReqs */);
3057 else if (rc != VERR_VD_IOCTX_HALT)
3058 rc = VINF_SUCCESS;
3059 }
3060 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3061 rc = VINF_SUCCESS;
3062 else if (rc != VERR_VD_IOCTX_HALT)/* Some other error. */
3063 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessBlockedReqs */);
3064 }
3065
3066 return rc;
3067}
3068
3069/**
3070 * Async discard helper - discards a whole block which is recorded in the block
3071 * tree.
3072 *
3073 * @returns VBox status code.
3074 * @param pIoCtx The I/O context to operate on.
3075 */
3076static int vdDiscardWholeBlockAsync(PVDIOCTX pIoCtx)
3077{
3078 int rc = VINF_SUCCESS;
3079 PVBOXHDD pDisk = pIoCtx->pDisk;
3080 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3081 PVDDISCARDBLOCK pBlock = pIoCtx->Req.Discard.pBlock;
3082 size_t cbPreAllocated, cbPostAllocated, cbActuallyDiscarded;
3083
3084 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
3085
3086 AssertPtr(pBlock);
3087
3088 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
3089 pBlock->Core.Key, pBlock->cbDiscard,
3090 &cbPreAllocated, &cbPostAllocated,
3091 &cbActuallyDiscarded, NULL, 0);
3092 Assert(rc != VERR_VD_DISCARD_ALIGNMENT_NOT_MET);
3093 Assert(!cbPreAllocated);
3094 Assert(!cbPostAllocated);
3095 Assert(cbActuallyDiscarded == pBlock->cbDiscard || RT_FAILURE(rc));
3096
3097 /* Remove the block on success. */
3098 if ( RT_SUCCESS(rc)
3099 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3100 {
3101 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
3102 Assert(pBlockRemove == pBlock);
3103
3104 pDiscard->cbDiscarding -= pBlock->cbDiscard;
3105 RTListNodeRemove(&pBlock->NodeLru);
3106 RTMemFree(pBlock->pbmAllocated);
3107 RTMemFree(pBlock);
3108 pIoCtx->Req.Discard.pBlock = NULL;/* Safety precaution. */
3109 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync; /* Next part. */
3110 rc = VINF_SUCCESS;
3111 }
3112
3113 LogFlowFunc(("returns rc=%Rrc\n", rc));
3114 return rc;
3115}
3116
3117/**
3118 * Removes the least recently used blocks from the waiting list until
3119 * the new value is reached - version for async I/O.
3120 *
3121 * @returns VBox status code.
3122 * @param pDisk VD disk container.
3123 * @param pDiscard The discard state.
3124 * @param cbDiscardingNew How many bytes should be waiting on success.
3125 * The number of bytes waiting can be less.
3126 */
3127static int vdDiscardRemoveBlocksAsync(PVBOXHDD pDisk, PVDIOCTX pIoCtx, size_t cbDiscardingNew)
3128{
3129 int rc = VINF_SUCCESS;
3130 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3131
3132 LogFlowFunc(("pDisk=%#p pDiscard=%#p cbDiscardingNew=%zu\n",
3133 pDisk, pDiscard, cbDiscardingNew));
3134
3135 while (pDiscard->cbDiscarding > cbDiscardingNew)
3136 {
3137 PVDDISCARDBLOCK pBlock = RTListGetLast(&pDiscard->ListLru, VDDISCARDBLOCK, NodeLru);
3138
3139 Assert(!RTListIsEmpty(&pDiscard->ListLru));
3140
3141 /* Go over the allocation bitmap and mark all discarded sectors as unused. */
3142 uint64_t offStart = pBlock->Core.Key;
3143 uint32_t idxStart = 0;
3144 size_t cbLeft = pBlock->cbDiscard;
3145 bool fAllocated = ASMBitTest(pBlock->pbmAllocated, idxStart);
3146 uint32_t cSectors = (uint32_t)(pBlock->cbDiscard / 512);
3147
3148 while (cbLeft > 0)
3149 {
3150 int32_t idxEnd;
3151 size_t cbThis = cbLeft;
3152
3153 if (fAllocated)
3154 {
3155 /* Check for the first unallocated bit. */
3156 idxEnd = ASMBitNextClear(pBlock->pbmAllocated, cSectors, idxStart);
3157 if (idxEnd != -1)
3158 {
3159 cbThis = (idxEnd - idxStart) * 512;
3160 fAllocated = false;
3161 }
3162 }
3163 else
3164 {
3165 /* Mark as unused and check for the first set bit. */
3166 idxEnd = ASMBitNextSet(pBlock->pbmAllocated, cSectors, idxStart);
3167 if (idxEnd != -1)
3168 cbThis = (idxEnd - idxStart) * 512;
3169
3170 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
3171 offStart, cbThis, NULL, NULL, &cbThis,
3172 NULL, VD_DISCARD_MARK_UNUSED);
3173 if ( RT_FAILURE(rc)
3174 && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
3175 break;
3176
3177 fAllocated = true;
3178 }
3179
3180 idxStart = idxEnd;
3181 offStart += cbThis;
3182 cbLeft -= cbThis;
3183 }
3184
3185 if ( RT_FAILURE(rc)
3186 && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
3187 break;
3188
3189 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
3190 Assert(pBlockRemove == pBlock);
3191 RTListNodeRemove(&pBlock->NodeLru);
3192
3193 pDiscard->cbDiscarding -= pBlock->cbDiscard;
3194 RTMemFree(pBlock->pbmAllocated);
3195 RTMemFree(pBlock);
3196 }
3197
3198 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3199 rc = VINF_SUCCESS;
3200
3201 Assert(RT_FAILURE(rc) || pDiscard->cbDiscarding <= cbDiscardingNew);
3202
3203 LogFlowFunc(("returns rc=%Rrc\n", rc));
3204 return rc;
3205}
3206
3207/**
3208 * Async discard helper - discards the current range if there is no matching
3209 * block in the tree.
3210 *
3211 * @returns VBox status code.
3212 * @param pIoCtx The I/O context to operate on.
3213 */
3214static int vdDiscardCurrentRangeAsync(PVDIOCTX pIoCtx)
3215{
3216 PVBOXHDD pDisk = pIoCtx->pDisk;
3217 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3218 uint64_t offStart = pIoCtx->Req.Discard.offCur;
3219 size_t cbThisDiscard = pIoCtx->Req.Discard.cbThisDiscard;
3220 void *pbmAllocated = NULL;
3221 size_t cbPreAllocated, cbPostAllocated;
3222 int rc = VINF_SUCCESS;
3223
3224 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
3225
3226 /* No block found, try to discard using the backend first. */
3227 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
3228 offStart, cbThisDiscard, &cbPreAllocated,
3229 &cbPostAllocated, &cbThisDiscard,
3230 &pbmAllocated, 0);
3231 if (rc == VERR_VD_DISCARD_ALIGNMENT_NOT_MET)
3232 {
3233 /* Create new discard block. */
3234 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTMemAllocZ(sizeof(VDDISCARDBLOCK));
3235 if (pBlock)
3236 {
3237 pBlock->Core.Key = offStart - cbPreAllocated;
3238 pBlock->Core.KeyLast = offStart + cbThisDiscard + cbPostAllocated - 1;
3239 pBlock->cbDiscard = cbPreAllocated + cbThisDiscard + cbPostAllocated;
3240 pBlock->pbmAllocated = pbmAllocated;
3241 bool fInserted = RTAvlrU64Insert(pDiscard->pTreeBlocks, &pBlock->Core);
3242 Assert(fInserted);
3243
3244 RTListPrepend(&pDiscard->ListLru, &pBlock->NodeLru);
3245 pDiscard->cbDiscarding += pBlock->cbDiscard;
3246
3247 Assert(pIoCtx->Req.Discard.cbDiscardLeft >= cbThisDiscard);
3248 pIoCtx->Req.Discard.cbDiscardLeft -= cbThisDiscard;
3249 pIoCtx->Req.Discard.offCur += cbThisDiscard;
3250 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3251
3252 if (pDiscard->cbDiscarding > VD_DISCARD_REMOVE_THRESHOLD)
3253 rc = vdDiscardRemoveBlocksAsync(pDisk, pIoCtx, VD_DISCARD_REMOVE_THRESHOLD);
3254 else
3255 rc = VINF_SUCCESS;
3256
3257 if (RT_SUCCESS(rc))
3258 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync; /* Next part. */
3259 }
3260 else
3261 {
3262 RTMemFree(pbmAllocated);
3263 rc = VERR_NO_MEMORY;
3264 }
3265 }
3266 else if ( RT_SUCCESS(rc)
3267 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS) /* Save state and andvance to next range. */
3268 {
3269 Assert(pIoCtx->Req.Discard.cbDiscardLeft >= cbThisDiscard);
3270 pIoCtx->Req.Discard.cbDiscardLeft -= cbThisDiscard;
3271 pIoCtx->Req.Discard.offCur += cbThisDiscard;
3272 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3273 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync;
3274 rc = VINF_SUCCESS;
3275 }
3276
3277 LogFlowFunc(("returns rc=%Rrc\n", rc));
3278 return rc;
3279}
3280
3281/**
3282 * Async discard helper - entry point.
3283 *
3284 * @returns VBox status code.
3285 * @param pIoCtx The I/O context to operate on.
3286 */
3287static int vdDiscardHelperAsync(PVDIOCTX pIoCtx)
3288{
3289 int rc = VINF_SUCCESS;
3290 PVBOXHDD pDisk = pIoCtx->pDisk;
3291 PCRTRANGE paRanges = pIoCtx->Req.Discard.paRanges;
3292 unsigned cRanges = pIoCtx->Req.Discard.cRanges;
3293 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3294
3295 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
3296
3297 /* Check if the I/O context processed all ranges. */
3298 if ( pIoCtx->Req.Discard.idxRange == cRanges
3299 && !pIoCtx->Req.Discard.cbDiscardLeft)
3300 {
3301 LogFlowFunc(("All ranges discarded, completing\n"));
3302 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessDeferredReqs*/);
3303 return VINF_SUCCESS;
3304 }
3305
3306 if (pDisk->pIoCtxLockOwner != pIoCtx)
3307 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
3308
3309 if (RT_SUCCESS(rc))
3310 {
3311 uint64_t offStart = pIoCtx->Req.Discard.offCur;
3312 size_t cbDiscardLeft = pIoCtx->Req.Discard.cbDiscardLeft;
3313 size_t cbThisDiscard;
3314
3315 if (RT_UNLIKELY(!pDiscard))
3316 {
3317 pDiscard = vdDiscardStateCreate();
3318 if (!pDiscard)
3319 return VERR_NO_MEMORY;
3320
3321 pDisk->pDiscard = pDiscard;
3322 }
3323
3324 if (!pIoCtx->Req.Discard.cbDiscardLeft)
3325 {
3326 offStart = paRanges[pIoCtx->Req.Discard.idxRange].offStart;
3327 cbDiscardLeft = paRanges[pIoCtx->Req.Discard.idxRange].cbRange;
3328 LogFlowFunc(("New range descriptor loaded (%u) offStart=%llu cbDiscard=%zu\n",
3329 pIoCtx->Req.Discard.idxRange, offStart, cbDiscardLeft));
3330 pIoCtx->Req.Discard.idxRange++;
3331 }
3332
3333 /* Look for a matching block in the AVL tree first. */
3334 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, offStart, false);
3335 if (!pBlock || pBlock->Core.KeyLast < offStart)
3336 {
3337 PVDDISCARDBLOCK pBlockAbove = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, offStart, true);
3338
3339 /* Clip range to remain in the current block. */
3340 if (pBlockAbove)
3341 cbThisDiscard = RT_MIN(cbDiscardLeft, pBlockAbove->Core.KeyLast - offStart + 1);
3342 else
3343 cbThisDiscard = cbDiscardLeft;
3344
3345 Assert(!(cbThisDiscard % 512));
3346 pIoCtx->Req.Discard.pBlock = NULL;
3347 pIoCtx->pfnIoCtxTransferNext = vdDiscardCurrentRangeAsync;
3348 }
3349 else
3350 {
3351 /* Range lies partly in the block, update allocation bitmap. */
3352 int32_t idxStart, idxEnd;
3353
3354 cbThisDiscard = RT_MIN(cbDiscardLeft, pBlock->Core.KeyLast - offStart + 1);
3355
3356 AssertPtr(pBlock);
3357
3358 Assert(!(cbThisDiscard % 512));
3359 Assert(!((offStart - pBlock->Core.Key) % 512));
3360
3361 idxStart = (offStart - pBlock->Core.Key) / 512;
3362 idxEnd = idxStart + (int32_t)(cbThisDiscard / 512);
3363
3364 ASMBitClearRange(pBlock->pbmAllocated, idxStart, idxEnd);
3365
3366 cbDiscardLeft -= cbThisDiscard;
3367 offStart += cbThisDiscard;
3368
3369 /* Call the backend to discard the block if it is completely unallocated now. */
3370 if (ASMBitFirstSet((volatile void *)pBlock->pbmAllocated, (uint32_t)(pBlock->cbDiscard / 512)) == -1)
3371 {
3372 pIoCtx->Req.Discard.pBlock = pBlock;
3373 pIoCtx->pfnIoCtxTransferNext = vdDiscardWholeBlockAsync;
3374 rc = VINF_SUCCESS;
3375 }
3376 else
3377 {
3378 RTListNodeRemove(&pBlock->NodeLru);
3379 RTListPrepend(&pDiscard->ListLru, &pBlock->NodeLru);
3380
3381 /* Start with next range. */
3382 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync;
3383 rc = VINF_SUCCESS;
3384 }
3385 }
3386
3387 /* Save state in the context. */
3388 pIoCtx->Req.Discard.offCur = offStart;
3389 pIoCtx->Req.Discard.cbDiscardLeft = cbDiscardLeft;
3390 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3391 }
3392
3393 LogFlowFunc(("returns rc=%Rrc\n", rc));
3394 return rc;
3395}
3396
3397#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
3398/**
3399 * @copydoc VDPLUGIN::pfnRegisterImage
3400 */
3401static DECLCALLBACK(int) vdPluginRegisterImage(void *pvUser, PCVBOXHDDBACKEND pBackend)
3402{
3403 int rc = VINF_SUCCESS;
3404
3405 if (pBackend->cbSize == sizeof(VBOXHDDBACKEND))
3406 vdAddBackend(pBackend);
3407 else
3408 {
3409 LogFunc(("ignored plugin: pBackend->cbSize=%d rc=%Rrc\n", pBackend->cbSize));
3410 rc = VERR_IGNORED;
3411 }
3412
3413 return rc;
3414}
3415
3416/**
3417 * @copydoc VDPLUGIN::pfnRegisterCache
3418 */
3419static DECLCALLBACK(int) vdPluginRegisterCache(void *pvUser, PCVDCACHEBACKEND pBackend)
3420{
3421 int rc = VINF_SUCCESS;
3422
3423 if (pBackend->cbSize == sizeof(VDCACHEBACKEND))
3424 vdAddCacheBackend(pBackend);
3425 else
3426 {
3427 LogFunc(("ignored plugin: pBackend->cbSize=%d rc=%Rrc\n", pBackend->cbSize));
3428 rc = VERR_IGNORED;
3429 }
3430
3431 return rc;
3432}
3433
3434/**
3435 * @copydoc VDPLUGIN::pfnRegisterFilter
3436 */
3437static DECLCALLBACK(int) vdPluginRegisterFilter(void *pvUser, PCVDFILTERBACKEND pBackend)
3438{
3439 int rc = VINF_SUCCESS;
3440
3441 if (pBackend->cbSize == sizeof(VDFILTERBACKEND))
3442 vdAddFilterBackend(pBackend);
3443 else
3444 {
3445 LogFunc(("ignored plugin: pBackend->cbSize=%d rc=%Rrc\n", pBackend->cbSize));
3446 rc = VERR_IGNORED;
3447 }
3448
3449 return rc;
3450}
3451
3452/**
3453 * Adds a plugin to the list of loaded plugins.
3454 *
3455 * @returns VBox status code.
3456 * @param hPlugin PLugin handle to add.
3457 */
3458static int vdAddPlugin(RTLDRMOD hPlugin)
3459{
3460 int rc = VINF_SUCCESS;
3461 PVDPLUGIN pPlugin = (PVDPLUGIN)RTMemAllocZ(sizeof(VDPLUGIN));
3462
3463 if (pPlugin)
3464 {
3465 pPlugin->hPlugin = hPlugin;
3466 RTListAppend(&g_ListPluginsLoaded, &pPlugin->NodePlugin);
3467 }
3468 else
3469 rc = VERR_NO_MEMORY;
3470
3471 return rc;
3472}
3473#endif
3474
3475/**
3476 * internal: scans plugin directory and loads found plugins.
3477 */
3478static int vdLoadDynamicBackends()
3479{
3480#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
3481 int rc = VINF_SUCCESS;
3482 PRTDIR pPluginDir = NULL;
3483
3484 /* Enumerate plugin backends. */
3485 char szPath[RTPATH_MAX];
3486 rc = RTPathAppPrivateArch(szPath, sizeof(szPath));
3487 if (RT_FAILURE(rc))
3488 return rc;
3489
3490 /* To get all entries with VBoxHDD as prefix. */
3491 char *pszPluginFilter = RTPathJoinA(szPath, VD_PLUGIN_PREFIX "*");
3492 if (!pszPluginFilter)
3493 return VERR_NO_STR_MEMORY;
3494
3495 PRTDIRENTRYEX pPluginDirEntry = NULL;
3496 size_t cbPluginDirEntry = sizeof(RTDIRENTRYEX);
3497 /* The plugins are in the same directory as the other shared libs. */
3498 rc = RTDirOpenFiltered(&pPluginDir, pszPluginFilter, RTDIRFILTER_WINNT, 0);
3499 if (RT_FAILURE(rc))
3500 {
3501 /* On Windows the above immediately signals that there are no
3502 * files matching, while on other platforms enumerating the
3503 * files below fails. Either way: no plugins. */
3504 goto out;
3505 }
3506
3507 pPluginDirEntry = (PRTDIRENTRYEX)RTMemAllocZ(sizeof(RTDIRENTRYEX));
3508 if (!pPluginDirEntry)
3509 {
3510 rc = VERR_NO_MEMORY;
3511 goto out;
3512 }
3513
3514 while ((rc = RTDirReadEx(pPluginDir, pPluginDirEntry, &cbPluginDirEntry, RTFSOBJATTRADD_NOTHING, RTPATH_F_ON_LINK)) != VERR_NO_MORE_FILES)
3515 {
3516 RTLDRMOD hPlugin = NIL_RTLDRMOD;
3517 char *pszPluginPath = NULL;
3518
3519 if (rc == VERR_BUFFER_OVERFLOW)
3520 {
3521 /* allocate new buffer. */
3522 RTMemFree(pPluginDirEntry);
3523 pPluginDirEntry = (PRTDIRENTRYEX)RTMemAllocZ(cbPluginDirEntry);
3524 if (!pPluginDirEntry)
3525 {
3526 rc = VERR_NO_MEMORY;
3527 break;
3528 }
3529 /* Retry. */
3530 rc = RTDirReadEx(pPluginDir, pPluginDirEntry, &cbPluginDirEntry, RTFSOBJATTRADD_NOTHING, RTPATH_F_ON_LINK);
3531 if (RT_FAILURE(rc))
3532 break;
3533 }
3534 else if (RT_FAILURE(rc))
3535 break;
3536
3537 /* We got the new entry. */
3538 if (!RTFS_IS_FILE(pPluginDirEntry->Info.Attr.fMode))
3539 continue;
3540
3541 /* Prepend the path to the libraries. */
3542 pszPluginPath = RTPathJoinA(szPath, pPluginDirEntry->szName);
3543 if (!pszPluginPath)
3544 {
3545 rc = VERR_NO_STR_MEMORY;
3546 break;
3547 }
3548
3549 rc = SUPR3HardenedLdrLoadPlugIn(pszPluginPath, &hPlugin, NULL);
3550 if (RT_SUCCESS(rc))
3551 {
3552 VDBACKENDREGISTER BackendRegister;
3553 PFNVDPLUGINLOAD pfnVDPluginLoad = NULL;
3554
3555 BackendRegister.pfnRegisterImage = vdPluginRegisterImage;
3556 BackendRegister.pfnRegisterCache = vdPluginRegisterCache;
3557 BackendRegister.pfnRegisterFilter = vdPluginRegisterFilter;
3558
3559 rc = RTLdrGetSymbol(hPlugin, VD_PLUGIN_LOAD_NAME, (void**)&pfnVDPluginLoad);
3560 if (RT_FAILURE(rc) || !pfnVDPluginLoad)
3561 {
3562 LogFunc(("error resolving the entry point %s in plugin %s, rc=%Rrc, pfnVDPluginLoad=%#p\n",
3563 VD_PLUGIN_LOAD_NAME, pPluginDirEntry->szName, rc, pfnVDPluginLoad));
3564 if (RT_SUCCESS(rc))
3565 rc = VERR_SYMBOL_NOT_FOUND;
3566 }
3567
3568 if (RT_SUCCESS(rc))
3569 {
3570 /* Get the function table. */
3571 rc = pfnVDPluginLoad(NULL, &BackendRegister);
3572 }
3573 else
3574 LogFunc(("ignored plugin '%s': rc=%Rrc\n", pszPluginPath, rc));
3575
3576 /* Create a plugin entry on success. */
3577 if (RT_SUCCESS(rc))
3578 vdAddPlugin(hPlugin);
3579 else
3580 RTLdrClose(hPlugin);
3581 }
3582 RTStrFree(pszPluginPath);
3583 }
3584out:
3585 if (rc == VERR_NO_MORE_FILES)
3586 rc = VINF_SUCCESS;
3587 RTStrFree(pszPluginFilter);
3588 if (pPluginDirEntry)
3589 RTMemFree(pPluginDirEntry);
3590 if (pPluginDir)
3591 RTDirClose(pPluginDir);
3592 return rc;
3593#else
3594 return VINF_SUCCESS;
3595#endif
3596}
3597
3598/**
3599 * VD async I/O interface open callback.
3600 */
3601static int vdIOOpenFallback(void *pvUser, const char *pszLocation,
3602 uint32_t fOpen, PFNVDCOMPLETED pfnCompleted,
3603 void **ppStorage)
3604{
3605 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)RTMemAllocZ(sizeof(VDIIOFALLBACKSTORAGE));
3606
3607 if (!pStorage)
3608 return VERR_NO_MEMORY;
3609
3610 pStorage->pfnCompleted = pfnCompleted;
3611
3612 /* Open the file. */
3613 int rc = RTFileOpen(&pStorage->File, pszLocation, fOpen);
3614 if (RT_SUCCESS(rc))
3615 {
3616 *ppStorage = pStorage;
3617 return VINF_SUCCESS;
3618 }
3619
3620 RTMemFree(pStorage);
3621 return rc;
3622}
3623
3624/**
3625 * VD async I/O interface close callback.
3626 */
3627static int vdIOCloseFallback(void *pvUser, void *pvStorage)
3628{
3629 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3630
3631 RTFileClose(pStorage->File);
3632 RTMemFree(pStorage);
3633 return VINF_SUCCESS;
3634}
3635
3636static int vdIODeleteFallback(void *pvUser, const char *pcszFilename)
3637{
3638 return RTFileDelete(pcszFilename);
3639}
3640
3641static int vdIOMoveFallback(void *pvUser, const char *pcszSrc, const char *pcszDst, unsigned fMove)
3642{
3643 return RTFileMove(pcszSrc, pcszDst, fMove);
3644}
3645
3646static int vdIOGetFreeSpaceFallback(void *pvUser, const char *pcszFilename, int64_t *pcbFreeSpace)
3647{
3648 return RTFsQuerySizes(pcszFilename, NULL, pcbFreeSpace, NULL, NULL);
3649}
3650
3651static int vdIOGetModificationTimeFallback(void *pvUser, const char *pcszFilename, PRTTIMESPEC pModificationTime)
3652{
3653 RTFSOBJINFO info;
3654 int rc = RTPathQueryInfo(pcszFilename, &info, RTFSOBJATTRADD_NOTHING);
3655 if (RT_SUCCESS(rc))
3656 *pModificationTime = info.ModificationTime;
3657 return rc;
3658}
3659
3660/**
3661 * VD async I/O interface callback for retrieving the file size.
3662 */
3663static int vdIOGetSizeFallback(void *pvUser, void *pvStorage, uint64_t *pcbSize)
3664{
3665 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3666
3667 return RTFileGetSize(pStorage->File, pcbSize);
3668}
3669
3670/**
3671 * VD async I/O interface callback for setting the file size.
3672 */
3673static int vdIOSetSizeFallback(void *pvUser, void *pvStorage, uint64_t cbSize)
3674{
3675 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3676
3677 return RTFileSetSize(pStorage->File, cbSize);
3678}
3679
3680/**
3681 * VD async I/O interface callback for a synchronous write to the file.
3682 */
3683static int vdIOWriteSyncFallback(void *pvUser, void *pvStorage, uint64_t uOffset,
3684 const void *pvBuf, size_t cbWrite, size_t *pcbWritten)
3685{
3686 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3687
3688 return RTFileWriteAt(pStorage->File, uOffset, pvBuf, cbWrite, pcbWritten);
3689}
3690
3691/**
3692 * VD async I/O interface callback for a synchronous read from the file.
3693 */
3694static int vdIOReadSyncFallback(void *pvUser, void *pvStorage, uint64_t uOffset,
3695 void *pvBuf, size_t cbRead, size_t *pcbRead)
3696{
3697 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3698
3699 return RTFileReadAt(pStorage->File, uOffset, pvBuf, cbRead, pcbRead);
3700}
3701
3702/**
3703 * VD async I/O interface callback for a synchronous flush of the file data.
3704 */
3705static int vdIOFlushSyncFallback(void *pvUser, void *pvStorage)
3706{
3707 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3708
3709 return RTFileFlush(pStorage->File);
3710}
3711
3712/**
3713 * VD async I/O interface callback for a asynchronous read from the file.
3714 */
3715static int vdIOReadAsyncFallback(void *pvUser, void *pStorage, uint64_t uOffset,
3716 PCRTSGSEG paSegments, size_t cSegments,
3717 size_t cbRead, void *pvCompletion,
3718 void **ppTask)
3719{
3720 return VERR_NOT_IMPLEMENTED;
3721}
3722
3723/**
3724 * VD async I/O interface callback for a asynchronous write to the file.
3725 */
3726static int vdIOWriteAsyncFallback(void *pvUser, void *pStorage, uint64_t uOffset,
3727 PCRTSGSEG paSegments, size_t cSegments,
3728 size_t cbWrite, void *pvCompletion,
3729 void **ppTask)
3730{
3731 return VERR_NOT_IMPLEMENTED;
3732}
3733
3734/**
3735 * VD async I/O interface callback for a asynchronous flush of the file data.
3736 */
3737static int vdIOFlushAsyncFallback(void *pvUser, void *pStorage,
3738 void *pvCompletion, void **ppTask)
3739{
3740 return VERR_NOT_IMPLEMENTED;
3741}
3742
3743/**
3744 * Internal - Continues an I/O context after
3745 * it was halted because of an active transfer.
3746 */
3747static int vdIoCtxContinue(PVDIOCTX pIoCtx, int rcReq)
3748{
3749 PVBOXHDD pDisk = pIoCtx->pDisk;
3750 int rc = VINF_SUCCESS;
3751
3752 VD_IS_LOCKED(pDisk);
3753
3754 if (RT_FAILURE(rcReq))
3755 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rcReq, VINF_SUCCESS);
3756
3757 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
3758 {
3759 /* Continue the transfer */
3760 rc = vdIoCtxProcessLocked(pIoCtx);
3761
3762 if ( rc == VINF_VD_ASYNC_IO_FINISHED
3763 && ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
3764 {
3765 LogFlowFunc(("I/O context completed pIoCtx=%#p\n", pIoCtx));
3766 if (pIoCtx->pIoCtxParent)
3767 {
3768 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
3769
3770 Assert(!pIoCtxParent->pIoCtxParent);
3771 if (RT_FAILURE(pIoCtx->rcReq))
3772 ASMAtomicCmpXchgS32(&pIoCtxParent->rcReq, pIoCtx->rcReq, VINF_SUCCESS);
3773
3774 ASMAtomicDecU32(&pIoCtxParent->cDataTransfersPending);
3775
3776 if (pIoCtx->enmTxDir == VDIOCTXTXDIR_WRITE)
3777 {
3778 LogFlowFunc(("I/O context transferred %u bytes for the parent pIoCtxParent=%p\n",
3779 pIoCtx->Type.Child.cbTransferParent, pIoCtxParent));
3780
3781 /* Update the parent state. */
3782 Assert(pIoCtxParent->Req.Io.cbTransferLeft >= pIoCtx->Type.Child.cbTransferParent);
3783 ASMAtomicSubU32(&pIoCtxParent->Req.Io.cbTransferLeft, (uint32_t)pIoCtx->Type.Child.cbTransferParent);
3784 }
3785 else
3786 Assert(pIoCtx->enmTxDir == VDIOCTXTXDIR_FLUSH);
3787
3788 /*
3789 * A completed child write means that we finished growing the image.
3790 * We have to process any pending writes now.
3791 */
3792 vdIoCtxUnlockDisk(pDisk, pIoCtxParent, false /* fProcessDeferredReqs */);
3793
3794 /* Unblock the parent */
3795 pIoCtxParent->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
3796
3797 rc = vdIoCtxProcessLocked(pIoCtxParent);
3798
3799 if ( rc == VINF_VD_ASYNC_IO_FINISHED
3800 && ASMAtomicCmpXchgBool(&pIoCtxParent->fComplete, true, false))
3801 {
3802 LogFlowFunc(("Parent I/O context completed pIoCtxParent=%#p rcReq=%Rrc\n", pIoCtxParent, pIoCtxParent->rcReq));
3803 vdIoCtxRootComplete(pDisk, pIoCtxParent);
3804 vdThreadFinishWrite(pDisk);
3805 vdIoCtxFree(pDisk, pIoCtxParent);
3806 vdDiskProcessBlockedIoCtx(pDisk);
3807 }
3808 else if (!vdIoCtxIsDiskLockOwner(pDisk, pIoCtx))
3809 {
3810 /* Process any pending writes if the current request didn't caused another growing. */
3811 vdDiskProcessBlockedIoCtx(pDisk);
3812 }
3813 }
3814 else
3815 {
3816 if (pIoCtx->enmTxDir == VDIOCTXTXDIR_FLUSH)
3817 {
3818 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessDerredReqs */);
3819 vdThreadFinishWrite(pDisk);
3820 }
3821 else if ( pIoCtx->enmTxDir == VDIOCTXTXDIR_WRITE
3822 || pIoCtx->enmTxDir == VDIOCTXTXDIR_DISCARD)
3823 vdThreadFinishWrite(pDisk);
3824 else
3825 {
3826 Assert(pIoCtx->enmTxDir == VDIOCTXTXDIR_READ);
3827 vdThreadFinishRead(pDisk);
3828 }
3829
3830 LogFlowFunc(("I/O context completed pIoCtx=%#p rcReq=%Rrc\n", pIoCtx, pIoCtx->rcReq));
3831 vdIoCtxRootComplete(pDisk, pIoCtx);
3832 }
3833
3834 vdIoCtxFree(pDisk, pIoCtx);
3835 }
3836 }
3837
3838 return VINF_SUCCESS;
3839}
3840
3841/**
3842 * Internal - Called when user transfer completed.
3843 */
3844static int vdUserXferCompleted(PVDIOSTORAGE pIoStorage, PVDIOCTX pIoCtx,
3845 PFNVDXFERCOMPLETED pfnComplete, void *pvUser,
3846 size_t cbTransfer, int rcReq)
3847{
3848 int rc = VINF_SUCCESS;
3849 bool fIoCtxContinue = true;
3850 PVBOXHDD pDisk = pIoCtx->pDisk;
3851
3852 LogFlowFunc(("pIoStorage=%#p pIoCtx=%#p pfnComplete=%#p pvUser=%#p cbTransfer=%zu rcReq=%Rrc\n",
3853 pIoStorage, pIoCtx, pfnComplete, pvUser, cbTransfer, rcReq));
3854
3855 VD_IS_LOCKED(pDisk);
3856
3857 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbTransfer);
3858 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTransfer); Assert(cbTransfer == (uint32_t)cbTransfer);
3859 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
3860
3861 if (pfnComplete)
3862 rc = pfnComplete(pIoStorage->pVDIo->pBackendData, pIoCtx, pvUser, rcReq);
3863
3864 if (RT_SUCCESS(rc))
3865 rc = vdIoCtxContinue(pIoCtx, rcReq);
3866 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3867 rc = VINF_SUCCESS;
3868
3869 return rc;
3870}
3871
3872/**
3873 * Internal - Called when a meta transfer completed.
3874 */
3875static int vdMetaXferCompleted(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser,
3876 PVDMETAXFER pMetaXfer, int rcReq)
3877{
3878 PVBOXHDD pDisk = pIoStorage->pVDIo->pDisk;
3879 RTLISTNODE ListIoCtxWaiting;
3880 bool fFlush;
3881
3882 LogFlowFunc(("pIoStorage=%#p pfnComplete=%#p pvUser=%#p pMetaXfer=%#p rcReq=%Rrc\n",
3883 pIoStorage, pfnComplete, pvUser, pMetaXfer, rcReq));
3884
3885 VD_IS_LOCKED(pDisk);
3886
3887 fFlush = VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_FLUSH;
3888 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
3889
3890 if (!fFlush)
3891 {
3892 RTListMove(&ListIoCtxWaiting, &pMetaXfer->ListIoCtxWaiting);
3893
3894 if (RT_FAILURE(rcReq))
3895 {
3896 /* Remove from the AVL tree. */
3897 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
3898 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
3899 Assert(fRemoved);
3900 RTMemFree(pMetaXfer);
3901 }
3902 else
3903 {
3904 /* Increase the reference counter to make sure it doesn't go away before the last context is processed. */
3905 pMetaXfer->cRefs++;
3906 }
3907 }
3908 else
3909 RTListMove(&ListIoCtxWaiting, &pMetaXfer->ListIoCtxWaiting);
3910
3911 /* Go through the waiting list and continue the I/O contexts. */
3912 while (!RTListIsEmpty(&ListIoCtxWaiting))
3913 {
3914 int rc = VINF_SUCCESS;
3915 bool fContinue = true;
3916 PVDIOCTXDEFERRED pDeferred = RTListGetFirst(&ListIoCtxWaiting, VDIOCTXDEFERRED, NodeDeferred);
3917 PVDIOCTX pIoCtx = pDeferred->pIoCtx;
3918 RTListNodeRemove(&pDeferred->NodeDeferred);
3919
3920 RTMemFree(pDeferred);
3921 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
3922
3923 if (pfnComplete)
3924 rc = pfnComplete(pIoStorage->pVDIo->pBackendData, pIoCtx, pvUser, rcReq);
3925
3926 LogFlow(("Completion callback for I/O context %#p returned %Rrc\n", pIoCtx, rc));
3927
3928 if (RT_SUCCESS(rc))
3929 {
3930 rc = vdIoCtxContinue(pIoCtx, rcReq);
3931 AssertRC(rc);
3932 }
3933 else
3934 Assert(rc == VERR_VD_ASYNC_IO_IN_PROGRESS);
3935 }
3936
3937 /* Remove if not used anymore. */
3938 if (RT_SUCCESS(rcReq) && !fFlush)
3939 {
3940 pMetaXfer->cRefs--;
3941 if (!pMetaXfer->cRefs && RTListIsEmpty(&pMetaXfer->ListIoCtxWaiting))
3942 {
3943 /* Remove from the AVL tree. */
3944 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
3945 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
3946 Assert(fRemoved);
3947 RTMemFree(pMetaXfer);
3948 }
3949 }
3950 else if (fFlush)
3951 RTMemFree(pMetaXfer);
3952
3953 return VINF_SUCCESS;
3954}
3955
3956/**
3957 * Processes a list of waiting I/O tasks. The disk lock must be held by caller.
3958 *
3959 * @returns nothing.
3960 * @param pDisk The disk to process the list for.
3961 */
3962static void vdIoTaskProcessWaitingList(PVBOXHDD pDisk)
3963{
3964 LogFlowFunc(("pDisk=%#p\n", pDisk));
3965
3966 VD_IS_LOCKED(pDisk);
3967
3968 PVDIOTASK pHead = ASMAtomicXchgPtrT(&pDisk->pIoTasksPendingHead, NULL, PVDIOTASK);
3969
3970 Log(("I/O task list cleared\n"));
3971
3972 /* Reverse order. */
3973 PVDIOTASK pCur = pHead;
3974 pHead = NULL;
3975 while (pCur)
3976 {
3977 PVDIOTASK pInsert = pCur;
3978 pCur = pCur->pNext;
3979 pInsert->pNext = pHead;
3980 pHead = pInsert;
3981 }
3982
3983 while (pHead)
3984 {
3985 PVDIOSTORAGE pIoStorage = pHead->pIoStorage;
3986
3987 if (!pHead->fMeta)
3988 vdUserXferCompleted(pIoStorage, pHead->Type.User.pIoCtx,
3989 pHead->pfnComplete, pHead->pvUser,
3990 pHead->Type.User.cbTransfer, pHead->rcReq);
3991 else
3992 vdMetaXferCompleted(pIoStorage, pHead->pfnComplete, pHead->pvUser,
3993 pHead->Type.Meta.pMetaXfer, pHead->rcReq);
3994
3995 pCur = pHead;
3996 pHead = pHead->pNext;
3997 vdIoTaskFree(pDisk, pCur);
3998 }
3999}
4000
4001/**
4002 * Process any I/O context on the halted list.
4003 *
4004 * @returns nothing.
4005 * @param pDisk The disk.
4006 */
4007static void vdIoCtxProcessHaltedList(PVBOXHDD pDisk)
4008{
4009 LogFlowFunc(("pDisk=%#p\n", pDisk));
4010
4011 VD_IS_LOCKED(pDisk);
4012
4013 /* Get the waiting list and process it in FIFO order. */
4014 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxHaltedHead, NULL, PVDIOCTX);
4015
4016 /* Reverse it. */
4017 PVDIOCTX pCur = pIoCtxHead;
4018 pIoCtxHead = NULL;
4019 while (pCur)
4020 {
4021 PVDIOCTX pInsert = pCur;
4022 pCur = pCur->pIoCtxNext;
4023 pInsert->pIoCtxNext = pIoCtxHead;
4024 pIoCtxHead = pInsert;
4025 }
4026
4027 /* Process now. */
4028 pCur = pIoCtxHead;
4029 while (pCur)
4030 {
4031 PVDIOCTX pTmp = pCur;
4032
4033 pCur = pCur->pIoCtxNext;
4034 pTmp->pIoCtxNext = NULL;
4035
4036 /* Continue */
4037 pTmp->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
4038 vdIoCtxContinue(pTmp, pTmp->rcReq);
4039 }
4040}
4041
4042/**
4043 * Unlock the disk and process pending tasks.
4044 *
4045 * @returns VBox status code.
4046 * @param pDisk The disk to unlock.
4047 */
4048static int vdDiskUnlock(PVBOXHDD pDisk, PVDIOCTX pIoCtxRc)
4049{
4050 int rc = VINF_SUCCESS;
4051
4052 VD_IS_LOCKED(pDisk);
4053
4054 /*
4055 * Process the list of waiting I/O tasks first
4056 * because they might complete I/O contexts.
4057 * Same for the list of halted I/O contexts.
4058 * Afterwards comes the list of new I/O contexts.
4059 */
4060 vdIoTaskProcessWaitingList(pDisk);
4061 vdIoCtxProcessHaltedList(pDisk);
4062 rc = vdDiskProcessWaitingIoCtx(pDisk, pIoCtxRc);
4063 ASMAtomicXchgBool(&pDisk->fLocked, false);
4064
4065 /*
4066 * Need to check for new I/O tasks and waiting I/O contexts now
4067 * again as other threads might added them while we processed
4068 * previous lists.
4069 */
4070 while ( ASMAtomicUoReadPtrT(&pDisk->pIoCtxHead, PVDIOCTX) != NULL
4071 || ASMAtomicUoReadPtrT(&pDisk->pIoTasksPendingHead, PVDIOTASK) != NULL
4072 || ASMAtomicUoReadPtrT(&pDisk->pIoCtxHaltedHead, PVDIOCTX) != NULL)
4073 {
4074 /* Try lock disk again. */
4075 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
4076 {
4077 vdIoTaskProcessWaitingList(pDisk);
4078 vdIoCtxProcessHaltedList(pDisk);
4079 vdDiskProcessWaitingIoCtx(pDisk, NULL);
4080 ASMAtomicXchgBool(&pDisk->fLocked, false);
4081 }
4082 else /* Let the other thread everything when he unlocks the disk. */
4083 break;
4084 }
4085
4086 return rc;
4087}
4088
4089/**
4090 * Try to lock the disk to complete pressing of the I/O task.
4091 * The completion is deferred if the disk is locked already.
4092 *
4093 * @returns nothing.
4094 * @param pIoTask The I/O task to complete.
4095 */
4096static void vdXferTryLockDiskDeferIoTask(PVDIOTASK pIoTask)
4097{
4098 PVDIOSTORAGE pIoStorage = pIoTask->pIoStorage;
4099 PVBOXHDD pDisk = pIoStorage->pVDIo->pDisk;
4100
4101 Log(("Deferring I/O task pIoTask=%p\n", pIoTask));
4102
4103 /* Put it on the waiting list. */
4104 PVDIOTASK pNext = ASMAtomicUoReadPtrT(&pDisk->pIoTasksPendingHead, PVDIOTASK);
4105 PVDIOTASK pHeadOld;
4106 pIoTask->pNext = pNext;
4107 while (!ASMAtomicCmpXchgExPtr(&pDisk->pIoTasksPendingHead, pIoTask, pNext, &pHeadOld))
4108 {
4109 pNext = pHeadOld;
4110 Assert(pNext != pIoTask);
4111 pIoTask->pNext = pNext;
4112 ASMNopPause();
4113 }
4114
4115 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
4116 {
4117 /* Release disk lock, it will take care of processing all lists. */
4118 vdDiskUnlock(pDisk, NULL);
4119 }
4120}
4121
4122static int vdIOIntReqCompleted(void *pvUser, int rcReq)
4123{
4124 PVDIOTASK pIoTask = (PVDIOTASK)pvUser;
4125
4126 LogFlowFunc(("Task completed pIoTask=%#p\n", pIoTask));
4127
4128 pIoTask->rcReq = rcReq;
4129 vdXferTryLockDiskDeferIoTask(pIoTask);
4130 return VINF_SUCCESS;
4131}
4132
4133/**
4134 * VD I/O interface callback for opening a file.
4135 */
4136static int vdIOIntOpen(void *pvUser, const char *pszLocation,
4137 unsigned uOpenFlags, PPVDIOSTORAGE ppIoStorage)
4138{
4139 int rc = VINF_SUCCESS;
4140 PVDIO pVDIo = (PVDIO)pvUser;
4141 PVDIOSTORAGE pIoStorage = (PVDIOSTORAGE)RTMemAllocZ(sizeof(VDIOSTORAGE));
4142
4143 if (!pIoStorage)
4144 return VERR_NO_MEMORY;
4145
4146 /* Create the AVl tree. */
4147 pIoStorage->pTreeMetaXfers = (PAVLRFOFFTREE)RTMemAllocZ(sizeof(AVLRFOFFTREE));
4148 if (pIoStorage->pTreeMetaXfers)
4149 {
4150 rc = pVDIo->pInterfaceIo->pfnOpen(pVDIo->pInterfaceIo->Core.pvUser,
4151 pszLocation, uOpenFlags,
4152 vdIOIntReqCompleted,
4153 &pIoStorage->pStorage);
4154 if (RT_SUCCESS(rc))
4155 {
4156 pIoStorage->pVDIo = pVDIo;
4157 *ppIoStorage = pIoStorage;
4158 return VINF_SUCCESS;
4159 }
4160
4161 RTMemFree(pIoStorage->pTreeMetaXfers);
4162 }
4163 else
4164 rc = VERR_NO_MEMORY;
4165
4166 RTMemFree(pIoStorage);
4167 return rc;
4168}
4169
4170static int vdIOIntTreeMetaXferDestroy(PAVLRFOFFNODECORE pNode, void *pvUser)
4171{
4172 AssertMsgFailed(("Tree should be empty at this point!\n"));
4173 return VINF_SUCCESS;
4174}
4175
4176static int vdIOIntClose(void *pvUser, PVDIOSTORAGE pIoStorage)
4177{
4178 int rc = VINF_SUCCESS;
4179 PVDIO pVDIo = (PVDIO)pvUser;
4180
4181 /* We free everything here, even if closing the file failed for some reason. */
4182 rc = pVDIo->pInterfaceIo->pfnClose(pVDIo->pInterfaceIo->Core.pvUser, pIoStorage->pStorage);
4183 RTAvlrFileOffsetDestroy(pIoStorage->pTreeMetaXfers, vdIOIntTreeMetaXferDestroy, NULL);
4184 RTMemFree(pIoStorage->pTreeMetaXfers);
4185 RTMemFree(pIoStorage);
4186 return rc;
4187}
4188
4189static int vdIOIntDelete(void *pvUser, const char *pcszFilename)
4190{
4191 PVDIO pVDIo = (PVDIO)pvUser;
4192 return pVDIo->pInterfaceIo->pfnDelete(pVDIo->pInterfaceIo->Core.pvUser,
4193 pcszFilename);
4194}
4195
4196static int vdIOIntMove(void *pvUser, const char *pcszSrc, const char *pcszDst,
4197 unsigned fMove)
4198{
4199 PVDIO pVDIo = (PVDIO)pvUser;
4200 return pVDIo->pInterfaceIo->pfnMove(pVDIo->pInterfaceIo->Core.pvUser,
4201 pcszSrc, pcszDst, fMove);
4202}
4203
4204static int vdIOIntGetFreeSpace(void *pvUser, const char *pcszFilename,
4205 int64_t *pcbFreeSpace)
4206{
4207 PVDIO pVDIo = (PVDIO)pvUser;
4208 return pVDIo->pInterfaceIo->pfnGetFreeSpace(pVDIo->pInterfaceIo->Core.pvUser,
4209 pcszFilename, pcbFreeSpace);
4210}
4211
4212static int vdIOIntGetModificationTime(void *pvUser, const char *pcszFilename,
4213 PRTTIMESPEC pModificationTime)
4214{
4215 PVDIO pVDIo = (PVDIO)pvUser;
4216 return pVDIo->pInterfaceIo->pfnGetModificationTime(pVDIo->pInterfaceIo->Core.pvUser,
4217 pcszFilename, pModificationTime);
4218}
4219
4220static int vdIOIntGetSize(void *pvUser, PVDIOSTORAGE pIoStorage,
4221 uint64_t *pcbSize)
4222{
4223 PVDIO pVDIo = (PVDIO)pvUser;
4224 return pVDIo->pInterfaceIo->pfnGetSize(pVDIo->pInterfaceIo->Core.pvUser,
4225 pIoStorage->pStorage, pcbSize);
4226}
4227
4228static int vdIOIntSetSize(void *pvUser, PVDIOSTORAGE pIoStorage,
4229 uint64_t cbSize)
4230{
4231 PVDIO pVDIo = (PVDIO)pvUser;
4232 return pVDIo->pInterfaceIo->pfnSetSize(pVDIo->pInterfaceIo->Core.pvUser,
4233 pIoStorage->pStorage, cbSize);
4234}
4235
4236static int vdIOIntReadUser(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4237 PVDIOCTX pIoCtx, size_t cbRead)
4238{
4239 int rc = VINF_SUCCESS;
4240 PVDIO pVDIo = (PVDIO)pvUser;
4241 PVBOXHDD pDisk = pVDIo->pDisk;
4242
4243 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pIoCtx=%#p cbRead=%u\n",
4244 pvUser, pIoStorage, uOffset, pIoCtx, cbRead));
4245
4246 /** @todo: Enable check for sync I/O later. */
4247 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4248 VD_IS_LOCKED(pDisk);
4249
4250 Assert(cbRead > 0);
4251
4252 if (pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4253 {
4254 RTSGSEG Seg;
4255 unsigned cSegments = 1;
4256 size_t cbTaskRead = 0;
4257
4258 /* Synchronous I/O contexts only have one buffer segment. */
4259 AssertMsgReturn(pIoCtx->Req.Io.SgBuf.cSegs == 1,
4260 ("Invalid number of buffer segments for synchronous I/O context"),
4261 VERR_INVALID_PARAMETER);
4262
4263 cbTaskRead = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, &Seg, &cSegments, cbRead);
4264 Assert(cbRead == cbTaskRead);
4265 Assert(cSegments == 1);
4266 rc = pVDIo->pInterfaceIo->pfnReadSync(pVDIo->pInterfaceIo->Core.pvUser,
4267 pIoStorage->pStorage, uOffset,
4268 Seg.pvSeg, cbRead, NULL);
4269 if (RT_SUCCESS(rc))
4270 {
4271 Assert(cbRead == (uint32_t)cbRead);
4272 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbRead);
4273 }
4274 }
4275 else
4276 {
4277 /* Build the S/G array and spawn a new I/O task */
4278 while (cbRead)
4279 {
4280 RTSGSEG aSeg[VD_IO_TASK_SEGMENTS_MAX];
4281 unsigned cSegments = VD_IO_TASK_SEGMENTS_MAX;
4282 size_t cbTaskRead = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, aSeg, &cSegments, cbRead);
4283
4284 Assert(cSegments > 0);
4285 Assert(cbTaskRead > 0);
4286 AssertMsg(cbTaskRead <= cbRead, ("Invalid number of bytes to read\n"));
4287
4288 LogFlow(("Reading %u bytes into %u segments\n", cbTaskRead, cSegments));
4289
4290#ifdef RT_STRICT
4291 for (unsigned i = 0; i < cSegments; i++)
4292 AssertMsg(aSeg[i].pvSeg && !(aSeg[i].cbSeg % 512),
4293 ("Segment %u is invalid\n", i));
4294#endif
4295
4296 Assert(cbTaskRead == (uint32_t)cbTaskRead);
4297 PVDIOTASK pIoTask = vdIoTaskUserAlloc(pIoStorage, NULL, NULL, pIoCtx, (uint32_t)cbTaskRead);
4298
4299 if (!pIoTask)
4300 return VERR_NO_MEMORY;
4301
4302 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
4303
4304 void *pvTask;
4305 Log(("Spawning pIoTask=%p pIoCtx=%p\n", pIoTask, pIoCtx));
4306 rc = pVDIo->pInterfaceIo->pfnReadAsync(pVDIo->pInterfaceIo->Core.pvUser,
4307 pIoStorage->pStorage, uOffset,
4308 aSeg, cSegments, cbTaskRead, pIoTask,
4309 &pvTask);
4310 if (RT_SUCCESS(rc))
4311 {
4312 AssertMsg(cbTaskRead <= pIoCtx->Req.Io.cbTransferLeft, ("Impossible!\n"));
4313 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTaskRead);
4314 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4315 vdIoTaskFree(pDisk, pIoTask);
4316 }
4317 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4318 {
4319 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4320 vdIoTaskFree(pDisk, pIoTask);
4321 break;
4322 }
4323
4324 uOffset += cbTaskRead;
4325 cbRead -= cbTaskRead;
4326 }
4327 }
4328
4329 LogFlowFunc(("returns rc=%Rrc\n", rc));
4330 return rc;
4331}
4332
4333static int vdIOIntWriteUser(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4334 PVDIOCTX pIoCtx, size_t cbWrite, PFNVDXFERCOMPLETED pfnComplete,
4335 void *pvCompleteUser)
4336{
4337 int rc = VINF_SUCCESS;
4338 PVDIO pVDIo = (PVDIO)pvUser;
4339 PVBOXHDD pDisk = pVDIo->pDisk;
4340
4341 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pIoCtx=%#p cbWrite=%u\n",
4342 pvUser, pIoStorage, uOffset, pIoCtx, cbWrite));
4343
4344 /** @todo: Enable check for sync I/O later. */
4345 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4346 VD_IS_LOCKED(pDisk);
4347
4348 Assert(cbWrite > 0);
4349
4350 if (pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4351 {
4352 RTSGSEG Seg;
4353 unsigned cSegments = 1;
4354 size_t cbTaskWrite = 0;
4355
4356 /* Synchronous I/O contexts only have one buffer segment. */
4357 AssertMsgReturn(pIoCtx->Req.Io.SgBuf.cSegs == 1,
4358 ("Invalid number of buffer segments for synchronous I/O context"),
4359 VERR_INVALID_PARAMETER);
4360
4361 cbTaskWrite = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, &Seg, &cSegments, cbWrite);
4362 Assert(cbWrite == cbTaskWrite);
4363 Assert(cSegments == 1);
4364 rc = pVDIo->pInterfaceIo->pfnWriteSync(pVDIo->pInterfaceIo->Core.pvUser,
4365 pIoStorage->pStorage, uOffset,
4366 Seg.pvSeg, cbWrite, NULL);
4367 if (RT_SUCCESS(rc))
4368 {
4369 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbWrite);
4370 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbWrite);
4371 }
4372 }
4373 else
4374 {
4375 /* Build the S/G array and spawn a new I/O task */
4376 while (cbWrite)
4377 {
4378 RTSGSEG aSeg[VD_IO_TASK_SEGMENTS_MAX];
4379 unsigned cSegments = VD_IO_TASK_SEGMENTS_MAX;
4380 size_t cbTaskWrite = 0;
4381
4382 cbTaskWrite = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, aSeg, &cSegments, cbWrite);
4383
4384 Assert(cSegments > 0);
4385 Assert(cbTaskWrite > 0);
4386 AssertMsg(cbTaskWrite <= cbWrite, ("Invalid number of bytes to write\n"));
4387
4388 LogFlow(("Writing %u bytes from %u segments\n", cbTaskWrite, cSegments));
4389
4390#ifdef DEBUG
4391 for (unsigned i = 0; i < cSegments; i++)
4392 AssertMsg(aSeg[i].pvSeg && !(aSeg[i].cbSeg % 512),
4393 ("Segment %u is invalid\n", i));
4394#endif
4395
4396 Assert(cbTaskWrite == (uint32_t)cbTaskWrite);
4397 PVDIOTASK pIoTask = vdIoTaskUserAlloc(pIoStorage, pfnComplete, pvCompleteUser, pIoCtx, (uint32_t)cbTaskWrite);
4398
4399 if (!pIoTask)
4400 return VERR_NO_MEMORY;
4401
4402 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
4403
4404 void *pvTask;
4405 Log(("Spawning pIoTask=%p pIoCtx=%p\n", pIoTask, pIoCtx));
4406 rc = pVDIo->pInterfaceIo->pfnWriteAsync(pVDIo->pInterfaceIo->Core.pvUser,
4407 pIoStorage->pStorage,
4408 uOffset, aSeg, cSegments,
4409 cbTaskWrite, pIoTask, &pvTask);
4410 if (RT_SUCCESS(rc))
4411 {
4412 AssertMsg(cbTaskWrite <= pIoCtx->Req.Io.cbTransferLeft, ("Impossible!\n"));
4413 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTaskWrite);
4414 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4415 vdIoTaskFree(pDisk, pIoTask);
4416 }
4417 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4418 {
4419 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4420 vdIoTaskFree(pDisk, pIoTask);
4421 break;
4422 }
4423
4424 uOffset += cbTaskWrite;
4425 cbWrite -= cbTaskWrite;
4426 }
4427 }
4428
4429 LogFlowFunc(("returns rc=%Rrc\n", rc));
4430 return rc;
4431}
4432
4433static int vdIOIntReadMeta(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4434 void *pvBuf, size_t cbRead, PVDIOCTX pIoCtx,
4435 PPVDMETAXFER ppMetaXfer, PFNVDXFERCOMPLETED pfnComplete,
4436 void *pvCompleteUser)
4437{
4438 PVDIO pVDIo = (PVDIO)pvUser;
4439 PVBOXHDD pDisk = pVDIo->pDisk;
4440 int rc = VINF_SUCCESS;
4441 RTSGSEG Seg;
4442 PVDIOTASK pIoTask;
4443 PVDMETAXFER pMetaXfer = NULL;
4444 void *pvTask = NULL;
4445
4446 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pvBuf=%#p cbRead=%u\n",
4447 pvUser, pIoStorage, uOffset, pvBuf, cbRead));
4448
4449 AssertMsgReturn( pIoCtx
4450 || (!ppMetaXfer && !pfnComplete && !pvCompleteUser),
4451 ("A synchronous metadata read is requested but the parameters are wrong\n"),
4452 VERR_INVALID_POINTER);
4453
4454 /** @todo: Enable check for sync I/O later. */
4455 if ( pIoCtx
4456 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4457 VD_IS_LOCKED(pDisk);
4458
4459 if ( !pIoCtx
4460 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4461 {
4462 /* Handle synchronous metadata I/O. */
4463 /** @todo: Integrate with metadata transfers below. */
4464 rc = pVDIo->pInterfaceIo->pfnReadSync(pVDIo->pInterfaceIo->Core.pvUser,
4465 pIoStorage->pStorage, uOffset,
4466 pvBuf, cbRead, NULL);
4467 if (ppMetaXfer)
4468 *ppMetaXfer = NULL;
4469 }
4470 else
4471 {
4472 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGet(pIoStorage->pTreeMetaXfers, uOffset);
4473 if (!pMetaXfer)
4474 {
4475#ifdef RT_STRICT
4476 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGetBestFit(pIoStorage->pTreeMetaXfers, uOffset, false /* fAbove */);
4477 AssertMsg(!pMetaXfer || (pMetaXfer->Core.Key + (RTFOFF)pMetaXfer->cbMeta <= (RTFOFF)uOffset),
4478 ("Overlapping meta transfers!\n"));
4479#endif
4480
4481 /* Allocate a new meta transfer. */
4482 pMetaXfer = vdMetaXferAlloc(pIoStorage, uOffset, cbRead);
4483 if (!pMetaXfer)
4484 return VERR_NO_MEMORY;
4485
4486 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvCompleteUser, pMetaXfer);
4487 if (!pIoTask)
4488 {
4489 RTMemFree(pMetaXfer);
4490 return VERR_NO_MEMORY;
4491 }
4492
4493 Seg.cbSeg = cbRead;
4494 Seg.pvSeg = pMetaXfer->abData;
4495
4496 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_READ);
4497 rc = pVDIo->pInterfaceIo->pfnReadAsync(pVDIo->pInterfaceIo->Core.pvUser,
4498 pIoStorage->pStorage,
4499 uOffset, &Seg, 1,
4500 cbRead, pIoTask, &pvTask);
4501
4502 if (RT_SUCCESS(rc) || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4503 {
4504 bool fInserted = RTAvlrFileOffsetInsert(pIoStorage->pTreeMetaXfers, &pMetaXfer->Core);
4505 Assert(fInserted);
4506 }
4507 else
4508 RTMemFree(pMetaXfer);
4509
4510 if (RT_SUCCESS(rc))
4511 {
4512 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4513 vdIoTaskFree(pDisk, pIoTask);
4514 }
4515 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS && !pfnComplete)
4516 rc = VERR_VD_NOT_ENOUGH_METADATA;
4517 }
4518
4519 Assert(VALID_PTR(pMetaXfer) || RT_FAILURE(rc));
4520
4521 if (RT_SUCCESS(rc) || rc == VERR_VD_NOT_ENOUGH_METADATA || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4522 {
4523 /* If it is pending add the request to the list. */
4524 if (VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_READ)
4525 {
4526 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4527 AssertPtr(pDeferred);
4528
4529 RTListInit(&pDeferred->NodeDeferred);
4530 pDeferred->pIoCtx = pIoCtx;
4531
4532 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4533 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4534 rc = VERR_VD_NOT_ENOUGH_METADATA;
4535 }
4536 else
4537 {
4538 /* Transfer the data. */
4539 pMetaXfer->cRefs++;
4540 Assert(pMetaXfer->cbMeta >= cbRead);
4541 Assert(pMetaXfer->Core.Key == (RTFOFF)uOffset);
4542 memcpy(pvBuf, pMetaXfer->abData, cbRead);
4543 *ppMetaXfer = pMetaXfer;
4544 }
4545 }
4546 }
4547
4548 LogFlowFunc(("returns rc=%Rrc\n", rc));
4549 return rc;
4550}
4551
4552static int vdIOIntWriteMeta(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4553 const void *pvBuf, size_t cbWrite, PVDIOCTX pIoCtx,
4554 PFNVDXFERCOMPLETED pfnComplete, void *pvCompleteUser)
4555{
4556 PVDIO pVDIo = (PVDIO)pvUser;
4557 PVBOXHDD pDisk = pVDIo->pDisk;
4558 int rc = VINF_SUCCESS;
4559 RTSGSEG Seg;
4560 PVDIOTASK pIoTask;
4561 PVDMETAXFER pMetaXfer = NULL;
4562 bool fInTree = false;
4563 void *pvTask = NULL;
4564
4565 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pvBuf=%#p cbWrite=%u\n",
4566 pvUser, pIoStorage, uOffset, pvBuf, cbWrite));
4567
4568 AssertMsgReturn( pIoCtx
4569 || (!pfnComplete && !pvCompleteUser),
4570 ("A synchronous metadata write is requested but the parameters are wrong\n"),
4571 VERR_INVALID_POINTER);
4572
4573 /** @todo: Enable check for sync I/O later. */
4574 if ( pIoCtx
4575 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4576 VD_IS_LOCKED(pDisk);
4577
4578 if ( !pIoCtx
4579 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4580 {
4581 /* Handle synchronous metadata I/O. */
4582 /** @todo: Integrate with metadata transfers below. */
4583 rc = pVDIo->pInterfaceIo->pfnWriteSync(pVDIo->pInterfaceIo->Core.pvUser,
4584 pIoStorage->pStorage, uOffset,
4585 pvBuf, cbWrite, NULL);
4586 }
4587 else
4588 {
4589 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGet(pIoStorage->pTreeMetaXfers, uOffset);
4590 if (!pMetaXfer)
4591 {
4592 /* Allocate a new meta transfer. */
4593 pMetaXfer = vdMetaXferAlloc(pIoStorage, uOffset, cbWrite);
4594 if (!pMetaXfer)
4595 return VERR_NO_MEMORY;
4596 }
4597 else
4598 {
4599 Assert(pMetaXfer->cbMeta >= cbWrite);
4600 Assert(pMetaXfer->Core.Key == (RTFOFF)uOffset);
4601 fInTree = true;
4602 }
4603
4604 Assert(VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE);
4605
4606 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvCompleteUser, pMetaXfer);
4607 if (!pIoTask)
4608 {
4609 RTMemFree(pMetaXfer);
4610 return VERR_NO_MEMORY;
4611 }
4612
4613 memcpy(pMetaXfer->abData, pvBuf, cbWrite);
4614 Seg.cbSeg = cbWrite;
4615 Seg.pvSeg = pMetaXfer->abData;
4616
4617 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4618
4619 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_WRITE);
4620 rc = pVDIo->pInterfaceIo->pfnWriteAsync(pVDIo->pInterfaceIo->Core.pvUser,
4621 pIoStorage->pStorage,
4622 uOffset, &Seg, 1, cbWrite, pIoTask,
4623 &pvTask);
4624 if (RT_SUCCESS(rc))
4625 {
4626 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4627 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
4628 vdIoTaskFree(pDisk, pIoTask);
4629 if (fInTree && !pMetaXfer->cRefs)
4630 {
4631 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4632 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4633 AssertMsg(fRemoved, ("Metadata transfer wasn't removed\n"));
4634 RTMemFree(pMetaXfer);
4635 pMetaXfer = NULL;
4636 }
4637 }
4638 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4639 {
4640 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4641 AssertPtr(pDeferred);
4642
4643 RTListInit(&pDeferred->NodeDeferred);
4644 pDeferred->pIoCtx = pIoCtx;
4645
4646 if (!fInTree)
4647 {
4648 bool fInserted = RTAvlrFileOffsetInsert(pIoStorage->pTreeMetaXfers, &pMetaXfer->Core);
4649 Assert(fInserted);
4650 }
4651
4652 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4653 }
4654 else
4655 {
4656 RTMemFree(pMetaXfer);
4657 pMetaXfer = NULL;
4658 }
4659 }
4660
4661 LogFlowFunc(("returns rc=%Rrc\n", rc));
4662 return rc;
4663}
4664
4665static void vdIOIntMetaXferRelease(void *pvUser, PVDMETAXFER pMetaXfer)
4666{
4667 PVDIO pVDIo = (PVDIO)pvUser;
4668 PVBOXHDD pDisk = pVDIo->pDisk;
4669 PVDIOSTORAGE pIoStorage;
4670
4671 /*
4672 * It is possible that we get called with a NULL metadata xfer handle
4673 * for synchronous I/O. Just exit.
4674 */
4675 if (!pMetaXfer)
4676 return;
4677
4678 pIoStorage = pMetaXfer->pIoStorage;
4679
4680 VD_IS_LOCKED(pDisk);
4681
4682 Assert( VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE
4683 || VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_WRITE);
4684 Assert(pMetaXfer->cRefs > 0);
4685
4686 pMetaXfer->cRefs--;
4687 if ( !pMetaXfer->cRefs
4688 && RTListIsEmpty(&pMetaXfer->ListIoCtxWaiting)
4689 && VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE)
4690 {
4691 /* Free the meta data entry. */
4692 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4693 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4694 AssertMsg(fRemoved, ("Metadata transfer wasn't removed\n"));
4695
4696 RTMemFree(pMetaXfer);
4697 }
4698}
4699
4700static int vdIOIntFlush(void *pvUser, PVDIOSTORAGE pIoStorage, PVDIOCTX pIoCtx,
4701 PFNVDXFERCOMPLETED pfnComplete, void *pvCompleteUser)
4702{
4703 PVDIO pVDIo = (PVDIO)pvUser;
4704 PVBOXHDD pDisk = pVDIo->pDisk;
4705 int rc = VINF_SUCCESS;
4706 PVDIOTASK pIoTask;
4707 PVDMETAXFER pMetaXfer = NULL;
4708 void *pvTask = NULL;
4709
4710 LogFlowFunc(("pvUser=%#p pIoStorage=%#p pIoCtx=%#p\n",
4711 pvUser, pIoStorage, pIoCtx));
4712
4713 AssertMsgReturn( pIoCtx
4714 || (!pfnComplete && !pvCompleteUser),
4715 ("A synchronous metadata write is requested but the parameters are wrong\n"),
4716 VERR_INVALID_POINTER);
4717
4718 /** @todo: Enable check for sync I/O later. */
4719 if ( pIoCtx
4720 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4721 VD_IS_LOCKED(pDisk);
4722
4723 if (pVDIo->fIgnoreFlush)
4724 return VINF_SUCCESS;
4725
4726 if ( !pIoCtx
4727 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4728 {
4729 /* Handle synchronous flushes. */
4730 /** @todo: Integrate with metadata transfers below. */
4731 rc = pVDIo->pInterfaceIo->pfnFlushSync(pVDIo->pInterfaceIo->Core.pvUser,
4732 pIoStorage->pStorage);
4733 }
4734 else
4735 {
4736 /* Allocate a new meta transfer. */
4737 pMetaXfer = vdMetaXferAlloc(pIoStorage, 0, 0);
4738 if (!pMetaXfer)
4739 return VERR_NO_MEMORY;
4740
4741 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvUser, pMetaXfer);
4742 if (!pIoTask)
4743 {
4744 RTMemFree(pMetaXfer);
4745 return VERR_NO_MEMORY;
4746 }
4747
4748 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4749
4750 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4751 AssertPtr(pDeferred);
4752
4753 RTListInit(&pDeferred->NodeDeferred);
4754 pDeferred->pIoCtx = pIoCtx;
4755
4756 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4757 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_FLUSH);
4758 rc = pVDIo->pInterfaceIo->pfnFlushAsync(pVDIo->pInterfaceIo->Core.pvUser,
4759 pIoStorage->pStorage,
4760 pIoTask, &pvTask);
4761 if (RT_SUCCESS(rc))
4762 {
4763 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4764 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
4765 vdIoTaskFree(pDisk, pIoTask);
4766 RTMemFree(pDeferred);
4767 RTMemFree(pMetaXfer);
4768 }
4769 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4770 RTMemFree(pMetaXfer);
4771 }
4772
4773 LogFlowFunc(("returns rc=%Rrc\n", rc));
4774 return rc;
4775}
4776
4777static size_t vdIOIntIoCtxCopyTo(void *pvUser, PVDIOCTX pIoCtx,
4778 const void *pvBuf, size_t cbBuf)
4779{
4780 PVDIO pVDIo = (PVDIO)pvUser;
4781 PVBOXHDD pDisk = pVDIo->pDisk;
4782 size_t cbCopied = 0;
4783
4784 /** @todo: Enable check for sync I/O later. */
4785 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4786 VD_IS_LOCKED(pDisk);
4787
4788 cbCopied = vdIoCtxCopyTo(pIoCtx, (uint8_t *)pvBuf, cbBuf);
4789 Assert(cbCopied == cbBuf);
4790
4791 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft >= cbCopied); - triggers with vdCopyHelper/dmgRead.
4792 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCopied);
4793
4794 return cbCopied;
4795}
4796
4797static size_t vdIOIntIoCtxCopyFrom(void *pvUser, PVDIOCTX pIoCtx,
4798 void *pvBuf, size_t cbBuf)
4799{
4800 PVDIO pVDIo = (PVDIO)pvUser;
4801 PVBOXHDD pDisk = pVDIo->pDisk;
4802 size_t cbCopied = 0;
4803
4804 /** @todo: Enable check for sync I/O later. */
4805 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4806 VD_IS_LOCKED(pDisk);
4807
4808 cbCopied = vdIoCtxCopyFrom(pIoCtx, (uint8_t *)pvBuf, cbBuf);
4809 Assert(cbCopied == cbBuf);
4810
4811 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft > cbCopied); - triggers with vdCopyHelper/dmgRead.
4812 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCopied);
4813
4814 return cbCopied;
4815}
4816
4817static size_t vdIOIntIoCtxSet(void *pvUser, PVDIOCTX pIoCtx, int ch, size_t cb)
4818{
4819 PVDIO pVDIo = (PVDIO)pvUser;
4820 PVBOXHDD pDisk = pVDIo->pDisk;
4821 size_t cbSet = 0;
4822
4823 /** @todo: Enable check for sync I/O later. */
4824 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4825 VD_IS_LOCKED(pDisk);
4826
4827 cbSet = vdIoCtxSet(pIoCtx, ch, cb);
4828 Assert(cbSet == cb);
4829
4830 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft >= cbSet); - triggers with vdCopyHelper/dmgRead.
4831 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbSet);
4832
4833 return cbSet;
4834}
4835
4836static size_t vdIOIntIoCtxSegArrayCreate(void *pvUser, PVDIOCTX pIoCtx,
4837 PRTSGSEG paSeg, unsigned *pcSeg,
4838 size_t cbData)
4839{
4840 PVDIO pVDIo = (PVDIO)pvUser;
4841 PVBOXHDD pDisk = pVDIo->pDisk;
4842 size_t cbCreated = 0;
4843
4844 /** @todo: Enable check for sync I/O later. */
4845 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4846 VD_IS_LOCKED(pDisk);
4847
4848 cbCreated = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, paSeg, pcSeg, cbData);
4849 Assert(!paSeg || cbData == cbCreated);
4850
4851 return cbCreated;
4852}
4853
4854static void vdIOIntIoCtxCompleted(void *pvUser, PVDIOCTX pIoCtx, int rcReq,
4855 size_t cbCompleted)
4856{
4857 PVDIO pVDIo = (PVDIO)pvUser;
4858 PVBOXHDD pDisk = pVDIo->pDisk;
4859
4860 LogFlowFunc(("pvUser=%#p pIoCtx=%#p rcReq=%Rrc cbCompleted=%zu\n",
4861 pvUser, pIoCtx, rcReq, cbCompleted));
4862
4863 /*
4864 * Grab the disk critical section to avoid races with other threads which
4865 * might still modify the I/O context.
4866 * Example is that iSCSI is doing an asynchronous write but calls us already
4867 * while the other thread is still hanging in vdWriteHelperAsync and couldn't update
4868 * the blocked state yet.
4869 * It can overwrite the state to true before we call vdIoCtxContinue and the
4870 * the request would hang indefinite.
4871 */
4872 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rcReq, VINF_SUCCESS);
4873 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbCompleted);
4874 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCompleted);
4875
4876 /* Set next transfer function if the current one finished.
4877 * @todo: Find a better way to prevent vdIoCtxContinue from calling the current helper again. */
4878 if (!pIoCtx->Req.Io.cbTransferLeft)
4879 {
4880 pIoCtx->pfnIoCtxTransfer = pIoCtx->pfnIoCtxTransferNext;
4881 pIoCtx->pfnIoCtxTransferNext = NULL;
4882 }
4883
4884 vdIoCtxAddToWaitingList(&pDisk->pIoCtxHaltedHead, pIoCtx);
4885 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
4886 {
4887 /* Immediately drop the lock again, it will take care of processing the list. */
4888 vdDiskUnlock(pDisk, NULL);
4889 }
4890}
4891
4892static DECLCALLBACK(bool) vdIOIntIoCtxIsSynchronous(void *pvUser, PVDIOCTX pIoCtx)
4893{
4894 NOREF(pvUser);
4895 return !!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC);
4896}
4897
4898static DECLCALLBACK(bool) vdIOIntIoCtxIsZero(void *pvUser, PVDIOCTX pIoCtx, size_t cbCheck,
4899 bool fAdvance)
4900{
4901 NOREF(pvUser);
4902
4903 bool fIsZero = RTSgBufIsZero(&pIoCtx->Req.Io.SgBuf, cbCheck);
4904 if (fIsZero && fAdvance)
4905 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbCheck);
4906
4907 return fIsZero;
4908}
4909
4910/**
4911 * VD I/O interface callback for opening a file (limited version for VDGetFormat).
4912 */
4913static int vdIOIntOpenLimited(void *pvUser, const char *pszLocation,
4914 uint32_t fOpen, PPVDIOSTORAGE ppIoStorage)
4915{
4916 int rc = VINF_SUCCESS;
4917 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4918 PVDIOSTORAGE pIoStorage = (PVDIOSTORAGE)RTMemAllocZ(sizeof(VDIOSTORAGE));
4919
4920 if (!pIoStorage)
4921 return VERR_NO_MEMORY;
4922
4923 rc = pInterfaceIo->pfnOpen(NULL, pszLocation, fOpen, NULL, &pIoStorage->pStorage);
4924 if (RT_SUCCESS(rc))
4925 *ppIoStorage = pIoStorage;
4926 else
4927 RTMemFree(pIoStorage);
4928
4929 return rc;
4930}
4931
4932static int vdIOIntCloseLimited(void *pvUser, PVDIOSTORAGE pIoStorage)
4933{
4934 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4935 int rc = pInterfaceIo->pfnClose(NULL, pIoStorage->pStorage);
4936
4937 RTMemFree(pIoStorage);
4938 return rc;
4939}
4940
4941static int vdIOIntDeleteLimited(void *pvUser, const char *pcszFilename)
4942{
4943 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4944 return pInterfaceIo->pfnDelete(NULL, pcszFilename);
4945}
4946
4947static int vdIOIntMoveLimited(void *pvUser, const char *pcszSrc,
4948 const char *pcszDst, unsigned fMove)
4949{
4950 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4951 return pInterfaceIo->pfnMove(NULL, pcszSrc, pcszDst, fMove);
4952}
4953
4954static int vdIOIntGetFreeSpaceLimited(void *pvUser, const char *pcszFilename,
4955 int64_t *pcbFreeSpace)
4956{
4957 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4958 return pInterfaceIo->pfnGetFreeSpace(NULL, pcszFilename, pcbFreeSpace);
4959}
4960
4961static int vdIOIntGetModificationTimeLimited(void *pvUser,
4962 const char *pcszFilename,
4963 PRTTIMESPEC pModificationTime)
4964{
4965 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4966 return pInterfaceIo->pfnGetModificationTime(NULL, pcszFilename, pModificationTime);
4967}
4968
4969static int vdIOIntGetSizeLimited(void *pvUser, PVDIOSTORAGE pIoStorage,
4970 uint64_t *pcbSize)
4971{
4972 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4973 return pInterfaceIo->pfnGetSize(NULL, pIoStorage->pStorage, pcbSize);
4974}
4975
4976static int vdIOIntSetSizeLimited(void *pvUser, PVDIOSTORAGE pIoStorage,
4977 uint64_t cbSize)
4978{
4979 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4980 return pInterfaceIo->pfnSetSize(NULL, pIoStorage->pStorage, cbSize);
4981}
4982
4983static int vdIOIntWriteUserLimited(void *pvUser, PVDIOSTORAGE pStorage,
4984 uint64_t uOffset, PVDIOCTX pIoCtx,
4985 size_t cbWrite,
4986 PFNVDXFERCOMPLETED pfnComplete,
4987 void *pvCompleteUser)
4988{
4989 NOREF(pvUser);
4990 NOREF(pStorage);
4991 NOREF(uOffset);
4992 NOREF(pIoCtx);
4993 NOREF(cbWrite);
4994 NOREF(pfnComplete);
4995 NOREF(pvCompleteUser);
4996 AssertMsgFailedReturn(("This needs to be implemented when called\n"), VERR_NOT_IMPLEMENTED);
4997}
4998
4999static int vdIOIntReadUserLimited(void *pvUser, PVDIOSTORAGE pStorage,
5000 uint64_t uOffset, PVDIOCTX pIoCtx,
5001 size_t cbRead)
5002{
5003 NOREF(pvUser);
5004 NOREF(pStorage);
5005 NOREF(uOffset);
5006 NOREF(pIoCtx);
5007 NOREF(cbRead);
5008 AssertMsgFailedReturn(("This needs to be implemented when called\n"), VERR_NOT_IMPLEMENTED);
5009}
5010
5011static int vdIOIntWriteMetaLimited(void *pvUser, PVDIOSTORAGE pStorage,
5012 uint64_t uOffset, const void *pvBuffer,
5013 size_t cbBuffer, PVDIOCTX pIoCtx,
5014 PFNVDXFERCOMPLETED pfnComplete,
5015 void *pvCompleteUser)
5016{
5017 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5018
5019 AssertMsgReturn(!pIoCtx && !pfnComplete && !pvCompleteUser,
5020 ("Async I/O not implemented for the limited interface"),
5021 VERR_NOT_SUPPORTED);
5022
5023 return pInterfaceIo->pfnWriteSync(NULL, pStorage->pStorage, uOffset, pvBuffer, cbBuffer, NULL);
5024}
5025
5026static int vdIOIntReadMetaLimited(void *pvUser, PVDIOSTORAGE pStorage,
5027 uint64_t uOffset, void *pvBuffer,
5028 size_t cbBuffer, PVDIOCTX pIoCtx,
5029 PPVDMETAXFER ppMetaXfer,
5030 PFNVDXFERCOMPLETED pfnComplete,
5031 void *pvCompleteUser)
5032{
5033 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5034
5035 AssertMsgReturn(!pIoCtx && !ppMetaXfer && !pfnComplete && !pvCompleteUser,
5036 ("Async I/O not implemented for the limited interface"),
5037 VERR_NOT_SUPPORTED);
5038
5039 return pInterfaceIo->pfnReadSync(NULL, pStorage->pStorage, uOffset, pvBuffer, cbBuffer, NULL);
5040}
5041
5042static int vdIOIntMetaXferReleaseLimited(void *pvUser, PVDMETAXFER pMetaXfer)
5043{
5044 /* This is a NOP in this case. */
5045 NOREF(pvUser);
5046 NOREF(pMetaXfer);
5047 return VINF_SUCCESS;
5048}
5049
5050static int vdIOIntFlushLimited(void *pvUser, PVDIOSTORAGE pStorage,
5051 PVDIOCTX pIoCtx,
5052 PFNVDXFERCOMPLETED pfnComplete,
5053 void *pvCompleteUser)
5054{
5055 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5056
5057 AssertMsgReturn(!pIoCtx && !pfnComplete && !pvCompleteUser,
5058 ("Async I/O not implemented for the limited interface"),
5059 VERR_NOT_SUPPORTED);
5060
5061 return pInterfaceIo->pfnFlushSync(NULL, pStorage->pStorage);
5062}
5063
5064/**
5065 * internal: send output to the log (unconditionally).
5066 */
5067int vdLogMessage(void *pvUser, const char *pszFormat, va_list args)
5068{
5069 NOREF(pvUser);
5070 RTLogPrintfV(pszFormat, args);
5071 return VINF_SUCCESS;
5072}
5073
5074DECLINLINE(int) vdMessageWrapper(PVBOXHDD pDisk, const char *pszFormat, ...)
5075{
5076 va_list va;
5077 va_start(va, pszFormat);
5078 int rc = pDisk->pInterfaceError->pfnMessage(pDisk->pInterfaceError->Core.pvUser,
5079 pszFormat, va);
5080 va_end(va);
5081 return rc;
5082}
5083
5084
5085/**
5086 * internal: adjust PCHS geometry
5087 */
5088static void vdFixupPCHSGeometry(PVDGEOMETRY pPCHS, uint64_t cbSize)
5089{
5090 /* Fix broken PCHS geometry. Can happen for two reasons: either the backend
5091 * mixes up PCHS and LCHS, or the application used to create the source
5092 * image has put garbage in it. Additionally, if the PCHS geometry covers
5093 * more than the image size, set it back to the default. */
5094 if ( pPCHS->cHeads > 16
5095 || pPCHS->cSectors > 63
5096 || pPCHS->cCylinders == 0
5097 || (uint64_t)pPCHS->cHeads * pPCHS->cSectors * pPCHS->cCylinders * 512 > cbSize)
5098 {
5099 Assert(!(RT_MIN(cbSize / 512 / 16 / 63, 16383) - (uint32_t)RT_MIN(cbSize / 512 / 16 / 63, 16383)));
5100 pPCHS->cCylinders = (uint32_t)RT_MIN(cbSize / 512 / 16 / 63, 16383);
5101 pPCHS->cHeads = 16;
5102 pPCHS->cSectors = 63;
5103 }
5104}
5105
5106/**
5107 * internal: adjust PCHS geometry
5108 */
5109static void vdFixupLCHSGeometry(PVDGEOMETRY pLCHS, uint64_t cbSize)
5110{
5111 /* Fix broken LCHS geometry. Can happen for two reasons: either the backend
5112 * mixes up PCHS and LCHS, or the application used to create the source
5113 * image has put garbage in it. The fix in this case is to clear the LCHS
5114 * geometry to trigger autodetection when it is used next. If the geometry
5115 * already says "please autodetect" (cylinders=0) keep it. */
5116 if ( ( pLCHS->cHeads > 255
5117 || pLCHS->cHeads == 0
5118 || pLCHS->cSectors > 63
5119 || pLCHS->cSectors == 0)
5120 && pLCHS->cCylinders != 0)
5121 {
5122 pLCHS->cCylinders = 0;
5123 pLCHS->cHeads = 0;
5124 pLCHS->cSectors = 0;
5125 }
5126 /* Always recompute the number of cylinders stored in the LCHS
5127 * geometry if it isn't set to "autotedetect" at the moment.
5128 * This is very useful if the destination image size is
5129 * larger or smaller than the source image size. Do not modify
5130 * the number of heads and sectors. Windows guests hate it. */
5131 if ( pLCHS->cCylinders != 0
5132 && pLCHS->cHeads != 0 /* paranoia */
5133 && pLCHS->cSectors != 0 /* paranoia */)
5134 {
5135 Assert(!(RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024) - (uint32_t)RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024)));
5136 pLCHS->cCylinders = (uint32_t)RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024);
5137 }
5138}
5139
5140/**
5141 * Sets the I/O callbacks of the given interface to the fallback methods
5142 *
5143 * @returns nothing.
5144 * @param pIfIo The I/O interface to setup.
5145 */
5146static void vdIfIoFallbackCallbacksSetup(PVDINTERFACEIO pIfIo)
5147{
5148 pIfIo->pfnOpen = vdIOOpenFallback;
5149 pIfIo->pfnClose = vdIOCloseFallback;
5150 pIfIo->pfnDelete = vdIODeleteFallback;
5151 pIfIo->pfnMove = vdIOMoveFallback;
5152 pIfIo->pfnGetFreeSpace = vdIOGetFreeSpaceFallback;
5153 pIfIo->pfnGetModificationTime = vdIOGetModificationTimeFallback;
5154 pIfIo->pfnGetSize = vdIOGetSizeFallback;
5155 pIfIo->pfnSetSize = vdIOSetSizeFallback;
5156 pIfIo->pfnReadSync = vdIOReadSyncFallback;
5157 pIfIo->pfnWriteSync = vdIOWriteSyncFallback;
5158 pIfIo->pfnFlushSync = vdIOFlushSyncFallback;
5159 pIfIo->pfnReadAsync = vdIOReadAsyncFallback;
5160 pIfIo->pfnWriteAsync = vdIOWriteAsyncFallback;
5161 pIfIo->pfnFlushAsync = vdIOFlushAsyncFallback;
5162}
5163
5164/**
5165 * Sets the internal I/O callbacks of the given interface.
5166 *
5167 * @returns nothing.
5168 * @param pIfIoInt The internal I/O interface to setup.
5169 */
5170static void vdIfIoIntCallbacksSetup(PVDINTERFACEIOINT pIfIoInt)
5171{
5172 pIfIoInt->pfnOpen = vdIOIntOpen;
5173 pIfIoInt->pfnClose = vdIOIntClose;
5174 pIfIoInt->pfnDelete = vdIOIntDelete;
5175 pIfIoInt->pfnMove = vdIOIntMove;
5176 pIfIoInt->pfnGetFreeSpace = vdIOIntGetFreeSpace;
5177 pIfIoInt->pfnGetModificationTime = vdIOIntGetModificationTime;
5178 pIfIoInt->pfnGetSize = vdIOIntGetSize;
5179 pIfIoInt->pfnSetSize = vdIOIntSetSize;
5180 pIfIoInt->pfnReadUser = vdIOIntReadUser;
5181 pIfIoInt->pfnWriteUser = vdIOIntWriteUser;
5182 pIfIoInt->pfnReadMeta = vdIOIntReadMeta;
5183 pIfIoInt->pfnWriteMeta = vdIOIntWriteMeta;
5184 pIfIoInt->pfnMetaXferRelease = vdIOIntMetaXferRelease;
5185 pIfIoInt->pfnFlush = vdIOIntFlush;
5186 pIfIoInt->pfnIoCtxCopyFrom = vdIOIntIoCtxCopyFrom;
5187 pIfIoInt->pfnIoCtxCopyTo = vdIOIntIoCtxCopyTo;
5188 pIfIoInt->pfnIoCtxSet = vdIOIntIoCtxSet;
5189 pIfIoInt->pfnIoCtxSegArrayCreate = vdIOIntIoCtxSegArrayCreate;
5190 pIfIoInt->pfnIoCtxCompleted = vdIOIntIoCtxCompleted;
5191 pIfIoInt->pfnIoCtxIsSynchronous = vdIOIntIoCtxIsSynchronous;
5192 pIfIoInt->pfnIoCtxIsZero = vdIOIntIoCtxIsZero;
5193}
5194
5195/**
5196 * Internally used completion handler for synchronous I/O contexts.
5197 */
5198static DECLCALLBACK(void) vdIoCtxSyncComplete(void *pvUser1, void *pvUser2, int rcReq)
5199{
5200 PVBOXHDD pDisk = (PVBOXHDD)pvUser1;
5201 RTSEMEVENT hEvent = (RTSEMEVENT)pvUser2;
5202
5203 RTSemEventSignal(hEvent);
5204}
5205
5206/**
5207 * Initializes HDD backends.
5208 *
5209 * @returns VBox status code.
5210 */
5211VBOXDDU_DECL(int) VDInit(void)
5212{
5213 int rc = vdAddBackends(aStaticBackends, RT_ELEMENTS(aStaticBackends));
5214 if (RT_SUCCESS(rc))
5215 {
5216 rc = vdAddCacheBackends(aStaticCacheBackends, RT_ELEMENTS(aStaticCacheBackends));
5217 if (RT_SUCCESS(rc))
5218 {
5219 RTListInit(&g_ListPluginsLoaded);
5220 rc = vdLoadDynamicBackends();
5221 }
5222 }
5223 LogRel(("VDInit finished\n"));
5224 return rc;
5225}
5226
5227/**
5228 * Destroys loaded HDD backends.
5229 *
5230 * @returns VBox status code.
5231 */
5232VBOXDDU_DECL(int) VDShutdown(void)
5233{
5234 PCVBOXHDDBACKEND *pBackends = g_apBackends;
5235 PCVDCACHEBACKEND *pCacheBackends = g_apCacheBackends;
5236 unsigned cBackends = g_cBackends;
5237
5238 if (!g_apBackends)
5239 return VERR_INTERNAL_ERROR;
5240
5241 if (g_apCacheBackends)
5242 RTMemFree(g_apCacheBackends);
5243 RTMemFree(g_apBackends);
5244
5245 g_cBackends = 0;
5246 g_apBackends = NULL;
5247
5248 /* Clear the supported cache backends. */
5249 g_cCacheBackends = 0;
5250 g_apCacheBackends = NULL;
5251
5252#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
5253 PVDPLUGIN pPlugin, pPluginNext;
5254
5255 RTListForEachSafe(&g_ListPluginsLoaded, pPlugin, pPluginNext, VDPLUGIN, NodePlugin)
5256 {
5257 RTLdrClose(pPlugin->hPlugin);
5258 RTListNodeRemove(&pPlugin->NodePlugin);
5259 RTMemFree(pPlugin);
5260 }
5261#endif
5262
5263 return VINF_SUCCESS;
5264}
5265
5266
5267/**
5268 * Lists all HDD backends and their capabilities in a caller-provided buffer.
5269 *
5270 * @returns VBox status code.
5271 * VERR_BUFFER_OVERFLOW if not enough space is passed.
5272 * @param cEntriesAlloc Number of list entries available.
5273 * @param pEntries Pointer to array for the entries.
5274 * @param pcEntriesUsed Number of entries returned.
5275 */
5276VBOXDDU_DECL(int) VDBackendInfo(unsigned cEntriesAlloc, PVDBACKENDINFO pEntries,
5277 unsigned *pcEntriesUsed)
5278{
5279 int rc = VINF_SUCCESS;
5280 PRTDIR pPluginDir = NULL;
5281 unsigned cEntries = 0;
5282
5283 LogFlowFunc(("cEntriesAlloc=%u pEntries=%#p pcEntriesUsed=%#p\n", cEntriesAlloc, pEntries, pcEntriesUsed));
5284 /* Check arguments. */
5285 AssertMsgReturn(cEntriesAlloc,
5286 ("cEntriesAlloc=%u\n", cEntriesAlloc),
5287 VERR_INVALID_PARAMETER);
5288 AssertMsgReturn(VALID_PTR(pEntries),
5289 ("pEntries=%#p\n", pEntries),
5290 VERR_INVALID_PARAMETER);
5291 AssertMsgReturn(VALID_PTR(pcEntriesUsed),
5292 ("pcEntriesUsed=%#p\n", pcEntriesUsed),
5293 VERR_INVALID_PARAMETER);
5294 if (!g_apBackends)
5295 VDInit();
5296
5297 if (cEntriesAlloc < g_cBackends)
5298 {
5299 *pcEntriesUsed = g_cBackends;
5300 return VERR_BUFFER_OVERFLOW;
5301 }
5302
5303 for (unsigned i = 0; i < g_cBackends; i++)
5304 {
5305 pEntries[i].pszBackend = g_apBackends[i]->pszBackendName;
5306 pEntries[i].uBackendCaps = g_apBackends[i]->uBackendCaps;
5307 pEntries[i].paFileExtensions = g_apBackends[i]->paFileExtensions;
5308 pEntries[i].paConfigInfo = g_apBackends[i]->paConfigInfo;
5309 pEntries[i].pfnComposeLocation = g_apBackends[i]->pfnComposeLocation;
5310 pEntries[i].pfnComposeName = g_apBackends[i]->pfnComposeName;
5311 }
5312
5313 LogFlowFunc(("returns %Rrc *pcEntriesUsed=%u\n", rc, cEntries));
5314 *pcEntriesUsed = g_cBackends;
5315 return rc;
5316}
5317
5318/**
5319 * Lists the capabilities of a backend identified by its name.
5320 *
5321 * @returns VBox status code.
5322 * @param pszBackend The backend name.
5323 * @param pEntries Pointer to an entry.
5324 */
5325VBOXDDU_DECL(int) VDBackendInfoOne(const char *pszBackend, PVDBACKENDINFO pEntry)
5326{
5327 LogFlowFunc(("pszBackend=%#p pEntry=%#p\n", pszBackend, pEntry));
5328 /* Check arguments. */
5329 AssertMsgReturn(VALID_PTR(pszBackend),
5330 ("pszBackend=%#p\n", pszBackend),
5331 VERR_INVALID_PARAMETER);
5332 AssertMsgReturn(VALID_PTR(pEntry),
5333 ("pEntry=%#p\n", pEntry),
5334 VERR_INVALID_PARAMETER);
5335 if (!g_apBackends)
5336 VDInit();
5337
5338 /* Go through loaded backends. */
5339 for (unsigned i = 0; i < g_cBackends; i++)
5340 {
5341 if (!RTStrICmp(pszBackend, g_apBackends[i]->pszBackendName))
5342 {
5343 pEntry->pszBackend = g_apBackends[i]->pszBackendName;
5344 pEntry->uBackendCaps = g_apBackends[i]->uBackendCaps;
5345 pEntry->paFileExtensions = g_apBackends[i]->paFileExtensions;
5346 pEntry->paConfigInfo = g_apBackends[i]->paConfigInfo;
5347 return VINF_SUCCESS;
5348 }
5349 }
5350
5351 return VERR_NOT_FOUND;
5352}
5353
5354/**
5355 * Allocates and initializes an empty HDD container.
5356 * No image files are opened.
5357 *
5358 * @returns VBox status code.
5359 * @param pVDIfsDisk Pointer to the per-disk VD interface list.
5360 * @param enmType Type of the image container.
5361 * @param ppDisk Where to store the reference to HDD container.
5362 */
5363VBOXDDU_DECL(int) VDCreate(PVDINTERFACE pVDIfsDisk, VDTYPE enmType, PVBOXHDD *ppDisk)
5364{
5365 int rc = VINF_SUCCESS;
5366 PVBOXHDD pDisk = NULL;
5367
5368 LogFlowFunc(("pVDIfsDisk=%#p\n", pVDIfsDisk));
5369 do
5370 {
5371 /* Check arguments. */
5372 AssertMsgBreakStmt(VALID_PTR(ppDisk),
5373 ("ppDisk=%#p\n", ppDisk),
5374 rc = VERR_INVALID_PARAMETER);
5375
5376 pDisk = (PVBOXHDD)RTMemAllocZ(sizeof(VBOXHDD));
5377 if (pDisk)
5378 {
5379 pDisk->u32Signature = VBOXHDDDISK_SIGNATURE;
5380 pDisk->enmType = enmType;
5381 pDisk->cImages = 0;
5382 pDisk->pBase = NULL;
5383 pDisk->pLast = NULL;
5384 pDisk->cbSize = 0;
5385 pDisk->PCHSGeometry.cCylinders = 0;
5386 pDisk->PCHSGeometry.cHeads = 0;
5387 pDisk->PCHSGeometry.cSectors = 0;
5388 pDisk->LCHSGeometry.cCylinders = 0;
5389 pDisk->LCHSGeometry.cHeads = 0;
5390 pDisk->LCHSGeometry.cSectors = 0;
5391 pDisk->pVDIfsDisk = pVDIfsDisk;
5392 pDisk->pInterfaceError = NULL;
5393 pDisk->pInterfaceThreadSync = NULL;
5394 pDisk->pIoCtxLockOwner = NULL;
5395 pDisk->pIoCtxHead = NULL;
5396 pDisk->fLocked = false;
5397 pDisk->hMemCacheIoCtx = NIL_RTMEMCACHE;
5398 pDisk->hMemCacheIoTask = NIL_RTMEMCACHE;
5399 pDisk->pFilterHead = NULL;
5400 pDisk->pFilterTail = NULL;
5401
5402 /* Create the I/O ctx cache */
5403 rc = RTMemCacheCreate(&pDisk->hMemCacheIoCtx, sizeof(VDIOCTX), 0, UINT32_MAX,
5404 NULL, NULL, NULL, 0);
5405 if (RT_FAILURE(rc))
5406 break;
5407
5408 /* Create the I/O task cache */
5409 rc = RTMemCacheCreate(&pDisk->hMemCacheIoTask, sizeof(VDIOTASK), 0, UINT32_MAX,
5410 NULL, NULL, NULL, 0);
5411 if (RT_FAILURE(rc))
5412 break;
5413
5414 pDisk->pInterfaceError = VDIfErrorGet(pVDIfsDisk);
5415 pDisk->pInterfaceThreadSync = VDIfThreadSyncGet(pVDIfsDisk);
5416
5417 *ppDisk = pDisk;
5418 }
5419 else
5420 {
5421 rc = VERR_NO_MEMORY;
5422 break;
5423 }
5424 } while (0);
5425
5426 if ( RT_FAILURE(rc)
5427 && pDisk)
5428 {
5429 if (pDisk->hMemCacheIoCtx != NIL_RTMEMCACHE)
5430 RTMemCacheDestroy(pDisk->hMemCacheIoCtx);
5431 if (pDisk->hMemCacheIoTask != NIL_RTMEMCACHE)
5432 RTMemCacheDestroy(pDisk->hMemCacheIoTask);
5433 }
5434
5435 LogFlowFunc(("returns %Rrc (pDisk=%#p)\n", rc, pDisk));
5436 return rc;
5437}
5438
5439/**
5440 * Destroys HDD container.
5441 * If container has opened image files they will be closed.
5442 *
5443 * @returns VBox status code.
5444 * @param pDisk Pointer to HDD container.
5445 */
5446VBOXDDU_DECL(int) VDDestroy(PVBOXHDD pDisk)
5447{
5448 int rc = VINF_SUCCESS;
5449 LogFlowFunc(("pDisk=%#p\n", pDisk));
5450 do
5451 {
5452 /* sanity check */
5453 AssertPtrBreak(pDisk);
5454 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5455 Assert(!pDisk->fLocked);
5456
5457 rc = VDCloseAll(pDisk);
5458 int rc2 = VDFilterRemoveAll(pDisk);
5459 if (RT_SUCCESS(rc))
5460 rc = rc2;
5461
5462 RTMemCacheDestroy(pDisk->hMemCacheIoCtx);
5463 RTMemCacheDestroy(pDisk->hMemCacheIoTask);
5464 RTMemFree(pDisk);
5465 } while (0);
5466 LogFlowFunc(("returns %Rrc\n", rc));
5467 return rc;
5468}
5469
5470/**
5471 * Try to get the backend name which can use this image.
5472 *
5473 * @returns VBox status code.
5474 * VINF_SUCCESS if a plugin was found.
5475 * ppszFormat contains the string which can be used as backend name.
5476 * VERR_NOT_SUPPORTED if no backend was found.
5477 * @param pVDIfsDisk Pointer to the per-disk VD interface list.
5478 * @param pVDIfsImage Pointer to the per-image VD interface list.
5479 * @param pszFilename Name of the image file for which the backend is queried.
5480 * @param ppszFormat Receives pointer of the UTF-8 string which contains the format name.
5481 * The returned pointer must be freed using RTStrFree().
5482 */
5483VBOXDDU_DECL(int) VDGetFormat(PVDINTERFACE pVDIfsDisk, PVDINTERFACE pVDIfsImage,
5484 const char *pszFilename, char **ppszFormat, VDTYPE *penmType)
5485{
5486 int rc = VERR_NOT_SUPPORTED;
5487 VDINTERFACEIOINT VDIfIoInt;
5488 VDINTERFACEIO VDIfIoFallback;
5489 PVDINTERFACEIO pInterfaceIo;
5490
5491 LogFlowFunc(("pszFilename=\"%s\"\n", pszFilename));
5492 /* Check arguments. */
5493 AssertMsgReturn(VALID_PTR(pszFilename) && *pszFilename,
5494 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5495 VERR_INVALID_PARAMETER);
5496 AssertMsgReturn(VALID_PTR(ppszFormat),
5497 ("ppszFormat=%#p\n", ppszFormat),
5498 VERR_INVALID_PARAMETER);
5499 AssertMsgReturn(VALID_PTR(penmType),
5500 ("penmType=%#p\n", penmType),
5501 VERR_INVALID_PARAMETER);
5502
5503 if (!g_apBackends)
5504 VDInit();
5505
5506 pInterfaceIo = VDIfIoGet(pVDIfsImage);
5507 if (!pInterfaceIo)
5508 {
5509 /*
5510 * Caller doesn't provide an I/O interface, create our own using the
5511 * native file API.
5512 */
5513 vdIfIoFallbackCallbacksSetup(&VDIfIoFallback);
5514 pInterfaceIo = &VDIfIoFallback;
5515 }
5516
5517 /* Set up the internal I/O interface. */
5518 AssertReturn(!VDIfIoIntGet(pVDIfsImage), VERR_INVALID_PARAMETER);
5519 VDIfIoInt.pfnOpen = vdIOIntOpenLimited;
5520 VDIfIoInt.pfnClose = vdIOIntCloseLimited;
5521 VDIfIoInt.pfnDelete = vdIOIntDeleteLimited;
5522 VDIfIoInt.pfnMove = vdIOIntMoveLimited;
5523 VDIfIoInt.pfnGetFreeSpace = vdIOIntGetFreeSpaceLimited;
5524 VDIfIoInt.pfnGetModificationTime = vdIOIntGetModificationTimeLimited;
5525 VDIfIoInt.pfnGetSize = vdIOIntGetSizeLimited;
5526 VDIfIoInt.pfnSetSize = vdIOIntSetSizeLimited;
5527 VDIfIoInt.pfnReadUser = vdIOIntReadUserLimited;
5528 VDIfIoInt.pfnWriteUser = vdIOIntWriteUserLimited;
5529 VDIfIoInt.pfnReadMeta = vdIOIntReadMetaLimited;
5530 VDIfIoInt.pfnWriteMeta = vdIOIntWriteMetaLimited;
5531 VDIfIoInt.pfnFlush = vdIOIntFlushLimited;
5532 rc = VDInterfaceAdd(&VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
5533 pInterfaceIo, sizeof(VDINTERFACEIOINT), &pVDIfsImage);
5534 AssertRC(rc);
5535
5536 /* Find the backend supporting this file format. */
5537 for (unsigned i = 0; i < g_cBackends; i++)
5538 {
5539 if (g_apBackends[i]->pfnCheckIfValid)
5540 {
5541 rc = g_apBackends[i]->pfnCheckIfValid(pszFilename, pVDIfsDisk,
5542 pVDIfsImage, penmType);
5543 if ( RT_SUCCESS(rc)
5544 /* The correct backend has been found, but there is a small
5545 * incompatibility so that the file cannot be used. Stop here
5546 * and signal success - the actual open will of course fail,
5547 * but that will create a really sensible error message. */
5548 || ( rc != VERR_VD_GEN_INVALID_HEADER
5549 && rc != VERR_VD_VDI_INVALID_HEADER
5550 && rc != VERR_VD_VMDK_INVALID_HEADER
5551 && rc != VERR_VD_ISCSI_INVALID_HEADER
5552 && rc != VERR_VD_VHD_INVALID_HEADER
5553 && rc != VERR_VD_RAW_INVALID_HEADER
5554 && rc != VERR_VD_PARALLELS_INVALID_HEADER
5555 && rc != VERR_VD_DMG_INVALID_HEADER))
5556 {
5557 /* Copy the name into the new string. */
5558 char *pszFormat = RTStrDup(g_apBackends[i]->pszBackendName);
5559 if (!pszFormat)
5560 {
5561 rc = VERR_NO_MEMORY;
5562 break;
5563 }
5564 *ppszFormat = pszFormat;
5565 /* Do not consider the typical file access errors as success,
5566 * which allows the caller to deal with such issues. */
5567 if ( rc != VERR_ACCESS_DENIED
5568 && rc != VERR_PATH_NOT_FOUND
5569 && rc != VERR_FILE_NOT_FOUND)
5570 rc = VINF_SUCCESS;
5571 break;
5572 }
5573 rc = VERR_NOT_SUPPORTED;
5574 }
5575 }
5576
5577 /* Try the cache backends. */
5578 if (rc == VERR_NOT_SUPPORTED)
5579 {
5580 for (unsigned i = 0; i < g_cCacheBackends; i++)
5581 {
5582 if (g_apCacheBackends[i]->pfnProbe)
5583 {
5584 rc = g_apCacheBackends[i]->pfnProbe(pszFilename, pVDIfsDisk,
5585 pVDIfsImage);
5586 if ( RT_SUCCESS(rc)
5587 || (rc != VERR_VD_GEN_INVALID_HEADER))
5588 {
5589 /* Copy the name into the new string. */
5590 char *pszFormat = RTStrDup(g_apBackends[i]->pszBackendName);
5591 if (!pszFormat)
5592 {
5593 rc = VERR_NO_MEMORY;
5594 break;
5595 }
5596 *ppszFormat = pszFormat;
5597 rc = VINF_SUCCESS;
5598 break;
5599 }
5600 rc = VERR_NOT_SUPPORTED;
5601 }
5602 }
5603 }
5604
5605 LogFlowFunc(("returns %Rrc *ppszFormat=\"%s\"\n", rc, *ppszFormat));
5606 return rc;
5607}
5608
5609/**
5610 * Opens an image file.
5611 *
5612 * The first opened image file in HDD container must have a base image type,
5613 * others (next opened images) must be a differencing or undo images.
5614 * Linkage is checked for differencing image to be in consistence with the previously opened image.
5615 * When another differencing image is opened and the last image was opened in read/write access
5616 * mode, then the last image is reopened in read-only with deny write sharing mode. This allows
5617 * other processes to use images in read-only mode too.
5618 *
5619 * Note that the image is opened in read-only mode if a read/write open is not possible.
5620 * Use VDIsReadOnly to check open mode.
5621 *
5622 * @returns VBox status code.
5623 * @param pDisk Pointer to HDD container.
5624 * @param pszBackend Name of the image file backend to use.
5625 * @param pszFilename Name of the image file to open.
5626 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
5627 * @param pVDIfsImage Pointer to the per-image VD interface list.
5628 */
5629VBOXDDU_DECL(int) VDOpen(PVBOXHDD pDisk, const char *pszBackend,
5630 const char *pszFilename, unsigned uOpenFlags,
5631 PVDINTERFACE pVDIfsImage)
5632{
5633 int rc = VINF_SUCCESS;
5634 int rc2;
5635 bool fLockWrite = false;
5636 PVDIMAGE pImage = NULL;
5637
5638 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uOpenFlags=%#x, pVDIfsImage=%#p\n",
5639 pDisk, pszBackend, pszFilename, uOpenFlags, pVDIfsImage));
5640
5641 do
5642 {
5643 /* sanity check */
5644 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
5645 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5646
5647 /* Check arguments. */
5648 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
5649 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
5650 rc = VERR_INVALID_PARAMETER);
5651 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
5652 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5653 rc = VERR_INVALID_PARAMETER);
5654 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
5655 ("uOpenFlags=%#x\n", uOpenFlags),
5656 rc = VERR_INVALID_PARAMETER);
5657 AssertMsgBreakStmt( !(uOpenFlags & VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS)
5658 || (uOpenFlags & VD_OPEN_FLAGS_READONLY),
5659 ("uOpenFlags=%#x\n", uOpenFlags),
5660 rc = VERR_INVALID_PARAMETER);
5661
5662 /*
5663 * Destroy the current discard state first which might still have pending blocks
5664 * for the currently opened image which will be switched to readonly mode.
5665 */
5666 /* Lock disk for writing, as we modify pDisk information below. */
5667 rc2 = vdThreadStartWrite(pDisk);
5668 AssertRC(rc2);
5669 fLockWrite = true;
5670 rc = vdDiscardStateDestroy(pDisk);
5671 if (RT_FAILURE(rc))
5672 break;
5673 rc2 = vdThreadFinishWrite(pDisk);
5674 AssertRC(rc2);
5675 fLockWrite = false;
5676
5677 /* Set up image descriptor. */
5678 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
5679 if (!pImage)
5680 {
5681 rc = VERR_NO_MEMORY;
5682 break;
5683 }
5684 pImage->pszFilename = RTStrDup(pszFilename);
5685 if (!pImage->pszFilename)
5686 {
5687 rc = VERR_NO_MEMORY;
5688 break;
5689 }
5690
5691 pImage->VDIo.pDisk = pDisk;
5692 pImage->pVDIfsImage = pVDIfsImage;
5693
5694 rc = vdFindBackend(pszBackend, &pImage->Backend);
5695 if (RT_FAILURE(rc))
5696 break;
5697 if (!pImage->Backend)
5698 {
5699 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
5700 N_("VD: unknown backend name '%s'"), pszBackend);
5701 break;
5702 }
5703
5704 /*
5705 * Fail if the backend can't do async I/O but the
5706 * flag is set.
5707 */
5708 if ( !(pImage->Backend->uBackendCaps & VD_CAP_ASYNC)
5709 && (uOpenFlags & VD_OPEN_FLAGS_ASYNC_IO))
5710 {
5711 rc = vdError(pDisk, VERR_NOT_SUPPORTED, RT_SRC_POS,
5712 N_("VD: Backend '%s' does not support async I/O"), pszBackend);
5713 break;
5714 }
5715
5716 /*
5717 * Fail if the backend doesn't support the discard operation but the
5718 * flag is set.
5719 */
5720 if ( !(pImage->Backend->uBackendCaps & VD_CAP_DISCARD)
5721 && (uOpenFlags & VD_OPEN_FLAGS_DISCARD))
5722 {
5723 rc = vdError(pDisk, VERR_VD_DISCARD_NOT_SUPPORTED, RT_SRC_POS,
5724 N_("VD: Backend '%s' does not support discard"), pszBackend);
5725 break;
5726 }
5727
5728 /* Set up the I/O interface. */
5729 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
5730 if (!pImage->VDIo.pInterfaceIo)
5731 {
5732 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
5733 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
5734 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
5735 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
5736 }
5737
5738 /* Set up the internal I/O interface. */
5739 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
5740 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
5741 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
5742 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
5743 AssertRC(rc);
5744
5745 pImage->uOpenFlags = uOpenFlags & (VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_DISCARD | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS);
5746 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
5747 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
5748 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS),
5749 pDisk->pVDIfsDisk,
5750 pImage->pVDIfsImage,
5751 pDisk->enmType,
5752 &pImage->pBackendData);
5753 /*
5754 * If the image is corrupted and there is a repair method try to repair it
5755 * first if it was openend in read-write mode and open again afterwards.
5756 */
5757 if ( RT_UNLIKELY(rc == VERR_VD_IMAGE_CORRUPTED)
5758 && !(uOpenFlags & VD_OPEN_FLAGS_READONLY)
5759 && pImage->Backend->pfnRepair)
5760 {
5761 rc = pImage->Backend->pfnRepair(pszFilename, pDisk->pVDIfsDisk, pImage->pVDIfsImage, 0 /* fFlags */);
5762 if (RT_SUCCESS(rc))
5763 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
5764 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS),
5765 pDisk->pVDIfsDisk,
5766 pImage->pVDIfsImage,
5767 pDisk->enmType,
5768 &pImage->pBackendData);
5769 else
5770 {
5771 rc = vdError(pDisk, rc, RT_SRC_POS,
5772 N_("VD: error %Rrc repairing corrupted image file '%s'"), rc, pszFilename);
5773 break;
5774 }
5775 }
5776 else if (RT_UNLIKELY(rc == VERR_VD_IMAGE_CORRUPTED))
5777 {
5778 rc = vdError(pDisk, rc, RT_SRC_POS,
5779 N_("VD: Image file '%s' is corrupted and can't be opened"), pszFilename);
5780 break;
5781 }
5782
5783 /* If the open in read-write mode failed, retry in read-only mode. */
5784 if (RT_FAILURE(rc))
5785 {
5786 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY)
5787 && ( rc == VERR_ACCESS_DENIED
5788 || rc == VERR_PERMISSION_DENIED
5789 || rc == VERR_WRITE_PROTECT
5790 || rc == VERR_SHARING_VIOLATION
5791 || rc == VERR_FILE_LOCK_FAILED))
5792 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
5793 (uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS))
5794 | VD_OPEN_FLAGS_READONLY,
5795 pDisk->pVDIfsDisk,
5796 pImage->pVDIfsImage,
5797 pDisk->enmType,
5798 &pImage->pBackendData);
5799 if (RT_FAILURE(rc))
5800 {
5801 rc = vdError(pDisk, rc, RT_SRC_POS,
5802 N_("VD: error %Rrc opening image file '%s'"), rc, pszFilename);
5803 break;
5804 }
5805 }
5806
5807 /* Lock disk for writing, as we modify pDisk information below. */
5808 rc2 = vdThreadStartWrite(pDisk);
5809 AssertRC(rc2);
5810 fLockWrite = true;
5811
5812 pImage->VDIo.pBackendData = pImage->pBackendData;
5813
5814 /* Check image type. As the image itself has only partial knowledge
5815 * whether it's a base image or not, this info is derived here. The
5816 * base image can be fixed or normal, all others must be normal or
5817 * diff images. Some image formats don't distinguish between normal
5818 * and diff images, so this must be corrected here. */
5819 unsigned uImageFlags;
5820 uImageFlags = pImage->Backend->pfnGetImageFlags(pImage->pBackendData);
5821 if (RT_FAILURE(rc))
5822 uImageFlags = VD_IMAGE_FLAGS_NONE;
5823 if ( RT_SUCCESS(rc)
5824 && !(uOpenFlags & VD_OPEN_FLAGS_INFO))
5825 {
5826 if ( pDisk->cImages == 0
5827 && (uImageFlags & VD_IMAGE_FLAGS_DIFF))
5828 {
5829 rc = VERR_VD_INVALID_TYPE;
5830 break;
5831 }
5832 else if (pDisk->cImages != 0)
5833 {
5834 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
5835 {
5836 rc = VERR_VD_INVALID_TYPE;
5837 break;
5838 }
5839 else
5840 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
5841 }
5842 }
5843
5844 /* Ensure we always get correct diff information, even if the backend
5845 * doesn't actually have a stored flag for this. It must not return
5846 * bogus information for the parent UUID if it is not a diff image. */
5847 RTUUID parentUuid;
5848 RTUuidClear(&parentUuid);
5849 rc2 = pImage->Backend->pfnGetParentUuid(pImage->pBackendData, &parentUuid);
5850 if (RT_SUCCESS(rc2) && !RTUuidIsNull(&parentUuid))
5851 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
5852
5853 pImage->uImageFlags = uImageFlags;
5854
5855 /* Force sane optimization settings. It's not worth avoiding writes
5856 * to fixed size images. The overhead would have almost no payback. */
5857 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
5858 pImage->uOpenFlags |= VD_OPEN_FLAGS_HONOR_SAME;
5859
5860 /** @todo optionally check UUIDs */
5861
5862 /* Cache disk information. */
5863 pDisk->cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
5864
5865 /* Cache PCHS geometry. */
5866 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
5867 &pDisk->PCHSGeometry);
5868 if (RT_FAILURE(rc2))
5869 {
5870 pDisk->PCHSGeometry.cCylinders = 0;
5871 pDisk->PCHSGeometry.cHeads = 0;
5872 pDisk->PCHSGeometry.cSectors = 0;
5873 }
5874 else
5875 {
5876 /* Make sure the PCHS geometry is properly clipped. */
5877 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
5878 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
5879 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
5880 }
5881
5882 /* Cache LCHS geometry. */
5883 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
5884 &pDisk->LCHSGeometry);
5885 if (RT_FAILURE(rc2))
5886 {
5887 pDisk->LCHSGeometry.cCylinders = 0;
5888 pDisk->LCHSGeometry.cHeads = 0;
5889 pDisk->LCHSGeometry.cSectors = 0;
5890 }
5891 else
5892 {
5893 /* Make sure the LCHS geometry is properly clipped. */
5894 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
5895 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
5896 }
5897
5898 if (pDisk->cImages != 0)
5899 {
5900 /* Switch previous image to read-only mode. */
5901 unsigned uOpenFlagsPrevImg;
5902 uOpenFlagsPrevImg = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
5903 if (!(uOpenFlagsPrevImg & VD_OPEN_FLAGS_READONLY))
5904 {
5905 uOpenFlagsPrevImg |= VD_OPEN_FLAGS_READONLY;
5906 rc = pDisk->pLast->Backend->pfnSetOpenFlags(pDisk->pLast->pBackendData, uOpenFlagsPrevImg);
5907 }
5908 }
5909
5910 if (RT_SUCCESS(rc))
5911 {
5912 /* Image successfully opened, make it the last image. */
5913 vdAddImageToList(pDisk, pImage);
5914 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
5915 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
5916 }
5917 else
5918 {
5919 /* Error detected, but image opened. Close image. */
5920 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, false);
5921 AssertRC(rc2);
5922 pImage->pBackendData = NULL;
5923 }
5924 } while (0);
5925
5926 if (RT_UNLIKELY(fLockWrite))
5927 {
5928 rc2 = vdThreadFinishWrite(pDisk);
5929 AssertRC(rc2);
5930 }
5931
5932 if (RT_FAILURE(rc))
5933 {
5934 if (pImage)
5935 {
5936 if (pImage->pszFilename)
5937 RTStrFree(pImage->pszFilename);
5938 RTMemFree(pImage);
5939 }
5940 }
5941
5942 LogFlowFunc(("returns %Rrc\n", rc));
5943 return rc;
5944}
5945
5946/**
5947 * Opens a cache image.
5948 *
5949 * @return VBox status code.
5950 * @param pDisk Pointer to the HDD container which should use the cache image.
5951 * @param pszBackend Name of the cache file backend to use (case insensitive).
5952 * @param pszFilename Name of the cache image to open.
5953 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
5954 * @param pVDIfsCache Pointer to the per-cache VD interface list.
5955 */
5956VBOXDDU_DECL(int) VDCacheOpen(PVBOXHDD pDisk, const char *pszBackend,
5957 const char *pszFilename, unsigned uOpenFlags,
5958 PVDINTERFACE pVDIfsCache)
5959{
5960 int rc = VINF_SUCCESS;
5961 int rc2;
5962 bool fLockWrite = false;
5963 PVDCACHE pCache = NULL;
5964
5965 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uOpenFlags=%#x, pVDIfsCache=%#p\n",
5966 pDisk, pszBackend, pszFilename, uOpenFlags, pVDIfsCache));
5967
5968 do
5969 {
5970 /* sanity check */
5971 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
5972 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5973
5974 /* Check arguments. */
5975 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
5976 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
5977 rc = VERR_INVALID_PARAMETER);
5978 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
5979 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5980 rc = VERR_INVALID_PARAMETER);
5981 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
5982 ("uOpenFlags=%#x\n", uOpenFlags),
5983 rc = VERR_INVALID_PARAMETER);
5984
5985 /* Set up image descriptor. */
5986 pCache = (PVDCACHE)RTMemAllocZ(sizeof(VDCACHE));
5987 if (!pCache)
5988 {
5989 rc = VERR_NO_MEMORY;
5990 break;
5991 }
5992 pCache->pszFilename = RTStrDup(pszFilename);
5993 if (!pCache->pszFilename)
5994 {
5995 rc = VERR_NO_MEMORY;
5996 break;
5997 }
5998
5999 pCache->VDIo.pDisk = pDisk;
6000 pCache->pVDIfsCache = pVDIfsCache;
6001
6002 rc = vdFindCacheBackend(pszBackend, &pCache->Backend);
6003 if (RT_FAILURE(rc))
6004 break;
6005 if (!pCache->Backend)
6006 {
6007 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6008 N_("VD: unknown backend name '%s'"), pszBackend);
6009 break;
6010 }
6011
6012 /* Set up the I/O interface. */
6013 pCache->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsCache);
6014 if (!pCache->VDIo.pInterfaceIo)
6015 {
6016 vdIfIoFallbackCallbacksSetup(&pCache->VDIo.VDIfIo);
6017 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6018 pDisk, sizeof(VDINTERFACEIO), &pVDIfsCache);
6019 pCache->VDIo.pInterfaceIo = &pCache->VDIo.VDIfIo;
6020 }
6021
6022 /* Set up the internal I/O interface. */
6023 AssertBreakStmt(!VDIfIoIntGet(pVDIfsCache), rc = VERR_INVALID_PARAMETER);
6024 vdIfIoIntCallbacksSetup(&pCache->VDIo.VDIfIoInt);
6025 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6026 &pCache->VDIo, sizeof(VDINTERFACEIOINT), &pCache->pVDIfsCache);
6027 AssertRC(rc);
6028
6029 pCache->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6030 rc = pCache->Backend->pfnOpen(pCache->pszFilename,
6031 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6032 pDisk->pVDIfsDisk,
6033 pCache->pVDIfsCache,
6034 &pCache->pBackendData);
6035 /* If the open in read-write mode failed, retry in read-only mode. */
6036 if (RT_FAILURE(rc))
6037 {
6038 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY)
6039 && ( rc == VERR_ACCESS_DENIED
6040 || rc == VERR_PERMISSION_DENIED
6041 || rc == VERR_WRITE_PROTECT
6042 || rc == VERR_SHARING_VIOLATION
6043 || rc == VERR_FILE_LOCK_FAILED))
6044 rc = pCache->Backend->pfnOpen(pCache->pszFilename,
6045 (uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME)
6046 | VD_OPEN_FLAGS_READONLY,
6047 pDisk->pVDIfsDisk,
6048 pCache->pVDIfsCache,
6049 &pCache->pBackendData);
6050 if (RT_FAILURE(rc))
6051 {
6052 rc = vdError(pDisk, rc, RT_SRC_POS,
6053 N_("VD: error %Rrc opening image file '%s'"), rc, pszFilename);
6054 break;
6055 }
6056 }
6057
6058 /* Lock disk for writing, as we modify pDisk information below. */
6059 rc2 = vdThreadStartWrite(pDisk);
6060 AssertRC(rc2);
6061 fLockWrite = true;
6062
6063 /*
6064 * Check that the modification UUID of the cache and last image
6065 * match. If not the image was modified in-between without the cache.
6066 * The cache might contain stale data.
6067 */
6068 RTUUID UuidImage, UuidCache;
6069
6070 rc = pCache->Backend->pfnGetModificationUuid(pCache->pBackendData,
6071 &UuidCache);
6072 if (RT_SUCCESS(rc))
6073 {
6074 rc = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6075 &UuidImage);
6076 if (RT_SUCCESS(rc))
6077 {
6078 if (RTUuidCompare(&UuidImage, &UuidCache))
6079 rc = VERR_VD_CACHE_NOT_UP_TO_DATE;
6080 }
6081 }
6082
6083 /*
6084 * We assume that the user knows what he is doing if one of the images
6085 * doesn't support the modification uuid.
6086 */
6087 if (rc == VERR_NOT_SUPPORTED)
6088 rc = VINF_SUCCESS;
6089
6090 if (RT_SUCCESS(rc))
6091 {
6092 /* Cache successfully opened, make it the current one. */
6093 if (!pDisk->pCache)
6094 pDisk->pCache = pCache;
6095 else
6096 rc = VERR_VD_CACHE_ALREADY_EXISTS;
6097 }
6098
6099 if (RT_FAILURE(rc))
6100 {
6101 /* Error detected, but image opened. Close image. */
6102 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, false);
6103 AssertRC(rc2);
6104 pCache->pBackendData = NULL;
6105 }
6106 } while (0);
6107
6108 if (RT_UNLIKELY(fLockWrite))
6109 {
6110 rc2 = vdThreadFinishWrite(pDisk);
6111 AssertRC(rc2);
6112 }
6113
6114 if (RT_FAILURE(rc))
6115 {
6116 if (pCache)
6117 {
6118 if (pCache->pszFilename)
6119 RTStrFree(pCache->pszFilename);
6120 RTMemFree(pCache);
6121 }
6122 }
6123
6124 LogFlowFunc(("returns %Rrc\n", rc));
6125 return rc;
6126}
6127
6128/**
6129 * Adds a filter to the disk.
6130 *
6131 * @returns VBox status code.
6132 * @param pDisk Pointer to the HDD container which should use the filter.
6133 * @param pszFilter Name of the filter backend to use (case insensitive).
6134 * @param pVDIfsFilter Pointer to the per-filter VD interface list.
6135 */
6136VBOXDDU_DECL(int) VDFilterAdd(PVBOXHDD pDisk, const char *pszFilter,
6137 PVDINTERFACE pVDIfsFilter)
6138{
6139 int rc = VINF_SUCCESS;
6140 int rc2;
6141 bool fLockWrite = false;
6142 PVDFILTER pFilter = NULL;
6143
6144 LogFlowFunc(("pDisk=%#p pszFilter=\"%s\" pVDIfsFilter=%#p\n",
6145 pDisk, pszFilter, pVDIfsFilter));
6146
6147 do
6148 {
6149 /* sanity check */
6150 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6151 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6152
6153 /* Check arguments. */
6154 AssertMsgBreakStmt(VALID_PTR(pszFilter) && *pszFilter,
6155 ("pszFilter=%#p \"%s\"\n", pszFilter, pszFilter),
6156 rc = VERR_INVALID_PARAMETER);
6157
6158 /* Set up image descriptor. */
6159 pFilter = (PVDFILTER)RTMemAllocZ(sizeof(VDFILTER));
6160 if (!pFilter)
6161 {
6162 rc = VERR_NO_MEMORY;
6163 break;
6164 }
6165
6166 rc = vdFindFilterBackend(pszFilter, &pFilter->pBackend);
6167 if (RT_FAILURE(rc))
6168 break;
6169 if (!pFilter->pBackend)
6170 {
6171 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6172 N_("VD: unknown filter backend name '%s'"), pszFilter);
6173 break;
6174 }
6175
6176 rc = pFilter->pBackend->pfnCreate(pDisk->pVDIfsDisk, pVDIfsFilter,
6177 &pFilter->pvBackendData);
6178
6179 /* If the open in read-write mode failed, retry in read-only mode. */
6180 if (RT_FAILURE(rc))
6181 {
6182 rc = vdError(pDisk, rc, RT_SRC_POS,
6183 N_("VD: error %Rrc creating filter '%s'"), rc, pszFilter);
6184 break;
6185 }
6186
6187 /* Lock disk for writing, as we modify pDisk information below. */
6188 rc2 = vdThreadStartWrite(pDisk);
6189 AssertRC(rc2);
6190 fLockWrite = true;
6191
6192 /* Add filter to chain. */
6193 vdAddFilterToList(pDisk, pFilter);
6194 } while (0);
6195
6196 if (RT_UNLIKELY(fLockWrite))
6197 {
6198 rc2 = vdThreadFinishWrite(pDisk);
6199 AssertRC(rc2);
6200 }
6201
6202 if (RT_FAILURE(rc))
6203 {
6204 if (pFilter)
6205 RTMemFree(pFilter);
6206 }
6207
6208 LogFlowFunc(("returns %Rrc\n", rc));
6209 return rc;
6210}
6211
6212/**
6213 * Creates and opens a new base image file.
6214 *
6215 * @returns VBox status code.
6216 * @param pDisk Pointer to HDD container.
6217 * @param pszBackend Name of the image file backend to use.
6218 * @param pszFilename Name of the image file to create.
6219 * @param cbSize Image size in bytes.
6220 * @param uImageFlags Flags specifying special image features.
6221 * @param pszComment Pointer to image comment. NULL is ok.
6222 * @param pPCHSGeometry Pointer to physical disk geometry <= (16383,16,63). Not NULL.
6223 * @param pLCHSGeometry Pointer to logical disk geometry <= (x,255,63). Not NULL.
6224 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6225 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6226 * @param pVDIfsImage Pointer to the per-image VD interface list.
6227 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6228 */
6229VBOXDDU_DECL(int) VDCreateBase(PVBOXHDD pDisk, const char *pszBackend,
6230 const char *pszFilename, uint64_t cbSize,
6231 unsigned uImageFlags, const char *pszComment,
6232 PCVDGEOMETRY pPCHSGeometry,
6233 PCVDGEOMETRY pLCHSGeometry,
6234 PCRTUUID pUuid, unsigned uOpenFlags,
6235 PVDINTERFACE pVDIfsImage,
6236 PVDINTERFACE pVDIfsOperation)
6237{
6238 int rc = VINF_SUCCESS;
6239 int rc2;
6240 bool fLockWrite = false, fLockRead = false;
6241 PVDIMAGE pImage = NULL;
6242 RTUUID uuid;
6243
6244 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" cbSize=%llu uImageFlags=%#x pszComment=\"%s\" PCHS=%u/%u/%u LCHS=%u/%u/%u Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6245 pDisk, pszBackend, pszFilename, cbSize, uImageFlags, pszComment,
6246 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
6247 pPCHSGeometry->cSectors, pLCHSGeometry->cCylinders,
6248 pLCHSGeometry->cHeads, pLCHSGeometry->cSectors, pUuid,
6249 uOpenFlags, pVDIfsImage, pVDIfsOperation));
6250
6251 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6252
6253 do
6254 {
6255 /* sanity check */
6256 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6257 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6258
6259 /* Check arguments. */
6260 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6261 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6262 rc = VERR_INVALID_PARAMETER);
6263 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6264 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6265 rc = VERR_INVALID_PARAMETER);
6266 AssertMsgBreakStmt(cbSize,
6267 ("cbSize=%llu\n", cbSize),
6268 rc = VERR_INVALID_PARAMETER);
6269 AssertMsgBreakStmt( ((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0)
6270 || ((uImageFlags & (VD_IMAGE_FLAGS_FIXED | VD_IMAGE_FLAGS_DIFF)) != VD_IMAGE_FLAGS_FIXED),
6271 ("uImageFlags=%#x\n", uImageFlags),
6272 rc = VERR_INVALID_PARAMETER);
6273 /* The PCHS geometry fields may be 0 to leave it for later. */
6274 AssertMsgBreakStmt( VALID_PTR(pPCHSGeometry)
6275 && pPCHSGeometry->cHeads <= 16
6276 && pPCHSGeometry->cSectors <= 63,
6277 ("pPCHSGeometry=%#p PCHS=%u/%u/%u\n", pPCHSGeometry,
6278 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
6279 pPCHSGeometry->cSectors),
6280 rc = VERR_INVALID_PARAMETER);
6281 /* The LCHS geometry fields may be 0 to leave it to later autodetection. */
6282 AssertMsgBreakStmt( VALID_PTR(pLCHSGeometry)
6283 && pLCHSGeometry->cHeads <= 255
6284 && pLCHSGeometry->cSectors <= 63,
6285 ("pLCHSGeometry=%#p LCHS=%u/%u/%u\n", pLCHSGeometry,
6286 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads,
6287 pLCHSGeometry->cSectors),
6288 rc = VERR_INVALID_PARAMETER);
6289 /* The UUID may be NULL. */
6290 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6291 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6292 rc = VERR_INVALID_PARAMETER);
6293 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6294 ("uOpenFlags=%#x\n", uOpenFlags),
6295 rc = VERR_INVALID_PARAMETER);
6296
6297 /* Check state. Needs a temporary read lock. Holding the write lock
6298 * all the time would be blocking other activities for too long. */
6299 rc2 = vdThreadStartRead(pDisk);
6300 AssertRC(rc2);
6301 fLockRead = true;
6302 AssertMsgBreakStmt(pDisk->cImages == 0,
6303 ("Create base image cannot be done with other images open\n"),
6304 rc = VERR_VD_INVALID_STATE);
6305 rc2 = vdThreadFinishRead(pDisk);
6306 AssertRC(rc2);
6307 fLockRead = false;
6308
6309 /* Set up image descriptor. */
6310 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
6311 if (!pImage)
6312 {
6313 rc = VERR_NO_MEMORY;
6314 break;
6315 }
6316 pImage->pszFilename = RTStrDup(pszFilename);
6317 if (!pImage->pszFilename)
6318 {
6319 rc = VERR_NO_MEMORY;
6320 break;
6321 }
6322 pImage->VDIo.pDisk = pDisk;
6323 pImage->pVDIfsImage = pVDIfsImage;
6324
6325 /* Set up the I/O interface. */
6326 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
6327 if (!pImage->VDIo.pInterfaceIo)
6328 {
6329 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
6330 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6331 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
6332 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
6333 }
6334
6335 /* Set up the internal I/O interface. */
6336 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
6337 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
6338 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6339 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
6340 AssertRC(rc);
6341
6342 rc = vdFindBackend(pszBackend, &pImage->Backend);
6343 if (RT_FAILURE(rc))
6344 break;
6345 if (!pImage->Backend)
6346 {
6347 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6348 N_("VD: unknown backend name '%s'"), pszBackend);
6349 break;
6350 }
6351 if (!(pImage->Backend->uBackendCaps & ( VD_CAP_CREATE_FIXED
6352 | VD_CAP_CREATE_DYNAMIC)))
6353 {
6354 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6355 N_("VD: backend '%s' cannot create base images"), pszBackend);
6356 break;
6357 }
6358
6359 /* Create UUID if the caller didn't specify one. */
6360 if (!pUuid)
6361 {
6362 rc = RTUuidCreate(&uuid);
6363 if (RT_FAILURE(rc))
6364 {
6365 rc = vdError(pDisk, rc, RT_SRC_POS,
6366 N_("VD: cannot generate UUID for image '%s'"),
6367 pszFilename);
6368 break;
6369 }
6370 pUuid = &uuid;
6371 }
6372
6373 pImage->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6374 uImageFlags &= ~VD_IMAGE_FLAGS_DIFF;
6375 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6376 rc = pImage->Backend->pfnCreate(pImage->pszFilename, cbSize,
6377 uImageFlags, pszComment, pPCHSGeometry,
6378 pLCHSGeometry, pUuid,
6379 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6380 0, 99,
6381 pDisk->pVDIfsDisk,
6382 pImage->pVDIfsImage,
6383 pVDIfsOperation,
6384 &pImage->pBackendData);
6385
6386 if (RT_SUCCESS(rc))
6387 {
6388 pImage->VDIo.pBackendData = pImage->pBackendData;
6389 pImage->uImageFlags = uImageFlags;
6390
6391 /* Force sane optimization settings. It's not worth avoiding writes
6392 * to fixed size images. The overhead would have almost no payback. */
6393 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
6394 pImage->uOpenFlags |= VD_OPEN_FLAGS_HONOR_SAME;
6395
6396 /* Lock disk for writing, as we modify pDisk information below. */
6397 rc2 = vdThreadStartWrite(pDisk);
6398 AssertRC(rc2);
6399 fLockWrite = true;
6400
6401 /** @todo optionally check UUIDs */
6402
6403 /* Re-check state, as the lock wasn't held and another image
6404 * creation call could have been done by another thread. */
6405 AssertMsgStmt(pDisk->cImages == 0,
6406 ("Create base image cannot be done with other images open\n"),
6407 rc = VERR_VD_INVALID_STATE);
6408 }
6409
6410 if (RT_SUCCESS(rc))
6411 {
6412 /* Cache disk information. */
6413 pDisk->cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
6414
6415 /* Cache PCHS geometry. */
6416 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
6417 &pDisk->PCHSGeometry);
6418 if (RT_FAILURE(rc2))
6419 {
6420 pDisk->PCHSGeometry.cCylinders = 0;
6421 pDisk->PCHSGeometry.cHeads = 0;
6422 pDisk->PCHSGeometry.cSectors = 0;
6423 }
6424 else
6425 {
6426 /* Make sure the CHS geometry is properly clipped. */
6427 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
6428 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
6429 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
6430 }
6431
6432 /* Cache LCHS geometry. */
6433 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
6434 &pDisk->LCHSGeometry);
6435 if (RT_FAILURE(rc2))
6436 {
6437 pDisk->LCHSGeometry.cCylinders = 0;
6438 pDisk->LCHSGeometry.cHeads = 0;
6439 pDisk->LCHSGeometry.cSectors = 0;
6440 }
6441 else
6442 {
6443 /* Make sure the CHS geometry is properly clipped. */
6444 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
6445 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
6446 }
6447
6448 /* Image successfully opened, make it the last image. */
6449 vdAddImageToList(pDisk, pImage);
6450 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
6451 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
6452 }
6453 else
6454 {
6455 /* Error detected, image may or may not be opened. Close and delete
6456 * image if it was opened. */
6457 if (pImage->pBackendData)
6458 {
6459 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, true);
6460 AssertRC(rc2);
6461 pImage->pBackendData = NULL;
6462 }
6463 }
6464 } while (0);
6465
6466 if (RT_UNLIKELY(fLockWrite))
6467 {
6468 rc2 = vdThreadFinishWrite(pDisk);
6469 AssertRC(rc2);
6470 }
6471 else if (RT_UNLIKELY(fLockRead))
6472 {
6473 rc2 = vdThreadFinishRead(pDisk);
6474 AssertRC(rc2);
6475 }
6476
6477 if (RT_FAILURE(rc))
6478 {
6479 if (pImage)
6480 {
6481 if (pImage->pszFilename)
6482 RTStrFree(pImage->pszFilename);
6483 RTMemFree(pImage);
6484 }
6485 }
6486
6487 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6488 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6489
6490 LogFlowFunc(("returns %Rrc\n", rc));
6491 return rc;
6492}
6493
6494/**
6495 * Creates and opens a new differencing image file in HDD container.
6496 * See comments for VDOpen function about differencing images.
6497 *
6498 * @returns VBox status code.
6499 * @param pDisk Pointer to HDD container.
6500 * @param pszBackend Name of the image file backend to use.
6501 * @param pszFilename Name of the differencing image file to create.
6502 * @param uImageFlags Flags specifying special image features.
6503 * @param pszComment Pointer to image comment. NULL is ok.
6504 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6505 * @param pParentUuid New parent UUID of the image. If NULL, the UUID is queried automatically.
6506 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6507 * @param pVDIfsImage Pointer to the per-image VD interface list.
6508 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6509 */
6510VBOXDDU_DECL(int) VDCreateDiff(PVBOXHDD pDisk, const char *pszBackend,
6511 const char *pszFilename, unsigned uImageFlags,
6512 const char *pszComment, PCRTUUID pUuid,
6513 PCRTUUID pParentUuid, unsigned uOpenFlags,
6514 PVDINTERFACE pVDIfsImage,
6515 PVDINTERFACE pVDIfsOperation)
6516{
6517 int rc = VINF_SUCCESS;
6518 int rc2;
6519 bool fLockWrite = false, fLockRead = false;
6520 PVDIMAGE pImage = NULL;
6521 RTUUID uuid;
6522
6523 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uImageFlags=%#x pszComment=\"%s\" Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6524 pDisk, pszBackend, pszFilename, uImageFlags, pszComment, pUuid, uOpenFlags, pVDIfsImage, pVDIfsOperation));
6525
6526 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6527
6528 do
6529 {
6530 /* sanity check */
6531 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6532 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6533
6534 /* Check arguments. */
6535 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6536 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6537 rc = VERR_INVALID_PARAMETER);
6538 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6539 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6540 rc = VERR_INVALID_PARAMETER);
6541 AssertMsgBreakStmt((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0,
6542 ("uImageFlags=%#x\n", uImageFlags),
6543 rc = VERR_INVALID_PARAMETER);
6544 /* The UUID may be NULL. */
6545 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6546 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6547 rc = VERR_INVALID_PARAMETER);
6548 /* The parent UUID may be NULL. */
6549 AssertMsgBreakStmt(pParentUuid == NULL || VALID_PTR(pParentUuid),
6550 ("pParentUuid=%#p ParentUUID=%RTuuid\n", pParentUuid, pParentUuid),
6551 rc = VERR_INVALID_PARAMETER);
6552 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6553 ("uOpenFlags=%#x\n", uOpenFlags),
6554 rc = VERR_INVALID_PARAMETER);
6555
6556 /* Check state. Needs a temporary read lock. Holding the write lock
6557 * all the time would be blocking other activities for too long. */
6558 rc2 = vdThreadStartRead(pDisk);
6559 AssertRC(rc2);
6560 fLockRead = true;
6561 AssertMsgBreakStmt(pDisk->cImages != 0,
6562 ("Create diff image cannot be done without other images open\n"),
6563 rc = VERR_VD_INVALID_STATE);
6564 rc2 = vdThreadFinishRead(pDisk);
6565 AssertRC(rc2);
6566 fLockRead = false;
6567
6568 /*
6569 * Destroy the current discard state first which might still have pending blocks
6570 * for the currently opened image which will be switched to readonly mode.
6571 */
6572 /* Lock disk for writing, as we modify pDisk information below. */
6573 rc2 = vdThreadStartWrite(pDisk);
6574 AssertRC(rc2);
6575 fLockWrite = true;
6576 rc = vdDiscardStateDestroy(pDisk);
6577 if (RT_FAILURE(rc))
6578 break;
6579 rc2 = vdThreadFinishWrite(pDisk);
6580 AssertRC(rc2);
6581 fLockWrite = false;
6582
6583 /* Set up image descriptor. */
6584 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
6585 if (!pImage)
6586 {
6587 rc = VERR_NO_MEMORY;
6588 break;
6589 }
6590 pImage->pszFilename = RTStrDup(pszFilename);
6591 if (!pImage->pszFilename)
6592 {
6593 rc = VERR_NO_MEMORY;
6594 break;
6595 }
6596
6597 rc = vdFindBackend(pszBackend, &pImage->Backend);
6598 if (RT_FAILURE(rc))
6599 break;
6600 if (!pImage->Backend)
6601 {
6602 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6603 N_("VD: unknown backend name '%s'"), pszBackend);
6604 break;
6605 }
6606 if ( !(pImage->Backend->uBackendCaps & VD_CAP_DIFF)
6607 || !(pImage->Backend->uBackendCaps & ( VD_CAP_CREATE_FIXED
6608 | VD_CAP_CREATE_DYNAMIC)))
6609 {
6610 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6611 N_("VD: backend '%s' cannot create diff images"), pszBackend);
6612 break;
6613 }
6614
6615 pImage->VDIo.pDisk = pDisk;
6616 pImage->pVDIfsImage = pVDIfsImage;
6617
6618 /* Set up the I/O interface. */
6619 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
6620 if (!pImage->VDIo.pInterfaceIo)
6621 {
6622 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
6623 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6624 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
6625 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
6626 }
6627
6628 /* Set up the internal I/O interface. */
6629 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
6630 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
6631 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6632 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
6633 AssertRC(rc);
6634
6635 /* Create UUID if the caller didn't specify one. */
6636 if (!pUuid)
6637 {
6638 rc = RTUuidCreate(&uuid);
6639 if (RT_FAILURE(rc))
6640 {
6641 rc = vdError(pDisk, rc, RT_SRC_POS,
6642 N_("VD: cannot generate UUID for image '%s'"),
6643 pszFilename);
6644 break;
6645 }
6646 pUuid = &uuid;
6647 }
6648
6649 pImage->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6650 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6651 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
6652 rc = pImage->Backend->pfnCreate(pImage->pszFilename, pDisk->cbSize,
6653 uImageFlags | VD_IMAGE_FLAGS_DIFF,
6654 pszComment, &pDisk->PCHSGeometry,
6655 &pDisk->LCHSGeometry, pUuid,
6656 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6657 0, 99,
6658 pDisk->pVDIfsDisk,
6659 pImage->pVDIfsImage,
6660 pVDIfsOperation,
6661 &pImage->pBackendData);
6662
6663 if (RT_SUCCESS(rc))
6664 {
6665 pImage->VDIo.pBackendData = pImage->pBackendData;
6666 pImage->uImageFlags = uImageFlags;
6667
6668 /* Lock disk for writing, as we modify pDisk information below. */
6669 rc2 = vdThreadStartWrite(pDisk);
6670 AssertRC(rc2);
6671 fLockWrite = true;
6672
6673 /* Switch previous image to read-only mode. */
6674 unsigned uOpenFlagsPrevImg;
6675 uOpenFlagsPrevImg = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
6676 if (!(uOpenFlagsPrevImg & VD_OPEN_FLAGS_READONLY))
6677 {
6678 uOpenFlagsPrevImg |= VD_OPEN_FLAGS_READONLY;
6679 rc = pDisk->pLast->Backend->pfnSetOpenFlags(pDisk->pLast->pBackendData, uOpenFlagsPrevImg);
6680 }
6681
6682 /** @todo optionally check UUIDs */
6683
6684 /* Re-check state, as the lock wasn't held and another image
6685 * creation call could have been done by another thread. */
6686 AssertMsgStmt(pDisk->cImages != 0,
6687 ("Create diff image cannot be done without other images open\n"),
6688 rc = VERR_VD_INVALID_STATE);
6689 }
6690
6691 if (RT_SUCCESS(rc))
6692 {
6693 RTUUID Uuid;
6694 RTTIMESPEC ts;
6695
6696 if (pParentUuid && !RTUuidIsNull(pParentUuid))
6697 {
6698 Uuid = *pParentUuid;
6699 pImage->Backend->pfnSetParentUuid(pImage->pBackendData, &Uuid);
6700 }
6701 else
6702 {
6703 rc2 = pDisk->pLast->Backend->pfnGetUuid(pDisk->pLast->pBackendData,
6704 &Uuid);
6705 if (RT_SUCCESS(rc2))
6706 pImage->Backend->pfnSetParentUuid(pImage->pBackendData, &Uuid);
6707 }
6708 rc2 = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6709 &Uuid);
6710 if (RT_SUCCESS(rc2))
6711 pImage->Backend->pfnSetParentModificationUuid(pImage->pBackendData,
6712 &Uuid);
6713 if (pDisk->pLast->Backend->pfnGetTimeStamp)
6714 rc2 = pDisk->pLast->Backend->pfnGetTimeStamp(pDisk->pLast->pBackendData,
6715 &ts);
6716 else
6717 rc2 = VERR_NOT_IMPLEMENTED;
6718 if (RT_SUCCESS(rc2) && pImage->Backend->pfnSetParentTimeStamp)
6719 pImage->Backend->pfnSetParentTimeStamp(pImage->pBackendData, &ts);
6720
6721 if (pImage->Backend->pfnSetParentFilename)
6722 rc2 = pImage->Backend->pfnSetParentFilename(pImage->pBackendData, pDisk->pLast->pszFilename);
6723 }
6724
6725 if (RT_SUCCESS(rc))
6726 {
6727 /* Image successfully opened, make it the last image. */
6728 vdAddImageToList(pDisk, pImage);
6729 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
6730 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
6731 }
6732 else
6733 {
6734 /* Error detected, but image opened. Close and delete image. */
6735 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, true);
6736 AssertRC(rc2);
6737 pImage->pBackendData = NULL;
6738 }
6739 } while (0);
6740
6741 if (RT_UNLIKELY(fLockWrite))
6742 {
6743 rc2 = vdThreadFinishWrite(pDisk);
6744 AssertRC(rc2);
6745 }
6746 else if (RT_UNLIKELY(fLockRead))
6747 {
6748 rc2 = vdThreadFinishRead(pDisk);
6749 AssertRC(rc2);
6750 }
6751
6752 if (RT_FAILURE(rc))
6753 {
6754 if (pImage)
6755 {
6756 if (pImage->pszFilename)
6757 RTStrFree(pImage->pszFilename);
6758 RTMemFree(pImage);
6759 }
6760 }
6761
6762 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6763 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6764
6765 LogFlowFunc(("returns %Rrc\n", rc));
6766 return rc;
6767}
6768
6769
6770/**
6771 * Creates and opens new cache image file in HDD container.
6772 *
6773 * @return VBox status code.
6774 * @param pDisk Name of the cache file backend to use (case insensitive).
6775 * @param pszFilename Name of the differencing cache file to create.
6776 * @param cbSize Maximum size of the cache.
6777 * @param uImageFlags Flags specifying special cache features.
6778 * @param pszComment Pointer to image comment. NULL is ok.
6779 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6780 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6781 * @param pVDIfsCache Pointer to the per-cache VD interface list.
6782 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6783 */
6784VBOXDDU_DECL(int) VDCreateCache(PVBOXHDD pDisk, const char *pszBackend,
6785 const char *pszFilename, uint64_t cbSize,
6786 unsigned uImageFlags, const char *pszComment,
6787 PCRTUUID pUuid, unsigned uOpenFlags,
6788 PVDINTERFACE pVDIfsCache, PVDINTERFACE pVDIfsOperation)
6789{
6790 int rc = VINF_SUCCESS;
6791 int rc2;
6792 bool fLockWrite = false, fLockRead = false;
6793 PVDCACHE pCache = NULL;
6794 RTUUID uuid;
6795
6796 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" cbSize=%llu uImageFlags=%#x pszComment=\"%s\" Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6797 pDisk, pszBackend, pszFilename, cbSize, uImageFlags, pszComment, pUuid, uOpenFlags, pVDIfsCache, pVDIfsOperation));
6798
6799 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6800
6801 do
6802 {
6803 /* sanity check */
6804 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6805 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6806
6807 /* Check arguments. */
6808 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6809 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6810 rc = VERR_INVALID_PARAMETER);
6811 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6812 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6813 rc = VERR_INVALID_PARAMETER);
6814 AssertMsgBreakStmt(cbSize,
6815 ("cbSize=%llu\n", cbSize),
6816 rc = VERR_INVALID_PARAMETER);
6817 AssertMsgBreakStmt((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0,
6818 ("uImageFlags=%#x\n", uImageFlags),
6819 rc = VERR_INVALID_PARAMETER);
6820 /* The UUID may be NULL. */
6821 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6822 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6823 rc = VERR_INVALID_PARAMETER);
6824 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6825 ("uOpenFlags=%#x\n", uOpenFlags),
6826 rc = VERR_INVALID_PARAMETER);
6827
6828 /* Check state. Needs a temporary read lock. Holding the write lock
6829 * all the time would be blocking other activities for too long. */
6830 rc2 = vdThreadStartRead(pDisk);
6831 AssertRC(rc2);
6832 fLockRead = true;
6833 AssertMsgBreakStmt(!pDisk->pCache,
6834 ("Create cache image cannot be done with a cache already attached\n"),
6835 rc = VERR_VD_CACHE_ALREADY_EXISTS);
6836 rc2 = vdThreadFinishRead(pDisk);
6837 AssertRC(rc2);
6838 fLockRead = false;
6839
6840 /* Set up image descriptor. */
6841 pCache = (PVDCACHE)RTMemAllocZ(sizeof(VDCACHE));
6842 if (!pCache)
6843 {
6844 rc = VERR_NO_MEMORY;
6845 break;
6846 }
6847 pCache->pszFilename = RTStrDup(pszFilename);
6848 if (!pCache->pszFilename)
6849 {
6850 rc = VERR_NO_MEMORY;
6851 break;
6852 }
6853
6854 rc = vdFindCacheBackend(pszBackend, &pCache->Backend);
6855 if (RT_FAILURE(rc))
6856 break;
6857 if (!pCache->Backend)
6858 {
6859 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6860 N_("VD: unknown backend name '%s'"), pszBackend);
6861 break;
6862 }
6863
6864 pCache->VDIo.pDisk = pDisk;
6865 pCache->pVDIfsCache = pVDIfsCache;
6866
6867 /* Set up the I/O interface. */
6868 pCache->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsCache);
6869 if (!pCache->VDIo.pInterfaceIo)
6870 {
6871 vdIfIoFallbackCallbacksSetup(&pCache->VDIo.VDIfIo);
6872 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6873 pDisk, sizeof(VDINTERFACEIO), &pVDIfsCache);
6874 pCache->VDIo.pInterfaceIo = &pCache->VDIo.VDIfIo;
6875 }
6876
6877 /* Set up the internal I/O interface. */
6878 AssertBreakStmt(!VDIfIoIntGet(pVDIfsCache), rc = VERR_INVALID_PARAMETER);
6879 vdIfIoIntCallbacksSetup(&pCache->VDIo.VDIfIoInt);
6880 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6881 &pCache->VDIo, sizeof(VDINTERFACEIOINT), &pCache->pVDIfsCache);
6882 AssertRC(rc);
6883
6884 /* Create UUID if the caller didn't specify one. */
6885 if (!pUuid)
6886 {
6887 rc = RTUuidCreate(&uuid);
6888 if (RT_FAILURE(rc))
6889 {
6890 rc = vdError(pDisk, rc, RT_SRC_POS,
6891 N_("VD: cannot generate UUID for image '%s'"),
6892 pszFilename);
6893 break;
6894 }
6895 pUuid = &uuid;
6896 }
6897
6898 pCache->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6899 pCache->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6900 rc = pCache->Backend->pfnCreate(pCache->pszFilename, cbSize,
6901 uImageFlags,
6902 pszComment, pUuid,
6903 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6904 0, 99,
6905 pDisk->pVDIfsDisk,
6906 pCache->pVDIfsCache,
6907 pVDIfsOperation,
6908 &pCache->pBackendData);
6909
6910 if (RT_SUCCESS(rc))
6911 {
6912 /* Lock disk for writing, as we modify pDisk information below. */
6913 rc2 = vdThreadStartWrite(pDisk);
6914 AssertRC(rc2);
6915 fLockWrite = true;
6916
6917 pCache->VDIo.pBackendData = pCache->pBackendData;
6918
6919 /* Re-check state, as the lock wasn't held and another image
6920 * creation call could have been done by another thread. */
6921 AssertMsgStmt(!pDisk->pCache,
6922 ("Create cache image cannot be done with another cache open\n"),
6923 rc = VERR_VD_CACHE_ALREADY_EXISTS);
6924 }
6925
6926 if ( RT_SUCCESS(rc)
6927 && pDisk->pLast)
6928 {
6929 RTUUID UuidModification;
6930
6931 /* Set same modification Uuid as the last image. */
6932 rc = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6933 &UuidModification);
6934 if (RT_SUCCESS(rc))
6935 {
6936 rc = pCache->Backend->pfnSetModificationUuid(pCache->pBackendData,
6937 &UuidModification);
6938 }
6939
6940 if (rc == VERR_NOT_SUPPORTED)
6941 rc = VINF_SUCCESS;
6942 }
6943
6944 if (RT_SUCCESS(rc))
6945 {
6946 /* Cache successfully created. */
6947 pDisk->pCache = pCache;
6948 }
6949 else
6950 {
6951 /* Error detected, but image opened. Close and delete image. */
6952 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, true);
6953 AssertRC(rc2);
6954 pCache->pBackendData = NULL;
6955 }
6956 } while (0);
6957
6958 if (RT_UNLIKELY(fLockWrite))
6959 {
6960 rc2 = vdThreadFinishWrite(pDisk);
6961 AssertRC(rc2);
6962 }
6963 else if (RT_UNLIKELY(fLockRead))
6964 {
6965 rc2 = vdThreadFinishRead(pDisk);
6966 AssertRC(rc2);
6967 }
6968
6969 if (RT_FAILURE(rc))
6970 {
6971 if (pCache)
6972 {
6973 if (pCache->pszFilename)
6974 RTStrFree(pCache->pszFilename);
6975 RTMemFree(pCache);
6976 }
6977 }
6978
6979 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6980 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6981
6982 LogFlowFunc(("returns %Rrc\n", rc));
6983 return rc;
6984}
6985
6986/**
6987 * Merges two images (not necessarily with direct parent/child relationship).
6988 * As a side effect the source image and potentially the other images which
6989 * are also merged to the destination are deleted from both the disk and the
6990 * images in the HDD container.
6991 *
6992 * @returns VBox status code.
6993 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
6994 * @param pDisk Pointer to HDD container.
6995 * @param nImageFrom Name of the image file to merge from.
6996 * @param nImageTo Name of the image file to merge to.
6997 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6998 */
6999VBOXDDU_DECL(int) VDMerge(PVBOXHDD pDisk, unsigned nImageFrom,
7000 unsigned nImageTo, PVDINTERFACE pVDIfsOperation)
7001{
7002 int rc = VINF_SUCCESS;
7003 int rc2;
7004 bool fLockWrite = false, fLockRead = false;
7005 void *pvBuf = NULL;
7006
7007 LogFlowFunc(("pDisk=%#p nImageFrom=%u nImageTo=%u pVDIfsOperation=%#p\n",
7008 pDisk, nImageFrom, nImageTo, pVDIfsOperation));
7009
7010 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7011
7012 do
7013 {
7014 /* sanity check */
7015 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
7016 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
7017
7018 /* For simplicity reasons lock for writing as the image reopen below
7019 * might need it. After all the reopen is usually needed. */
7020 rc2 = vdThreadStartWrite(pDisk);
7021 AssertRC(rc2);
7022 fLockWrite = true;
7023 PVDIMAGE pImageFrom = vdGetImageByNumber(pDisk, nImageFrom);
7024 PVDIMAGE pImageTo = vdGetImageByNumber(pDisk, nImageTo);
7025 if (!pImageFrom || !pImageTo)
7026 {
7027 rc = VERR_VD_IMAGE_NOT_FOUND;
7028 break;
7029 }
7030 AssertBreakStmt(pImageFrom != pImageTo, rc = VERR_INVALID_PARAMETER);
7031
7032 /* Make sure destination image is writable. */
7033 unsigned uOpenFlags = pImageTo->Backend->pfnGetOpenFlags(pImageTo->pBackendData);
7034 if (uOpenFlags & VD_OPEN_FLAGS_READONLY)
7035 {
7036 /*
7037 * Clear skip consistency checks because the image is made writable now and
7038 * skipping consistency checks is only possible for readonly images.
7039 */
7040 uOpenFlags &= ~(VD_OPEN_FLAGS_READONLY | VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS);
7041 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7042 uOpenFlags);
7043 if (RT_FAILURE(rc))
7044 break;
7045 }
7046
7047 /* Get size of destination image. */
7048 uint64_t cbSize = pImageTo->Backend->pfnGetSize(pImageTo->pBackendData);
7049 rc2 = vdThreadFinishWrite(pDisk);
7050 AssertRC(rc2);
7051 fLockWrite = false;
7052
7053 /* Allocate tmp buffer. */
7054 pvBuf = RTMemTmpAlloc(VD_MERGE_BUFFER_SIZE);
7055 if (!pvBuf)
7056 {
7057 rc = VERR_NO_MEMORY;
7058 break;
7059 }
7060
7061 /* Merging is done directly on the images itself. This potentially
7062 * causes trouble if the disk is full in the middle of operation. */
7063 if (nImageFrom < nImageTo)
7064 {
7065 /* Merge parent state into child. This means writing all not
7066 * allocated blocks in the destination image which are allocated in
7067 * the images to be merged. */
7068 uint64_t uOffset = 0;
7069 uint64_t cbRemaining = cbSize;
7070 do
7071 {
7072 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
7073 RTSGSEG SegmentBuf;
7074 RTSGBUF SgBuf;
7075 VDIOCTX IoCtx;
7076
7077 SegmentBuf.pvSeg = pvBuf;
7078 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
7079 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
7080 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, 0, 0, NULL,
7081 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
7082
7083 /* Need to hold the write lock during a read-write operation. */
7084 rc2 = vdThreadStartWrite(pDisk);
7085 AssertRC(rc2);
7086 fLockWrite = true;
7087
7088 rc = pImageTo->Backend->pfnRead(pImageTo->pBackendData,
7089 uOffset, cbThisRead,
7090 &IoCtx, &cbThisRead);
7091 if (rc == VERR_VD_BLOCK_FREE)
7092 {
7093 /* Search for image with allocated block. Do not attempt to
7094 * read more than the previous reads marked as valid.
7095 * Otherwise this would return stale data when different
7096 * block sizes are used for the images. */
7097 for (PVDIMAGE pCurrImage = pImageTo->pPrev;
7098 pCurrImage != NULL && pCurrImage != pImageFrom->pPrev && rc == VERR_VD_BLOCK_FREE;
7099 pCurrImage = pCurrImage->pPrev)
7100 {
7101 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
7102 uOffset, cbThisRead,
7103 &IoCtx, &cbThisRead);
7104 }
7105
7106 if (rc != VERR_VD_BLOCK_FREE)
7107 {
7108 if (RT_FAILURE(rc))
7109 break;
7110 /* Updating the cache is required because this might be a live merge. */
7111 rc = vdWriteHelperEx(pDisk, pImageTo, pImageFrom->pPrev,
7112 uOffset, pvBuf, cbThisRead,
7113 VDIOCTX_FLAGS_READ_UPDATE_CACHE, 0);
7114 if (RT_FAILURE(rc))
7115 break;
7116 }
7117 else
7118 rc = VINF_SUCCESS;
7119 }
7120 else if (RT_FAILURE(rc))
7121 break;
7122
7123 rc2 = vdThreadFinishWrite(pDisk);
7124 AssertRC(rc2);
7125 fLockWrite = false;
7126
7127 uOffset += cbThisRead;
7128 cbRemaining -= cbThisRead;
7129
7130 if (pIfProgress && pIfProgress->pfnProgress)
7131 {
7132 /** @todo r=klaus: this can update the progress to the same
7133 * percentage over and over again if the image format makes
7134 * relatively small increments. */
7135 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
7136 uOffset * 99 / cbSize);
7137 if (RT_FAILURE(rc))
7138 break;
7139 }
7140 } while (uOffset < cbSize);
7141 }
7142 else
7143 {
7144 /*
7145 * We may need to update the parent uuid of the child coming after
7146 * the last image to be merged. We have to reopen it read/write.
7147 *
7148 * This is done before we do the actual merge to prevent an
7149 * inconsistent chain if the mode change fails for some reason.
7150 */
7151 if (pImageFrom->pNext)
7152 {
7153 PVDIMAGE pImageChild = pImageFrom->pNext;
7154
7155 /* Take the write lock. */
7156 rc2 = vdThreadStartWrite(pDisk);
7157 AssertRC(rc2);
7158 fLockWrite = true;
7159
7160 /* We need to open the image in read/write mode. */
7161 uOpenFlags = pImageChild->Backend->pfnGetOpenFlags(pImageChild->pBackendData);
7162
7163 if (uOpenFlags & VD_OPEN_FLAGS_READONLY)
7164 {
7165 uOpenFlags &= ~VD_OPEN_FLAGS_READONLY;
7166 rc = pImageChild->Backend->pfnSetOpenFlags(pImageChild->pBackendData,
7167 uOpenFlags);
7168 if (RT_FAILURE(rc))
7169 break;
7170 }
7171
7172 rc2 = vdThreadFinishWrite(pDisk);
7173 AssertRC(rc2);
7174 fLockWrite = false;
7175 }
7176
7177 /* If the merge is from the last image we have to relay all writes
7178 * to the merge destination as well, so that concurrent writes
7179 * (in case of a live merge) are handled correctly. */
7180 if (!pImageFrom->pNext)
7181 {
7182 /* Take the write lock. */
7183 rc2 = vdThreadStartWrite(pDisk);
7184 AssertRC(rc2);
7185 fLockWrite = true;
7186
7187 pDisk->pImageRelay = pImageTo;
7188
7189 rc2 = vdThreadFinishWrite(pDisk);
7190 AssertRC(rc2);
7191 fLockWrite = false;
7192 }
7193
7194 /* Merge child state into parent. This means writing all blocks
7195 * which are allocated in the image up to the source image to the
7196 * destination image. */
7197 uint64_t uOffset = 0;
7198 uint64_t cbRemaining = cbSize;
7199 do
7200 {
7201 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
7202 RTSGSEG SegmentBuf;
7203 RTSGBUF SgBuf;
7204 VDIOCTX IoCtx;
7205
7206 rc = VERR_VD_BLOCK_FREE;
7207
7208 SegmentBuf.pvSeg = pvBuf;
7209 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
7210 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
7211 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, 0, 0, NULL,
7212 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
7213
7214 /* Need to hold the write lock during a read-write operation. */
7215 rc2 = vdThreadStartWrite(pDisk);
7216 AssertRC(rc2);
7217 fLockWrite = true;
7218
7219 /* Search for image with allocated block. Do not attempt to
7220 * read more than the previous reads marked as valid. Otherwise
7221 * this would return stale data when different block sizes are
7222 * used for the images. */
7223 for (PVDIMAGE pCurrImage = pImageFrom;
7224 pCurrImage != NULL && pCurrImage != pImageTo && rc == VERR_VD_BLOCK_FREE;
7225 pCurrImage = pCurrImage->pPrev)
7226 {
7227 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
7228 uOffset, cbThisRead,
7229 &IoCtx, &cbThisRead);
7230 }
7231
7232 if (rc != VERR_VD_BLOCK_FREE)
7233 {
7234 if (RT_FAILURE(rc))
7235 break;
7236 rc = vdWriteHelper(pDisk, pImageTo, uOffset, pvBuf,
7237 cbThisRead, VDIOCTX_FLAGS_READ_UPDATE_CACHE);
7238 if (RT_FAILURE(rc))
7239 break;
7240 }
7241 else
7242 rc = VINF_SUCCESS;
7243
7244 rc2 = vdThreadFinishWrite(pDisk);
7245 AssertRC(rc2);
7246 fLockWrite = false;
7247
7248 uOffset += cbThisRead;
7249 cbRemaining -= cbThisRead;
7250
7251 if (pIfProgress && pIfProgress->pfnProgress)
7252 {
7253 /** @todo r=klaus: this can update the progress to the same
7254 * percentage over and over again if the image format makes
7255 * relatively small increments. */
7256 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
7257 uOffset * 99 / cbSize);
7258 if (RT_FAILURE(rc))
7259 break;
7260 }
7261 } while (uOffset < cbSize);
7262
7263 /* In case we set up a "write proxy" image above we must clear
7264 * this again now to prevent stray writes. Failure or not. */
7265 if (!pImageFrom->pNext)
7266 {
7267 /* Take the write lock. */
7268 rc2 = vdThreadStartWrite(pDisk);
7269 AssertRC(rc2);
7270 fLockWrite = true;
7271
7272 pDisk->pImageRelay = NULL;
7273
7274 rc2 = vdThreadFinishWrite(pDisk);
7275 AssertRC(rc2);
7276 fLockWrite = false;
7277 }
7278 }
7279
7280 /*
7281 * Leave in case of an error to avoid corrupted data in the image chain
7282 * (includes cancelling the operation by the user).
7283 */
7284 if (RT_FAILURE(rc))
7285 break;
7286
7287 /* Need to hold the write lock while finishing the merge. */
7288 rc2 = vdThreadStartWrite(pDisk);
7289 AssertRC(rc2);
7290 fLockWrite = true;
7291
7292 /* Update parent UUID so that image chain is consistent.
7293 * The two attempts work around the problem that some backends
7294 * (e.g. iSCSI) do not support UUIDs, so we exploit the fact that
7295 * so far there can only be one such image in the chain. */
7296 /** @todo needs a better long-term solution, passing the UUID
7297 * knowledge from the caller or some such */
7298 RTUUID Uuid;
7299 PVDIMAGE pImageChild = NULL;
7300 if (nImageFrom < nImageTo)
7301 {
7302 if (pImageFrom->pPrev)
7303 {
7304 /* plan A: ask the parent itself for its UUID */
7305 rc = pImageFrom->pPrev->Backend->pfnGetUuid(pImageFrom->pPrev->pBackendData,
7306 &Uuid);
7307 if (RT_FAILURE(rc))
7308 {
7309 /* plan B: ask the child of the parent for parent UUID */
7310 rc = pImageFrom->Backend->pfnGetParentUuid(pImageFrom->pBackendData,
7311 &Uuid);
7312 }
7313 AssertRC(rc);
7314 }
7315 else
7316 RTUuidClear(&Uuid);
7317 rc = pImageTo->Backend->pfnSetParentUuid(pImageTo->pBackendData,
7318 &Uuid);
7319 AssertRC(rc);
7320 }
7321 else
7322 {
7323 /* Update the parent uuid of the child of the last merged image. */
7324 if (pImageFrom->pNext)
7325 {
7326 /* plan A: ask the parent itself for its UUID */
7327 rc = pImageTo->Backend->pfnGetUuid(pImageTo->pBackendData,
7328 &Uuid);
7329 if (RT_FAILURE(rc))
7330 {
7331 /* plan B: ask the child of the parent for parent UUID */
7332 rc = pImageTo->pNext->Backend->pfnGetParentUuid(pImageTo->pNext->pBackendData,
7333 &Uuid);
7334 }
7335 AssertRC(rc);
7336
7337 rc = pImageFrom->Backend->pfnSetParentUuid(pImageFrom->pNext->pBackendData,
7338 &Uuid);
7339 AssertRC(rc);
7340
7341 pImageChild = pImageFrom->pNext;
7342 }
7343 }
7344
7345 /* Delete the no longer needed images. */
7346 PVDIMAGE pImg = pImageFrom, pTmp;
7347 while (pImg != pImageTo)
7348 {
7349 if (nImageFrom < nImageTo)
7350 pTmp = pImg->pNext;
7351 else
7352 pTmp = pImg->pPrev;
7353 vdRemoveImageFromList(pDisk, pImg);
7354 pImg->Backend->pfnClose(pImg->pBackendData, true);
7355 RTMemFree(pImg->pszFilename);
7356 RTMemFree(pImg);
7357 pImg = pTmp;
7358 }
7359
7360 /* Make sure destination image is back to read only if necessary. */
7361 if (pImageTo != pDisk->pLast)
7362 {
7363 uOpenFlags = pImageTo->Backend->pfnGetOpenFlags(pImageTo->pBackendData);
7364 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
7365 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7366 uOpenFlags);
7367 if (RT_FAILURE(rc))
7368 break;
7369 }
7370
7371 /*
7372 * Make sure the child is readonly
7373 * for the child -> parent merge direction
7374 * if necessary.
7375 */
7376 if ( nImageFrom > nImageTo
7377 && pImageChild
7378 && pImageChild != pDisk->pLast)
7379 {
7380 uOpenFlags = pImageChild->Backend->pfnGetOpenFlags(pImageChild->pBackendData);
7381 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
7382 rc = pImageChild->Backend->pfnSetOpenFlags(pImageChild->pBackendData,
7383 uOpenFlags);
7384 if (RT_FAILURE(rc))
7385 break;
7386 }
7387 } while (0);
7388
7389 if (RT_UNLIKELY(fLockWrite))
7390 {
7391 rc2 = vdThreadFinishWrite(pDisk);
7392 AssertRC(rc2);
7393 }
7394 else if (RT_UNLIKELY(fLockRead))
7395 {
7396 rc2 = vdThreadFinishRead(pDisk);
7397 AssertRC(rc2);
7398 }
7399
7400 if (pvBuf)
7401 RTMemTmpFree(pvBuf);
7402
7403 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
7404 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7405
7406 LogFlowFunc(("returns %Rrc\n", rc));
7407 return rc;
7408}
7409
7410/**
7411 * Copies an image from one HDD container to another - extended version.
7412 * The copy is opened in the target HDD container.
7413 * It is possible to convert between different image formats, because the
7414 * backend for the destination may be different from the source.
7415 * If both the source and destination reference the same HDD container,
7416 * then the image is moved (by copying/deleting or renaming) to the new location.
7417 * The source container is unchanged if the move operation fails, otherwise
7418 * the image at the new location is opened in the same way as the old one was.
7419 *
7420 * @note The read/write accesses across disks are not synchronized, just the
7421 * accesses to each disk. Once there is a use case which requires a defined
7422 * read/write behavior in this situation this needs to be extended.
7423 *
7424 * @return VBox status code.
7425 * @return VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7426 * @param pDiskFrom Pointer to source HDD container.
7427 * @param nImage Image number, counts from 0. 0 is always base image of container.
7428 * @param pDiskTo Pointer to destination HDD container.
7429 * @param pszBackend Name of the image file backend to use (may be NULL to use the same as the source, case insensitive).
7430 * @param pszFilename New name of the image (may be NULL to specify that the
7431 * copy destination is the destination container, or
7432 * if pDiskFrom == pDiskTo, i.e. when moving).
7433 * @param fMoveByRename If true, attempt to perform a move by renaming (if successful the new size is ignored).
7434 * @param cbSize New image size (0 means leave unchanged).
7435 * @param nImageSameFrom todo
7436 * @param nImageSameTo todo
7437 * @param uImageFlags Flags specifying special destination image features.
7438 * @param pDstUuid New UUID of the destination image. If NULL, a new UUID is created.
7439 * This parameter is used if and only if a true copy is created.
7440 * In all rename/move cases or copy to existing image cases the modification UUIDs are copied over.
7441 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
7442 * Only used if the destination image is created.
7443 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7444 * @param pDstVDIfsImage Pointer to the per-image VD interface list, for the
7445 * destination image.
7446 * @param pDstVDIfsOperation Pointer to the per-operation VD interface list,
7447 * for the destination operation.
7448 */
7449VBOXDDU_DECL(int) VDCopyEx(PVBOXHDD pDiskFrom, unsigned nImage, PVBOXHDD pDiskTo,
7450 const char *pszBackend, const char *pszFilename,
7451 bool fMoveByRename, uint64_t cbSize,
7452 unsigned nImageFromSame, unsigned nImageToSame,
7453 unsigned uImageFlags, PCRTUUID pDstUuid,
7454 unsigned uOpenFlags, PVDINTERFACE pVDIfsOperation,
7455 PVDINTERFACE pDstVDIfsImage,
7456 PVDINTERFACE pDstVDIfsOperation)
7457{
7458 int rc = VINF_SUCCESS;
7459 int rc2;
7460 bool fLockReadFrom = false, fLockWriteFrom = false, fLockWriteTo = false;
7461 PVDIMAGE pImageTo = NULL;
7462
7463 LogFlowFunc(("pDiskFrom=%#p nImage=%u pDiskTo=%#p pszBackend=\"%s\" pszFilename=\"%s\" fMoveByRename=%d cbSize=%llu nImageFromSame=%u nImageToSame=%u uImageFlags=%#x pDstUuid=%#p uOpenFlags=%#x pVDIfsOperation=%#p pDstVDIfsImage=%#p pDstVDIfsOperation=%#p\n",
7464 pDiskFrom, nImage, pDiskTo, pszBackend, pszFilename, fMoveByRename, cbSize, nImageFromSame, nImageToSame, uImageFlags, pDstUuid, uOpenFlags, pVDIfsOperation, pDstVDIfsImage, pDstVDIfsOperation));
7465
7466 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7467 PVDINTERFACEPROGRESS pDstIfProgress = VDIfProgressGet(pDstVDIfsOperation);
7468
7469 do {
7470 /* Check arguments. */
7471 AssertMsgBreakStmt(VALID_PTR(pDiskFrom), ("pDiskFrom=%#p\n", pDiskFrom),
7472 rc = VERR_INVALID_PARAMETER);
7473 AssertMsg(pDiskFrom->u32Signature == VBOXHDDDISK_SIGNATURE,
7474 ("u32Signature=%08x\n", pDiskFrom->u32Signature));
7475
7476 rc2 = vdThreadStartRead(pDiskFrom);
7477 AssertRC(rc2);
7478 fLockReadFrom = true;
7479 PVDIMAGE pImageFrom = vdGetImageByNumber(pDiskFrom, nImage);
7480 AssertPtrBreakStmt(pImageFrom, rc = VERR_VD_IMAGE_NOT_FOUND);
7481 AssertMsgBreakStmt(VALID_PTR(pDiskTo), ("pDiskTo=%#p\n", pDiskTo),
7482 rc = VERR_INVALID_PARAMETER);
7483 AssertMsg(pDiskTo->u32Signature == VBOXHDDDISK_SIGNATURE,
7484 ("u32Signature=%08x\n", pDiskTo->u32Signature));
7485 AssertMsgBreakStmt( (nImageFromSame < nImage || nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN)
7486 && (nImageToSame < pDiskTo->cImages || nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7487 && ( (nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN && nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7488 || (nImageFromSame != VD_IMAGE_CONTENT_UNKNOWN && nImageToSame != VD_IMAGE_CONTENT_UNKNOWN)),
7489 ("nImageFromSame=%u nImageToSame=%u\n", nImageFromSame, nImageToSame),
7490 rc = VERR_INVALID_PARAMETER);
7491
7492 /* Move the image. */
7493 if (pDiskFrom == pDiskTo)
7494 {
7495 /* Rename only works when backends are the same, are file based
7496 * and the rename method is implemented. */
7497 if ( fMoveByRename
7498 && !RTStrICmp(pszBackend, pImageFrom->Backend->pszBackendName)
7499 && pImageFrom->Backend->uBackendCaps & VD_CAP_FILE
7500 && pImageFrom->Backend->pfnRename)
7501 {
7502 rc2 = vdThreadFinishRead(pDiskFrom);
7503 AssertRC(rc2);
7504 fLockReadFrom = false;
7505
7506 rc2 = vdThreadStartWrite(pDiskFrom);
7507 AssertRC(rc2);
7508 fLockWriteFrom = true;
7509 rc = pImageFrom->Backend->pfnRename(pImageFrom->pBackendData, pszFilename ? pszFilename : pImageFrom->pszFilename);
7510 break;
7511 }
7512
7513 /** @todo Moving (including shrinking/growing) of the image is
7514 * requested, but the rename attempt failed or it wasn't possible.
7515 * Must now copy image to temp location. */
7516 AssertReleaseMsgFailed(("VDCopy: moving by copy/delete not implemented\n"));
7517 }
7518
7519 /* pszFilename is allowed to be NULL, as this indicates copy to the existing image. */
7520 AssertMsgBreakStmt(pszFilename == NULL || (VALID_PTR(pszFilename) && *pszFilename),
7521 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
7522 rc = VERR_INVALID_PARAMETER);
7523
7524 uint64_t cbSizeFrom;
7525 cbSizeFrom = pImageFrom->Backend->pfnGetSize(pImageFrom->pBackendData);
7526 if (cbSizeFrom == 0)
7527 {
7528 rc = VERR_VD_VALUE_NOT_FOUND;
7529 break;
7530 }
7531
7532 VDGEOMETRY PCHSGeometryFrom = {0, 0, 0};
7533 VDGEOMETRY LCHSGeometryFrom = {0, 0, 0};
7534 pImageFrom->Backend->pfnGetPCHSGeometry(pImageFrom->pBackendData, &PCHSGeometryFrom);
7535 pImageFrom->Backend->pfnGetLCHSGeometry(pImageFrom->pBackendData, &LCHSGeometryFrom);
7536
7537 RTUUID ImageUuid, ImageModificationUuid;
7538 if (pDiskFrom != pDiskTo)
7539 {
7540 if (pDstUuid)
7541 ImageUuid = *pDstUuid;
7542 else
7543 RTUuidCreate(&ImageUuid);
7544 }
7545 else
7546 {
7547 rc = pImageFrom->Backend->pfnGetUuid(pImageFrom->pBackendData, &ImageUuid);
7548 if (RT_FAILURE(rc))
7549 RTUuidCreate(&ImageUuid);
7550 }
7551 rc = pImageFrom->Backend->pfnGetModificationUuid(pImageFrom->pBackendData, &ImageModificationUuid);
7552 if (RT_FAILURE(rc))
7553 RTUuidClear(&ImageModificationUuid);
7554
7555 char szComment[1024];
7556 rc = pImageFrom->Backend->pfnGetComment(pImageFrom->pBackendData, szComment, sizeof(szComment));
7557 if (RT_FAILURE(rc))
7558 szComment[0] = '\0';
7559 else
7560 szComment[sizeof(szComment) - 1] = '\0';
7561
7562 rc2 = vdThreadFinishRead(pDiskFrom);
7563 AssertRC(rc2);
7564 fLockReadFrom = false;
7565
7566 rc2 = vdThreadStartRead(pDiskTo);
7567 AssertRC(rc2);
7568 unsigned cImagesTo = pDiskTo->cImages;
7569 rc2 = vdThreadFinishRead(pDiskTo);
7570 AssertRC(rc2);
7571
7572 if (pszFilename)
7573 {
7574 if (cbSize == 0)
7575 cbSize = cbSizeFrom;
7576
7577 /* Create destination image with the properties of source image. */
7578 /** @todo replace the VDCreateDiff/VDCreateBase calls by direct
7579 * calls to the backend. Unifies the code and reduces the API
7580 * dependencies. Would also make the synchronization explicit. */
7581 if (cImagesTo > 0)
7582 {
7583 rc = VDCreateDiff(pDiskTo, pszBackend, pszFilename,
7584 uImageFlags, szComment, &ImageUuid,
7585 NULL /* pParentUuid */,
7586 uOpenFlags & ~VD_OPEN_FLAGS_READONLY,
7587 pDstVDIfsImage, NULL);
7588
7589 rc2 = vdThreadStartWrite(pDiskTo);
7590 AssertRC(rc2);
7591 fLockWriteTo = true;
7592 } else {
7593 /** @todo hack to force creation of a fixed image for
7594 * the RAW backend, which can't handle anything else. */
7595 if (!RTStrICmp(pszBackend, "RAW"))
7596 uImageFlags |= VD_IMAGE_FLAGS_FIXED;
7597
7598 vdFixupPCHSGeometry(&PCHSGeometryFrom, cbSize);
7599 vdFixupLCHSGeometry(&LCHSGeometryFrom, cbSize);
7600
7601 rc = VDCreateBase(pDiskTo, pszBackend, pszFilename, cbSize,
7602 uImageFlags, szComment,
7603 &PCHSGeometryFrom, &LCHSGeometryFrom,
7604 NULL, uOpenFlags & ~VD_OPEN_FLAGS_READONLY,
7605 pDstVDIfsImage, NULL);
7606
7607 rc2 = vdThreadStartWrite(pDiskTo);
7608 AssertRC(rc2);
7609 fLockWriteTo = true;
7610
7611 if (RT_SUCCESS(rc) && !RTUuidIsNull(&ImageUuid))
7612 pDiskTo->pLast->Backend->pfnSetUuid(pDiskTo->pLast->pBackendData, &ImageUuid);
7613 }
7614 if (RT_FAILURE(rc))
7615 break;
7616
7617 pImageTo = pDiskTo->pLast;
7618 AssertPtrBreakStmt(pImageTo, rc = VERR_VD_IMAGE_NOT_FOUND);
7619
7620 cbSize = RT_MIN(cbSize, cbSizeFrom);
7621 }
7622 else
7623 {
7624 pImageTo = pDiskTo->pLast;
7625 AssertPtrBreakStmt(pImageTo, rc = VERR_VD_IMAGE_NOT_FOUND);
7626
7627 uint64_t cbSizeTo;
7628 cbSizeTo = pImageTo->Backend->pfnGetSize(pImageTo->pBackendData);
7629 if (cbSizeTo == 0)
7630 {
7631 rc = VERR_VD_VALUE_NOT_FOUND;
7632 break;
7633 }
7634
7635 if (cbSize == 0)
7636 cbSize = RT_MIN(cbSizeFrom, cbSizeTo);
7637
7638 vdFixupPCHSGeometry(&PCHSGeometryFrom, cbSize);
7639 vdFixupLCHSGeometry(&LCHSGeometryFrom, cbSize);
7640
7641 /* Update the geometry in the destination image. */
7642 pImageTo->Backend->pfnSetPCHSGeometry(pImageTo->pBackendData, &PCHSGeometryFrom);
7643 pImageTo->Backend->pfnSetLCHSGeometry(pImageTo->pBackendData, &LCHSGeometryFrom);
7644 }
7645
7646 rc2 = vdThreadFinishWrite(pDiskTo);
7647 AssertRC(rc2);
7648 fLockWriteTo = false;
7649
7650 /* Whether we can take the optimized copy path (false) or not.
7651 * Don't optimize if the image existed or if it is a child image. */
7652 bool fSuppressRedundantIo = ( !(pszFilename == NULL || cImagesTo > 0)
7653 || (nImageToSame != VD_IMAGE_CONTENT_UNKNOWN));
7654 unsigned cImagesFromReadBack, cImagesToReadBack;
7655
7656 if (nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN)
7657 cImagesFromReadBack = 0;
7658 else
7659 {
7660 if (nImage == VD_LAST_IMAGE)
7661 cImagesFromReadBack = pDiskFrom->cImages - nImageFromSame - 1;
7662 else
7663 cImagesFromReadBack = nImage - nImageFromSame;
7664 }
7665
7666 if (nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7667 cImagesToReadBack = 0;
7668 else
7669 cImagesToReadBack = pDiskTo->cImages - nImageToSame - 1;
7670
7671 /* Copy the data. */
7672 rc = vdCopyHelper(pDiskFrom, pImageFrom, pDiskTo, cbSize,
7673 cImagesFromReadBack, cImagesToReadBack,
7674 fSuppressRedundantIo, pIfProgress, pDstIfProgress);
7675
7676 if (RT_SUCCESS(rc))
7677 {
7678 rc2 = vdThreadStartWrite(pDiskTo);
7679 AssertRC(rc2);
7680 fLockWriteTo = true;
7681
7682 /* Only set modification UUID if it is non-null, since the source
7683 * backend might not provide a valid modification UUID. */
7684 if (!RTUuidIsNull(&ImageModificationUuid))
7685 pImageTo->Backend->pfnSetModificationUuid(pImageTo->pBackendData, &ImageModificationUuid);
7686
7687 /* Set the requested open flags if they differ from the value
7688 * required for creating the image and copying the contents. */
7689 if ( pImageTo && pszFilename
7690 && uOpenFlags != (uOpenFlags & ~VD_OPEN_FLAGS_READONLY))
7691 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7692 uOpenFlags);
7693 }
7694 } while (0);
7695
7696 if (RT_FAILURE(rc) && pImageTo && pszFilename)
7697 {
7698 /* Take the write lock only if it is not taken. Not worth making the
7699 * above code even more complicated. */
7700 if (RT_UNLIKELY(!fLockWriteTo))
7701 {
7702 rc2 = vdThreadStartWrite(pDiskTo);
7703 AssertRC(rc2);
7704 fLockWriteTo = true;
7705 }
7706 /* Error detected, but new image created. Remove image from list. */
7707 vdRemoveImageFromList(pDiskTo, pImageTo);
7708
7709 /* Close and delete image. */
7710 rc2 = pImageTo->Backend->pfnClose(pImageTo->pBackendData, true);
7711 AssertRC(rc2);
7712 pImageTo->pBackendData = NULL;
7713
7714 /* Free remaining resources. */
7715 if (pImageTo->pszFilename)
7716 RTStrFree(pImageTo->pszFilename);
7717
7718 RTMemFree(pImageTo);
7719 }
7720
7721 if (RT_UNLIKELY(fLockWriteTo))
7722 {
7723 rc2 = vdThreadFinishWrite(pDiskTo);
7724 AssertRC(rc2);
7725 }
7726 if (RT_UNLIKELY(fLockWriteFrom))
7727 {
7728 rc2 = vdThreadFinishWrite(pDiskFrom);
7729 AssertRC(rc2);
7730 }
7731 else if (RT_UNLIKELY(fLockReadFrom))
7732 {
7733 rc2 = vdThreadFinishRead(pDiskFrom);
7734 AssertRC(rc2);
7735 }
7736
7737 if (RT_SUCCESS(rc))
7738 {
7739 if (pIfProgress && pIfProgress->pfnProgress)
7740 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7741 if (pDstIfProgress && pDstIfProgress->pfnProgress)
7742 pDstIfProgress->pfnProgress(pDstIfProgress->Core.pvUser, 100);
7743 }
7744
7745 LogFlowFunc(("returns %Rrc\n", rc));
7746 return rc;
7747}
7748
7749/**
7750 * Copies an image from one HDD container to another.
7751 * The copy is opened in the target HDD container.
7752 * It is possible to convert between different image formats, because the
7753 * backend for the destination may be different from the source.
7754 * If both the source and destination reference the same HDD container,
7755 * then the image is moved (by copying/deleting or renaming) to the new location.
7756 * The source container is unchanged if the move operation fails, otherwise
7757 * the image at the new location is opened in the same way as the old one was.
7758 *
7759 * @returns VBox status code.
7760 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7761 * @param pDiskFrom Pointer to source HDD container.
7762 * @param nImage Image number, counts from 0. 0 is always base image of container.
7763 * @param pDiskTo Pointer to destination HDD container.
7764 * @param pszBackend Name of the image file backend to use.
7765 * @param pszFilename New name of the image (may be NULL if pDiskFrom == pDiskTo).
7766 * @param fMoveByRename If true, attempt to perform a move by renaming (if successful the new size is ignored).
7767 * @param cbSize New image size (0 means leave unchanged).
7768 * @param uImageFlags Flags specifying special destination image features.
7769 * @param pDstUuid New UUID of the destination image. If NULL, a new UUID is created.
7770 * This parameter is used if and only if a true copy is created.
7771 * In all rename/move cases the UUIDs are copied over.
7772 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
7773 * Only used if the destination image is created.
7774 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7775 * @param pDstVDIfsImage Pointer to the per-image VD interface list, for the
7776 * destination image.
7777 * @param pDstVDIfsOperation Pointer to the per-image VD interface list,
7778 * for the destination image.
7779 */
7780VBOXDDU_DECL(int) VDCopy(PVBOXHDD pDiskFrom, unsigned nImage, PVBOXHDD pDiskTo,
7781 const char *pszBackend, const char *pszFilename,
7782 bool fMoveByRename, uint64_t cbSize,
7783 unsigned uImageFlags, PCRTUUID pDstUuid,
7784 unsigned uOpenFlags, PVDINTERFACE pVDIfsOperation,
7785 PVDINTERFACE pDstVDIfsImage,
7786 PVDINTERFACE pDstVDIfsOperation)
7787{
7788 return VDCopyEx(pDiskFrom, nImage, pDiskTo, pszBackend, pszFilename, fMoveByRename,
7789 cbSize, VD_IMAGE_CONTENT_UNKNOWN, VD_IMAGE_CONTENT_UNKNOWN,
7790 uImageFlags, pDstUuid, uOpenFlags, pVDIfsOperation,
7791 pDstVDIfsImage, pDstVDIfsOperation);
7792}
7793
7794/**
7795 * Optimizes the storage consumption of an image. Typically the unused blocks
7796 * have to be wiped with zeroes to achieve a substantial reduced storage use.
7797 * Another optimization done is reordering the image blocks, which can provide
7798 * a significant performance boost, as reads and writes tend to use less random
7799 * file offsets.
7800 *
7801 * @return VBox status code.
7802 * @return VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7803 * @return VERR_VD_IMAGE_READ_ONLY if image is not writable.
7804 * @return VERR_NOT_SUPPORTED if this kind of image can be compacted, but
7805 * the code for this isn't implemented yet.
7806 * @param pDisk Pointer to HDD container.
7807 * @param nImage Image number, counts from 0. 0 is always base image of container.
7808 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7809 */
7810VBOXDDU_DECL(int) VDCompact(PVBOXHDD pDisk, unsigned nImage,
7811 PVDINTERFACE pVDIfsOperation)
7812{
7813 int rc = VINF_SUCCESS;
7814 int rc2;
7815 bool fLockRead = false, fLockWrite = false;
7816 void *pvBuf = NULL;
7817 void *pvTmp = NULL;
7818
7819 LogFlowFunc(("pDisk=%#p nImage=%u pVDIfsOperation=%#p\n",
7820 pDisk, nImage, pVDIfsOperation));
7821
7822 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7823
7824 do {
7825 /* Check arguments. */
7826 AssertMsgBreakStmt(VALID_PTR(pDisk), ("pDisk=%#p\n", pDisk),
7827 rc = VERR_INVALID_PARAMETER);
7828 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE,
7829 ("u32Signature=%08x\n", pDisk->u32Signature));
7830
7831 rc2 = vdThreadStartRead(pDisk);
7832 AssertRC(rc2);
7833 fLockRead = true;
7834
7835 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
7836 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
7837
7838 /* If there is no compact callback for not file based backends then
7839 * the backend doesn't need compaction. No need to make much fuss about
7840 * this. For file based ones signal this as not yet supported. */
7841 if (!pImage->Backend->pfnCompact)
7842 {
7843 if (pImage->Backend->uBackendCaps & VD_CAP_FILE)
7844 rc = VERR_NOT_SUPPORTED;
7845 else
7846 rc = VINF_SUCCESS;
7847 break;
7848 }
7849
7850 /* Insert interface for reading parent state into per-operation list,
7851 * if there is a parent image. */
7852 VDINTERFACEPARENTSTATE VDIfParent;
7853 VDPARENTSTATEDESC ParentUser;
7854 if (pImage->pPrev)
7855 {
7856 VDIfParent.pfnParentRead = vdParentRead;
7857 ParentUser.pDisk = pDisk;
7858 ParentUser.pImage = pImage->pPrev;
7859 rc = VDInterfaceAdd(&VDIfParent.Core, "VDCompact_ParentState", VDINTERFACETYPE_PARENTSTATE,
7860 &ParentUser, sizeof(VDINTERFACEPARENTSTATE), &pVDIfsOperation);
7861 AssertRC(rc);
7862 }
7863
7864 rc2 = vdThreadFinishRead(pDisk);
7865 AssertRC(rc2);
7866 fLockRead = false;
7867
7868 rc2 = vdThreadStartWrite(pDisk);
7869 AssertRC(rc2);
7870 fLockWrite = true;
7871
7872 rc = pImage->Backend->pfnCompact(pImage->pBackendData,
7873 0, 99,
7874 pDisk->pVDIfsDisk,
7875 pImage->pVDIfsImage,
7876 pVDIfsOperation);
7877 } while (0);
7878
7879 if (RT_UNLIKELY(fLockWrite))
7880 {
7881 rc2 = vdThreadFinishWrite(pDisk);
7882 AssertRC(rc2);
7883 }
7884 else if (RT_UNLIKELY(fLockRead))
7885 {
7886 rc2 = vdThreadFinishRead(pDisk);
7887 AssertRC(rc2);
7888 }
7889
7890 if (pvBuf)
7891 RTMemTmpFree(pvBuf);
7892 if (pvTmp)
7893 RTMemTmpFree(pvTmp);
7894
7895 if (RT_SUCCESS(rc))
7896 {
7897 if (pIfProgress && pIfProgress->pfnProgress)
7898 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7899 }
7900
7901 LogFlowFunc(("returns %Rrc\n", rc));
7902 return rc;
7903}
7904
7905/**
7906 * Resizes the given disk image to the given size.
7907 *
7908 * @return VBox status
7909 * @return VERR_VD_IMAGE_READ_ONLY if image is not writable.
7910 * @return VERR_NOT_SUPPORTED if this kind of image can be compacted, but
7911 *
7912 * @param pDisk Pointer to the HDD container.
7913 * @param cbSize New size of the image.
7914 * @param pPCHSGeometry Pointer to the new physical disk geometry <= (16383,16,63). Not NULL.
7915 * @param pLCHSGeometry Pointer to the new logical disk geometry <= (x,255,63). Not NULL.
7916 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7917 */
7918VBOXDDU_DECL(int) VDResize(PVBOXHDD pDisk, uint64_t cbSize,
7919 PCVDGEOMETRY pPCHSGeometry,
7920 PCVDGEOMETRY pLCHSGeometry,
7921 PVDINTERFACE pVDIfsOperation)
7922{
7923 /** @todo r=klaus resizing was designed to be part of VDCopy, so having a separate function is not desirable. */
7924 int rc = VINF_SUCCESS;
7925 int rc2;
7926 bool fLockRead = false, fLockWrite = false;
7927
7928 LogFlowFunc(("pDisk=%#p cbSize=%llu pVDIfsOperation=%#p\n",
7929 pDisk, cbSize, pVDIfsOperation));
7930
7931 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7932
7933 do {
7934 /* Check arguments. */
7935 AssertMsgBreakStmt(VALID_PTR(pDisk), ("pDisk=%#p\n", pDisk),
7936 rc = VERR_INVALID_PARAMETER);
7937 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE,
7938 ("u32Signature=%08x\n", pDisk->u32Signature));
7939
7940 rc2 = vdThreadStartRead(pDisk);
7941 AssertRC(rc2);
7942 fLockRead = true;
7943
7944 /* Must have at least one image in the chain, will resize last. */
7945 AssertMsgBreakStmt(pDisk->cImages >= 1, ("cImages=%u\n", pDisk->cImages),
7946 rc = VERR_NOT_SUPPORTED);
7947
7948 PVDIMAGE pImage = pDisk->pLast;
7949
7950 /* If there is no compact callback for not file based backends then
7951 * the backend doesn't need compaction. No need to make much fuss about
7952 * this. For file based ones signal this as not yet supported. */
7953 if (!pImage->Backend->pfnResize)
7954 {
7955 if (pImage->Backend->uBackendCaps & VD_CAP_FILE)
7956 rc = VERR_NOT_SUPPORTED;
7957 else
7958 rc = VINF_SUCCESS;
7959 break;
7960 }
7961
7962 rc2 = vdThreadFinishRead(pDisk);
7963 AssertRC(rc2);
7964 fLockRead = false;
7965
7966 rc2 = vdThreadStartWrite(pDisk);
7967 AssertRC(rc2);
7968 fLockWrite = true;
7969
7970 VDGEOMETRY PCHSGeometryOld;
7971 VDGEOMETRY LCHSGeometryOld;
7972 PCVDGEOMETRY pPCHSGeometryNew;
7973 PCVDGEOMETRY pLCHSGeometryNew;
7974
7975 if (pPCHSGeometry->cCylinders == 0)
7976 {
7977 /* Auto-detect marker, calculate new value ourself. */
7978 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData, &PCHSGeometryOld);
7979 if (RT_SUCCESS(rc) && (PCHSGeometryOld.cCylinders != 0))
7980 PCHSGeometryOld.cCylinders = RT_MIN(cbSize / 512 / PCHSGeometryOld.cHeads / PCHSGeometryOld.cSectors, 16383);
7981 else if (rc == VERR_VD_GEOMETRY_NOT_SET)
7982 rc = VINF_SUCCESS;
7983
7984 pPCHSGeometryNew = &PCHSGeometryOld;
7985 }
7986 else
7987 pPCHSGeometryNew = pPCHSGeometry;
7988
7989 if (pLCHSGeometry->cCylinders == 0)
7990 {
7991 /* Auto-detect marker, calculate new value ourself. */
7992 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData, &LCHSGeometryOld);
7993 if (RT_SUCCESS(rc) && (LCHSGeometryOld.cCylinders != 0))
7994 LCHSGeometryOld.cCylinders = cbSize / 512 / LCHSGeometryOld.cHeads / LCHSGeometryOld.cSectors;
7995 else if (rc == VERR_VD_GEOMETRY_NOT_SET)
7996 rc = VINF_SUCCESS;
7997
7998 pLCHSGeometryNew = &LCHSGeometryOld;
7999 }
8000 else
8001 pLCHSGeometryNew = pLCHSGeometry;
8002
8003 if (RT_SUCCESS(rc))
8004 rc = pImage->Backend->pfnResize(pImage->pBackendData,
8005 cbSize,
8006 pPCHSGeometryNew,
8007 pLCHSGeometryNew,
8008 0, 99,
8009 pDisk->pVDIfsDisk,
8010 pImage->pVDIfsImage,
8011 pVDIfsOperation);
8012 } while (0);
8013
8014 if (RT_UNLIKELY(fLockWrite))
8015 {
8016 rc2 = vdThreadFinishWrite(pDisk);
8017 AssertRC(rc2);
8018 }
8019 else if (RT_UNLIKELY(fLockRead))
8020 {
8021 rc2 = vdThreadFinishRead(pDisk);
8022 AssertRC(rc2);
8023 }
8024
8025 if (RT_SUCCESS(rc))
8026 {
8027 if (pIfProgress && pIfProgress->pfnProgress)
8028 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
8029
8030 pDisk->cbSize = cbSize;
8031 }
8032
8033 LogFlowFunc(("returns %Rrc\n", rc));
8034 return rc;
8035}
8036
8037/**
8038 * Closes the last opened image file in HDD container.
8039 * If previous image file was opened in read-only mode (the normal case) and
8040 * the last opened image is in read-write mode then the previous image will be
8041 * reopened in read/write mode.
8042 *
8043 * @returns VBox status code.
8044 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8045 * @param pDisk Pointer to HDD container.
8046 * @param fDelete If true, delete the image from the host disk.
8047 */
8048VBOXDDU_DECL(int) VDClose(PVBOXHDD pDisk, bool fDelete)
8049{
8050 int rc = VINF_SUCCESS;
8051 int rc2;
8052 bool fLockWrite = false;
8053
8054 LogFlowFunc(("pDisk=%#p fDelete=%d\n", pDisk, fDelete));
8055 do
8056 {
8057 /* sanity check */
8058 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8059 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8060
8061 /* Not worth splitting this up into a read lock phase and write
8062 * lock phase, as closing an image is a relatively fast operation
8063 * dominated by the part which needs the write lock. */
8064 rc2 = vdThreadStartWrite(pDisk);
8065 AssertRC(rc2);
8066 fLockWrite = true;
8067
8068 PVDIMAGE pImage = pDisk->pLast;
8069 if (!pImage)
8070 {
8071 rc = VERR_VD_NOT_OPENED;
8072 break;
8073 }
8074
8075 /* Destroy the current discard state first which might still have pending blocks. */
8076 rc = vdDiscardStateDestroy(pDisk);
8077 if (RT_FAILURE(rc))
8078 break;
8079
8080 unsigned uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
8081 /* Remove image from list of opened images. */
8082 vdRemoveImageFromList(pDisk, pImage);
8083 /* Close (and optionally delete) image. */
8084 rc = pImage->Backend->pfnClose(pImage->pBackendData, fDelete);
8085 /* Free remaining resources related to the image. */
8086 RTStrFree(pImage->pszFilename);
8087 RTMemFree(pImage);
8088
8089 pImage = pDisk->pLast;
8090 if (!pImage)
8091 break;
8092
8093 /* If disk was previously in read/write mode, make sure it will stay
8094 * like this (if possible) after closing this image. Set the open flags
8095 * accordingly. */
8096 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
8097 {
8098 uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
8099 uOpenFlags &= ~ VD_OPEN_FLAGS_READONLY;
8100 rc = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData, uOpenFlags);
8101 }
8102
8103 /* Cache disk information. */
8104 pDisk->cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
8105
8106 /* Cache PCHS geometry. */
8107 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8108 &pDisk->PCHSGeometry);
8109 if (RT_FAILURE(rc2))
8110 {
8111 pDisk->PCHSGeometry.cCylinders = 0;
8112 pDisk->PCHSGeometry.cHeads = 0;
8113 pDisk->PCHSGeometry.cSectors = 0;
8114 }
8115 else
8116 {
8117 /* Make sure the PCHS geometry is properly clipped. */
8118 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
8119 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
8120 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
8121 }
8122
8123 /* Cache LCHS geometry. */
8124 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
8125 &pDisk->LCHSGeometry);
8126 if (RT_FAILURE(rc2))
8127 {
8128 pDisk->LCHSGeometry.cCylinders = 0;
8129 pDisk->LCHSGeometry.cHeads = 0;
8130 pDisk->LCHSGeometry.cSectors = 0;
8131 }
8132 else
8133 {
8134 /* Make sure the LCHS geometry is properly clipped. */
8135 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
8136 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
8137 }
8138 } while (0);
8139
8140 if (RT_UNLIKELY(fLockWrite))
8141 {
8142 rc2 = vdThreadFinishWrite(pDisk);
8143 AssertRC(rc2);
8144 }
8145
8146 LogFlowFunc(("returns %Rrc\n", rc));
8147 return rc;
8148}
8149
8150/**
8151 * Closes the currently opened cache image file in HDD container.
8152 *
8153 * @return VBox status code.
8154 * @return VERR_VD_NOT_OPENED if no cache is opened in HDD container.
8155 * @param pDisk Pointer to HDD container.
8156 * @param fDelete If true, delete the image from the host disk.
8157 */
8158VBOXDDU_DECL(int) VDCacheClose(PVBOXHDD pDisk, bool fDelete)
8159{
8160 int rc = VINF_SUCCESS;
8161 int rc2;
8162 bool fLockWrite = false;
8163 PVDCACHE pCache = NULL;
8164
8165 LogFlowFunc(("pDisk=%#p fDelete=%d\n", pDisk, fDelete));
8166
8167 do
8168 {
8169 /* sanity check */
8170 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8171 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8172
8173 rc2 = vdThreadStartWrite(pDisk);
8174 AssertRC(rc2);
8175 fLockWrite = true;
8176
8177 AssertPtrBreakStmt(pDisk->pCache, rc = VERR_VD_CACHE_NOT_FOUND);
8178
8179 pCache = pDisk->pCache;
8180 pDisk->pCache = NULL;
8181
8182 pCache->Backend->pfnClose(pCache->pBackendData, fDelete);
8183 if (pCache->pszFilename)
8184 RTStrFree(pCache->pszFilename);
8185 RTMemFree(pCache);
8186 } while (0);
8187
8188 if (RT_LIKELY(fLockWrite))
8189 {
8190 rc2 = vdThreadFinishWrite(pDisk);
8191 AssertRC(rc2);
8192 }
8193
8194 LogFlowFunc(("returns %Rrc\n", rc));
8195 return rc;
8196}
8197
8198/**
8199 * Removes the last added filter in the HDD container.
8200 *
8201 * @return VBox status code.
8202 * @retval VERR_VD_NOT_OPENED if no filter is present for the disk.
8203 * @param pDisk Pointer to HDD container.
8204 */
8205VBOXDDU_DECL(int) VDFilterRemove(PVBOXHDD pDisk)
8206{
8207 int rc = VINF_SUCCESS;
8208 int rc2;
8209 bool fLockWrite = false;
8210 PVDFILTER pFilter = NULL;
8211
8212 LogFlowFunc(("pDisk=%#p\n", pDisk));
8213
8214 do
8215 {
8216 /* sanity check */
8217 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8218 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8219
8220 rc2 = vdThreadStartWrite(pDisk);
8221 AssertRC(rc2);
8222 fLockWrite = true;
8223
8224 AssertPtrBreakStmt(pDisk->pFilterHead, rc = VERR_VD_NOT_OPENED);
8225
8226 pFilter = pDisk->pFilterTail;
8227 vdRemoveFilterFromList(pDisk, pFilter);
8228
8229 pFilter->pBackend->pfnDestroy(pFilter->pvBackendData);
8230 RTMemFree(pFilter);
8231 } while (0);
8232
8233 if (RT_LIKELY(fLockWrite))
8234 {
8235 rc2 = vdThreadFinishWrite(pDisk);
8236 AssertRC(rc2);
8237 }
8238
8239 LogFlowFunc(("returns %Rrc\n", rc));
8240 return rc;
8241}
8242
8243/**
8244 * Closes all opened image files in HDD container.
8245 *
8246 * @returns VBox status code.
8247 * @param pDisk Pointer to HDD container.
8248 */
8249VBOXDDU_DECL(int) VDCloseAll(PVBOXHDD pDisk)
8250{
8251 int rc = VINF_SUCCESS;
8252 int rc2;
8253 bool fLockWrite = false;
8254
8255 LogFlowFunc(("pDisk=%#p\n", pDisk));
8256 do
8257 {
8258 /* sanity check */
8259 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8260 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8261
8262 /* Lock the entire operation. */
8263 rc2 = vdThreadStartWrite(pDisk);
8264 AssertRC(rc2);
8265 fLockWrite = true;
8266
8267 PVDCACHE pCache = pDisk->pCache;
8268 if (pCache)
8269 {
8270 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, false);
8271 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
8272 rc = rc2;
8273
8274 if (pCache->pszFilename)
8275 RTStrFree(pCache->pszFilename);
8276 RTMemFree(pCache);
8277 }
8278
8279 PVDIMAGE pImage = pDisk->pLast;
8280 while (VALID_PTR(pImage))
8281 {
8282 PVDIMAGE pPrev = pImage->pPrev;
8283 /* Remove image from list of opened images. */
8284 vdRemoveImageFromList(pDisk, pImage);
8285 /* Close image. */
8286 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, false);
8287 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
8288 rc = rc2;
8289 /* Free remaining resources related to the image. */
8290 RTStrFree(pImage->pszFilename);
8291 RTMemFree(pImage);
8292 pImage = pPrev;
8293 }
8294 Assert(!VALID_PTR(pDisk->pLast));
8295 } while (0);
8296
8297 if (RT_UNLIKELY(fLockWrite))
8298 {
8299 rc2 = vdThreadFinishWrite(pDisk);
8300 AssertRC(rc2);
8301 }
8302
8303 LogFlowFunc(("returns %Rrc\n", rc));
8304 return rc;
8305}
8306
8307/**
8308 * Removes all filters of the given HDD container.
8309 *
8310 * @return VBox status code.
8311 * @param pDisk Pointer to HDD container.
8312 */
8313VBOXDDU_DECL(int) VDFilterRemoveAll(PVBOXHDD pDisk)
8314{
8315 int rc = VINF_SUCCESS;
8316 int rc2;
8317 bool fLockWrite = false;
8318
8319 LogFlowFunc(("pDisk=%#p\n", pDisk));
8320 do
8321 {
8322 /* sanity check */
8323 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8324 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8325
8326 /* Lock the entire operation. */
8327 rc2 = vdThreadStartWrite(pDisk);
8328 AssertRC(rc2);
8329 fLockWrite = true;
8330
8331 PVDFILTER pFilter = pDisk->pFilterTail;
8332 while (VALID_PTR(pFilter))
8333 {
8334 PVDFILTER pPrev = pFilter->pPrev;
8335 vdRemoveFilterFromList(pDisk, pFilter);
8336
8337 rc2 = pFilter->pBackend->pfnDestroy(pFilter->pvBackendData);
8338 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
8339 rc = rc2;
8340 /* Free remaining resources related to the image. */
8341 RTMemFree(pFilter);
8342 pFilter = pPrev;
8343 }
8344 Assert(!VALID_PTR(pDisk->pFilterTail));
8345 } while (0);
8346
8347 if (RT_UNLIKELY(fLockWrite))
8348 {
8349 rc2 = vdThreadFinishWrite(pDisk);
8350 AssertRC(rc2);
8351 }
8352
8353 LogFlowFunc(("returns %Rrc\n", rc));
8354 return rc;
8355}
8356
8357/**
8358 * Read data from virtual HDD.
8359 *
8360 * @returns VBox status code.
8361 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8362 * @param pDisk Pointer to HDD container.
8363 * @param uOffset Offset of first reading byte from start of disk.
8364 * @param pvBuf Pointer to buffer for reading data.
8365 * @param cbRead Number of bytes to read.
8366 */
8367VBOXDDU_DECL(int) VDRead(PVBOXHDD pDisk, uint64_t uOffset, void *pvBuf,
8368 size_t cbRead)
8369{
8370 int rc = VINF_SUCCESS;
8371 int rc2;
8372 bool fLockRead = false;
8373
8374 LogFlowFunc(("pDisk=%#p uOffset=%llu pvBuf=%p cbRead=%zu\n",
8375 pDisk, uOffset, pvBuf, cbRead));
8376 do
8377 {
8378 /* sanity check */
8379 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8380 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8381
8382 /* Check arguments. */
8383 AssertMsgBreakStmt(VALID_PTR(pvBuf),
8384 ("pvBuf=%#p\n", pvBuf),
8385 rc = VERR_INVALID_PARAMETER);
8386 AssertMsgBreakStmt(cbRead,
8387 ("cbRead=%zu\n", cbRead),
8388 rc = VERR_INVALID_PARAMETER);
8389
8390 rc2 = vdThreadStartRead(pDisk);
8391 AssertRC(rc2);
8392 fLockRead = true;
8393
8394 PVDIMAGE pImage = pDisk->pLast;
8395 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8396
8397 if (uOffset + cbRead > pDisk->cbSize)
8398 {
8399 /* Floppy images might be smaller than the standard expected by
8400 the floppy controller code. So, we won't fail here. */
8401 AssertMsgBreakStmt(pDisk->enmType == VDTYPE_FLOPPY,
8402 ("uOffset=%llu cbRead=%zu pDisk->cbSize=%llu\n",
8403 uOffset, cbRead, pDisk->cbSize),
8404 rc = VERR_EOF);
8405 memset(pvBuf, 0xf6, cbRead); /* f6h = format.com filler byte */
8406 if (uOffset >= pDisk->cbSize)
8407 break;
8408 cbRead = pDisk->cbSize - uOffset;
8409 }
8410
8411 rc = vdReadHelper(pDisk, pImage, uOffset, pvBuf, cbRead,
8412 true /* fUpdateCache */);
8413 } while (0);
8414
8415 if (RT_UNLIKELY(fLockRead))
8416 {
8417 rc2 = vdThreadFinishRead(pDisk);
8418 AssertRC(rc2);
8419 }
8420
8421 LogFlowFunc(("returns %Rrc\n", rc));
8422 return rc;
8423}
8424
8425/**
8426 * Write data to virtual HDD.
8427 *
8428 * @returns VBox status code.
8429 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8430 * @param pDisk Pointer to HDD container.
8431 * @param uOffset Offset of the first byte being
8432 * written from start of disk.
8433 * @param pvBuf Pointer to buffer for writing data.
8434 * @param cbWrite Number of bytes to write.
8435 */
8436VBOXDDU_DECL(int) VDWrite(PVBOXHDD pDisk, uint64_t uOffset, const void *pvBuf,
8437 size_t cbWrite)
8438{
8439 int rc = VINF_SUCCESS;
8440 int rc2;
8441 bool fLockWrite = false;
8442
8443 LogFlowFunc(("pDisk=%#p uOffset=%llu pvBuf=%p cbWrite=%zu\n",
8444 pDisk, uOffset, pvBuf, cbWrite));
8445 do
8446 {
8447 /* sanity check */
8448 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8449 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8450
8451 /* Check arguments. */
8452 AssertMsgBreakStmt(VALID_PTR(pvBuf),
8453 ("pvBuf=%#p\n", pvBuf),
8454 rc = VERR_INVALID_PARAMETER);
8455 AssertMsgBreakStmt(cbWrite,
8456 ("cbWrite=%zu\n", cbWrite),
8457 rc = VERR_INVALID_PARAMETER);
8458
8459 rc2 = vdThreadStartWrite(pDisk);
8460 AssertRC(rc2);
8461 fLockWrite = true;
8462
8463 AssertMsgBreakStmt(uOffset + cbWrite <= pDisk->cbSize,
8464 ("uOffset=%llu cbWrite=%zu pDisk->cbSize=%llu\n",
8465 uOffset, cbWrite, pDisk->cbSize),
8466 rc = VERR_INVALID_PARAMETER);
8467
8468 PVDIMAGE pImage = pDisk->pLast;
8469 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8470
8471 vdSetModifiedFlag(pDisk);
8472 rc = vdWriteHelper(pDisk, pImage, uOffset, pvBuf, cbWrite,
8473 VDIOCTX_FLAGS_READ_UPDATE_CACHE);
8474 if (RT_FAILURE(rc))
8475 break;
8476
8477 /* If there is a merge (in the direction towards a parent) running
8478 * concurrently then we have to also "relay" the write to this parent,
8479 * as the merge position might be already past the position where
8480 * this write is going. The "context" of the write can come from the
8481 * natural chain, since merging either already did or will take care
8482 * of the "other" content which is might be needed to fill the block
8483 * to a full allocation size. The cache doesn't need to be touched
8484 * as this write is covered by the previous one. */
8485 if (RT_UNLIKELY(pDisk->pImageRelay))
8486 rc = vdWriteHelper(pDisk, pDisk->pImageRelay, uOffset,
8487 pvBuf, cbWrite, VDIOCTX_FLAGS_DEFAULT);
8488 } while (0);
8489
8490 if (RT_UNLIKELY(fLockWrite))
8491 {
8492 rc2 = vdThreadFinishWrite(pDisk);
8493 AssertRC(rc2);
8494 }
8495
8496 LogFlowFunc(("returns %Rrc\n", rc));
8497 return rc;
8498}
8499
8500/**
8501 * Make sure the on disk representation of a virtual HDD is up to date.
8502 *
8503 * @returns VBox status code.
8504 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8505 * @param pDisk Pointer to HDD container.
8506 */
8507VBOXDDU_DECL(int) VDFlush(PVBOXHDD pDisk)
8508{
8509 int rc = VINF_SUCCESS;
8510 int rc2;
8511 bool fLockWrite = false;
8512
8513 LogFlowFunc(("pDisk=%#p\n", pDisk));
8514 do
8515 {
8516 /* sanity check */
8517 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8518 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8519
8520 rc2 = vdThreadStartWrite(pDisk);
8521 AssertRC(rc2);
8522 fLockWrite = true;
8523
8524 PVDIMAGE pImage = pDisk->pLast;
8525 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8526
8527 VDIOCTX IoCtx;
8528 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
8529
8530 rc = RTSemEventCreate(&hEventComplete);
8531 if (RT_FAILURE(rc))
8532 break;
8533
8534 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_FLUSH, 0, 0, pImage, NULL,
8535 NULL, vdFlushHelperAsync, VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE);
8536
8537 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
8538 IoCtx.Type.Root.pvUser1 = pDisk;
8539 IoCtx.Type.Root.pvUser2 = hEventComplete;
8540 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
8541
8542 RTSemEventDestroy(hEventComplete);
8543 } while (0);
8544
8545 if (RT_UNLIKELY(fLockWrite))
8546 {
8547 rc2 = vdThreadFinishWrite(pDisk);
8548 AssertRC(rc2);
8549 }
8550
8551 LogFlowFunc(("returns %Rrc\n", rc));
8552 return rc;
8553}
8554
8555/**
8556 * Get number of opened images in HDD container.
8557 *
8558 * @returns Number of opened images for HDD container. 0 if no images have been opened.
8559 * @param pDisk Pointer to HDD container.
8560 */
8561VBOXDDU_DECL(unsigned) VDGetCount(PVBOXHDD pDisk)
8562{
8563 unsigned cImages;
8564 int rc2;
8565 bool fLockRead = false;
8566
8567 LogFlowFunc(("pDisk=%#p\n", pDisk));
8568 do
8569 {
8570 /* sanity check */
8571 AssertPtrBreakStmt(pDisk, cImages = 0);
8572 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8573
8574 rc2 = vdThreadStartRead(pDisk);
8575 AssertRC(rc2);
8576 fLockRead = true;
8577
8578 cImages = pDisk->cImages;
8579 } while (0);
8580
8581 if (RT_UNLIKELY(fLockRead))
8582 {
8583 rc2 = vdThreadFinishRead(pDisk);
8584 AssertRC(rc2);
8585 }
8586
8587 LogFlowFunc(("returns %u\n", cImages));
8588 return cImages;
8589}
8590
8591/**
8592 * Get read/write mode of HDD container.
8593 *
8594 * @returns Virtual disk ReadOnly status.
8595 * @returns true if no image is opened in HDD container.
8596 * @param pDisk Pointer to HDD container.
8597 */
8598VBOXDDU_DECL(bool) VDIsReadOnly(PVBOXHDD pDisk)
8599{
8600 bool fReadOnly;
8601 int rc2;
8602 bool fLockRead = false;
8603
8604 LogFlowFunc(("pDisk=%#p\n", pDisk));
8605 do
8606 {
8607 /* sanity check */
8608 AssertPtrBreakStmt(pDisk, fReadOnly = false);
8609 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8610
8611 rc2 = vdThreadStartRead(pDisk);
8612 AssertRC(rc2);
8613 fLockRead = true;
8614
8615 PVDIMAGE pImage = pDisk->pLast;
8616 AssertPtrBreakStmt(pImage, fReadOnly = true);
8617
8618 unsigned uOpenFlags;
8619 uOpenFlags = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
8620 fReadOnly = !!(uOpenFlags & VD_OPEN_FLAGS_READONLY);
8621 } while (0);
8622
8623 if (RT_UNLIKELY(fLockRead))
8624 {
8625 rc2 = vdThreadFinishRead(pDisk);
8626 AssertRC(rc2);
8627 }
8628
8629 LogFlowFunc(("returns %d\n", fReadOnly));
8630 return fReadOnly;
8631}
8632
8633/**
8634 * Get sector size of an image in HDD container.
8635 *
8636 * @return Virtual disk sector size in bytes.
8637 * @return 0 if image with specified number was not opened.
8638 * @param pDisk Pointer to HDD container.
8639 * @param nImage Image number, counts from 0. 0 is always base image of container.
8640 */
8641VBOXDDU_DECL(uint32_t) VDGetSectorSize(PVBOXHDD pDisk, unsigned nImage)
8642{
8643 uint64_t cbSector;
8644 int rc2;
8645 bool fLockRead = false;
8646
8647 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8648 do
8649 {
8650 /* sanity check */
8651 AssertPtrBreakStmt(pDisk, cbSector = 0);
8652 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8653
8654 rc2 = vdThreadStartRead(pDisk);
8655 AssertRC(rc2);
8656 fLockRead = true;
8657
8658 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8659 AssertPtrBreakStmt(pImage, cbSector = 0);
8660 cbSector = pImage->Backend->pfnGetSectorSize(pImage->pBackendData);
8661 } while (0);
8662
8663 if (RT_UNLIKELY(fLockRead))
8664 {
8665 rc2 = vdThreadFinishRead(pDisk);
8666 AssertRC(rc2);
8667 }
8668
8669 LogFlowFunc(("returns %u\n", cbSector));
8670 return cbSector;
8671}
8672
8673/**
8674 * Get total capacity of an image in HDD container.
8675 *
8676 * @returns Virtual disk size in bytes.
8677 * @returns 0 if no image with specified number was not opened.
8678 * @param pDisk Pointer to HDD container.
8679 * @param nImage Image number, counts from 0. 0 is always base image of container.
8680 */
8681VBOXDDU_DECL(uint64_t) VDGetSize(PVBOXHDD pDisk, unsigned nImage)
8682{
8683 uint64_t cbSize;
8684 int rc2;
8685 bool fLockRead = false;
8686
8687 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8688 do
8689 {
8690 /* sanity check */
8691 AssertPtrBreakStmt(pDisk, cbSize = 0);
8692 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8693
8694 rc2 = vdThreadStartRead(pDisk);
8695 AssertRC(rc2);
8696 fLockRead = true;
8697
8698 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8699 AssertPtrBreakStmt(pImage, cbSize = 0);
8700 cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
8701 } while (0);
8702
8703 if (RT_UNLIKELY(fLockRead))
8704 {
8705 rc2 = vdThreadFinishRead(pDisk);
8706 AssertRC(rc2);
8707 }
8708
8709 LogFlowFunc(("returns %llu\n", cbSize));
8710 return cbSize;
8711}
8712
8713/**
8714 * Get total file size of an image in HDD container.
8715 *
8716 * @returns Virtual disk size in bytes.
8717 * @returns 0 if no image is opened in HDD container.
8718 * @param pDisk Pointer to HDD container.
8719 * @param nImage Image number, counts from 0. 0 is always base image of container.
8720 */
8721VBOXDDU_DECL(uint64_t) VDGetFileSize(PVBOXHDD pDisk, unsigned nImage)
8722{
8723 uint64_t cbSize;
8724 int rc2;
8725 bool fLockRead = false;
8726
8727 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8728 do
8729 {
8730 /* sanity check */
8731 AssertPtrBreakStmt(pDisk, cbSize = 0);
8732 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8733
8734 rc2 = vdThreadStartRead(pDisk);
8735 AssertRC(rc2);
8736 fLockRead = true;
8737
8738 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8739 AssertPtrBreakStmt(pImage, cbSize = 0);
8740 cbSize = pImage->Backend->pfnGetFileSize(pImage->pBackendData);
8741 } while (0);
8742
8743 if (RT_UNLIKELY(fLockRead))
8744 {
8745 rc2 = vdThreadFinishRead(pDisk);
8746 AssertRC(rc2);
8747 }
8748
8749 LogFlowFunc(("returns %llu\n", cbSize));
8750 return cbSize;
8751}
8752
8753/**
8754 * Get virtual disk PCHS geometry stored in HDD container.
8755 *
8756 * @returns VBox status code.
8757 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8758 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8759 * @param pDisk Pointer to HDD container.
8760 * @param nImage Image number, counts from 0. 0 is always base image of container.
8761 * @param pPCHSGeometry Where to store PCHS geometry. Not NULL.
8762 */
8763VBOXDDU_DECL(int) VDGetPCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
8764 PVDGEOMETRY pPCHSGeometry)
8765{
8766 int rc = VINF_SUCCESS;
8767 int rc2;
8768 bool fLockRead = false;
8769
8770 LogFlowFunc(("pDisk=%#p nImage=%u pPCHSGeometry=%#p\n",
8771 pDisk, nImage, pPCHSGeometry));
8772 do
8773 {
8774 /* sanity check */
8775 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8776 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8777
8778 /* Check arguments. */
8779 AssertMsgBreakStmt(VALID_PTR(pPCHSGeometry),
8780 ("pPCHSGeometry=%#p\n", pPCHSGeometry),
8781 rc = VERR_INVALID_PARAMETER);
8782
8783 rc2 = vdThreadStartRead(pDisk);
8784 AssertRC(rc2);
8785 fLockRead = true;
8786
8787 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8788 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8789
8790 if (pImage == pDisk->pLast)
8791 {
8792 /* Use cached information if possible. */
8793 if (pDisk->PCHSGeometry.cCylinders != 0)
8794 *pPCHSGeometry = pDisk->PCHSGeometry;
8795 else
8796 rc = VERR_VD_GEOMETRY_NOT_SET;
8797 }
8798 else
8799 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8800 pPCHSGeometry);
8801 } while (0);
8802
8803 if (RT_UNLIKELY(fLockRead))
8804 {
8805 rc2 = vdThreadFinishRead(pDisk);
8806 AssertRC(rc2);
8807 }
8808
8809 LogFlowFunc(("%Rrc (PCHS=%u/%u/%u)\n", rc,
8810 pDisk->PCHSGeometry.cCylinders, pDisk->PCHSGeometry.cHeads,
8811 pDisk->PCHSGeometry.cSectors));
8812 return rc;
8813}
8814
8815/**
8816 * Store virtual disk PCHS geometry in HDD container.
8817 *
8818 * Note that in case of unrecoverable error all images in HDD container will be closed.
8819 *
8820 * @returns VBox status code.
8821 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8822 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8823 * @param pDisk Pointer to HDD container.
8824 * @param nImage Image number, counts from 0. 0 is always base image of container.
8825 * @param pPCHSGeometry Where to load PCHS geometry from. Not NULL.
8826 */
8827VBOXDDU_DECL(int) VDSetPCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
8828 PCVDGEOMETRY pPCHSGeometry)
8829{
8830 int rc = VINF_SUCCESS;
8831 int rc2;
8832 bool fLockWrite = false;
8833
8834 LogFlowFunc(("pDisk=%#p nImage=%u pPCHSGeometry=%#p PCHS=%u/%u/%u\n",
8835 pDisk, nImage, pPCHSGeometry, pPCHSGeometry->cCylinders,
8836 pPCHSGeometry->cHeads, pPCHSGeometry->cSectors));
8837 do
8838 {
8839 /* sanity check */
8840 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8841 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8842
8843 /* Check arguments. */
8844 AssertMsgBreakStmt( VALID_PTR(pPCHSGeometry)
8845 && pPCHSGeometry->cHeads <= 16
8846 && pPCHSGeometry->cSectors <= 63,
8847 ("pPCHSGeometry=%#p PCHS=%u/%u/%u\n", pPCHSGeometry,
8848 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
8849 pPCHSGeometry->cSectors),
8850 rc = VERR_INVALID_PARAMETER);
8851
8852 rc2 = vdThreadStartWrite(pDisk);
8853 AssertRC(rc2);
8854 fLockWrite = true;
8855
8856 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8857 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8858
8859 if (pImage == pDisk->pLast)
8860 {
8861 if ( pPCHSGeometry->cCylinders != pDisk->PCHSGeometry.cCylinders
8862 || pPCHSGeometry->cHeads != pDisk->PCHSGeometry.cHeads
8863 || pPCHSGeometry->cSectors != pDisk->PCHSGeometry.cSectors)
8864 {
8865 /* Only update geometry if it is changed. Avoids similar checks
8866 * in every backend. Most of the time the new geometry is set
8867 * to the previous values, so no need to go through the hassle
8868 * of updating an image which could be opened in read-only mode
8869 * right now. */
8870 rc = pImage->Backend->pfnSetPCHSGeometry(pImage->pBackendData,
8871 pPCHSGeometry);
8872
8873 /* Cache new geometry values in any case. */
8874 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8875 &pDisk->PCHSGeometry);
8876 if (RT_FAILURE(rc2))
8877 {
8878 pDisk->PCHSGeometry.cCylinders = 0;
8879 pDisk->PCHSGeometry.cHeads = 0;
8880 pDisk->PCHSGeometry.cSectors = 0;
8881 }
8882 else
8883 {
8884 /* Make sure the CHS geometry is properly clipped. */
8885 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 255);
8886 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
8887 }
8888 }
8889 }
8890 else
8891 {
8892 VDGEOMETRY PCHS;
8893 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8894 &PCHS);
8895 if ( RT_FAILURE(rc)
8896 || pPCHSGeometry->cCylinders != PCHS.cCylinders
8897 || pPCHSGeometry->cHeads != PCHS.cHeads
8898 || pPCHSGeometry->cSectors != PCHS.cSectors)
8899 {
8900 /* Only update geometry if it is changed. Avoids similar checks
8901 * in every backend. Most of the time the new geometry is set
8902 * to the previous values, so no need to go through the hassle
8903 * of updating an image which could be opened in read-only mode
8904 * right now. */
8905 rc = pImage->Backend->pfnSetPCHSGeometry(pImage->pBackendData,
8906 pPCHSGeometry);
8907 }
8908 }
8909 } while (0);
8910
8911 if (RT_UNLIKELY(fLockWrite))
8912 {
8913 rc2 = vdThreadFinishWrite(pDisk);
8914 AssertRC(rc2);
8915 }
8916
8917 LogFlowFunc(("returns %Rrc\n", rc));
8918 return rc;
8919}
8920
8921/**
8922 * Get virtual disk LCHS geometry stored in HDD container.
8923 *
8924 * @returns VBox status code.
8925 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8926 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8927 * @param pDisk Pointer to HDD container.
8928 * @param nImage Image number, counts from 0. 0 is always base image of container.
8929 * @param pLCHSGeometry Where to store LCHS geometry. Not NULL.
8930 */
8931VBOXDDU_DECL(int) VDGetLCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
8932 PVDGEOMETRY pLCHSGeometry)
8933{
8934 int rc = VINF_SUCCESS;
8935 int rc2;
8936 bool fLockRead = false;
8937
8938 LogFlowFunc(("pDisk=%#p nImage=%u pLCHSGeometry=%#p\n",
8939 pDisk, nImage, pLCHSGeometry));
8940 do
8941 {
8942 /* sanity check */
8943 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8944 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8945
8946 /* Check arguments. */
8947 AssertMsgBreakStmt(VALID_PTR(pLCHSGeometry),
8948 ("pLCHSGeometry=%#p\n", pLCHSGeometry),
8949 rc = VERR_INVALID_PARAMETER);
8950
8951 rc2 = vdThreadStartRead(pDisk);
8952 AssertRC(rc2);
8953 fLockRead = true;
8954
8955 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8956 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8957
8958 if (pImage == pDisk->pLast)
8959 {
8960 /* Use cached information if possible. */
8961 if (pDisk->LCHSGeometry.cCylinders != 0)
8962 *pLCHSGeometry = pDisk->LCHSGeometry;
8963 else
8964 rc = VERR_VD_GEOMETRY_NOT_SET;
8965 }
8966 else
8967 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
8968 pLCHSGeometry);
8969 } while (0);
8970
8971 if (RT_UNLIKELY(fLockRead))
8972 {
8973 rc2 = vdThreadFinishRead(pDisk);
8974 AssertRC(rc2);
8975 }
8976
8977 LogFlowFunc((": %Rrc (LCHS=%u/%u/%u)\n", rc,
8978 pDisk->LCHSGeometry.cCylinders, pDisk->LCHSGeometry.cHeads,
8979 pDisk->LCHSGeometry.cSectors));
8980 return rc;
8981}
8982
8983/**
8984 * Store virtual disk LCHS geometry in HDD container.
8985 *
8986 * Note that in case of unrecoverable error all images in HDD container will be closed.
8987 *
8988 * @returns VBox status code.
8989 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8990 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8991 * @param pDisk Pointer to HDD container.
8992 * @param nImage Image number, counts from 0. 0 is always base image of container.
8993 * @param pLCHSGeometry Where to load LCHS geometry from. Not NULL.
8994 */
8995VBOXDDU_DECL(int) VDSetLCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
8996 PCVDGEOMETRY pLCHSGeometry)
8997{
8998 int rc = VINF_SUCCESS;
8999 int rc2;
9000 bool fLockWrite = false;
9001
9002 LogFlowFunc(("pDisk=%#p nImage=%u pLCHSGeometry=%#p LCHS=%u/%u/%u\n",
9003 pDisk, nImage, pLCHSGeometry, pLCHSGeometry->cCylinders,
9004 pLCHSGeometry->cHeads, pLCHSGeometry->cSectors));
9005 do
9006 {
9007 /* sanity check */
9008 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9009 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9010
9011 /* Check arguments. */
9012 AssertMsgBreakStmt( VALID_PTR(pLCHSGeometry)
9013 && pLCHSGeometry->cHeads <= 255
9014 && pLCHSGeometry->cSectors <= 63,
9015 ("pLCHSGeometry=%#p LCHS=%u/%u/%u\n", pLCHSGeometry,
9016 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads,
9017 pLCHSGeometry->cSectors),
9018 rc = VERR_INVALID_PARAMETER);
9019
9020 rc2 = vdThreadStartWrite(pDisk);
9021 AssertRC(rc2);
9022 fLockWrite = true;
9023
9024 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9025 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9026
9027 if (pImage == pDisk->pLast)
9028 {
9029 if ( pLCHSGeometry->cCylinders != pDisk->LCHSGeometry.cCylinders
9030 || pLCHSGeometry->cHeads != pDisk->LCHSGeometry.cHeads
9031 || pLCHSGeometry->cSectors != pDisk->LCHSGeometry.cSectors)
9032 {
9033 /* Only update geometry if it is changed. Avoids similar checks
9034 * in every backend. Most of the time the new geometry is set
9035 * to the previous values, so no need to go through the hassle
9036 * of updating an image which could be opened in read-only mode
9037 * right now. */
9038 rc = pImage->Backend->pfnSetLCHSGeometry(pImage->pBackendData,
9039 pLCHSGeometry);
9040
9041 /* Cache new geometry values in any case. */
9042 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
9043 &pDisk->LCHSGeometry);
9044 if (RT_FAILURE(rc2))
9045 {
9046 pDisk->LCHSGeometry.cCylinders = 0;
9047 pDisk->LCHSGeometry.cHeads = 0;
9048 pDisk->LCHSGeometry.cSectors = 0;
9049 }
9050 else
9051 {
9052 /* Make sure the CHS geometry is properly clipped. */
9053 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
9054 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
9055 }
9056 }
9057 }
9058 else
9059 {
9060 VDGEOMETRY LCHS;
9061 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
9062 &LCHS);
9063 if ( RT_FAILURE(rc)
9064 || pLCHSGeometry->cCylinders != LCHS.cCylinders
9065 || pLCHSGeometry->cHeads != LCHS.cHeads
9066 || pLCHSGeometry->cSectors != LCHS.cSectors)
9067 {
9068 /* Only update geometry if it is changed. Avoids similar checks
9069 * in every backend. Most of the time the new geometry is set
9070 * to the previous values, so no need to go through the hassle
9071 * of updating an image which could be opened in read-only mode
9072 * right now. */
9073 rc = pImage->Backend->pfnSetLCHSGeometry(pImage->pBackendData,
9074 pLCHSGeometry);
9075 }
9076 }
9077 } while (0);
9078
9079 if (RT_UNLIKELY(fLockWrite))
9080 {
9081 rc2 = vdThreadFinishWrite(pDisk);
9082 AssertRC(rc2);
9083 }
9084
9085 LogFlowFunc(("returns %Rrc\n", rc));
9086 return rc;
9087}
9088
9089/**
9090 * Get version of image in HDD container.
9091 *
9092 * @returns VBox status code.
9093 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9094 * @param pDisk Pointer to HDD container.
9095 * @param nImage Image number, counts from 0. 0 is always base image of container.
9096 * @param puVersion Where to store the image version.
9097 */
9098VBOXDDU_DECL(int) VDGetVersion(PVBOXHDD pDisk, unsigned nImage,
9099 unsigned *puVersion)
9100{
9101 int rc = VINF_SUCCESS;
9102 int rc2;
9103 bool fLockRead = false;
9104
9105 LogFlowFunc(("pDisk=%#p nImage=%u puVersion=%#p\n",
9106 pDisk, nImage, puVersion));
9107 do
9108 {
9109 /* sanity check */
9110 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9111 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9112
9113 /* Check arguments. */
9114 AssertMsgBreakStmt(VALID_PTR(puVersion),
9115 ("puVersion=%#p\n", puVersion),
9116 rc = VERR_INVALID_PARAMETER);
9117
9118 rc2 = vdThreadStartRead(pDisk);
9119 AssertRC(rc2);
9120 fLockRead = true;
9121
9122 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9123 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9124
9125 *puVersion = pImage->Backend->pfnGetVersion(pImage->pBackendData);
9126 } while (0);
9127
9128 if (RT_UNLIKELY(fLockRead))
9129 {
9130 rc2 = vdThreadFinishRead(pDisk);
9131 AssertRC(rc2);
9132 }
9133
9134 LogFlowFunc(("returns %Rrc uVersion=%#x\n", rc, *puVersion));
9135 return rc;
9136}
9137
9138/**
9139 * List the capabilities of image backend in HDD container.
9140 *
9141 * @returns VBox status code.
9142 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9143 * @param pDisk Pointer to the HDD container.
9144 * @param nImage Image number, counts from 0. 0 is always base image of container.
9145 * @param pbackendInfo Where to store the backend information.
9146 */
9147VBOXDDU_DECL(int) VDBackendInfoSingle(PVBOXHDD pDisk, unsigned nImage,
9148 PVDBACKENDINFO pBackendInfo)
9149{
9150 int rc = VINF_SUCCESS;
9151 int rc2;
9152 bool fLockRead = false;
9153
9154 LogFlowFunc(("pDisk=%#p nImage=%u pBackendInfo=%#p\n",
9155 pDisk, nImage, pBackendInfo));
9156 do
9157 {
9158 /* sanity check */
9159 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9160 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9161
9162 /* Check arguments. */
9163 AssertMsgBreakStmt(VALID_PTR(pBackendInfo),
9164 ("pBackendInfo=%#p\n", pBackendInfo),
9165 rc = VERR_INVALID_PARAMETER);
9166
9167 rc2 = vdThreadStartRead(pDisk);
9168 AssertRC(rc2);
9169 fLockRead = true;
9170
9171 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9172 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9173
9174 pBackendInfo->pszBackend = pImage->Backend->pszBackendName;
9175 pBackendInfo->uBackendCaps = pImage->Backend->uBackendCaps;
9176 pBackendInfo->paFileExtensions = pImage->Backend->paFileExtensions;
9177 pBackendInfo->paConfigInfo = pImage->Backend->paConfigInfo;
9178 } while (0);
9179
9180 if (RT_UNLIKELY(fLockRead))
9181 {
9182 rc2 = vdThreadFinishRead(pDisk);
9183 AssertRC(rc2);
9184 }
9185
9186 LogFlowFunc(("returns %Rrc\n", rc));
9187 return rc;
9188}
9189
9190/**
9191 * Get flags of image in HDD container.
9192 *
9193 * @returns VBox status code.
9194 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9195 * @param pDisk Pointer to HDD container.
9196 * @param nImage Image number, counts from 0. 0 is always base image of container.
9197 * @param puImageFlags Where to store the image flags.
9198 */
9199VBOXDDU_DECL(int) VDGetImageFlags(PVBOXHDD pDisk, unsigned nImage,
9200 unsigned *puImageFlags)
9201{
9202 int rc = VINF_SUCCESS;
9203 int rc2;
9204 bool fLockRead = false;
9205
9206 LogFlowFunc(("pDisk=%#p nImage=%u puImageFlags=%#p\n",
9207 pDisk, nImage, puImageFlags));
9208 do
9209 {
9210 /* sanity check */
9211 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9212 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9213
9214 /* Check arguments. */
9215 AssertMsgBreakStmt(VALID_PTR(puImageFlags),
9216 ("puImageFlags=%#p\n", puImageFlags),
9217 rc = VERR_INVALID_PARAMETER);
9218
9219 rc2 = vdThreadStartRead(pDisk);
9220 AssertRC(rc2);
9221 fLockRead = true;
9222
9223 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9224 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9225
9226 *puImageFlags = pImage->uImageFlags;
9227 } while (0);
9228
9229 if (RT_UNLIKELY(fLockRead))
9230 {
9231 rc2 = vdThreadFinishRead(pDisk);
9232 AssertRC(rc2);
9233 }
9234
9235 LogFlowFunc(("returns %Rrc uImageFlags=%#x\n", rc, *puImageFlags));
9236 return rc;
9237}
9238
9239/**
9240 * Get open flags of image in HDD container.
9241 *
9242 * @returns VBox status code.
9243 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9244 * @param pDisk Pointer to HDD container.
9245 * @param nImage Image number, counts from 0. 0 is always base image of container.
9246 * @param puOpenFlags Where to store the image open flags.
9247 */
9248VBOXDDU_DECL(int) VDGetOpenFlags(PVBOXHDD pDisk, unsigned nImage,
9249 unsigned *puOpenFlags)
9250{
9251 int rc = VINF_SUCCESS;
9252 int rc2;
9253 bool fLockRead = false;
9254
9255 LogFlowFunc(("pDisk=%#p nImage=%u puOpenFlags=%#p\n",
9256 pDisk, nImage, puOpenFlags));
9257 do
9258 {
9259 /* sanity check */
9260 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9261 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9262
9263 /* Check arguments. */
9264 AssertMsgBreakStmt(VALID_PTR(puOpenFlags),
9265 ("puOpenFlags=%#p\n", puOpenFlags),
9266 rc = VERR_INVALID_PARAMETER);
9267
9268 rc2 = vdThreadStartRead(pDisk);
9269 AssertRC(rc2);
9270 fLockRead = true;
9271
9272 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9273 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9274
9275 *puOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
9276 } while (0);
9277
9278 if (RT_UNLIKELY(fLockRead))
9279 {
9280 rc2 = vdThreadFinishRead(pDisk);
9281 AssertRC(rc2);
9282 }
9283
9284 LogFlowFunc(("returns %Rrc uOpenFlags=%#x\n", rc, *puOpenFlags));
9285 return rc;
9286}
9287
9288/**
9289 * Set open flags of image in HDD container.
9290 * This operation may cause file locking changes and/or files being reopened.
9291 * Note that in case of unrecoverable error all images in HDD container will be closed.
9292 *
9293 * @returns VBox status code.
9294 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9295 * @param pDisk Pointer to HDD container.
9296 * @param nImage Image number, counts from 0. 0 is always base image of container.
9297 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
9298 */
9299VBOXDDU_DECL(int) VDSetOpenFlags(PVBOXHDD pDisk, unsigned nImage,
9300 unsigned uOpenFlags)
9301{
9302 int rc;
9303 int rc2;
9304 bool fLockWrite = false;
9305
9306 LogFlowFunc(("pDisk=%#p uOpenFlags=%#u\n", pDisk, uOpenFlags));
9307 do
9308 {
9309 /* sanity check */
9310 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9311 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9312
9313 /* Check arguments. */
9314 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
9315 ("uOpenFlags=%#x\n", uOpenFlags),
9316 rc = VERR_INVALID_PARAMETER);
9317
9318 rc2 = vdThreadStartWrite(pDisk);
9319 AssertRC(rc2);
9320 fLockWrite = true;
9321
9322 /* Destroy any discard state because the image might be changed to readonly mode. */
9323 rc = vdDiscardStateDestroy(pDisk);
9324 if (RT_FAILURE(rc))
9325 break;
9326
9327 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9328 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9329
9330 rc = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData,
9331 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS));
9332 if (RT_SUCCESS(rc))
9333 pImage->uOpenFlags = uOpenFlags & (VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_DISCARD | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS);
9334 } while (0);
9335
9336 if (RT_UNLIKELY(fLockWrite))
9337 {
9338 rc2 = vdThreadFinishWrite(pDisk);
9339 AssertRC(rc2);
9340 }
9341
9342 LogFlowFunc(("returns %Rrc\n", rc));
9343 return rc;
9344}
9345
9346/**
9347 * Get base filename of image in HDD container. Some image formats use
9348 * other filenames as well, so don't use this for anything but informational
9349 * purposes.
9350 *
9351 * @returns VBox status code.
9352 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9353 * @returns VERR_BUFFER_OVERFLOW if pszFilename buffer too small to hold filename.
9354 * @param pDisk Pointer to HDD container.
9355 * @param nImage Image number, counts from 0. 0 is always base image of container.
9356 * @param pszFilename Where to store the image file name.
9357 * @param cbFilename Size of buffer pszFilename points to.
9358 */
9359VBOXDDU_DECL(int) VDGetFilename(PVBOXHDD pDisk, unsigned nImage,
9360 char *pszFilename, unsigned cbFilename)
9361{
9362 int rc;
9363 int rc2;
9364 bool fLockRead = false;
9365
9366 LogFlowFunc(("pDisk=%#p nImage=%u pszFilename=%#p cbFilename=%u\n",
9367 pDisk, nImage, pszFilename, cbFilename));
9368 do
9369 {
9370 /* sanity check */
9371 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9372 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9373
9374 /* Check arguments. */
9375 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
9376 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
9377 rc = VERR_INVALID_PARAMETER);
9378 AssertMsgBreakStmt(cbFilename,
9379 ("cbFilename=%u\n", cbFilename),
9380 rc = VERR_INVALID_PARAMETER);
9381
9382 rc2 = vdThreadStartRead(pDisk);
9383 AssertRC(rc2);
9384 fLockRead = true;
9385
9386 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9387 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9388
9389 size_t cb = strlen(pImage->pszFilename);
9390 if (cb <= cbFilename)
9391 {
9392 strcpy(pszFilename, pImage->pszFilename);
9393 rc = VINF_SUCCESS;
9394 }
9395 else
9396 {
9397 strncpy(pszFilename, pImage->pszFilename, cbFilename - 1);
9398 pszFilename[cbFilename - 1] = '\0';
9399 rc = VERR_BUFFER_OVERFLOW;
9400 }
9401 } while (0);
9402
9403 if (RT_UNLIKELY(fLockRead))
9404 {
9405 rc2 = vdThreadFinishRead(pDisk);
9406 AssertRC(rc2);
9407 }
9408
9409 LogFlowFunc(("returns %Rrc, pszFilename=\"%s\"\n", rc, pszFilename));
9410 return rc;
9411}
9412
9413/**
9414 * Get the comment line of image in HDD container.
9415 *
9416 * @returns VBox status code.
9417 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9418 * @returns VERR_BUFFER_OVERFLOW if pszComment buffer too small to hold comment text.
9419 * @param pDisk Pointer to HDD container.
9420 * @param nImage Image number, counts from 0. 0 is always base image of container.
9421 * @param pszComment Where to store the comment string of image. NULL is ok.
9422 * @param cbComment The size of pszComment buffer. 0 is ok.
9423 */
9424VBOXDDU_DECL(int) VDGetComment(PVBOXHDD pDisk, unsigned nImage,
9425 char *pszComment, unsigned cbComment)
9426{
9427 int rc;
9428 int rc2;
9429 bool fLockRead = false;
9430
9431 LogFlowFunc(("pDisk=%#p nImage=%u pszComment=%#p cbComment=%u\n",
9432 pDisk, nImage, pszComment, cbComment));
9433 do
9434 {
9435 /* sanity check */
9436 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9437 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9438
9439 /* Check arguments. */
9440 AssertMsgBreakStmt(VALID_PTR(pszComment),
9441 ("pszComment=%#p \"%s\"\n", pszComment, pszComment),
9442 rc = VERR_INVALID_PARAMETER);
9443 AssertMsgBreakStmt(cbComment,
9444 ("cbComment=%u\n", cbComment),
9445 rc = VERR_INVALID_PARAMETER);
9446
9447 rc2 = vdThreadStartRead(pDisk);
9448 AssertRC(rc2);
9449 fLockRead = true;
9450
9451 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9452 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9453
9454 rc = pImage->Backend->pfnGetComment(pImage->pBackendData, pszComment,
9455 cbComment);
9456 } while (0);
9457
9458 if (RT_UNLIKELY(fLockRead))
9459 {
9460 rc2 = vdThreadFinishRead(pDisk);
9461 AssertRC(rc2);
9462 }
9463
9464 LogFlowFunc(("returns %Rrc, pszComment=\"%s\"\n", rc, pszComment));
9465 return rc;
9466}
9467
9468/**
9469 * Changes the comment line of image in HDD container.
9470 *
9471 * @returns VBox status code.
9472 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9473 * @param pDisk Pointer to HDD container.
9474 * @param nImage Image number, counts from 0. 0 is always base image of container.
9475 * @param pszComment New comment string (UTF-8). NULL is allowed to reset the comment.
9476 */
9477VBOXDDU_DECL(int) VDSetComment(PVBOXHDD pDisk, unsigned nImage,
9478 const char *pszComment)
9479{
9480 int rc;
9481 int rc2;
9482 bool fLockWrite = false;
9483
9484 LogFlowFunc(("pDisk=%#p nImage=%u pszComment=%#p \"%s\"\n",
9485 pDisk, nImage, pszComment, pszComment));
9486 do
9487 {
9488 /* sanity check */
9489 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9490 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9491
9492 /* Check arguments. */
9493 AssertMsgBreakStmt(VALID_PTR(pszComment) || pszComment == NULL,
9494 ("pszComment=%#p \"%s\"\n", pszComment, pszComment),
9495 rc = VERR_INVALID_PARAMETER);
9496
9497 rc2 = vdThreadStartWrite(pDisk);
9498 AssertRC(rc2);
9499 fLockWrite = true;
9500
9501 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9502 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9503
9504 rc = pImage->Backend->pfnSetComment(pImage->pBackendData, pszComment);
9505 } while (0);
9506
9507 if (RT_UNLIKELY(fLockWrite))
9508 {
9509 rc2 = vdThreadFinishWrite(pDisk);
9510 AssertRC(rc2);
9511 }
9512
9513 LogFlowFunc(("returns %Rrc\n", rc));
9514 return rc;
9515}
9516
9517
9518/**
9519 * Get UUID of image in HDD container.
9520 *
9521 * @returns VBox status code.
9522 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9523 * @param pDisk Pointer to HDD container.
9524 * @param nImage Image number, counts from 0. 0 is always base image of container.
9525 * @param pUuid Where to store the image creation UUID.
9526 */
9527VBOXDDU_DECL(int) VDGetUuid(PVBOXHDD pDisk, unsigned nImage, PRTUUID pUuid)
9528{
9529 int rc;
9530 int rc2;
9531 bool fLockRead = false;
9532
9533 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9534 do
9535 {
9536 /* sanity check */
9537 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9538 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9539
9540 /* Check arguments. */
9541 AssertMsgBreakStmt(VALID_PTR(pUuid),
9542 ("pUuid=%#p\n", pUuid),
9543 rc = VERR_INVALID_PARAMETER);
9544
9545 rc2 = vdThreadStartRead(pDisk);
9546 AssertRC(rc2);
9547 fLockRead = true;
9548
9549 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9550 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9551
9552 rc = pImage->Backend->pfnGetUuid(pImage->pBackendData, pUuid);
9553 } while (0);
9554
9555 if (RT_UNLIKELY(fLockRead))
9556 {
9557 rc2 = vdThreadFinishRead(pDisk);
9558 AssertRC(rc2);
9559 }
9560
9561 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9562 return rc;
9563}
9564
9565/**
9566 * Set the image's UUID. Should not be used by normal applications.
9567 *
9568 * @returns VBox status code.
9569 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9570 * @param pDisk Pointer to HDD container.
9571 * @param nImage Image number, counts from 0. 0 is always base image of container.
9572 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
9573 */
9574VBOXDDU_DECL(int) VDSetUuid(PVBOXHDD pDisk, unsigned nImage, PCRTUUID pUuid)
9575{
9576 int rc;
9577 int rc2;
9578 bool fLockWrite = false;
9579
9580 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9581 pDisk, nImage, pUuid, pUuid));
9582 do
9583 {
9584 /* sanity check */
9585 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9586 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9587
9588 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9589 ("pUuid=%#p\n", pUuid),
9590 rc = VERR_INVALID_PARAMETER);
9591
9592 rc2 = vdThreadStartWrite(pDisk);
9593 AssertRC(rc2);
9594 fLockWrite = true;
9595
9596 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9597 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9598
9599 RTUUID Uuid;
9600 if (!pUuid)
9601 {
9602 RTUuidCreate(&Uuid);
9603 pUuid = &Uuid;
9604 }
9605 rc = pImage->Backend->pfnSetUuid(pImage->pBackendData, pUuid);
9606 } while (0);
9607
9608 if (RT_UNLIKELY(fLockWrite))
9609 {
9610 rc2 = vdThreadFinishWrite(pDisk);
9611 AssertRC(rc2);
9612 }
9613
9614 LogFlowFunc(("returns %Rrc\n", rc));
9615 return rc;
9616}
9617
9618/**
9619 * Get last modification UUID of image in HDD container.
9620 *
9621 * @returns VBox status code.
9622 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9623 * @param pDisk Pointer to HDD container.
9624 * @param nImage Image number, counts from 0. 0 is always base image of container.
9625 * @param pUuid Where to store the image modification UUID.
9626 */
9627VBOXDDU_DECL(int) VDGetModificationUuid(PVBOXHDD pDisk, unsigned nImage, PRTUUID pUuid)
9628{
9629 int rc = VINF_SUCCESS;
9630 int rc2;
9631 bool fLockRead = false;
9632
9633 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9634 do
9635 {
9636 /* sanity check */
9637 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9638 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9639
9640 /* Check arguments. */
9641 AssertMsgBreakStmt(VALID_PTR(pUuid),
9642 ("pUuid=%#p\n", pUuid),
9643 rc = VERR_INVALID_PARAMETER);
9644
9645 rc2 = vdThreadStartRead(pDisk);
9646 AssertRC(rc2);
9647 fLockRead = true;
9648
9649 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9650 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9651
9652 rc = pImage->Backend->pfnGetModificationUuid(pImage->pBackendData,
9653 pUuid);
9654 } while (0);
9655
9656 if (RT_UNLIKELY(fLockRead))
9657 {
9658 rc2 = vdThreadFinishRead(pDisk);
9659 AssertRC(rc2);
9660 }
9661
9662 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9663 return rc;
9664}
9665
9666/**
9667 * Set the image's last modification UUID. Should not be used by normal applications.
9668 *
9669 * @returns VBox status code.
9670 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9671 * @param pDisk Pointer to HDD container.
9672 * @param nImage Image number, counts from 0. 0 is always base image of container.
9673 * @param pUuid New modification UUID of the image. If NULL, a new UUID is created.
9674 */
9675VBOXDDU_DECL(int) VDSetModificationUuid(PVBOXHDD pDisk, unsigned nImage, PCRTUUID pUuid)
9676{
9677 int rc;
9678 int rc2;
9679 bool fLockWrite = false;
9680
9681 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9682 pDisk, nImage, pUuid, pUuid));
9683 do
9684 {
9685 /* sanity check */
9686 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9687 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9688
9689 /* Check arguments. */
9690 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9691 ("pUuid=%#p\n", pUuid),
9692 rc = VERR_INVALID_PARAMETER);
9693
9694 rc2 = vdThreadStartWrite(pDisk);
9695 AssertRC(rc2);
9696 fLockWrite = true;
9697
9698 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9699 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9700
9701 RTUUID Uuid;
9702 if (!pUuid)
9703 {
9704 RTUuidCreate(&Uuid);
9705 pUuid = &Uuid;
9706 }
9707 rc = pImage->Backend->pfnSetModificationUuid(pImage->pBackendData,
9708 pUuid);
9709 } while (0);
9710
9711 if (RT_UNLIKELY(fLockWrite))
9712 {
9713 rc2 = vdThreadFinishWrite(pDisk);
9714 AssertRC(rc2);
9715 }
9716
9717 LogFlowFunc(("returns %Rrc\n", rc));
9718 return rc;
9719}
9720
9721/**
9722 * Get parent UUID of image in HDD container.
9723 *
9724 * @returns VBox status code.
9725 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9726 * @param pDisk Pointer to HDD container.
9727 * @param nImage Image number, counts from 0. 0 is always base image of container.
9728 * @param pUuid Where to store the parent image UUID.
9729 */
9730VBOXDDU_DECL(int) VDGetParentUuid(PVBOXHDD pDisk, unsigned nImage,
9731 PRTUUID pUuid)
9732{
9733 int rc = VINF_SUCCESS;
9734 int rc2;
9735 bool fLockRead = false;
9736
9737 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9738 do
9739 {
9740 /* sanity check */
9741 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9742 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9743
9744 /* Check arguments. */
9745 AssertMsgBreakStmt(VALID_PTR(pUuid),
9746 ("pUuid=%#p\n", pUuid),
9747 rc = VERR_INVALID_PARAMETER);
9748
9749 rc2 = vdThreadStartRead(pDisk);
9750 AssertRC(rc2);
9751 fLockRead = true;
9752
9753 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9754 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9755
9756 rc = pImage->Backend->pfnGetParentUuid(pImage->pBackendData, pUuid);
9757 } while (0);
9758
9759 if (RT_UNLIKELY(fLockRead))
9760 {
9761 rc2 = vdThreadFinishRead(pDisk);
9762 AssertRC(rc2);
9763 }
9764
9765 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9766 return rc;
9767}
9768
9769/**
9770 * Set the image's parent UUID. Should not be used by normal applications.
9771 *
9772 * @returns VBox status code.
9773 * @param pDisk Pointer to HDD container.
9774 * @param nImage Image number, counts from 0. 0 is always base image of container.
9775 * @param pUuid New parent UUID of the image. If NULL, a new UUID is created.
9776 */
9777VBOXDDU_DECL(int) VDSetParentUuid(PVBOXHDD pDisk, unsigned nImage,
9778 PCRTUUID pUuid)
9779{
9780 int rc;
9781 int rc2;
9782 bool fLockWrite = false;
9783
9784 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9785 pDisk, nImage, pUuid, pUuid));
9786 do
9787 {
9788 /* sanity check */
9789 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9790 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9791
9792 /* Check arguments. */
9793 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9794 ("pUuid=%#p\n", pUuid),
9795 rc = VERR_INVALID_PARAMETER);
9796
9797 rc2 = vdThreadStartWrite(pDisk);
9798 AssertRC(rc2);
9799 fLockWrite = true;
9800
9801 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9802 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9803
9804 RTUUID Uuid;
9805 if (!pUuid)
9806 {
9807 RTUuidCreate(&Uuid);
9808 pUuid = &Uuid;
9809 }
9810 rc = pImage->Backend->pfnSetParentUuid(pImage->pBackendData, pUuid);
9811 } while (0);
9812
9813 if (RT_UNLIKELY(fLockWrite))
9814 {
9815 rc2 = vdThreadFinishWrite(pDisk);
9816 AssertRC(rc2);
9817 }
9818
9819 LogFlowFunc(("returns %Rrc\n", rc));
9820 return rc;
9821}
9822
9823
9824/**
9825 * Debug helper - dumps all opened images in HDD container into the log file.
9826 *
9827 * @param pDisk Pointer to HDD container.
9828 */
9829VBOXDDU_DECL(void) VDDumpImages(PVBOXHDD pDisk)
9830{
9831 int rc2;
9832 bool fLockRead = false;
9833
9834 do
9835 {
9836 /* sanity check */
9837 AssertPtrBreak(pDisk);
9838 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9839
9840 if (!pDisk->pInterfaceError || !VALID_PTR(pDisk->pInterfaceError->pfnMessage))
9841 pDisk->pInterfaceError->pfnMessage = vdLogMessage;
9842
9843 rc2 = vdThreadStartRead(pDisk);
9844 AssertRC(rc2);
9845 fLockRead = true;
9846
9847 vdMessageWrapper(pDisk, "--- Dumping VD Disk, Images=%u\n", pDisk->cImages);
9848 for (PVDIMAGE pImage = pDisk->pBase; pImage; pImage = pImage->pNext)
9849 {
9850 vdMessageWrapper(pDisk, "Dumping VD image \"%s\" (Backend=%s)\n",
9851 pImage->pszFilename, pImage->Backend->pszBackendName);
9852 pImage->Backend->pfnDump(pImage->pBackendData);
9853 }
9854 } while (0);
9855
9856 if (RT_UNLIKELY(fLockRead))
9857 {
9858 rc2 = vdThreadFinishRead(pDisk);
9859 AssertRC(rc2);
9860 }
9861}
9862
9863
9864VBOXDDU_DECL(int) VDDiscardRanges(PVBOXHDD pDisk, PCRTRANGE paRanges, unsigned cRanges)
9865{
9866 int rc;
9867 int rc2;
9868 bool fLockWrite = false;
9869
9870 LogFlowFunc(("pDisk=%#p paRanges=%#p cRanges=%u\n",
9871 pDisk, paRanges, cRanges));
9872 do
9873 {
9874 /* sanity check */
9875 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9876 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9877
9878 /* Check arguments. */
9879 AssertMsgBreakStmt(cRanges,
9880 ("cRanges=%u\n", cRanges),
9881 rc = VERR_INVALID_PARAMETER);
9882 AssertMsgBreakStmt(VALID_PTR(paRanges),
9883 ("paRanges=%#p\n", paRanges),
9884 rc = VERR_INVALID_PARAMETER);
9885
9886 rc2 = vdThreadStartWrite(pDisk);
9887 AssertRC(rc2);
9888 fLockWrite = true;
9889
9890 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
9891
9892 AssertMsgBreakStmt(pDisk->pLast->uOpenFlags & VD_OPEN_FLAGS_DISCARD,
9893 ("Discarding not supported\n"),
9894 rc = VERR_NOT_SUPPORTED);
9895
9896 VDIOCTX IoCtx;
9897 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
9898
9899 rc = RTSemEventCreate(&hEventComplete);
9900 if (RT_FAILURE(rc))
9901 break;
9902
9903 vdIoCtxDiscardInit(&IoCtx, pDisk, paRanges, cRanges,
9904 vdIoCtxSyncComplete, pDisk, hEventComplete, NULL,
9905 vdDiscardHelperAsync, VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE);
9906 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
9907
9908 RTSemEventDestroy(hEventComplete);
9909 } while (0);
9910
9911 if (RT_UNLIKELY(fLockWrite))
9912 {
9913 rc2 = vdThreadFinishWrite(pDisk);
9914 AssertRC(rc2);
9915 }
9916
9917 LogFlowFunc(("returns %Rrc\n", rc));
9918 return rc;
9919}
9920
9921
9922VBOXDDU_DECL(int) VDAsyncRead(PVBOXHDD pDisk, uint64_t uOffset, size_t cbRead,
9923 PCRTSGBUF pcSgBuf,
9924 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
9925 void *pvUser1, void *pvUser2)
9926{
9927 int rc = VERR_VD_BLOCK_FREE;
9928 int rc2;
9929 bool fLockRead = false;
9930 PVDIOCTX pIoCtx = NULL;
9931
9932 LogFlowFunc(("pDisk=%#p uOffset=%llu pcSgBuf=%#p cbRead=%zu pvUser1=%#p pvUser2=%#p\n",
9933 pDisk, uOffset, pcSgBuf, cbRead, pvUser1, pvUser2));
9934
9935 do
9936 {
9937 /* sanity check */
9938 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9939 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9940
9941 /* Check arguments. */
9942 AssertMsgBreakStmt(cbRead,
9943 ("cbRead=%zu\n", cbRead),
9944 rc = VERR_INVALID_PARAMETER);
9945 AssertMsgBreakStmt(VALID_PTR(pcSgBuf),
9946 ("pcSgBuf=%#p\n", pcSgBuf),
9947 rc = VERR_INVALID_PARAMETER);
9948
9949 rc2 = vdThreadStartRead(pDisk);
9950 AssertRC(rc2);
9951 fLockRead = true;
9952
9953 AssertMsgBreakStmt(uOffset + cbRead <= pDisk->cbSize,
9954 ("uOffset=%llu cbRead=%zu pDisk->cbSize=%llu\n",
9955 uOffset, cbRead, pDisk->cbSize),
9956 rc = VERR_INVALID_PARAMETER);
9957 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
9958
9959 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_READ, uOffset,
9960 cbRead, pDisk->pLast, pcSgBuf,
9961 pfnComplete, pvUser1, pvUser2,
9962 NULL, vdReadHelperAsync,
9963 VDIOCTX_FLAGS_ZERO_FREE_BLOCKS);
9964 if (!pIoCtx)
9965 {
9966 rc = VERR_NO_MEMORY;
9967 break;
9968 }
9969
9970 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
9971 if (rc == VINF_VD_ASYNC_IO_FINISHED)
9972 {
9973 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
9974 vdIoCtxFree(pDisk, pIoCtx);
9975 else
9976 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
9977 }
9978 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
9979 vdIoCtxFree(pDisk, pIoCtx);
9980
9981 } while (0);
9982
9983 if (RT_UNLIKELY(fLockRead) && ( rc == VINF_VD_ASYNC_IO_FINISHED
9984 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
9985 {
9986 rc2 = vdThreadFinishRead(pDisk);
9987 AssertRC(rc2);
9988 }
9989
9990 LogFlowFunc(("returns %Rrc\n", rc));
9991 return rc;
9992}
9993
9994
9995VBOXDDU_DECL(int) VDAsyncWrite(PVBOXHDD pDisk, uint64_t uOffset, size_t cbWrite,
9996 PCRTSGBUF pcSgBuf,
9997 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
9998 void *pvUser1, void *pvUser2)
9999{
10000 int rc;
10001 int rc2;
10002 bool fLockWrite = false;
10003 PVDIOCTX pIoCtx = NULL;
10004
10005 LogFlowFunc(("pDisk=%#p uOffset=%llu cSgBuf=%#p cbWrite=%zu pvUser1=%#p pvUser2=%#p\n",
10006 pDisk, uOffset, pcSgBuf, cbWrite, pvUser1, pvUser2));
10007 do
10008 {
10009 /* sanity check */
10010 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10011 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10012
10013 /* Check arguments. */
10014 AssertMsgBreakStmt(cbWrite,
10015 ("cbWrite=%zu\n", cbWrite),
10016 rc = VERR_INVALID_PARAMETER);
10017 AssertMsgBreakStmt(VALID_PTR(pcSgBuf),
10018 ("pcSgBuf=%#p\n", pcSgBuf),
10019 rc = VERR_INVALID_PARAMETER);
10020
10021 rc2 = vdThreadStartWrite(pDisk);
10022 AssertRC(rc2);
10023 fLockWrite = true;
10024
10025 AssertMsgBreakStmt(uOffset + cbWrite <= pDisk->cbSize,
10026 ("uOffset=%llu cbWrite=%zu pDisk->cbSize=%llu\n",
10027 uOffset, cbWrite, pDisk->cbSize),
10028 rc = VERR_INVALID_PARAMETER);
10029 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10030
10031 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_WRITE, uOffset,
10032 cbWrite, pDisk->pLast, pcSgBuf,
10033 pfnComplete, pvUser1, pvUser2,
10034 NULL, vdWriteHelperAsync,
10035 VDIOCTX_FLAGS_DEFAULT);
10036 if (!pIoCtx)
10037 {
10038 rc = VERR_NO_MEMORY;
10039 break;
10040 }
10041
10042 /* Apply write filter chain here. */
10043 rc = vdFilterChainApplyWrite(pDisk, uOffset, cbWrite, pIoCtx);
10044 if (RT_FAILURE(rc))
10045 {
10046 vdIoCtxFree(pDisk, pIoCtx);
10047 break;
10048 }
10049
10050 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10051 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10052 {
10053 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10054 vdIoCtxFree(pDisk, pIoCtx);
10055 else
10056 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10057 }
10058 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10059 vdIoCtxFree(pDisk, pIoCtx);
10060 } while (0);
10061
10062 if (RT_UNLIKELY(fLockWrite) && ( rc == VINF_VD_ASYNC_IO_FINISHED
10063 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10064 {
10065 rc2 = vdThreadFinishWrite(pDisk);
10066 AssertRC(rc2);
10067 }
10068
10069 LogFlowFunc(("returns %Rrc\n", rc));
10070 return rc;
10071}
10072
10073
10074VBOXDDU_DECL(int) VDAsyncFlush(PVBOXHDD pDisk, PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10075 void *pvUser1, void *pvUser2)
10076{
10077 int rc;
10078 int rc2;
10079 bool fLockWrite = false;
10080 PVDIOCTX pIoCtx = NULL;
10081
10082 LogFlowFunc(("pDisk=%#p\n", pDisk));
10083
10084 do
10085 {
10086 /* sanity check */
10087 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10088 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10089
10090 rc2 = vdThreadStartWrite(pDisk);
10091 AssertRC(rc2);
10092 fLockWrite = true;
10093
10094 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10095
10096 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_FLUSH, 0,
10097 0, pDisk->pLast, NULL,
10098 pfnComplete, pvUser1, pvUser2,
10099 NULL, vdFlushHelperAsync,
10100 VDIOCTX_FLAGS_DEFAULT);
10101 if (!pIoCtx)
10102 {
10103 rc = VERR_NO_MEMORY;
10104 break;
10105 }
10106
10107 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10108 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10109 {
10110 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10111 vdIoCtxFree(pDisk, pIoCtx);
10112 else
10113 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10114 }
10115 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10116 vdIoCtxFree(pDisk, pIoCtx);
10117 } while (0);
10118
10119 if (RT_UNLIKELY(fLockWrite) && ( rc == VINF_VD_ASYNC_IO_FINISHED
10120 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10121 {
10122 rc2 = vdThreadFinishWrite(pDisk);
10123 AssertRC(rc2);
10124 }
10125
10126 LogFlowFunc(("returns %Rrc\n", rc));
10127 return rc;
10128}
10129
10130VBOXDDU_DECL(int) VDAsyncDiscardRanges(PVBOXHDD pDisk, PCRTRANGE paRanges, unsigned cRanges,
10131 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10132 void *pvUser1, void *pvUser2)
10133{
10134 int rc;
10135 int rc2;
10136 bool fLockWrite = false;
10137 PVDIOCTX pIoCtx = NULL;
10138
10139 LogFlowFunc(("pDisk=%#p\n", pDisk));
10140
10141 do
10142 {
10143 /* sanity check */
10144 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10145 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10146
10147 rc2 = vdThreadStartWrite(pDisk);
10148 AssertRC(rc2);
10149 fLockWrite = true;
10150
10151 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10152
10153 pIoCtx = vdIoCtxDiscardAlloc(pDisk, paRanges, cRanges,
10154 pfnComplete, pvUser1, pvUser2, NULL,
10155 vdDiscardHelperAsync,
10156 VDIOCTX_FLAGS_DEFAULT);
10157 if (!pIoCtx)
10158 {
10159 rc = VERR_NO_MEMORY;
10160 break;
10161 }
10162
10163 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10164 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10165 {
10166 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10167 vdIoCtxFree(pDisk, pIoCtx);
10168 else
10169 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10170 }
10171 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10172 vdIoCtxFree(pDisk, pIoCtx);
10173 } while (0);
10174
10175 if (RT_UNLIKELY(fLockWrite) && ( rc == VINF_VD_ASYNC_IO_FINISHED
10176 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10177 {
10178 rc2 = vdThreadFinishWrite(pDisk);
10179 AssertRC(rc2);
10180 }
10181
10182 LogFlowFunc(("returns %Rrc\n", rc));
10183 return rc;
10184}
10185
10186VBOXDDU_DECL(int) VDRepair(PVDINTERFACE pVDIfsDisk, PVDINTERFACE pVDIfsImage,
10187 const char *pszFilename, const char *pszBackend,
10188 uint32_t fFlags)
10189{
10190 int rc = VERR_NOT_SUPPORTED;
10191 PCVBOXHDDBACKEND pBackend = NULL;
10192 VDINTERFACEIOINT VDIfIoInt;
10193 VDINTERFACEIO VDIfIoFallback;
10194 PVDINTERFACEIO pInterfaceIo;
10195
10196 LogFlowFunc(("pszFilename=\"%s\"\n", pszFilename));
10197 /* Check arguments. */
10198 AssertMsgReturn(VALID_PTR(pszFilename) && *pszFilename,
10199 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
10200 VERR_INVALID_PARAMETER);
10201 AssertMsgReturn(VALID_PTR(pszBackend),
10202 ("pszBackend=%#p\n", pszBackend),
10203 VERR_INVALID_PARAMETER);
10204 AssertMsgReturn((fFlags & ~VD_REPAIR_FLAGS_MASK) == 0,
10205 ("fFlags=%#x\n", fFlags),
10206 VERR_INVALID_PARAMETER);
10207
10208 pInterfaceIo = VDIfIoGet(pVDIfsImage);
10209 if (!pInterfaceIo)
10210 {
10211 /*
10212 * Caller doesn't provide an I/O interface, create our own using the
10213 * native file API.
10214 */
10215 vdIfIoFallbackCallbacksSetup(&VDIfIoFallback);
10216 pInterfaceIo = &VDIfIoFallback;
10217 }
10218
10219 /* Set up the internal I/O interface. */
10220 AssertReturn(!VDIfIoIntGet(pVDIfsImage), VERR_INVALID_PARAMETER);
10221 VDIfIoInt.pfnOpen = vdIOIntOpenLimited;
10222 VDIfIoInt.pfnClose = vdIOIntCloseLimited;
10223 VDIfIoInt.pfnDelete = vdIOIntDeleteLimited;
10224 VDIfIoInt.pfnMove = vdIOIntMoveLimited;
10225 VDIfIoInt.pfnGetFreeSpace = vdIOIntGetFreeSpaceLimited;
10226 VDIfIoInt.pfnGetModificationTime = vdIOIntGetModificationTimeLimited;
10227 VDIfIoInt.pfnGetSize = vdIOIntGetSizeLimited;
10228 VDIfIoInt.pfnSetSize = vdIOIntSetSizeLimited;
10229 VDIfIoInt.pfnReadUser = vdIOIntReadUserLimited;
10230 VDIfIoInt.pfnWriteUser = vdIOIntWriteUserLimited;
10231 VDIfIoInt.pfnReadMeta = vdIOIntReadMetaLimited;
10232 VDIfIoInt.pfnWriteMeta = vdIOIntWriteMetaLimited;
10233 VDIfIoInt.pfnFlush = vdIOIntFlushLimited;
10234 rc = VDInterfaceAdd(&VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
10235 pInterfaceIo, sizeof(VDINTERFACEIOINT), &pVDIfsImage);
10236 AssertRC(rc);
10237
10238 rc = vdFindBackend(pszBackend, &pBackend);
10239 if (RT_SUCCESS(rc))
10240 {
10241 if (pBackend->pfnRepair)
10242 rc = pBackend->pfnRepair(pszFilename, pVDIfsDisk, pVDIfsImage, fFlags);
10243 else
10244 rc = VERR_VD_IMAGE_REPAIR_NOT_SUPPORTED;
10245 }
10246
10247 LogFlowFunc(("returns %Rrc\n", rc));
10248 return rc;
10249}
10250
Note: See TracBrowser for help on using the repository browser.

© 2025 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette