VirtualBox

source: vbox/trunk/src/VBox/Storage/VD.cpp@ 52268

Last change on this file since 52268 was 52268, checked in by vboxsync, 11 years ago

VD: Fix read corruption under rare circumstances if a read happens while a write allocating data accesses the same range

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 368.1 KB
Line 
1/* $Id: VD.cpp 52268 2014-08-04 19:20:02Z vboxsync $ */
2/** @file
3 * VBoxHDD - VBox HDD Container implementation.
4 */
5
6/*
7 * Copyright (C) 2006-2013 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18/*******************************************************************************
19* Header Files *
20*******************************************************************************/
21#define LOG_GROUP LOG_GROUP_VD
22#include <VBox/vd.h>
23#include <VBox/err.h>
24#include <VBox/sup.h>
25#include <VBox/log.h>
26
27#include <iprt/alloc.h>
28#include <iprt/assert.h>
29#include <iprt/uuid.h>
30#include <iprt/file.h>
31#include <iprt/string.h>
32#include <iprt/asm.h>
33#include <iprt/ldr.h>
34#include <iprt/dir.h>
35#include <iprt/path.h>
36#include <iprt/param.h>
37#include <iprt/memcache.h>
38#include <iprt/sg.h>
39#include <iprt/list.h>
40#include <iprt/avl.h>
41#include <iprt/semaphore.h>
42
43#include <VBox/vd-plugin.h>
44
45#include "VDBackends.h"
46
47/** Disable dynamic backends on non x86 architectures. This feature
48 * requires the SUPR3 library which is not available there.
49 */
50#if !defined(VBOX_HDD_NO_DYNAMIC_BACKENDS) && !defined(RT_ARCH_X86) && !defined(RT_ARCH_AMD64)
51# define VBOX_HDD_NO_DYNAMIC_BACKENDS
52#endif
53
54#define VBOXHDDDISK_SIGNATURE 0x6f0e2a7d
55
56/** Buffer size used for merging images. */
57#define VD_MERGE_BUFFER_SIZE (16 * _1M)
58
59/** Maximum number of segments in one I/O task. */
60#define VD_IO_TASK_SEGMENTS_MAX 64
61
62/** Threshold after not recently used blocks are removed from the list. */
63#define VD_DISCARD_REMOVE_THRESHOLD (10 * _1M) /** @todo: experiment */
64
65/**
66 * VD async I/O interface storage descriptor.
67 */
68typedef struct VDIIOFALLBACKSTORAGE
69{
70 /** File handle. */
71 RTFILE File;
72 /** Completion callback. */
73 PFNVDCOMPLETED pfnCompleted;
74 /** Thread for async access. */
75 RTTHREAD ThreadAsync;
76} VDIIOFALLBACKSTORAGE, *PVDIIOFALLBACKSTORAGE;
77
78/**
79 * Structure containing everything I/O related
80 * for the image and cache descriptors.
81 */
82typedef struct VDIO
83{
84 /** I/O interface to the upper layer. */
85 PVDINTERFACEIO pInterfaceIo;
86
87 /** Per image internal I/O interface. */
88 VDINTERFACEIOINT VDIfIoInt;
89
90 /** Fallback I/O interface, only used if the caller doesn't provide it. */
91 VDINTERFACEIO VDIfIo;
92
93 /** Opaque backend data. */
94 void *pBackendData;
95 /** Disk this image is part of */
96 PVBOXHDD pDisk;
97 /** Flag whether to ignore flush requests. */
98 bool fIgnoreFlush;
99} VDIO, *PVDIO;
100
101/** Forward declaration of an I/O task */
102typedef struct VDIOTASK *PVDIOTASK;
103
104/**
105 * VBox HDD Container image descriptor.
106 */
107typedef struct VDIMAGE
108{
109 /** Link to parent image descriptor, if any. */
110 struct VDIMAGE *pPrev;
111 /** Link to child image descriptor, if any. */
112 struct VDIMAGE *pNext;
113 /** Container base filename. (UTF-8) */
114 char *pszFilename;
115 /** Data managed by the backend which keeps the actual info. */
116 void *pBackendData;
117 /** Cached sanitized image flags. */
118 unsigned uImageFlags;
119 /** Image open flags (only those handled generically in this code and which
120 * the backends will never ever see). */
121 unsigned uOpenFlags;
122
123 /** Function pointers for the various backend methods. */
124 PCVBOXHDDBACKEND Backend;
125 /** Pointer to list of VD interfaces, per-image. */
126 PVDINTERFACE pVDIfsImage;
127 /** I/O related things. */
128 VDIO VDIo;
129} VDIMAGE, *PVDIMAGE;
130
131/**
132 * uModified bit flags.
133 */
134#define VD_IMAGE_MODIFIED_FLAG RT_BIT(0)
135#define VD_IMAGE_MODIFIED_FIRST RT_BIT(1)
136#define VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE RT_BIT(2)
137
138
139/**
140 * VBox HDD Cache image descriptor.
141 */
142typedef struct VDCACHE
143{
144 /** Cache base filename. (UTF-8) */
145 char *pszFilename;
146 /** Data managed by the backend which keeps the actual info. */
147 void *pBackendData;
148 /** Cached sanitized image flags. */
149 unsigned uImageFlags;
150 /** Image open flags (only those handled generically in this code and which
151 * the backends will never ever see). */
152 unsigned uOpenFlags;
153
154 /** Function pointers for the various backend methods. */
155 PCVDCACHEBACKEND Backend;
156
157 /** Pointer to list of VD interfaces, per-cache. */
158 PVDINTERFACE pVDIfsCache;
159 /** I/O related things. */
160 VDIO VDIo;
161} VDCACHE, *PVDCACHE;
162
163/**
164 * A block waiting for a discard.
165 */
166typedef struct VDDISCARDBLOCK
167{
168 /** AVL core. */
169 AVLRU64NODECORE Core;
170 /** LRU list node. */
171 RTLISTNODE NodeLru;
172 /** Number of bytes to discard. */
173 size_t cbDiscard;
174 /** Bitmap of allocated sectors. */
175 void *pbmAllocated;
176} VDDISCARDBLOCK, *PVDDISCARDBLOCK;
177
178/**
179 * VD discard state.
180 */
181typedef struct VDDISCARDSTATE
182{
183 /** Number of bytes waiting for a discard. */
184 size_t cbDiscarding;
185 /** AVL tree with blocks waiting for a discard.
186 * The uOffset + cbDiscard range is the search key. */
187 PAVLRU64TREE pTreeBlocks;
188 /** LRU list of the least frequently discarded blocks.
189 * If there are to many blocks waiting the least frequently used
190 * will be removed and the range will be set to 0.
191 */
192 RTLISTNODE ListLru;
193} VDDISCARDSTATE, *PVDDISCARDSTATE;
194
195/**
196 * VD filter instance.
197 */
198typedef struct VDFILTER
199{
200 /** Pointer to the previous filter. */
201 struct VDFILTER *pPrev;
202 /** Pointer to the next filter. */
203 struct VDFILTER *pNext;
204 /** Opaque VD filter backend instance data. */
205 void *pvBackendData;
206 /** Pointer to the filter backend interface. */
207 PCVDFILTERBACKEND pBackend;
208 /** Pointer to list of VD interfaces, per-filter. */
209 PVDINTERFACE pVDIfsFilter;
210 /** I/O related things. */
211 VDIO VDIo;
212} VDFILTER;
213/** Pointer to a VD filter instance. */
214typedef VDFILTER *PVDFILTER;
215
216/**
217 * VBox HDD Container main structure, private part.
218 */
219struct VBOXHDD
220{
221 /** Structure signature (VBOXHDDDISK_SIGNATURE). */
222 uint32_t u32Signature;
223
224 /** Image type. */
225 VDTYPE enmType;
226
227 /** Number of opened images. */
228 unsigned cImages;
229
230 /** Base image. */
231 PVDIMAGE pBase;
232
233 /** Last opened image in the chain.
234 * The same as pBase if only one image is used. */
235 PVDIMAGE pLast;
236
237 /** If a merge to one of the parents is running this may be non-NULL
238 * to indicate to what image the writes should be additionally relayed. */
239 PVDIMAGE pImageRelay;
240
241 /** Flags representing the modification state. */
242 unsigned uModified;
243
244 /** Cached size of this disk. */
245 uint64_t cbSize;
246 /** Cached PCHS geometry for this disk. */
247 VDGEOMETRY PCHSGeometry;
248 /** Cached LCHS geometry for this disk. */
249 VDGEOMETRY LCHSGeometry;
250
251 /** Pointer to list of VD interfaces, per-disk. */
252 PVDINTERFACE pVDIfsDisk;
253 /** Pointer to the common interface structure for error reporting. */
254 PVDINTERFACEERROR pInterfaceError;
255 /** Pointer to the optional thread synchronization callbacks. */
256 PVDINTERFACETHREADSYNC pInterfaceThreadSync;
257
258 /** Memory cache for I/O contexts */
259 RTMEMCACHE hMemCacheIoCtx;
260 /** Memory cache for I/O tasks. */
261 RTMEMCACHE hMemCacheIoTask;
262 /** An I/O context is currently using the disk structures
263 * Every I/O context must be placed on one of the lists below. */
264 volatile bool fLocked;
265 /** Head of pending I/O tasks waiting for completion - LIFO order. */
266 volatile PVDIOTASK pIoTasksPendingHead;
267 /** Head of newly queued I/O contexts - LIFO order. */
268 volatile PVDIOCTX pIoCtxHead;
269 /** Head of halted I/O contexts which are given back to generic
270 * disk framework by the backend. - LIFO order. */
271 volatile PVDIOCTX pIoCtxHaltedHead;
272
273 /** Head of blocked I/O contexts, processed only
274 * after pIoCtxLockOwner was freed - LIFO order. */
275 volatile PVDIOCTX pIoCtxBlockedHead;
276 /** I/O context which locked the disk for a growing write or flush request.
277 * Other flush or growing write requests need to wait until
278 * the current one completes. - NIL_VDIOCTX if unlocked. */
279 volatile PVDIOCTX pIoCtxLockOwner;
280 /** If the disk was locked by a growing write, flush or discard request this
281 * contains the start offset to check for interfering I/O while it is in progress. */
282 uint64_t uOffsetStartLocked;
283 /** If the disk was locked by a growing write, flush or discard request this contains
284 * the first non affected offset to check for interfering I/O while it is in progress. */
285 uint64_t uOffsetEndLocked;
286
287 /** Pointer to the L2 disk cache if any. */
288 PVDCACHE pCache;
289 /** Pointer to the discard state if any. */
290 PVDDISCARDSTATE pDiscard;
291
292 /** Pointer to the first filter in the chain. */
293 PVDFILTER pFilterHead;
294 /** Pointer to the last filter in the chain. */
295 PVDFILTER pFilterTail;
296};
297
298# define VD_IS_LOCKED(a_pDisk) \
299 do \
300 { \
301 AssertMsg(a_pDisk->fLocked, \
302 ("Lock not held\n"));\
303 } while(0)
304
305/**
306 * VBox parent read descriptor, used internally for compaction.
307 */
308typedef struct VDPARENTSTATEDESC
309{
310 /** Pointer to disk descriptor. */
311 PVBOXHDD pDisk;
312 /** Pointer to image descriptor. */
313 PVDIMAGE pImage;
314} VDPARENTSTATEDESC, *PVDPARENTSTATEDESC;
315
316/**
317 * Transfer direction.
318 */
319typedef enum VDIOCTXTXDIR
320{
321 /** Read */
322 VDIOCTXTXDIR_READ = 0,
323 /** Write */
324 VDIOCTXTXDIR_WRITE,
325 /** Flush */
326 VDIOCTXTXDIR_FLUSH,
327 /** Discard */
328 VDIOCTXTXDIR_DISCARD,
329 /** 32bit hack */
330 VDIOCTXTXDIR_32BIT_HACK = 0x7fffffff
331} VDIOCTXTXDIR, *PVDIOCTXTXDIR;
332
333/** Transfer function */
334typedef DECLCALLBACK(int) FNVDIOCTXTRANSFER (PVDIOCTX pIoCtx);
335/** Pointer to a transfer function. */
336typedef FNVDIOCTXTRANSFER *PFNVDIOCTXTRANSFER;
337
338/**
339 * I/O context
340 */
341typedef struct VDIOCTX
342{
343 /** Pointer to the next I/O context. */
344 struct VDIOCTX * volatile pIoCtxNext;
345 /** Disk this is request is for. */
346 PVBOXHDD pDisk;
347 /** Return code. */
348 int rcReq;
349 /** Various flags for the I/O context. */
350 uint32_t fFlags;
351 /** Number of data transfers currently pending. */
352 volatile uint32_t cDataTransfersPending;
353 /** How many meta data transfers are pending. */
354 volatile uint32_t cMetaTransfersPending;
355 /** Flag whether the request finished */
356 volatile bool fComplete;
357 /** Temporary allocated memory which is freed
358 * when the context completes. */
359 void *pvAllocation;
360 /** Transfer function. */
361 PFNVDIOCTXTRANSFER pfnIoCtxTransfer;
362 /** Next transfer part after the current one completed. */
363 PFNVDIOCTXTRANSFER pfnIoCtxTransferNext;
364 /** Transfer direction */
365 VDIOCTXTXDIR enmTxDir;
366 /** Request type dependent data. */
367 union
368 {
369 /** I/O request (read/write). */
370 struct
371 {
372 /** Number of bytes left until this context completes. */
373 volatile uint32_t cbTransferLeft;
374 /** Current offset */
375 volatile uint64_t uOffset;
376 /** Number of bytes to transfer */
377 volatile size_t cbTransfer;
378 /** Current image in the chain. */
379 PVDIMAGE pImageCur;
380 /** Start image to read from. pImageCur is reset to this
381 * value after it reached the first image in the chain. */
382 PVDIMAGE pImageStart;
383 /** S/G buffer */
384 RTSGBUF SgBuf;
385 /** Number of bytes to clear in the buffer before the current read. */
386 size_t cbBufClear;
387 /** Number of images to read. */
388 unsigned cImagesRead;
389 /** Override for the parent image to start reading from. */
390 PVDIMAGE pImageParentOverride;
391 /** Original offset of the transfer - required for filtering read requests. */
392 uint64_t uOffsetXferOrig;
393 /** Original size of the transfer - required for fitlering read requests. */
394 size_t cbXferOrig;
395 } Io;
396 /** Discard requests. */
397 struct
398 {
399 /** Pointer to the range descriptor array. */
400 PCRTRANGE paRanges;
401 /** Number of ranges in the array. */
402 unsigned cRanges;
403 /** Range descriptor index which is processed. */
404 unsigned idxRange;
405 /** Start offset to discard currently. */
406 uint64_t offCur;
407 /** How many bytes left to discard in the current range. */
408 size_t cbDiscardLeft;
409 /** How many bytes to discard in the current block (<= cbDiscardLeft). */
410 size_t cbThisDiscard;
411 /** Discard block handled currently. */
412 PVDDISCARDBLOCK pBlock;
413 } Discard;
414 } Req;
415 /** Parent I/O context if any. Sets the type of the context (root/child) */
416 PVDIOCTX pIoCtxParent;
417 /** Type dependent data (root/child) */
418 union
419 {
420 /** Root data */
421 struct
422 {
423 /** Completion callback */
424 PFNVDASYNCTRANSFERCOMPLETE pfnComplete;
425 /** User argument 1 passed on completion. */
426 void *pvUser1;
427 /** User argument 2 passed on completion. */
428 void *pvUser2;
429 } Root;
430 /** Child data */
431 struct
432 {
433 /** Saved start offset */
434 uint64_t uOffsetSaved;
435 /** Saved transfer size */
436 size_t cbTransferLeftSaved;
437 /** Number of bytes transferred from the parent if this context completes. */
438 size_t cbTransferParent;
439 /** Number of bytes to pre read */
440 size_t cbPreRead;
441 /** Number of bytes to post read. */
442 size_t cbPostRead;
443 /** Number of bytes to write left in the parent. */
444 size_t cbWriteParent;
445 /** Write type dependent data. */
446 union
447 {
448 /** Optimized */
449 struct
450 {
451 /** Bytes to fill to satisfy the block size. Not part of the virtual disk. */
452 size_t cbFill;
453 /** Bytes to copy instead of reading from the parent */
454 size_t cbWriteCopy;
455 /** Bytes to read from the image. */
456 size_t cbReadImage;
457 } Optimized;
458 } Write;
459 } Child;
460 } Type;
461} VDIOCTX;
462
463/** Default flags for an I/O context, i.e. unblocked and async. */
464#define VDIOCTX_FLAGS_DEFAULT (0)
465/** Flag whether the context is blocked. */
466#define VDIOCTX_FLAGS_BLOCKED RT_BIT_32(0)
467/** Flag whether the I/O context is using synchronous I/O. */
468#define VDIOCTX_FLAGS_SYNC RT_BIT_32(1)
469/** Flag whether the read should update the cache. */
470#define VDIOCTX_FLAGS_READ_UPDATE_CACHE RT_BIT_32(2)
471/** Flag whether free blocks should be zeroed.
472 * If false and no image has data for sepcified
473 * range VERR_VD_BLOCK_FREE is returned for the I/O context.
474 * Note that unallocated blocks are still zeroed
475 * if at least one image has valid data for a part
476 * of the range.
477 */
478#define VDIOCTX_FLAGS_ZERO_FREE_BLOCKS RT_BIT_32(3)
479/** Don't free the I/O context when complete because
480 * it was alloacted elsewhere (stack, ...). */
481#define VDIOCTX_FLAGS_DONT_FREE RT_BIT_32(4)
482/** Don't set the modified flag for this I/O context when writing. */
483#define VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG RT_BIT_32(5)
484/** The write filter was applied already and shouldn't be applied a second time.
485 * Used at the beginning of vdWriteHelperAsync() because it might be called
486 * multiple times.
487 */
488#define VDIOCTX_FLAGS_WRITE_FILTER_APPLIED RT_BIT_32(6)
489
490/** NIL I/O context pointer value. */
491#define NIL_VDIOCTX ((PVDIOCTX)0)
492
493/**
494 * List node for deferred I/O contexts.
495 */
496typedef struct VDIOCTXDEFERRED
497{
498 /** Node in the list of deferred requests.
499 * A request can be deferred if the image is growing
500 * and the request accesses the same range or if
501 * the backend needs to read or write metadata from the disk
502 * before it can continue. */
503 RTLISTNODE NodeDeferred;
504 /** I/O context this entry points to. */
505 PVDIOCTX pIoCtx;
506} VDIOCTXDEFERRED, *PVDIOCTXDEFERRED;
507
508/**
509 * I/O task.
510 */
511typedef struct VDIOTASK
512{
513 /** Next I/O task waiting in the list. */
514 struct VDIOTASK * volatile pNext;
515 /** Storage this task belongs to. */
516 PVDIOSTORAGE pIoStorage;
517 /** Optional completion callback. */
518 PFNVDXFERCOMPLETED pfnComplete;
519 /** Opaque user data. */
520 void *pvUser;
521 /** Completion status code for the task. */
522 int rcReq;
523 /** Flag whether this is a meta data transfer. */
524 bool fMeta;
525 /** Type dependent data. */
526 union
527 {
528 /** User data transfer. */
529 struct
530 {
531 /** Number of bytes this task transferred. */
532 uint32_t cbTransfer;
533 /** Pointer to the I/O context the task belongs. */
534 PVDIOCTX pIoCtx;
535 } User;
536 /** Meta data transfer. */
537 struct
538 {
539 /** Meta transfer this task is for. */
540 PVDMETAXFER pMetaXfer;
541 } Meta;
542 } Type;
543} VDIOTASK;
544
545/**
546 * Storage handle.
547 */
548typedef struct VDIOSTORAGE
549{
550 /** Image I/O state this storage handle belongs to. */
551 PVDIO pVDIo;
552 /** AVL tree for pending async metadata transfers. */
553 PAVLRFOFFTREE pTreeMetaXfers;
554 /** Storage handle */
555 void *pStorage;
556} VDIOSTORAGE;
557
558/**
559 * Metadata transfer.
560 *
561 * @note This entry can't be freed if either the list is not empty or
562 * the reference counter is not 0.
563 * The assumption is that the backends don't need to read huge amounts of
564 * metadata to complete a transfer so the additional memory overhead should
565 * be relatively small.
566 */
567typedef struct VDMETAXFER
568{
569 /** AVL core for fast search (the file offset is the key) */
570 AVLRFOFFNODECORE Core;
571 /** I/O storage for this transfer. */
572 PVDIOSTORAGE pIoStorage;
573 /** Flags. */
574 uint32_t fFlags;
575 /** List of I/O contexts waiting for this metadata transfer to complete. */
576 RTLISTNODE ListIoCtxWaiting;
577 /** Number of references to this entry. */
578 unsigned cRefs;
579 /** Size of the data stored with this entry. */
580 size_t cbMeta;
581 /** Data stored - variable size. */
582 uint8_t abData[1];
583} VDMETAXFER;
584
585/**
586 * The transfer direction for the metadata.
587 */
588#define VDMETAXFER_TXDIR_MASK 0x3
589#define VDMETAXFER_TXDIR_NONE 0x0
590#define VDMETAXFER_TXDIR_WRITE 0x1
591#define VDMETAXFER_TXDIR_READ 0x2
592#define VDMETAXFER_TXDIR_FLUSH 0x3
593#define VDMETAXFER_TXDIR_GET(flags) ((flags) & VDMETAXFER_TXDIR_MASK)
594#define VDMETAXFER_TXDIR_SET(flags, dir) ((flags) = (flags & ~VDMETAXFER_TXDIR_MASK) | (dir))
595
596/**
597 * Plugin structure.
598 */
599typedef struct VDPLUGIN
600{
601 /** Pointer to the next plugin structure. */
602 RTLISTNODE NodePlugin;
603 /** Handle of loaded plugin library. */
604 RTLDRMOD hPlugin;
605 /** Filename of the loaded plugin. */
606 char *pszFilename;
607} VDPLUGIN;
608/** Pointer to a plugin structure. */
609typedef VDPLUGIN *PVDPLUGIN;
610
611/** Head of loaded plugin list. */
612static RTLISTANCHOR g_ListPluginsLoaded;
613
614/** Number of image backends supported. */
615static unsigned g_cBackends = 0;
616/** Array of pointers to the image backends. */
617static PCVBOXHDDBACKEND *g_apBackends = NULL;
618/** Builtin image backends. */
619static PCVBOXHDDBACKEND aStaticBackends[] =
620{
621 &g_VmdkBackend,
622 &g_VDIBackend,
623 &g_VhdBackend,
624 &g_ParallelsBackend,
625 &g_DmgBackend,
626 &g_QedBackend,
627 &g_QCowBackend,
628 &g_VhdxBackend,
629 &g_RawBackend,
630 &g_ISCSIBackend
631};
632
633/** Number of supported cache backends. */
634static unsigned g_cCacheBackends = 0;
635/** Array of pointers to the cache backends. */
636static PCVDCACHEBACKEND *g_apCacheBackends = NULL;
637/** Builtin cache backends. */
638static PCVDCACHEBACKEND aStaticCacheBackends[] =
639{
640 &g_VciCacheBackend
641};
642
643/** Number of supported filter backends. */
644static unsigned g_cFilterBackends = 0;
645/** Array of pointers to the filters backends. */
646static PCVDFILTERBACKEND *g_apFilterBackends = NULL;
647
648/** Forward declaration of the async discard helper. */
649static int vdDiscardHelperAsync(PVDIOCTX pIoCtx);
650static int vdWriteHelperAsync(PVDIOCTX pIoCtx);
651static void vdDiskProcessBlockedIoCtx(PVBOXHDD pDisk);
652static int vdDiskUnlock(PVBOXHDD pDisk, PVDIOCTX pIoCtxRc);
653static DECLCALLBACK(void) vdIoCtxSyncComplete(void *pvUser1, void *pvUser2, int rcReq);
654
655/**
656 * internal: add several backends.
657 */
658static int vdAddBackends(PCVBOXHDDBACKEND *ppBackends, unsigned cBackends)
659{
660 PCVBOXHDDBACKEND *pTmp = (PCVBOXHDDBACKEND*)RTMemRealloc(g_apBackends,
661 (g_cBackends + cBackends) * sizeof(PCVBOXHDDBACKEND));
662 if (RT_UNLIKELY(!pTmp))
663 return VERR_NO_MEMORY;
664 g_apBackends = pTmp;
665 memcpy(&g_apBackends[g_cBackends], ppBackends, cBackends * sizeof(PCVBOXHDDBACKEND));
666 g_cBackends += cBackends;
667 return VINF_SUCCESS;
668}
669
670/**
671 * internal: add single backend.
672 */
673DECLINLINE(int) vdAddBackend(PCVBOXHDDBACKEND pBackend)
674{
675 return vdAddBackends(&pBackend, 1);
676}
677
678/**
679 * internal: add several cache backends.
680 */
681static int vdAddCacheBackends(PCVDCACHEBACKEND *ppBackends, unsigned cBackends)
682{
683 PCVDCACHEBACKEND *pTmp = (PCVDCACHEBACKEND*)RTMemRealloc(g_apCacheBackends,
684 (g_cCacheBackends + cBackends) * sizeof(PCVDCACHEBACKEND));
685 if (RT_UNLIKELY(!pTmp))
686 return VERR_NO_MEMORY;
687 g_apCacheBackends = pTmp;
688 memcpy(&g_apCacheBackends[g_cCacheBackends], ppBackends, cBackends * sizeof(PCVDCACHEBACKEND));
689 g_cCacheBackends += cBackends;
690 return VINF_SUCCESS;
691}
692
693/**
694 * internal: add single cache backend.
695 */
696DECLINLINE(int) vdAddCacheBackend(PCVDCACHEBACKEND pBackend)
697{
698 return vdAddCacheBackends(&pBackend, 1);
699}
700
701/**
702 * Add several filter bakends.
703 *
704 * @returns VBox status code.
705 * @param ppBackends Array of filter backends to add.
706 * @param cBackends Number of backends to add.
707 */
708static int vdAddFilterBackends(PCVDFILTERBACKEND *ppBackends, unsigned cBackends)
709{
710 PCVDFILTERBACKEND *pTmp = (PCVDFILTERBACKEND *)RTMemRealloc(g_apFilterBackends,
711 (g_cFilterBackends + cBackends) * sizeof(PCVDFILTERBACKEND));
712 if (RT_UNLIKELY(!pTmp))
713 return VERR_NO_MEMORY;
714 g_apFilterBackends = pTmp;
715 memcpy(&g_apFilterBackends[g_cFilterBackends], ppBackends, cBackends * sizeof(PCVDFILTERBACKEND));
716 g_cFilterBackends += cBackends;
717 return VINF_SUCCESS;
718}
719
720/**
721 * Add a single filter backend to the list of supported filters.
722 *
723 * @returns VBox status code.
724 * @param pBackend The backend to add.
725 */
726DECLINLINE(int) vdAddFilterBackend(PCVDFILTERBACKEND pBackend)
727{
728 return vdAddFilterBackends(&pBackend, 1);
729}
730
731/**
732 * internal: issue error message.
733 */
734static int vdError(PVBOXHDD pDisk, int rc, RT_SRC_POS_DECL,
735 const char *pszFormat, ...)
736{
737 va_list va;
738 va_start(va, pszFormat);
739 if (pDisk->pInterfaceError)
740 pDisk->pInterfaceError->pfnError(pDisk->pInterfaceError->Core.pvUser, rc, RT_SRC_POS_ARGS, pszFormat, va);
741 va_end(va);
742 return rc;
743}
744
745/**
746 * internal: thread synchronization, start read.
747 */
748DECLINLINE(int) vdThreadStartRead(PVBOXHDD pDisk)
749{
750 int rc = VINF_SUCCESS;
751 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
752 rc = pDisk->pInterfaceThreadSync->pfnStartRead(pDisk->pInterfaceThreadSync->Core.pvUser);
753 return rc;
754}
755
756/**
757 * internal: thread synchronization, finish read.
758 */
759DECLINLINE(int) vdThreadFinishRead(PVBOXHDD pDisk)
760{
761 int rc = VINF_SUCCESS;
762 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
763 rc = pDisk->pInterfaceThreadSync->pfnFinishRead(pDisk->pInterfaceThreadSync->Core.pvUser);
764 return rc;
765}
766
767/**
768 * internal: thread synchronization, start write.
769 */
770DECLINLINE(int) vdThreadStartWrite(PVBOXHDD pDisk)
771{
772 int rc = VINF_SUCCESS;
773 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
774 rc = pDisk->pInterfaceThreadSync->pfnStartWrite(pDisk->pInterfaceThreadSync->Core.pvUser);
775 return rc;
776}
777
778/**
779 * internal: thread synchronization, finish write.
780 */
781DECLINLINE(int) vdThreadFinishWrite(PVBOXHDD pDisk)
782{
783 int rc = VINF_SUCCESS;
784 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
785 rc = pDisk->pInterfaceThreadSync->pfnFinishWrite(pDisk->pInterfaceThreadSync->Core.pvUser);
786 return rc;
787}
788
789/**
790 * internal: find image format backend.
791 */
792static int vdFindBackend(const char *pszBackend, PCVBOXHDDBACKEND *ppBackend)
793{
794 int rc = VINF_SUCCESS;
795 PCVBOXHDDBACKEND pBackend = NULL;
796
797 if (!g_apBackends)
798 VDInit();
799
800 for (unsigned i = 0; i < g_cBackends; i++)
801 {
802 if (!RTStrICmp(pszBackend, g_apBackends[i]->pszBackendName))
803 {
804 pBackend = g_apBackends[i];
805 break;
806 }
807 }
808 *ppBackend = pBackend;
809 return rc;
810}
811
812/**
813 * internal: find cache format backend.
814 */
815static int vdFindCacheBackend(const char *pszBackend, PCVDCACHEBACKEND *ppBackend)
816{
817 int rc = VINF_SUCCESS;
818 PCVDCACHEBACKEND pBackend = NULL;
819
820 if (!g_apCacheBackends)
821 VDInit();
822
823 for (unsigned i = 0; i < g_cCacheBackends; i++)
824 {
825 if (!RTStrICmp(pszBackend, g_apCacheBackends[i]->pszBackendName))
826 {
827 pBackend = g_apCacheBackends[i];
828 break;
829 }
830 }
831 *ppBackend = pBackend;
832 return rc;
833}
834
835/**
836 * internal: find filter backend.
837 */
838static int vdFindFilterBackend(const char *pszFilter, PCVDFILTERBACKEND *ppBackend)
839{
840 int rc = VINF_SUCCESS;
841 PCVDFILTERBACKEND pBackend = NULL;
842
843 for (unsigned i = 0; i < g_cFilterBackends; i++)
844 {
845 if (!RTStrICmp(pszFilter, g_apFilterBackends[i]->pszBackendName))
846 {
847 pBackend = g_apFilterBackends[i];
848 break;
849 }
850 }
851 *ppBackend = pBackend;
852 return rc;
853}
854
855
856/**
857 * internal: add image structure to the end of images list.
858 */
859static void vdAddImageToList(PVBOXHDD pDisk, PVDIMAGE pImage)
860{
861 pImage->pPrev = NULL;
862 pImage->pNext = NULL;
863
864 if (pDisk->pBase)
865 {
866 Assert(pDisk->cImages > 0);
867 pImage->pPrev = pDisk->pLast;
868 pDisk->pLast->pNext = pImage;
869 pDisk->pLast = pImage;
870 }
871 else
872 {
873 Assert(pDisk->cImages == 0);
874 pDisk->pBase = pImage;
875 pDisk->pLast = pImage;
876 }
877
878 pDisk->cImages++;
879}
880
881/**
882 * internal: remove image structure from the images list.
883 */
884static void vdRemoveImageFromList(PVBOXHDD pDisk, PVDIMAGE pImage)
885{
886 Assert(pDisk->cImages > 0);
887
888 if (pImage->pPrev)
889 pImage->pPrev->pNext = pImage->pNext;
890 else
891 pDisk->pBase = pImage->pNext;
892
893 if (pImage->pNext)
894 pImage->pNext->pPrev = pImage->pPrev;
895 else
896 pDisk->pLast = pImage->pPrev;
897
898 pImage->pPrev = NULL;
899 pImage->pNext = NULL;
900
901 pDisk->cImages--;
902}
903
904/**
905 * internal: add filter structure to the end of filter list.
906 */
907static void vdAddFilterToList(PVBOXHDD pDisk, PVDFILTER pFilter)
908{
909 pFilter->pPrev = NULL;
910 pFilter->pNext = NULL;
911
912 if (pDisk->pFilterHead)
913 {
914 pFilter->pPrev = pDisk->pFilterTail;
915 pDisk->pFilterTail->pNext = pFilter;
916 pDisk->pFilterTail = pFilter;
917 }
918 else
919 {
920 pDisk->pFilterHead = pFilter;
921 pDisk->pFilterTail = pFilter;
922 }
923}
924
925/**
926 * internal: Remove last filter structure from the filter list.
927 */
928static void vdRemoveFilterFromList(PVBOXHDD pDisk, PVDFILTER pFilter)
929{
930 Assert(pDisk->pFilterHead != NULL && pDisk->pFilterTail != NULL);
931
932 if (pFilter->pPrev)
933 pFilter->pPrev->pNext = pFilter->pNext;
934 else
935 pDisk->pFilterHead = pFilter->pNext;
936
937 if (pFilter->pNext)
938 pFilter->pNext->pPrev = pFilter->pPrev;
939 else
940 pDisk->pFilterTail = pFilter->pPrev;
941
942 pFilter->pPrev = NULL;
943 pFilter->pNext = NULL;
944}
945
946/**
947 * internal: find image by index into the images list.
948 */
949static PVDIMAGE vdGetImageByNumber(PVBOXHDD pDisk, unsigned nImage)
950{
951 PVDIMAGE pImage = pDisk->pBase;
952 if (nImage == VD_LAST_IMAGE)
953 return pDisk->pLast;
954 while (pImage && nImage)
955 {
956 pImage = pImage->pNext;
957 nImage--;
958 }
959 return pImage;
960}
961
962/**
963 * Applies the filter chain to the given write request.
964 *
965 * @returns VBox status code.
966 * @param pDisk The HDD container.
967 * @param uOffset The start offset of the write.
968 * @param cbWrite Number of bytes to write.
969 * @param pIoCtx The I/O context associated with the request.
970 */
971static int vdFilterChainApplyWrite(PVBOXHDD pDisk, uint64_t uOffset, size_t cbWrite,
972 PVDIOCTX pIoCtx)
973{
974 int rc = VINF_SUCCESS;
975
976 VD_IS_LOCKED(pDisk);
977
978 if (pDisk->pFilterHead)
979 {
980 PVDFILTER pFilterCurr = pDisk->pFilterHead;
981
982 do
983 {
984 rc = pFilterCurr->pBackend->pfnFilterWrite(pFilterCurr->pvBackendData, uOffset, cbWrite, pIoCtx);
985 /* Reset S/G buffer for the next filter. */
986 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
987
988 pFilterCurr = pFilterCurr->pNext;
989 } while ( RT_SUCCESS(rc)
990 && pFilterCurr);
991 }
992
993 return rc;
994}
995
996/**
997 * Applies the filter chain to the given read request.
998 *
999 * @returns VBox status code.
1000 * @param pDisk The HDD container.
1001 * @param uOffset The start offset of the read.
1002 * @param cbRead Number of bytes read.
1003 * @param pIoCtx The I/O context associated with the request.
1004 */
1005static int vdFilterChainApplyRead(PVBOXHDD pDisk, uint64_t uOffset, size_t cbRead,
1006 PVDIOCTX pIoCtx)
1007{
1008 int rc = VINF_SUCCESS;
1009
1010 VD_IS_LOCKED(pDisk);
1011
1012 if (pDisk->pFilterHead)
1013 {
1014 PVDFILTER pFilterCurr = pDisk->pFilterHead;
1015
1016 /* Reset buffer before starting. */
1017 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
1018
1019 do
1020 {
1021 rc = pFilterCurr->pBackend->pfnFilterRead(pFilterCurr->pvBackendData, uOffset, cbRead, pIoCtx);
1022 /* Reset S/G buffer for the next filter. */
1023 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
1024
1025 pFilterCurr = pFilterCurr->pNext;
1026 } while ( RT_SUCCESS(rc)
1027 && pFilterCurr);
1028 }
1029
1030 return rc;
1031}
1032
1033DECLINLINE(void) vdIoCtxRootComplete(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1034{
1035 if ( RT_SUCCESS(pIoCtx->rcReq)
1036 && pIoCtx->enmTxDir == VDIOCTXTXDIR_READ)
1037 pIoCtx->rcReq = vdFilterChainApplyRead(pDisk, pIoCtx->Req.Io.uOffsetXferOrig,
1038 pIoCtx->Req.Io.cbXferOrig, pIoCtx);
1039
1040 pIoCtx->Type.Root.pfnComplete(pIoCtx->Type.Root.pvUser1,
1041 pIoCtx->Type.Root.pvUser2,
1042 pIoCtx->rcReq);
1043}
1044
1045/**
1046 * Initialize the structure members of a given I/O context.
1047 */
1048DECLINLINE(void) vdIoCtxInit(PVDIOCTX pIoCtx, PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1049 uint64_t uOffset, size_t cbTransfer, PVDIMAGE pImageStart,
1050 PCRTSGBUF pcSgBuf, void *pvAllocation,
1051 PFNVDIOCTXTRANSFER pfnIoCtxTransfer, uint32_t fFlags)
1052{
1053 pIoCtx->pDisk = pDisk;
1054 pIoCtx->enmTxDir = enmTxDir;
1055 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbTransfer; Assert((uint32_t)cbTransfer == cbTransfer);
1056 pIoCtx->Req.Io.uOffset = uOffset;
1057 pIoCtx->Req.Io.cbTransfer = cbTransfer;
1058 pIoCtx->Req.Io.pImageStart = pImageStart;
1059 pIoCtx->Req.Io.pImageCur = pImageStart;
1060 pIoCtx->Req.Io.cbBufClear = 0;
1061 pIoCtx->Req.Io.pImageParentOverride = NULL;
1062 pIoCtx->Req.Io.uOffsetXferOrig = uOffset;
1063 pIoCtx->Req.Io.cbXferOrig = cbTransfer;
1064 pIoCtx->cDataTransfersPending = 0;
1065 pIoCtx->cMetaTransfersPending = 0;
1066 pIoCtx->fComplete = false;
1067 pIoCtx->fFlags = fFlags;
1068 pIoCtx->pvAllocation = pvAllocation;
1069 pIoCtx->pfnIoCtxTransfer = pfnIoCtxTransfer;
1070 pIoCtx->pfnIoCtxTransferNext = NULL;
1071 pIoCtx->rcReq = VINF_SUCCESS;
1072 pIoCtx->pIoCtxParent = NULL;
1073
1074 /* There is no S/G list for a flush request. */
1075 if ( enmTxDir != VDIOCTXTXDIR_FLUSH
1076 && enmTxDir != VDIOCTXTXDIR_DISCARD)
1077 RTSgBufClone(&pIoCtx->Req.Io.SgBuf, pcSgBuf);
1078 else
1079 memset(&pIoCtx->Req.Io.SgBuf, 0, sizeof(RTSGBUF));
1080}
1081
1082/**
1083 * Internal: Tries to read the desired range from the given cache.
1084 *
1085 * @returns VBox status code.
1086 * @retval VERR_VD_BLOCK_FREE if the block is not in the cache.
1087 * pcbRead will be set to the number of bytes not in the cache.
1088 * Everything thereafter might be in the cache.
1089 * @param pCache The cache to read from.
1090 * @param uOffset Offset of the virtual disk to read.
1091 * @param cbRead How much to read.
1092 * @param pIoCtx The I/O context to read into.
1093 * @param pcbRead Where to store the number of bytes actually read.
1094 * On success this indicates the number of bytes read from the cache.
1095 * If VERR_VD_BLOCK_FREE is returned this gives the number of bytes
1096 * which are not in the cache.
1097 * In both cases everything beyond this value
1098 * might or might not be in the cache.
1099 */
1100static int vdCacheReadHelper(PVDCACHE pCache, uint64_t uOffset,
1101 size_t cbRead, PVDIOCTX pIoCtx, size_t *pcbRead)
1102{
1103 int rc = VINF_SUCCESS;
1104
1105 LogFlowFunc(("pCache=%#p uOffset=%llu pIoCtx=%p cbRead=%zu pcbRead=%#p\n",
1106 pCache, uOffset, pIoCtx, cbRead, pcbRead));
1107
1108 AssertPtr(pCache);
1109 AssertPtr(pcbRead);
1110
1111 rc = pCache->Backend->pfnRead(pCache->pBackendData, uOffset, cbRead,
1112 pIoCtx, pcbRead);
1113
1114 LogFlowFunc(("returns rc=%Rrc pcbRead=%zu\n", rc, *pcbRead));
1115 return rc;
1116}
1117
1118/**
1119 * Internal: Writes data for the given block into the cache.
1120 *
1121 * @returns VBox status code.
1122 * @param pCache The cache to write to.
1123 * @param uOffset Offset of the virtual disk to write to the cache.
1124 * @param cbWrite How much to write.
1125 * @param pIoCtx The I/O context to ẃrite from.
1126 * @param pcbWritten How much data could be written, optional.
1127 */
1128static int vdCacheWriteHelper(PVDCACHE pCache, uint64_t uOffset, size_t cbWrite,
1129 PVDIOCTX pIoCtx, size_t *pcbWritten)
1130{
1131 int rc = VINF_SUCCESS;
1132
1133 LogFlowFunc(("pCache=%#p uOffset=%llu pIoCtx=%p cbWrite=%zu pcbWritten=%#p\n",
1134 pCache, uOffset, pIoCtx, cbWrite, pcbWritten));
1135
1136 AssertPtr(pCache);
1137 AssertPtr(pIoCtx);
1138 Assert(cbWrite > 0);
1139
1140 if (pcbWritten)
1141 rc = pCache->Backend->pfnWrite(pCache->pBackendData, uOffset, cbWrite,
1142 pIoCtx, pcbWritten);
1143 else
1144 {
1145 size_t cbWritten = 0;
1146
1147 do
1148 {
1149 rc = pCache->Backend->pfnWrite(pCache->pBackendData, uOffset, cbWrite,
1150 pIoCtx, &cbWritten);
1151 uOffset += cbWritten;
1152 cbWrite -= cbWritten;
1153 } while ( cbWrite
1154 && ( RT_SUCCESS(rc)
1155 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS));
1156 }
1157
1158 LogFlowFunc(("returns rc=%Rrc pcbWritten=%zu\n",
1159 rc, pcbWritten ? *pcbWritten : cbWrite));
1160 return rc;
1161}
1162
1163/**
1164 * Creates a new empty discard state.
1165 *
1166 * @returns Pointer to the new discard state or NULL if out of memory.
1167 */
1168static PVDDISCARDSTATE vdDiscardStateCreate(void)
1169{
1170 PVDDISCARDSTATE pDiscard = (PVDDISCARDSTATE)RTMemAllocZ(sizeof(VDDISCARDSTATE));
1171
1172 if (pDiscard)
1173 {
1174 RTListInit(&pDiscard->ListLru);
1175 pDiscard->pTreeBlocks = (PAVLRU64TREE)RTMemAllocZ(sizeof(AVLRU64TREE));
1176 if (!pDiscard->pTreeBlocks)
1177 {
1178 RTMemFree(pDiscard);
1179 pDiscard = NULL;
1180 }
1181 }
1182
1183 return pDiscard;
1184}
1185
1186/**
1187 * Removes the least recently used blocks from the waiting list until
1188 * the new value is reached.
1189 *
1190 * @returns VBox status code.
1191 * @param pDisk VD disk container.
1192 * @param pDiscard The discard state.
1193 * @param cbDiscardingNew How many bytes should be waiting on success.
1194 * The number of bytes waiting can be less.
1195 */
1196static int vdDiscardRemoveBlocks(PVBOXHDD pDisk, PVDDISCARDSTATE pDiscard, size_t cbDiscardingNew)
1197{
1198 int rc = VINF_SUCCESS;
1199
1200 LogFlowFunc(("pDisk=%#p pDiscard=%#p cbDiscardingNew=%zu\n",
1201 pDisk, pDiscard, cbDiscardingNew));
1202
1203 while (pDiscard->cbDiscarding > cbDiscardingNew)
1204 {
1205 PVDDISCARDBLOCK pBlock = RTListGetLast(&pDiscard->ListLru, VDDISCARDBLOCK, NodeLru);
1206
1207 Assert(!RTListIsEmpty(&pDiscard->ListLru));
1208
1209 /* Go over the allocation bitmap and mark all discarded sectors as unused. */
1210 uint64_t offStart = pBlock->Core.Key;
1211 uint32_t idxStart = 0;
1212 size_t cbLeft = pBlock->cbDiscard;
1213 bool fAllocated = ASMBitTest(pBlock->pbmAllocated, idxStart);
1214 uint32_t cSectors = (uint32_t)(pBlock->cbDiscard / 512);
1215
1216 while (cbLeft > 0)
1217 {
1218 int32_t idxEnd;
1219 size_t cbThis = cbLeft;
1220
1221 if (fAllocated)
1222 {
1223 /* Check for the first unallocated bit. */
1224 idxEnd = ASMBitNextClear(pBlock->pbmAllocated, cSectors, idxStart);
1225 if (idxEnd != -1)
1226 {
1227 cbThis = (idxEnd - idxStart) * 512;
1228 fAllocated = false;
1229 }
1230 }
1231 else
1232 {
1233 /* Mark as unused and check for the first set bit. */
1234 idxEnd = ASMBitNextSet(pBlock->pbmAllocated, cSectors, idxStart);
1235 if (idxEnd != -1)
1236 cbThis = (idxEnd - idxStart) * 512;
1237
1238
1239 VDIOCTX IoCtx;
1240 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_DISCARD, 0, 0, NULL,
1241 NULL, NULL, NULL, VDIOCTX_FLAGS_SYNC);
1242 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData,
1243 &IoCtx, offStart, cbThis, NULL,
1244 NULL, &cbThis, NULL,
1245 VD_DISCARD_MARK_UNUSED);
1246 if (RT_FAILURE(rc))
1247 break;
1248
1249 fAllocated = true;
1250 }
1251
1252 idxStart = idxEnd;
1253 offStart += cbThis;
1254 cbLeft -= cbThis;
1255 }
1256
1257 if (RT_FAILURE(rc))
1258 break;
1259
1260 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
1261 Assert(pBlockRemove == pBlock);
1262 RTListNodeRemove(&pBlock->NodeLru);
1263
1264 pDiscard->cbDiscarding -= pBlock->cbDiscard;
1265 RTMemFree(pBlock->pbmAllocated);
1266 RTMemFree(pBlock);
1267 }
1268
1269 Assert(RT_FAILURE(rc) || pDiscard->cbDiscarding <= cbDiscardingNew);
1270
1271 LogFlowFunc(("returns rc=%Rrc\n", rc));
1272 return rc;
1273}
1274
1275/**
1276 * Destroys the current discard state, writing any waiting blocks to the image.
1277 *
1278 * @returns VBox status code.
1279 * @param pDisk VD disk container.
1280 */
1281static int vdDiscardStateDestroy(PVBOXHDD pDisk)
1282{
1283 int rc = VINF_SUCCESS;
1284
1285 if (pDisk->pDiscard)
1286 {
1287 rc = vdDiscardRemoveBlocks(pDisk, pDisk->pDiscard, 0 /* Remove all blocks. */);
1288 AssertRC(rc);
1289 RTMemFree(pDisk->pDiscard->pTreeBlocks);
1290 RTMemFree(pDisk->pDiscard);
1291 pDisk->pDiscard = NULL;
1292 }
1293
1294 return rc;
1295}
1296
1297/**
1298 * Marks the given range as allocated in the image.
1299 * Required if there are discards in progress and a write to a block which can get discarded
1300 * is written to.
1301 *
1302 * @returns VBox status code.
1303 * @param pDisk VD container data.
1304 * @param uOffset First byte to mark as allocated.
1305 * @param cbRange Number of bytes to mark as allocated.
1306 */
1307static int vdDiscardSetRangeAllocated(PVBOXHDD pDisk, uint64_t uOffset, size_t cbRange)
1308{
1309 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
1310 int rc = VINF_SUCCESS;
1311
1312 if (pDiscard)
1313 {
1314 do
1315 {
1316 size_t cbThisRange = cbRange;
1317 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTAvlrU64RangeGet(pDiscard->pTreeBlocks, uOffset);
1318
1319 if (pBlock)
1320 {
1321 int32_t idxStart, idxEnd;
1322
1323 Assert(!(cbThisRange % 512));
1324 Assert(!((uOffset - pBlock->Core.Key) % 512));
1325
1326 cbThisRange = RT_MIN(cbThisRange, pBlock->Core.KeyLast - uOffset + 1);
1327
1328 idxStart = (uOffset - pBlock->Core.Key) / 512;
1329 idxEnd = idxStart + (int32_t)(cbThisRange / 512);
1330 ASMBitSetRange(pBlock->pbmAllocated, idxStart, idxEnd);
1331 }
1332 else
1333 {
1334 pBlock = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, uOffset, true);
1335 if (pBlock)
1336 cbThisRange = RT_MIN(cbThisRange, pBlock->Core.Key - uOffset);
1337 }
1338
1339 Assert(cbRange >= cbThisRange);
1340
1341 uOffset += cbThisRange;
1342 cbRange -= cbThisRange;
1343 } while (cbRange != 0);
1344 }
1345
1346 return rc;
1347}
1348
1349DECLINLINE(PVDIOCTX) vdIoCtxAlloc(PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1350 uint64_t uOffset, size_t cbTransfer,
1351 PVDIMAGE pImageStart,PCRTSGBUF pcSgBuf,
1352 void *pvAllocation, PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1353 uint32_t fFlags)
1354{
1355 PVDIOCTX pIoCtx = NULL;
1356
1357 pIoCtx = (PVDIOCTX)RTMemCacheAlloc(pDisk->hMemCacheIoCtx);
1358 if (RT_LIKELY(pIoCtx))
1359 {
1360 vdIoCtxInit(pIoCtx, pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1361 pcSgBuf, pvAllocation, pfnIoCtxTransfer, fFlags);
1362 }
1363
1364 return pIoCtx;
1365}
1366
1367DECLINLINE(PVDIOCTX) vdIoCtxRootAlloc(PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1368 uint64_t uOffset, size_t cbTransfer,
1369 PVDIMAGE pImageStart, PCRTSGBUF pcSgBuf,
1370 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1371 void *pvUser1, void *pvUser2,
1372 void *pvAllocation,
1373 PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1374 uint32_t fFlags)
1375{
1376 PVDIOCTX pIoCtx = vdIoCtxAlloc(pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1377 pcSgBuf, pvAllocation, pfnIoCtxTransfer, fFlags);
1378
1379 if (RT_LIKELY(pIoCtx))
1380 {
1381 pIoCtx->pIoCtxParent = NULL;
1382 pIoCtx->Type.Root.pfnComplete = pfnComplete;
1383 pIoCtx->Type.Root.pvUser1 = pvUser1;
1384 pIoCtx->Type.Root.pvUser2 = pvUser2;
1385 }
1386
1387 LogFlow(("Allocated root I/O context %#p\n", pIoCtx));
1388 return pIoCtx;
1389}
1390
1391DECLINLINE(void) vdIoCtxDiscardInit(PVDIOCTX pIoCtx, PVBOXHDD pDisk, PCRTRANGE paRanges,
1392 unsigned cRanges, PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1393 void *pvUser1, void *pvUser2, void *pvAllocation,
1394 PFNVDIOCTXTRANSFER pfnIoCtxTransfer, uint32_t fFlags)
1395{
1396 pIoCtx->pIoCtxNext = NULL;
1397 pIoCtx->pDisk = pDisk;
1398 pIoCtx->enmTxDir = VDIOCTXTXDIR_DISCARD;
1399 pIoCtx->cDataTransfersPending = 0;
1400 pIoCtx->cMetaTransfersPending = 0;
1401 pIoCtx->fComplete = false;
1402 pIoCtx->fFlags = fFlags;
1403 pIoCtx->pvAllocation = pvAllocation;
1404 pIoCtx->pfnIoCtxTransfer = pfnIoCtxTransfer;
1405 pIoCtx->pfnIoCtxTransferNext = NULL;
1406 pIoCtx->rcReq = VINF_SUCCESS;
1407 pIoCtx->Req.Discard.paRanges = paRanges;
1408 pIoCtx->Req.Discard.cRanges = cRanges;
1409 pIoCtx->Req.Discard.idxRange = 0;
1410 pIoCtx->Req.Discard.cbDiscardLeft = 0;
1411 pIoCtx->Req.Discard.offCur = 0;
1412 pIoCtx->Req.Discard.cbThisDiscard = 0;
1413
1414 pIoCtx->pIoCtxParent = NULL;
1415 pIoCtx->Type.Root.pfnComplete = pfnComplete;
1416 pIoCtx->Type.Root.pvUser1 = pvUser1;
1417 pIoCtx->Type.Root.pvUser2 = pvUser2;
1418}
1419
1420DECLINLINE(PVDIOCTX) vdIoCtxDiscardAlloc(PVBOXHDD pDisk, PCRTRANGE paRanges,
1421 unsigned cRanges,
1422 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1423 void *pvUser1, void *pvUser2,
1424 void *pvAllocation,
1425 PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1426 uint32_t fFlags)
1427{
1428 PVDIOCTX pIoCtx = NULL;
1429
1430 pIoCtx = (PVDIOCTX)RTMemCacheAlloc(pDisk->hMemCacheIoCtx);
1431 if (RT_LIKELY(pIoCtx))
1432 {
1433 vdIoCtxDiscardInit(pIoCtx, pDisk, paRanges, cRanges, pfnComplete, pvUser1,
1434 pvUser2, pvAllocation, pfnIoCtxTransfer, fFlags);
1435 }
1436
1437 LogFlow(("Allocated discard I/O context %#p\n", pIoCtx));
1438 return pIoCtx;
1439}
1440
1441DECLINLINE(PVDIOCTX) vdIoCtxChildAlloc(PVBOXHDD pDisk, VDIOCTXTXDIR enmTxDir,
1442 uint64_t uOffset, size_t cbTransfer,
1443 PVDIMAGE pImageStart, PCRTSGBUF pcSgBuf,
1444 PVDIOCTX pIoCtxParent, size_t cbTransferParent,
1445 size_t cbWriteParent, void *pvAllocation,
1446 PFNVDIOCTXTRANSFER pfnIoCtxTransfer)
1447{
1448 PVDIOCTX pIoCtx = vdIoCtxAlloc(pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1449 pcSgBuf, pvAllocation, pfnIoCtxTransfer, pIoCtxParent->fFlags & ~VDIOCTX_FLAGS_DONT_FREE);
1450
1451 AssertPtr(pIoCtxParent);
1452 Assert(!pIoCtxParent->pIoCtxParent);
1453
1454 if (RT_LIKELY(pIoCtx))
1455 {
1456 pIoCtx->pIoCtxParent = pIoCtxParent;
1457 pIoCtx->Type.Child.uOffsetSaved = uOffset;
1458 pIoCtx->Type.Child.cbTransferLeftSaved = cbTransfer;
1459 pIoCtx->Type.Child.cbTransferParent = cbTransferParent;
1460 pIoCtx->Type.Child.cbWriteParent = cbWriteParent;
1461 }
1462
1463 LogFlow(("Allocated child I/O context %#p\n", pIoCtx));
1464 return pIoCtx;
1465}
1466
1467DECLINLINE(PVDIOTASK) vdIoTaskUserAlloc(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser, PVDIOCTX pIoCtx, uint32_t cbTransfer)
1468{
1469 PVDIOTASK pIoTask = NULL;
1470
1471 pIoTask = (PVDIOTASK)RTMemCacheAlloc(pIoStorage->pVDIo->pDisk->hMemCacheIoTask);
1472 if (pIoTask)
1473 {
1474 pIoTask->pIoStorage = pIoStorage;
1475 pIoTask->pfnComplete = pfnComplete;
1476 pIoTask->pvUser = pvUser;
1477 pIoTask->fMeta = false;
1478 pIoTask->Type.User.cbTransfer = cbTransfer;
1479 pIoTask->Type.User.pIoCtx = pIoCtx;
1480 }
1481
1482 return pIoTask;
1483}
1484
1485DECLINLINE(PVDIOTASK) vdIoTaskMetaAlloc(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser, PVDMETAXFER pMetaXfer)
1486{
1487 PVDIOTASK pIoTask = NULL;
1488
1489 pIoTask = (PVDIOTASK)RTMemCacheAlloc(pIoStorage->pVDIo->pDisk->hMemCacheIoTask);
1490 if (pIoTask)
1491 {
1492 pIoTask->pIoStorage = pIoStorage;
1493 pIoTask->pfnComplete = pfnComplete;
1494 pIoTask->pvUser = pvUser;
1495 pIoTask->fMeta = true;
1496 pIoTask->Type.Meta.pMetaXfer = pMetaXfer;
1497 }
1498
1499 return pIoTask;
1500}
1501
1502DECLINLINE(void) vdIoCtxFree(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1503{
1504 Log(("Freeing I/O context %#p\n", pIoCtx));
1505
1506 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_DONT_FREE))
1507 {
1508 if (pIoCtx->pvAllocation)
1509 RTMemFree(pIoCtx->pvAllocation);
1510#ifdef DEBUG
1511 memset(&pIoCtx->pDisk, 0xff, sizeof(void *));
1512#endif
1513 RTMemCacheFree(pDisk->hMemCacheIoCtx, pIoCtx);
1514 }
1515}
1516
1517DECLINLINE(void) vdIoTaskFree(PVBOXHDD pDisk, PVDIOTASK pIoTask)
1518{
1519#ifdef DEBUG
1520 memset(pIoTask, 0xff, sizeof(VDIOTASK));
1521#endif
1522 RTMemCacheFree(pDisk->hMemCacheIoTask, pIoTask);
1523}
1524
1525DECLINLINE(void) vdIoCtxChildReset(PVDIOCTX pIoCtx)
1526{
1527 AssertPtr(pIoCtx->pIoCtxParent);
1528
1529 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
1530 pIoCtx->Req.Io.uOffset = pIoCtx->Type.Child.uOffsetSaved;
1531 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)pIoCtx->Type.Child.cbTransferLeftSaved;
1532 Assert((uint32_t)pIoCtx->Type.Child.cbTransferLeftSaved == pIoCtx->Type.Child.cbTransferLeftSaved);
1533}
1534
1535DECLINLINE(PVDMETAXFER) vdMetaXferAlloc(PVDIOSTORAGE pIoStorage, uint64_t uOffset, size_t cb)
1536{
1537 PVDMETAXFER pMetaXfer = (PVDMETAXFER)RTMemAlloc(RT_OFFSETOF(VDMETAXFER, abData[cb]));
1538
1539 if (RT_LIKELY(pMetaXfer))
1540 {
1541 pMetaXfer->Core.Key = uOffset;
1542 pMetaXfer->Core.KeyLast = uOffset + cb - 1;
1543 pMetaXfer->fFlags = VDMETAXFER_TXDIR_NONE;
1544 pMetaXfer->cbMeta = cb;
1545 pMetaXfer->pIoStorage = pIoStorage;
1546 pMetaXfer->cRefs = 0;
1547 RTListInit(&pMetaXfer->ListIoCtxWaiting);
1548 }
1549 return pMetaXfer;
1550}
1551
1552DECLINLINE(void) vdIoCtxAddToWaitingList(volatile PVDIOCTX *ppList, PVDIOCTX pIoCtx)
1553{
1554 /* Put it on the waiting list. */
1555 PVDIOCTX pNext = ASMAtomicUoReadPtrT(ppList, PVDIOCTX);
1556 PVDIOCTX pHeadOld;
1557 pIoCtx->pIoCtxNext = pNext;
1558 while (!ASMAtomicCmpXchgExPtr(ppList, pIoCtx, pNext, &pHeadOld))
1559 {
1560 pNext = pHeadOld;
1561 Assert(pNext != pIoCtx);
1562 pIoCtx->pIoCtxNext = pNext;
1563 ASMNopPause();
1564 }
1565}
1566
1567DECLINLINE(void) vdIoCtxDefer(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1568{
1569 LogFlowFunc(("Deferring I/O context pIoCtx=%#p\n", pIoCtx));
1570
1571 Assert(!pIoCtx->pIoCtxParent && !(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED));
1572 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
1573 vdIoCtxAddToWaitingList(&pDisk->pIoCtxBlockedHead, pIoCtx);
1574}
1575
1576static size_t vdIoCtxCopy(PVDIOCTX pIoCtxDst, PVDIOCTX pIoCtxSrc, size_t cbData)
1577{
1578 return RTSgBufCopy(&pIoCtxDst->Req.Io.SgBuf, &pIoCtxSrc->Req.Io.SgBuf, cbData);
1579}
1580
1581static int vdIoCtxCmp(PVDIOCTX pIoCtx1, PVDIOCTX pIoCtx2, size_t cbData)
1582{
1583 return RTSgBufCmp(&pIoCtx1->Req.Io.SgBuf, &pIoCtx2->Req.Io.SgBuf, cbData);
1584}
1585
1586static size_t vdIoCtxCopyTo(PVDIOCTX pIoCtx, const uint8_t *pbData, size_t cbData)
1587{
1588 return RTSgBufCopyFromBuf(&pIoCtx->Req.Io.SgBuf, pbData, cbData);
1589}
1590
1591static size_t vdIoCtxCopyFrom(PVDIOCTX pIoCtx, uint8_t *pbData, size_t cbData)
1592{
1593 return RTSgBufCopyToBuf(&pIoCtx->Req.Io.SgBuf, pbData, cbData);
1594}
1595
1596static size_t vdIoCtxSet(PVDIOCTX pIoCtx, uint8_t ch, size_t cbData)
1597{
1598 return RTSgBufSet(&pIoCtx->Req.Io.SgBuf, ch, cbData);
1599}
1600
1601/**
1602 * Process the I/O context, core method which assumes that the I/O context
1603 * acquired the lock.
1604 *
1605 * @returns VBox status code.
1606 * @param pIoCtx I/O context to process.
1607 */
1608static int vdIoCtxProcessLocked(PVDIOCTX pIoCtx)
1609{
1610 int rc = VINF_SUCCESS;
1611
1612 VD_IS_LOCKED(pIoCtx->pDisk);
1613
1614 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
1615
1616 if ( !pIoCtx->cMetaTransfersPending
1617 && !pIoCtx->cDataTransfersPending
1618 && !pIoCtx->pfnIoCtxTransfer)
1619 {
1620 rc = VINF_VD_ASYNC_IO_FINISHED;
1621 goto out;
1622 }
1623
1624 /*
1625 * We complete the I/O context in case of an error
1626 * if there is no I/O task pending.
1627 */
1628 if ( RT_FAILURE(pIoCtx->rcReq)
1629 && !pIoCtx->cMetaTransfersPending
1630 && !pIoCtx->cDataTransfersPending)
1631 {
1632 rc = VINF_VD_ASYNC_IO_FINISHED;
1633 goto out;
1634 }
1635
1636 /* Don't change anything if there is a metadata transfer pending or we are blocked. */
1637 if ( pIoCtx->cMetaTransfersPending
1638 || (pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
1639 {
1640 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1641 goto out;
1642 }
1643
1644 if (pIoCtx->pfnIoCtxTransfer)
1645 {
1646 /* Call the transfer function advancing to the next while there is no error. */
1647 while ( pIoCtx->pfnIoCtxTransfer
1648 && !pIoCtx->cMetaTransfersPending
1649 && RT_SUCCESS(rc))
1650 {
1651 LogFlowFunc(("calling transfer function %#p\n", pIoCtx->pfnIoCtxTransfer));
1652 rc = pIoCtx->pfnIoCtxTransfer(pIoCtx);
1653
1654 /* Advance to the next part of the transfer if the current one succeeded. */
1655 if (RT_SUCCESS(rc))
1656 {
1657 pIoCtx->pfnIoCtxTransfer = pIoCtx->pfnIoCtxTransferNext;
1658 pIoCtx->pfnIoCtxTransferNext = NULL;
1659 }
1660 }
1661 }
1662
1663 if ( RT_SUCCESS(rc)
1664 && !pIoCtx->cMetaTransfersPending
1665 && !pIoCtx->cDataTransfersPending
1666 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
1667 rc = VINF_VD_ASYNC_IO_FINISHED;
1668 else if ( RT_SUCCESS(rc)
1669 || rc == VERR_VD_NOT_ENOUGH_METADATA
1670 || rc == VERR_VD_IOCTX_HALT)
1671 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1672 else if ( RT_FAILURE(rc)
1673 && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
1674 {
1675 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rc, VINF_SUCCESS);
1676
1677 /*
1678 * The I/O context completed if we have an error and there is no data
1679 * or meta data transfer pending.
1680 */
1681 if ( !pIoCtx->cMetaTransfersPending
1682 && !pIoCtx->cDataTransfersPending)
1683 rc = VINF_VD_ASYNC_IO_FINISHED;
1684 else
1685 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1686 }
1687
1688out:
1689 LogFlowFunc(("pIoCtx=%#p rc=%Rrc cDataTransfersPending=%u cMetaTransfersPending=%u fComplete=%RTbool\n",
1690 pIoCtx, rc, pIoCtx->cDataTransfersPending, pIoCtx->cMetaTransfersPending,
1691 pIoCtx->fComplete));
1692
1693 return rc;
1694}
1695
1696/**
1697 * Processes the list of waiting I/O contexts.
1698 *
1699 * @returns VBox status code, only valid if pIoCtxRc is not NULL, treat as void
1700 * function otherwise.
1701 * @param pDisk The disk structure.
1702 * @param pIoCtxRc An I/O context handle which waits on the list. When processed
1703 * The status code is returned. NULL if there is no I/O context
1704 * to return the status code for.
1705 */
1706static int vdDiskProcessWaitingIoCtx(PVBOXHDD pDisk, PVDIOCTX pIoCtxRc)
1707{
1708 int rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1709
1710 LogFlowFunc(("pDisk=%#p pIoCtxRc=%#p\n", pDisk, pIoCtxRc));
1711
1712 VD_IS_LOCKED(pDisk);
1713
1714 /* Get the waiting list and process it in FIFO order. */
1715 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxHead, NULL, PVDIOCTX);
1716
1717 /* Reverse it. */
1718 PVDIOCTX pCur = pIoCtxHead;
1719 pIoCtxHead = NULL;
1720 while (pCur)
1721 {
1722 PVDIOCTX pInsert = pCur;
1723 pCur = pCur->pIoCtxNext;
1724 pInsert->pIoCtxNext = pIoCtxHead;
1725 pIoCtxHead = pInsert;
1726 }
1727
1728 /* Process now. */
1729 pCur = pIoCtxHead;
1730 while (pCur)
1731 {
1732 int rcTmp;
1733 PVDIOCTX pTmp = pCur;
1734
1735 pCur = pCur->pIoCtxNext;
1736 pTmp->pIoCtxNext = NULL;
1737
1738 /*
1739 * Need to clear the sync flag here if there is a new I/O context
1740 * with it set and the context is not given in pIoCtxRc.
1741 * This happens most likely on a different thread and that one shouldn't
1742 * process the context synchronously.
1743 *
1744 * The thread who issued the context will wait on the event semaphore
1745 * anyway which is signalled when the completion handler is called.
1746 */
1747 if ( pTmp->fFlags & VDIOCTX_FLAGS_SYNC
1748 && pTmp != pIoCtxRc)
1749 pTmp->fFlags &= ~VDIOCTX_FLAGS_SYNC;
1750
1751 rcTmp = vdIoCtxProcessLocked(pTmp);
1752 if (pTmp == pIoCtxRc)
1753 {
1754 if ( rcTmp == VINF_VD_ASYNC_IO_FINISHED
1755 && RT_SUCCESS(pTmp->rcReq)
1756 && pTmp->enmTxDir == VDIOCTXTXDIR_READ)
1757 {
1758 int rc2 = vdFilterChainApplyRead(pDisk, pTmp->Req.Io.uOffsetXferOrig,
1759 pTmp->Req.Io.cbXferOrig, pTmp);
1760 if (RT_FAILURE(rc2))
1761 rcTmp = rc2;
1762 }
1763
1764 /* The given I/O context was processed, pass the return code to the caller. */
1765 if ( rcTmp == VINF_VD_ASYNC_IO_FINISHED
1766 && (pTmp->fFlags & VDIOCTX_FLAGS_SYNC))
1767 rc = pTmp->rcReq;
1768 else
1769 rc = rcTmp;
1770 }
1771 else if ( rcTmp == VINF_VD_ASYNC_IO_FINISHED
1772 && ASMAtomicCmpXchgBool(&pTmp->fComplete, true, false))
1773 {
1774 LogFlowFunc(("Waiting I/O context completed pTmp=%#p\n", pTmp));
1775 vdThreadFinishWrite(pDisk);
1776 vdIoCtxRootComplete(pDisk, pTmp);
1777 vdIoCtxFree(pDisk, pTmp);
1778 }
1779 }
1780
1781 LogFlowFunc(("returns rc=%Rrc\n", rc));
1782 return rc;
1783}
1784
1785/**
1786 * Processes the list of blocked I/O contexts.
1787 *
1788 * @returns nothing.
1789 * @param pDisk The disk structure.
1790 */
1791static void vdDiskProcessBlockedIoCtx(PVBOXHDD pDisk)
1792{
1793 LogFlowFunc(("pDisk=%#p\n", pDisk));
1794
1795 VD_IS_LOCKED(pDisk);
1796
1797 /* Get the waiting list and process it in FIFO order. */
1798 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxBlockedHead, NULL, PVDIOCTX);
1799
1800 /* Reverse it. */
1801 PVDIOCTX pCur = pIoCtxHead;
1802 pIoCtxHead = NULL;
1803 while (pCur)
1804 {
1805 PVDIOCTX pInsert = pCur;
1806 pCur = pCur->pIoCtxNext;
1807 pInsert->pIoCtxNext = pIoCtxHead;
1808 pIoCtxHead = pInsert;
1809 }
1810
1811 /* Process now. */
1812 pCur = pIoCtxHead;
1813 while (pCur)
1814 {
1815 int rc;
1816 PVDIOCTX pTmp = pCur;
1817
1818 pCur = pCur->pIoCtxNext;
1819 pTmp->pIoCtxNext = NULL;
1820
1821 Assert(!pTmp->pIoCtxParent);
1822 Assert(pTmp->fFlags & VDIOCTX_FLAGS_BLOCKED);
1823 pTmp->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
1824
1825 rc = vdIoCtxProcessLocked(pTmp);
1826 if ( rc == VINF_VD_ASYNC_IO_FINISHED
1827 && ASMAtomicCmpXchgBool(&pTmp->fComplete, true, false))
1828 {
1829 LogFlowFunc(("Waiting I/O context completed pTmp=%#p\n", pTmp));
1830 vdThreadFinishWrite(pDisk);
1831 vdIoCtxRootComplete(pDisk, pTmp);
1832 vdIoCtxFree(pDisk, pTmp);
1833 }
1834 }
1835
1836 LogFlowFunc(("returns\n"));
1837}
1838
1839/**
1840 * Processes the I/O context trying to lock the criticial section.
1841 * The context is deferred if the critical section is busy.
1842 *
1843 * @returns VBox status code.
1844 * @param pIoCtx The I/O context to process.
1845 */
1846static int vdIoCtxProcessTryLockDefer(PVDIOCTX pIoCtx)
1847{
1848 int rc = VINF_SUCCESS;
1849 PVBOXHDD pDisk = pIoCtx->pDisk;
1850
1851 Log(("Defer pIoCtx=%#p\n", pIoCtx));
1852
1853 /* Put it on the waiting list first. */
1854 vdIoCtxAddToWaitingList(&pDisk->pIoCtxHead, pIoCtx);
1855
1856 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
1857 {
1858 /* Leave it again, the context will be processed just before leaving the lock. */
1859 LogFlowFunc(("Successfully acquired the lock\n"));
1860 rc = vdDiskUnlock(pDisk, pIoCtx);
1861 }
1862 else
1863 {
1864 LogFlowFunc(("Lock is held\n"));
1865 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1866 }
1867
1868 return rc;
1869}
1870
1871/**
1872 * Process the I/O context in a synchronous manner, waiting
1873 * for it to complete.
1874 *
1875 * @returns VBox status code of the completed request.
1876 * @param pIoCtx The sync I/O context.
1877 * @param hEventComplete Event sempahore to wait on for completion.
1878 */
1879static int vdIoCtxProcessSync(PVDIOCTX pIoCtx, RTSEMEVENT hEventComplete)
1880{
1881 int rc = VINF_SUCCESS;
1882 PVBOXHDD pDisk = pIoCtx->pDisk;
1883
1884 LogFlowFunc(("pIoCtx=%p\n", pIoCtx));
1885
1886 AssertMsg(pIoCtx->fFlags & (VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE),
1887 ("I/O context is not marked as synchronous\n"));
1888
1889 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
1890 if (rc == VINF_VD_ASYNC_IO_FINISHED)
1891 rc = VINF_SUCCESS;
1892
1893 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
1894 {
1895 rc = RTSemEventWait(hEventComplete, RT_INDEFINITE_WAIT);
1896 AssertRC(rc);
1897 }
1898
1899 rc = pIoCtx->rcReq;
1900 vdIoCtxFree(pDisk, pIoCtx);
1901
1902 return rc;
1903}
1904
1905DECLINLINE(bool) vdIoCtxIsDiskLockOwner(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1906{
1907 return pDisk->pIoCtxLockOwner == pIoCtx;
1908}
1909
1910static int vdIoCtxLockDisk(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
1911{
1912 int rc = VINF_SUCCESS;
1913
1914 VD_IS_LOCKED(pDisk);
1915
1916 LogFlowFunc(("pDisk=%#p pIoCtx=%#p\n", pDisk, pIoCtx));
1917
1918 if (!ASMAtomicCmpXchgPtr(&pDisk->pIoCtxLockOwner, pIoCtx, NIL_VDIOCTX))
1919 {
1920 Assert(pDisk->pIoCtxLockOwner != pIoCtx); /* No nesting allowed. */
1921 vdIoCtxDefer(pDisk, pIoCtx);
1922 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1923 }
1924
1925 LogFlowFunc(("returns -> %Rrc\n", rc));
1926 return rc;
1927}
1928
1929static void vdIoCtxUnlockDisk(PVBOXHDD pDisk, PVDIOCTX pIoCtx, bool fProcessBlockedReqs)
1930{
1931 LogFlowFunc(("pDisk=%#p pIoCtx=%#p fProcessBlockedReqs=%RTbool\n",
1932 pDisk, pIoCtx, fProcessBlockedReqs));
1933
1934 VD_IS_LOCKED(pDisk);
1935
1936 LogFlow(("Unlocking disk lock owner is %#p\n", pDisk->pIoCtxLockOwner));
1937 Assert(pDisk->pIoCtxLockOwner == pIoCtx);
1938 ASMAtomicXchgPtrT(&pDisk->pIoCtxLockOwner, NIL_VDIOCTX, PVDIOCTX);
1939
1940 if (fProcessBlockedReqs)
1941 {
1942 /* Process any blocked writes if the current request didn't caused another growing. */
1943 vdDiskProcessBlockedIoCtx(pDisk);
1944 }
1945
1946 LogFlowFunc(("returns\n"));
1947}
1948
1949/**
1950 * Internal: Reads a given amount of data from the image chain of the disk.
1951 **/
1952static int vdDiskReadHelper(PVBOXHDD pDisk, PVDIMAGE pImage, PVDIMAGE pImageParentOverride,
1953 uint64_t uOffset, size_t cbRead, PVDIOCTX pIoCtx, size_t *pcbThisRead)
1954{
1955 int rc = VINF_SUCCESS;
1956 size_t cbThisRead = cbRead;
1957
1958 AssertPtr(pcbThisRead);
1959
1960 *pcbThisRead = 0;
1961
1962 /*
1963 * Try to read from the given image.
1964 * If the block is not allocated read from override chain if present.
1965 */
1966 rc = pImage->Backend->pfnRead(pImage->pBackendData,
1967 uOffset, cbThisRead, pIoCtx,
1968 &cbThisRead);
1969
1970 if (rc == VERR_VD_BLOCK_FREE)
1971 {
1972 for (PVDIMAGE pCurrImage = pImageParentOverride ? pImageParentOverride : pImage->pPrev;
1973 pCurrImage != NULL && rc == VERR_VD_BLOCK_FREE;
1974 pCurrImage = pCurrImage->pPrev)
1975 {
1976 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
1977 uOffset, cbThisRead, pIoCtx,
1978 &cbThisRead);
1979 }
1980 }
1981
1982 if (RT_SUCCESS(rc) || rc == VERR_VD_BLOCK_FREE)
1983 *pcbThisRead = cbThisRead;
1984
1985 return rc;
1986}
1987
1988/**
1989 * internal: read the specified amount of data in whatever blocks the backend
1990 * will give us - async version.
1991 */
1992static int vdReadHelperAsync(PVDIOCTX pIoCtx)
1993{
1994 int rc;
1995 PVBOXHDD pDisk = pIoCtx->pDisk;
1996 size_t cbToRead = pIoCtx->Req.Io.cbTransfer;
1997 uint64_t uOffset = pIoCtx->Req.Io.uOffset;
1998 PVDIMAGE pCurrImage = pIoCtx->Req.Io.pImageCur;
1999 PVDIMAGE pImageParentOverride = pIoCtx->Req.Io.pImageParentOverride;
2000 unsigned cImagesRead = pIoCtx->Req.Io.cImagesRead;
2001 size_t cbThisRead;
2002
2003 /*
2004 * Check whether there is a full block write in progress which was not allocated.
2005 * Defer I/O if the range interferes but only if it does not belong to the
2006 * write doing the allocation.
2007 */
2008 if ( pDisk->pIoCtxLockOwner != NIL_VDIOCTX
2009 && uOffset >= pDisk->uOffsetStartLocked
2010 && uOffset < pDisk->uOffsetEndLocked
2011 && ( !pIoCtx->pIoCtxParent
2012 || pIoCtx->pIoCtxParent != pDisk->pIoCtxLockOwner))
2013 {
2014 Log(("Interferring read while allocating a new block => deferring read\n"));
2015 vdIoCtxDefer(pDisk, pIoCtx);
2016 return VERR_VD_ASYNC_IO_IN_PROGRESS;
2017 }
2018
2019 /* Loop until all reads started or we have a backend which needs to read metadata. */
2020 do
2021 {
2022 /* Search for image with allocated block. Do not attempt to read more
2023 * than the previous reads marked as valid. Otherwise this would return
2024 * stale data when different block sizes are used for the images. */
2025 cbThisRead = cbToRead;
2026
2027 if ( pDisk->pCache
2028 && !pImageParentOverride)
2029 {
2030 rc = vdCacheReadHelper(pDisk->pCache, uOffset, cbThisRead,
2031 pIoCtx, &cbThisRead);
2032 if (rc == VERR_VD_BLOCK_FREE)
2033 {
2034 rc = vdDiskReadHelper(pDisk, pCurrImage, NULL, uOffset, cbThisRead,
2035 pIoCtx, &cbThisRead);
2036
2037 /* If the read was successful, write the data back into the cache. */
2038 if ( RT_SUCCESS(rc)
2039 && pIoCtx->fFlags & VDIOCTX_FLAGS_READ_UPDATE_CACHE)
2040 {
2041 rc = vdCacheWriteHelper(pDisk->pCache, uOffset, cbThisRead,
2042 pIoCtx, NULL);
2043 }
2044 }
2045 }
2046 else
2047 {
2048 /*
2049 * Try to read from the given image.
2050 * If the block is not allocated read from override chain if present.
2051 */
2052 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
2053 uOffset, cbThisRead, pIoCtx,
2054 &cbThisRead);
2055
2056 if ( rc == VERR_VD_BLOCK_FREE
2057 && cImagesRead != 1)
2058 {
2059 unsigned cImagesToProcess = cImagesRead;
2060
2061 pCurrImage = pImageParentOverride ? pImageParentOverride : pCurrImage->pPrev;
2062 pIoCtx->Req.Io.pImageParentOverride = NULL;
2063
2064 while (pCurrImage && rc == VERR_VD_BLOCK_FREE)
2065 {
2066 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
2067 uOffset, cbThisRead,
2068 pIoCtx, &cbThisRead);
2069 if (cImagesToProcess == 1)
2070 break;
2071 else if (cImagesToProcess > 0)
2072 cImagesToProcess--;
2073
2074 if (rc == VERR_VD_BLOCK_FREE)
2075 pCurrImage = pCurrImage->pPrev;
2076 }
2077 }
2078 }
2079
2080 /* The task state will be updated on success already, don't do it here!. */
2081 if (rc == VERR_VD_BLOCK_FREE)
2082 {
2083 /* No image in the chain contains the data for the block. */
2084 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbThisRead); Assert(cbThisRead == (uint32_t)cbThisRead);
2085
2086 /* Fill the free space with 0 if we are told to do so
2087 * or a previous read returned valid data. */
2088 if (pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS)
2089 vdIoCtxSet(pIoCtx, '\0', cbThisRead);
2090 else
2091 pIoCtx->Req.Io.cbBufClear += cbThisRead;
2092
2093 if (pIoCtx->Req.Io.pImageCur->uOpenFlags & VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS)
2094 rc = VINF_VD_NEW_ZEROED_BLOCK;
2095 else
2096 rc = VINF_SUCCESS;
2097 }
2098 else if (rc == VERR_VD_IOCTX_HALT)
2099 {
2100 uOffset += cbThisRead;
2101 cbToRead -= cbThisRead;
2102 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2103 }
2104 else if ( RT_SUCCESS(rc)
2105 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2106 {
2107 /* First not free block, fill the space before with 0. */
2108 if ( pIoCtx->Req.Io.cbBufClear
2109 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS))
2110 {
2111 RTSGBUF SgBuf;
2112 RTSgBufClone(&SgBuf, &pIoCtx->Req.Io.SgBuf);
2113 RTSgBufReset(&SgBuf);
2114 RTSgBufSet(&SgBuf, 0, pIoCtx->Req.Io.cbBufClear);
2115 pIoCtx->Req.Io.cbBufClear = 0;
2116 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2117 }
2118 rc = VINF_SUCCESS;
2119 }
2120
2121 if (RT_FAILURE(rc))
2122 break;
2123
2124 cbToRead -= cbThisRead;
2125 uOffset += cbThisRead;
2126 pCurrImage = pIoCtx->Req.Io.pImageStart; /* Start with the highest image in the chain. */
2127 } while (cbToRead != 0 && RT_SUCCESS(rc));
2128
2129 if ( rc == VERR_VD_NOT_ENOUGH_METADATA
2130 || rc == VERR_VD_IOCTX_HALT)
2131 {
2132 /* Save the current state. */
2133 pIoCtx->Req.Io.uOffset = uOffset;
2134 pIoCtx->Req.Io.cbTransfer = cbToRead;
2135 pIoCtx->Req.Io.pImageCur = pCurrImage ? pCurrImage : pIoCtx->Req.Io.pImageStart;
2136 }
2137
2138 return (!(pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS))
2139 ? VERR_VD_BLOCK_FREE
2140 : rc;
2141}
2142
2143/**
2144 * internal: parent image read wrapper for compacting.
2145 */
2146static int vdParentRead(void *pvUser, uint64_t uOffset, void *pvBuf,
2147 size_t cbRead)
2148{
2149 PVDPARENTSTATEDESC pParentState = (PVDPARENTSTATEDESC)pvUser;
2150
2151 /** @todo
2152 * Only used for compaction so far which is not possible to mix with async I/O.
2153 * Needs to be changed if we want to support online compaction of images.
2154 */
2155 bool fLocked = ASMAtomicXchgBool(&pParentState->pDisk->fLocked, true);
2156 AssertMsgReturn(!fLocked,
2157 ("Calling synchronous parent read while another thread holds the disk lock\n"),
2158 VERR_VD_INVALID_STATE);
2159
2160 /* Fake an I/O context. */
2161 RTSGSEG Segment;
2162 RTSGBUF SgBuf;
2163 VDIOCTX IoCtx;
2164
2165 Segment.pvSeg = pvBuf;
2166 Segment.cbSeg = cbRead;
2167 RTSgBufInit(&SgBuf, &Segment, 1);
2168 vdIoCtxInit(&IoCtx, pParentState->pDisk, VDIOCTXTXDIR_READ, uOffset, cbRead, pParentState->pImage,
2169 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_ZERO_FREE_BLOCKS);
2170 int rc = vdReadHelperAsync(&IoCtx);
2171 ASMAtomicXchgBool(&pParentState->pDisk->fLocked, false);
2172 return rc;
2173}
2174
2175/**
2176 * Extended version of vdReadHelper(), implementing certain optimizations
2177 * for image cloning.
2178 *
2179 * @returns VBox status code.
2180 * @param pDisk The disk to read from.
2181 * @param pImage The image to start reading from.
2182 * @param pImageParentOverride The parent image to read from
2183 * if the starting image returns a free block.
2184 * If NULL is passed the real parent of the image
2185 * in the chain is used.
2186 * @param uOffset Offset in the disk to start reading from.
2187 * @param pvBuf Where to store the read data.
2188 * @param cbRead How much to read.
2189 * @param fZeroFreeBlocks Flag whether free blocks should be zeroed.
2190 * If false and no image has data for sepcified
2191 * range VERR_VD_BLOCK_FREE is returned.
2192 * Note that unallocated blocks are still zeroed
2193 * if at least one image has valid data for a part
2194 * of the range.
2195 * @param fUpdateCache Flag whether to update the attached cache if
2196 * available.
2197 * @param cImagesRead Number of images in the chain to read until
2198 * the read is cut off. A value of 0 disables the cut off.
2199 */
2200static int vdReadHelperEx(PVBOXHDD pDisk, PVDIMAGE pImage, PVDIMAGE pImageParentOverride,
2201 uint64_t uOffset, void *pvBuf, size_t cbRead,
2202 bool fZeroFreeBlocks, bool fUpdateCache, unsigned cImagesRead)
2203{
2204 int rc = VINF_SUCCESS;
2205 uint32_t fFlags = VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE;
2206 RTSGSEG Segment;
2207 RTSGBUF SgBuf;
2208 VDIOCTX IoCtx;
2209 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
2210
2211 rc = RTSemEventCreate(&hEventComplete);
2212 if (RT_FAILURE(rc))
2213 return rc;
2214
2215 if (fZeroFreeBlocks)
2216 fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2217 if (fUpdateCache)
2218 fFlags |= VDIOCTX_FLAGS_READ_UPDATE_CACHE;
2219
2220 Segment.pvSeg = pvBuf;
2221 Segment.cbSeg = cbRead;
2222 RTSgBufInit(&SgBuf, &Segment, 1);
2223 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, uOffset, cbRead, pImage, &SgBuf,
2224 NULL, vdReadHelperAsync, fFlags);
2225
2226 IoCtx.Req.Io.pImageParentOverride = pImageParentOverride;
2227 IoCtx.Req.Io.cImagesRead = cImagesRead;
2228 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
2229 IoCtx.Type.Root.pvUser1 = pDisk;
2230 IoCtx.Type.Root.pvUser2 = hEventComplete;
2231 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
2232 RTSemEventDestroy(hEventComplete);
2233 return rc;
2234}
2235
2236/**
2237 * internal: read the specified amount of data in whatever blocks the backend
2238 * will give us.
2239 */
2240static int vdReadHelper(PVBOXHDD pDisk, PVDIMAGE pImage, uint64_t uOffset,
2241 void *pvBuf, size_t cbRead, bool fUpdateCache)
2242{
2243 return vdReadHelperEx(pDisk, pImage, NULL, uOffset, pvBuf, cbRead,
2244 true /* fZeroFreeBlocks */, fUpdateCache, 0);
2245}
2246
2247/**
2248 * internal: mark the disk as not modified.
2249 */
2250static void vdResetModifiedFlag(PVBOXHDD pDisk)
2251{
2252 if (pDisk->uModified & VD_IMAGE_MODIFIED_FLAG)
2253 {
2254 /* generate new last-modified uuid */
2255 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
2256 {
2257 RTUUID Uuid;
2258
2259 RTUuidCreate(&Uuid);
2260 pDisk->pLast->Backend->pfnSetModificationUuid(pDisk->pLast->pBackendData,
2261 &Uuid);
2262
2263 if (pDisk->pCache)
2264 pDisk->pCache->Backend->pfnSetModificationUuid(pDisk->pCache->pBackendData,
2265 &Uuid);
2266 }
2267
2268 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FLAG;
2269 }
2270}
2271
2272/**
2273 * internal: mark the disk as modified.
2274 */
2275static void vdSetModifiedFlag(PVBOXHDD pDisk)
2276{
2277 pDisk->uModified |= VD_IMAGE_MODIFIED_FLAG;
2278 if (pDisk->uModified & VD_IMAGE_MODIFIED_FIRST)
2279 {
2280 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FIRST;
2281
2282 /* First modify, so create a UUID and ensure it's written to disk. */
2283 vdResetModifiedFlag(pDisk);
2284
2285 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
2286 {
2287 VDIOCTX IoCtx;
2288 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_FLUSH, 0, 0, NULL,
2289 NULL, NULL, NULL, VDIOCTX_FLAGS_SYNC);
2290 pDisk->pLast->Backend->pfnFlush(pDisk->pLast->pBackendData, &IoCtx);
2291 }
2292 }
2293}
2294
2295/**
2296 * internal: write buffer to the image, taking care of block boundaries and
2297 * write optimizations.
2298 */
2299static int vdWriteHelperEx(PVBOXHDD pDisk, PVDIMAGE pImage,
2300 PVDIMAGE pImageParentOverride, uint64_t uOffset,
2301 const void *pvBuf, size_t cbWrite,
2302 uint32_t fFlags, unsigned cImagesRead)
2303{
2304 int rc = VINF_SUCCESS;
2305 RTSGSEG Segment;
2306 RTSGBUF SgBuf;
2307 VDIOCTX IoCtx;
2308 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
2309
2310 rc = RTSemEventCreate(&hEventComplete);
2311 if (RT_FAILURE(rc))
2312 return rc;
2313
2314 fFlags |= VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE;
2315
2316 Segment.pvSeg = (void *)pvBuf;
2317 Segment.cbSeg = cbWrite;
2318 RTSgBufInit(&SgBuf, &Segment, 1);
2319 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_WRITE, uOffset, cbWrite, pImage, &SgBuf,
2320 NULL, vdWriteHelperAsync, fFlags);
2321
2322 IoCtx.Req.Io.pImageParentOverride = pImageParentOverride;
2323 IoCtx.Req.Io.cImagesRead = cImagesRead;
2324 IoCtx.pIoCtxParent = NULL;
2325 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
2326 IoCtx.Type.Root.pvUser1 = pDisk;
2327 IoCtx.Type.Root.pvUser2 = hEventComplete;
2328 if (RT_SUCCESS(rc))
2329 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
2330
2331 RTSemEventDestroy(hEventComplete);
2332 return rc;
2333}
2334
2335/**
2336 * internal: write buffer to the image, taking care of block boundaries and
2337 * write optimizations.
2338 */
2339static int vdWriteHelper(PVBOXHDD pDisk, PVDIMAGE pImage, uint64_t uOffset,
2340 const void *pvBuf, size_t cbWrite, uint32_t fFlags)
2341{
2342 return vdWriteHelperEx(pDisk, pImage, NULL, uOffset, pvBuf, cbWrite,
2343 fFlags, 0);
2344}
2345
2346/**
2347 * Internal: Copies the content of one disk to another one applying optimizations
2348 * to speed up the copy process if possible.
2349 */
2350static int vdCopyHelper(PVBOXHDD pDiskFrom, PVDIMAGE pImageFrom, PVBOXHDD pDiskTo,
2351 uint64_t cbSize, unsigned cImagesFromRead, unsigned cImagesToRead,
2352 bool fSuppressRedundantIo, PVDINTERFACEPROGRESS pIfProgress,
2353 PVDINTERFACEPROGRESS pDstIfProgress)
2354{
2355 int rc = VINF_SUCCESS;
2356 int rc2;
2357 uint64_t uOffset = 0;
2358 uint64_t cbRemaining = cbSize;
2359 void *pvBuf = NULL;
2360 bool fLockReadFrom = false;
2361 bool fLockWriteTo = false;
2362 bool fBlockwiseCopy = fSuppressRedundantIo || (cImagesFromRead > 0);
2363 unsigned uProgressOld = 0;
2364
2365 LogFlowFunc(("pDiskFrom=%#p pImageFrom=%#p pDiskTo=%#p cbSize=%llu cImagesFromRead=%u cImagesToRead=%u fSuppressRedundantIo=%RTbool pIfProgress=%#p pDstIfProgress=%#p\n",
2366 pDiskFrom, pImageFrom, pDiskTo, cbSize, cImagesFromRead, cImagesToRead, fSuppressRedundantIo, pDstIfProgress, pDstIfProgress));
2367
2368 /* Allocate tmp buffer. */
2369 pvBuf = RTMemTmpAlloc(VD_MERGE_BUFFER_SIZE);
2370 if (!pvBuf)
2371 return rc;
2372
2373 do
2374 {
2375 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
2376
2377 /* Note that we don't attempt to synchronize cross-disk accesses.
2378 * It wouldn't be very difficult to do, just the lock order would
2379 * need to be defined somehow to prevent deadlocks. Postpone such
2380 * magic as there is no use case for this. */
2381
2382 rc2 = vdThreadStartRead(pDiskFrom);
2383 AssertRC(rc2);
2384 fLockReadFrom = true;
2385
2386 if (fBlockwiseCopy)
2387 {
2388 RTSGSEG SegmentBuf;
2389 RTSGBUF SgBuf;
2390 VDIOCTX IoCtx;
2391
2392 SegmentBuf.pvSeg = pvBuf;
2393 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
2394 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
2395 vdIoCtxInit(&IoCtx, pDiskFrom, VDIOCTXTXDIR_READ, 0, 0, NULL,
2396 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
2397
2398 /* Read the source data. */
2399 rc = pImageFrom->Backend->pfnRead(pImageFrom->pBackendData,
2400 uOffset, cbThisRead, &IoCtx,
2401 &cbThisRead);
2402
2403 if ( rc == VERR_VD_BLOCK_FREE
2404 && cImagesFromRead != 1)
2405 {
2406 unsigned cImagesToProcess = cImagesFromRead;
2407
2408 for (PVDIMAGE pCurrImage = pImageFrom->pPrev;
2409 pCurrImage != NULL && rc == VERR_VD_BLOCK_FREE;
2410 pCurrImage = pCurrImage->pPrev)
2411 {
2412 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
2413 uOffset, cbThisRead,
2414 &IoCtx, &cbThisRead);
2415 if (cImagesToProcess == 1)
2416 break;
2417 else if (cImagesToProcess > 0)
2418 cImagesToProcess--;
2419 }
2420 }
2421 }
2422 else
2423 rc = vdReadHelper(pDiskFrom, pImageFrom, uOffset, pvBuf, cbThisRead,
2424 false /* fUpdateCache */);
2425
2426 if (RT_FAILURE(rc) && rc != VERR_VD_BLOCK_FREE)
2427 break;
2428
2429 rc2 = vdThreadFinishRead(pDiskFrom);
2430 AssertRC(rc2);
2431 fLockReadFrom = false;
2432
2433 if (rc != VERR_VD_BLOCK_FREE)
2434 {
2435 rc2 = vdThreadStartWrite(pDiskTo);
2436 AssertRC(rc2);
2437 fLockWriteTo = true;
2438
2439 /* Only do collapsed I/O if we are copying the data blockwise. */
2440 rc = vdWriteHelperEx(pDiskTo, pDiskTo->pLast, NULL, uOffset, pvBuf,
2441 cbThisRead, VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG /* fFlags */,
2442 fBlockwiseCopy ? cImagesToRead : 0);
2443 if (RT_FAILURE(rc))
2444 break;
2445
2446 rc2 = vdThreadFinishWrite(pDiskTo);
2447 AssertRC(rc2);
2448 fLockWriteTo = false;
2449 }
2450 else /* Don't propagate the error to the outside */
2451 rc = VINF_SUCCESS;
2452
2453 uOffset += cbThisRead;
2454 cbRemaining -= cbThisRead;
2455
2456 unsigned uProgressNew = uOffset * 99 / cbSize;
2457 if (uProgressNew != uProgressOld)
2458 {
2459 uProgressOld = uProgressNew;
2460
2461 if (pIfProgress && pIfProgress->pfnProgress)
2462 {
2463 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
2464 uProgressOld);
2465 if (RT_FAILURE(rc))
2466 break;
2467 }
2468 if (pDstIfProgress && pDstIfProgress->pfnProgress)
2469 {
2470 rc = pDstIfProgress->pfnProgress(pDstIfProgress->Core.pvUser,
2471 uProgressOld);
2472 if (RT_FAILURE(rc))
2473 break;
2474 }
2475 }
2476 } while (uOffset < cbSize);
2477
2478 RTMemFree(pvBuf);
2479
2480 if (fLockReadFrom)
2481 {
2482 rc2 = vdThreadFinishRead(pDiskFrom);
2483 AssertRC(rc2);
2484 }
2485
2486 if (fLockWriteTo)
2487 {
2488 rc2 = vdThreadFinishWrite(pDiskTo);
2489 AssertRC(rc2);
2490 }
2491
2492 LogFlowFunc(("returns rc=%Rrc\n", rc));
2493 return rc;
2494}
2495
2496/**
2497 * Flush helper async version.
2498 */
2499static int vdSetModifiedHelperAsync(PVDIOCTX pIoCtx)
2500{
2501 int rc = VINF_SUCCESS;
2502 PVBOXHDD pDisk = pIoCtx->pDisk;
2503 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2504
2505 rc = pImage->Backend->pfnFlush(pImage->pBackendData, pIoCtx);
2506 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2507 rc = VINF_SUCCESS;
2508
2509 return rc;
2510}
2511
2512/**
2513 * internal: mark the disk as modified - async version.
2514 */
2515static int vdSetModifiedFlagAsync(PVBOXHDD pDisk, PVDIOCTX pIoCtx)
2516{
2517 int rc = VINF_SUCCESS;
2518
2519 VD_IS_LOCKED(pDisk);
2520
2521 pDisk->uModified |= VD_IMAGE_MODIFIED_FLAG;
2522 if (pDisk->uModified & VD_IMAGE_MODIFIED_FIRST)
2523 {
2524 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2525 if (RT_SUCCESS(rc))
2526 {
2527 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FIRST;
2528
2529 /* First modify, so create a UUID and ensure it's written to disk. */
2530 vdResetModifiedFlag(pDisk);
2531
2532 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
2533 {
2534 PVDIOCTX pIoCtxFlush = vdIoCtxChildAlloc(pDisk, VDIOCTXTXDIR_FLUSH,
2535 0, 0, pDisk->pLast,
2536 NULL, pIoCtx, 0, 0, NULL,
2537 vdSetModifiedHelperAsync);
2538
2539 if (pIoCtxFlush)
2540 {
2541 rc = vdIoCtxProcessLocked(pIoCtxFlush);
2542 if (rc == VINF_VD_ASYNC_IO_FINISHED)
2543 {
2544 vdIoCtxUnlockDisk(pDisk, pIoCtx, false /* fProcessDeferredReqs */);
2545 vdIoCtxFree(pDisk, pIoCtxFlush);
2546 }
2547 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2548 {
2549 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
2550 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2551 }
2552 else /* Another error */
2553 vdIoCtxFree(pDisk, pIoCtxFlush);
2554 }
2555 else
2556 rc = VERR_NO_MEMORY;
2557 }
2558 }
2559 }
2560
2561 return rc;
2562}
2563
2564static int vdWriteHelperCommitAsync(PVDIOCTX pIoCtx)
2565{
2566 int rc = VINF_SUCCESS;
2567 PVDIMAGE pImage = pIoCtx->Req.Io.pImageStart;
2568 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2569 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2570 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2571
2572 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2573 rc = pImage->Backend->pfnWrite(pImage->pBackendData,
2574 pIoCtx->Req.Io.uOffset - cbPreRead,
2575 cbPreRead + cbThisWrite + cbPostRead,
2576 pIoCtx, NULL, &cbPreRead, &cbPostRead, 0);
2577 Assert(rc != VERR_VD_BLOCK_FREE);
2578 Assert(rc == VERR_VD_NOT_ENOUGH_METADATA || cbPreRead == 0);
2579 Assert(rc == VERR_VD_NOT_ENOUGH_METADATA || cbPostRead == 0);
2580 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2581 rc = VINF_SUCCESS;
2582 else if (rc == VERR_VD_IOCTX_HALT)
2583 {
2584 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2585 rc = VINF_SUCCESS;
2586 }
2587
2588 LogFlowFunc(("returns rc=%Rrc\n", rc));
2589 return rc;
2590}
2591
2592static int vdWriteHelperOptimizedCmpAndWriteAsync(PVDIOCTX pIoCtx)
2593{
2594 int rc = VINF_SUCCESS;
2595 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2596 size_t cbThisWrite = 0;
2597 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2598 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2599 size_t cbWriteCopy = pIoCtx->Type.Child.Write.Optimized.cbWriteCopy;
2600 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2601 size_t cbReadImage = pIoCtx->Type.Child.Write.Optimized.cbReadImage;
2602 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
2603
2604 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2605
2606 AssertPtr(pIoCtxParent);
2607 Assert(!pIoCtxParent->pIoCtxParent);
2608 Assert(!pIoCtx->Req.Io.cbTransferLeft && !pIoCtx->cMetaTransfersPending);
2609
2610 vdIoCtxChildReset(pIoCtx);
2611 cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2612 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbPreRead);
2613
2614 /* Check if the write would modify anything in this block. */
2615 if (!RTSgBufCmp(&pIoCtx->Req.Io.SgBuf, &pIoCtxParent->Req.Io.SgBuf, cbThisWrite))
2616 {
2617 RTSGBUF SgBufSrcTmp;
2618
2619 RTSgBufClone(&SgBufSrcTmp, &pIoCtxParent->Req.Io.SgBuf);
2620 RTSgBufAdvance(&SgBufSrcTmp, cbThisWrite);
2621 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbThisWrite);
2622
2623 if (!cbWriteCopy || !RTSgBufCmp(&pIoCtx->Req.Io.SgBuf, &SgBufSrcTmp, cbWriteCopy))
2624 {
2625 /* Block is completely unchanged, so no need to write anything. */
2626 LogFlowFunc(("Block didn't changed\n"));
2627 ASMAtomicWriteU32(&pIoCtx->Req.Io.cbTransferLeft, 0);
2628 RTSgBufAdvance(&pIoCtxParent->Req.Io.SgBuf, cbThisWrite);
2629 return VINF_VD_ASYNC_IO_FINISHED;
2630 }
2631 }
2632
2633 /* Copy the data to the right place in the buffer. */
2634 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2635 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbPreRead);
2636 vdIoCtxCopy(pIoCtx, pIoCtxParent, cbThisWrite);
2637
2638 /* Handle the data that goes after the write to fill the block. */
2639 if (cbPostRead)
2640 {
2641 /* Now assemble the remaining data. */
2642 if (cbWriteCopy)
2643 {
2644 /*
2645 * The S/G buffer of the parent needs to be cloned because
2646 * it is not allowed to modify the state.
2647 */
2648 RTSGBUF SgBufParentTmp;
2649
2650 RTSgBufClone(&SgBufParentTmp, &pIoCtxParent->Req.Io.SgBuf);
2651 RTSgBufCopy(&pIoCtx->Req.Io.SgBuf, &SgBufParentTmp, cbWriteCopy);
2652 }
2653
2654 /* Zero out the remainder of this block. Will never be visible, as this
2655 * is beyond the limit of the image. */
2656 if (cbFill)
2657 {
2658 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbReadImage);
2659 vdIoCtxSet(pIoCtx, '\0', cbFill);
2660 }
2661 }
2662
2663 /* Write the full block to the virtual disk. */
2664 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2665 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2666
2667 return rc;
2668}
2669
2670static int vdWriteHelperOptimizedPreReadAsync(PVDIOCTX pIoCtx)
2671{
2672 int rc = VINF_SUCCESS;
2673
2674 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2675
2676 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2677
2678 if ( pIoCtx->Req.Io.cbTransferLeft
2679 && !pIoCtx->cDataTransfersPending)
2680 rc = vdReadHelperAsync(pIoCtx);
2681
2682 if ( ( RT_SUCCESS(rc)
2683 || (rc == VERR_VD_ASYNC_IO_IN_PROGRESS))
2684 && ( pIoCtx->Req.Io.cbTransferLeft
2685 || pIoCtx->cMetaTransfersPending))
2686 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2687 else
2688 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperOptimizedCmpAndWriteAsync;
2689
2690 return rc;
2691}
2692
2693/**
2694 * internal: write a complete block (only used for diff images), taking the
2695 * remaining data from parent images. This implementation optimizes out writes
2696 * that do not change the data relative to the state as of the parent images.
2697 * All backends which support differential/growing images support this - async version.
2698 */
2699static int vdWriteHelperOptimizedAsync(PVDIOCTX pIoCtx)
2700{
2701 PVBOXHDD pDisk = pIoCtx->pDisk;
2702 uint64_t uOffset = pIoCtx->Type.Child.uOffsetSaved;
2703 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2704 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2705 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2706 size_t cbWrite = pIoCtx->Type.Child.cbWriteParent;
2707 size_t cbFill = 0;
2708 size_t cbWriteCopy = 0;
2709 size_t cbReadImage = 0;
2710
2711 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2712
2713 AssertPtr(pIoCtx->pIoCtxParent);
2714 Assert(!pIoCtx->pIoCtxParent->pIoCtxParent);
2715
2716 if (cbPostRead)
2717 {
2718 /* Figure out how much we cannot read from the image, because
2719 * the last block to write might exceed the nominal size of the
2720 * image for technical reasons. */
2721 if (uOffset + cbThisWrite + cbPostRead > pDisk->cbSize)
2722 cbFill = uOffset + cbThisWrite + cbPostRead - pDisk->cbSize;
2723
2724 /* If we have data to be written, use that instead of reading
2725 * data from the image. */
2726 if (cbWrite > cbThisWrite)
2727 cbWriteCopy = RT_MIN(cbWrite - cbThisWrite, cbPostRead);
2728
2729 /* The rest must be read from the image. */
2730 cbReadImage = cbPostRead - cbWriteCopy - cbFill;
2731 }
2732
2733 pIoCtx->Type.Child.Write.Optimized.cbFill = cbFill;
2734 pIoCtx->Type.Child.Write.Optimized.cbWriteCopy = cbWriteCopy;
2735 pIoCtx->Type.Child.Write.Optimized.cbReadImage = cbReadImage;
2736
2737 /* Read the entire data of the block so that we can compare whether it will
2738 * be modified by the write or not. */
2739 size_t cbTmp = cbPreRead + cbThisWrite + cbPostRead - cbFill; Assert(cbTmp == (uint32_t)cbTmp);
2740 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbTmp;
2741 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2742 pIoCtx->Req.Io.uOffset -= cbPreRead;
2743
2744 /* Next step */
2745 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperOptimizedPreReadAsync;
2746 return VINF_SUCCESS;
2747}
2748
2749static int vdWriteHelperStandardReadImageAsync(PVDIOCTX pIoCtx)
2750{
2751 int rc = VINF_SUCCESS;
2752
2753 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2754
2755 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2756
2757 if ( pIoCtx->Req.Io.cbTransferLeft
2758 && !pIoCtx->cDataTransfersPending)
2759 rc = vdReadHelperAsync(pIoCtx);
2760
2761 if ( RT_SUCCESS(rc)
2762 && ( pIoCtx->Req.Io.cbTransferLeft
2763 || pIoCtx->cMetaTransfersPending))
2764 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2765 else
2766 {
2767 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2768
2769 /* Zero out the remainder of this block. Will never be visible, as this
2770 * is beyond the limit of the image. */
2771 if (cbFill)
2772 vdIoCtxSet(pIoCtx, '\0', cbFill);
2773
2774 /* Write the full block to the virtual disk. */
2775 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2776
2777 vdIoCtxChildReset(pIoCtx);
2778 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2779 }
2780
2781 return rc;
2782}
2783
2784static int vdWriteHelperStandardAssemble(PVDIOCTX pIoCtx)
2785{
2786 int rc = VINF_SUCCESS;
2787 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2788 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2789 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
2790
2791 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2792
2793 vdIoCtxCopy(pIoCtx, pIoCtxParent, cbThisWrite);
2794 if (cbPostRead)
2795 {
2796 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2797 size_t cbWriteCopy = pIoCtx->Type.Child.Write.Optimized.cbWriteCopy;
2798 size_t cbReadImage = pIoCtx->Type.Child.Write.Optimized.cbReadImage;
2799
2800 /* Now assemble the remaining data. */
2801 if (cbWriteCopy)
2802 {
2803 /*
2804 * The S/G buffer of the parent needs to be cloned because
2805 * it is not allowed to modify the state.
2806 */
2807 RTSGBUF SgBufParentTmp;
2808
2809 RTSgBufClone(&SgBufParentTmp, &pIoCtxParent->Req.Io.SgBuf);
2810 RTSgBufCopy(&pIoCtx->Req.Io.SgBuf, &SgBufParentTmp, cbWriteCopy);
2811 }
2812
2813 if (cbReadImage)
2814 {
2815 /* Read remaining data. */
2816 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardReadImageAsync;
2817
2818 /* Read the data that goes before the write to fill the block. */
2819 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbReadImage; Assert(cbReadImage == (uint32_t)cbReadImage);
2820 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2821 pIoCtx->Req.Io.uOffset += cbWriteCopy;
2822 }
2823 else
2824 {
2825 /* Zero out the remainder of this block. Will never be visible, as this
2826 * is beyond the limit of the image. */
2827 if (cbFill)
2828 vdIoCtxSet(pIoCtx, '\0', cbFill);
2829
2830 /* Write the full block to the virtual disk. */
2831 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2832 vdIoCtxChildReset(pIoCtx);
2833 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2834 }
2835 }
2836 else
2837 {
2838 /* Write the full block to the virtual disk. */
2839 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2840 vdIoCtxChildReset(pIoCtx);
2841 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2842 }
2843
2844 return rc;
2845}
2846
2847static int vdWriteHelperStandardPreReadAsync(PVDIOCTX pIoCtx)
2848{
2849 int rc = VINF_SUCCESS;
2850
2851 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2852
2853 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2854
2855 if ( pIoCtx->Req.Io.cbTransferLeft
2856 && !pIoCtx->cDataTransfersPending)
2857 rc = vdReadHelperAsync(pIoCtx);
2858
2859 if ( RT_SUCCESS(rc)
2860 && ( pIoCtx->Req.Io.cbTransferLeft
2861 || pIoCtx->cMetaTransfersPending))
2862 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2863 else
2864 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardAssemble;
2865
2866 return rc;
2867}
2868
2869static int vdWriteHelperStandardAsync(PVDIOCTX pIoCtx)
2870{
2871 PVBOXHDD pDisk = pIoCtx->pDisk;
2872 uint64_t uOffset = pIoCtx->Type.Child.uOffsetSaved;
2873 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2874 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2875 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2876 size_t cbWrite = pIoCtx->Type.Child.cbWriteParent;
2877 size_t cbFill = 0;
2878 size_t cbWriteCopy = 0;
2879 size_t cbReadImage = 0;
2880
2881 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2882
2883 AssertPtr(pIoCtx->pIoCtxParent);
2884 Assert(!pIoCtx->pIoCtxParent->pIoCtxParent);
2885
2886 /* Calculate the amount of data to read that goes after the write to fill the block. */
2887 if (cbPostRead)
2888 {
2889 /* If we have data to be written, use that instead of reading
2890 * data from the image. */
2891 if (cbWrite > cbThisWrite)
2892 cbWriteCopy = RT_MIN(cbWrite - cbThisWrite, cbPostRead);
2893 else
2894 cbWriteCopy = 0;
2895
2896 /* Figure out how much we cannot read from the image, because
2897 * the last block to write might exceed the nominal size of the
2898 * image for technical reasons. */
2899 if (uOffset + cbThisWrite + cbPostRead > pDisk->cbSize)
2900 cbFill = uOffset + cbThisWrite + cbPostRead - pDisk->cbSize;
2901
2902 /* The rest must be read from the image. */
2903 cbReadImage = cbPostRead - cbWriteCopy - cbFill;
2904 }
2905
2906 pIoCtx->Type.Child.Write.Optimized.cbFill = cbFill;
2907 pIoCtx->Type.Child.Write.Optimized.cbWriteCopy = cbWriteCopy;
2908 pIoCtx->Type.Child.Write.Optimized.cbReadImage = cbReadImage;
2909
2910 /* Next step */
2911 if (cbPreRead)
2912 {
2913 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardPreReadAsync;
2914
2915 /* Read the data that goes before the write to fill the block. */
2916 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbPreRead; Assert(cbPreRead == (uint32_t)cbPreRead);
2917 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2918 pIoCtx->Req.Io.uOffset -= cbPreRead;
2919 }
2920 else
2921 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardAssemble;
2922
2923 return VINF_SUCCESS;
2924}
2925
2926/**
2927 * internal: write buffer to the image, taking care of block boundaries and
2928 * write optimizations - async version.
2929 */
2930static int vdWriteHelperAsync(PVDIOCTX pIoCtx)
2931{
2932 int rc;
2933 size_t cbWrite = pIoCtx->Req.Io.cbTransfer;
2934 uint64_t uOffset = pIoCtx->Req.Io.uOffset;
2935 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2936 PVBOXHDD pDisk = pIoCtx->pDisk;
2937 unsigned fWrite;
2938 size_t cbThisWrite;
2939 size_t cbPreRead, cbPostRead;
2940
2941 /* Apply write filter chain here if it was not done already. */
2942 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_WRITE_FILTER_APPLIED))
2943 {
2944 rc = vdFilterChainApplyWrite(pDisk, uOffset, cbWrite, pIoCtx);
2945 if (RT_FAILURE(rc))
2946 return rc;
2947 pIoCtx->fFlags |= VDIOCTX_FLAGS_WRITE_FILTER_APPLIED;
2948 }
2949
2950 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG))
2951 {
2952 rc = vdSetModifiedFlagAsync(pDisk, pIoCtx);
2953 if (RT_FAILURE(rc)) /* Includes I/O in progress. */
2954 return rc;
2955 }
2956
2957 rc = vdDiscardSetRangeAllocated(pDisk, uOffset, cbWrite);
2958 if (RT_FAILURE(rc))
2959 return rc;
2960
2961 /* Loop until all written. */
2962 do
2963 {
2964 /* Try to write the possibly partial block to the last opened image.
2965 * This works when the block is already allocated in this image or
2966 * if it is a full-block write (and allocation isn't suppressed below).
2967 * For image formats which don't support zero blocks, it's beneficial
2968 * to avoid unnecessarily allocating unchanged blocks. This prevents
2969 * unwanted expanding of images. VMDK is an example. */
2970 cbThisWrite = cbWrite;
2971
2972 /*
2973 * Check whether there is a full block write in progress which was not allocated.
2974 * Defer I/O if the range interferes.
2975 */
2976 if ( pDisk->pIoCtxLockOwner != NIL_VDIOCTX
2977 && uOffset >= pDisk->uOffsetStartLocked
2978 && uOffset < pDisk->uOffsetEndLocked)
2979 {
2980 Log(("Interferring write while allocating a new block => deferring write\n"));
2981 vdIoCtxDefer(pDisk, pIoCtx);
2982 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2983 break;
2984 }
2985
2986 fWrite = (pImage->uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME)
2987 ? 0 : VD_WRITE_NO_ALLOC;
2988 rc = pImage->Backend->pfnWrite(pImage->pBackendData, uOffset, cbThisWrite,
2989 pIoCtx, &cbThisWrite, &cbPreRead, &cbPostRead,
2990 fWrite);
2991 if (rc == VERR_VD_BLOCK_FREE)
2992 {
2993 /* Lock the disk .*/
2994 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2995 if (RT_SUCCESS(rc))
2996 {
2997 /*
2998 * Allocate segment and buffer in one go.
2999 * A bit hackish but avoids the need to allocate memory twice.
3000 */
3001 PRTSGBUF pTmp = (PRTSGBUF)RTMemAlloc(cbPreRead + cbThisWrite + cbPostRead + sizeof(RTSGSEG) + sizeof(RTSGBUF));
3002 AssertBreakStmt(VALID_PTR(pTmp), rc = VERR_NO_MEMORY);
3003 PRTSGSEG pSeg = (PRTSGSEG)(pTmp + 1);
3004
3005 pSeg->pvSeg = pSeg + 1;
3006 pSeg->cbSeg = cbPreRead + cbThisWrite + cbPostRead;
3007 RTSgBufInit(pTmp, pSeg, 1);
3008
3009 PVDIOCTX pIoCtxWrite = vdIoCtxChildAlloc(pDisk, VDIOCTXTXDIR_WRITE,
3010 uOffset, pSeg->cbSeg, pImage,
3011 pTmp,
3012 pIoCtx, cbThisWrite,
3013 cbWrite,
3014 pTmp,
3015 (pImage->uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME)
3016 ? vdWriteHelperStandardAsync
3017 : vdWriteHelperOptimizedAsync);
3018 if (!VALID_PTR(pIoCtxWrite))
3019 {
3020 RTMemTmpFree(pTmp);
3021 rc = VERR_NO_MEMORY;
3022 break;
3023 }
3024
3025 LogFlowFunc(("Disk is growing because of pIoCtx=%#p pIoCtxWrite=%#p\n",
3026 pIoCtx, pIoCtxWrite));
3027
3028 /* Save the current range for the growing operation to check for intersecting requests later. */
3029 pDisk->uOffsetStartLocked = uOffset - cbPreRead;
3030 pDisk->uOffsetEndLocked = uOffset + cbThisWrite + cbPostRead;
3031
3032 pIoCtxWrite->Type.Child.cbPreRead = cbPreRead;
3033 pIoCtxWrite->Type.Child.cbPostRead = cbPostRead;
3034 pIoCtxWrite->Req.Io.pImageParentOverride = pIoCtx->Req.Io.pImageParentOverride;
3035
3036 /* Process the write request */
3037 rc = vdIoCtxProcessLocked(pIoCtxWrite);
3038
3039 if (RT_FAILURE(rc) && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
3040 {
3041 vdIoCtxFree(pDisk, pIoCtxWrite);
3042 break;
3043 }
3044 else if ( rc == VINF_VD_ASYNC_IO_FINISHED
3045 && ASMAtomicCmpXchgBool(&pIoCtxWrite->fComplete, true, false))
3046 {
3047 LogFlow(("Child write request completed\n"));
3048 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbThisWrite);
3049 Assert(cbThisWrite == (uint32_t)cbThisWrite);
3050 rc = pIoCtxWrite->rcReq;
3051 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbThisWrite);
3052 vdIoCtxUnlockDisk(pDisk, pIoCtx, false /* fProcessDeferredReqs*/ );
3053 vdIoCtxFree(pDisk, pIoCtxWrite);
3054 }
3055 else
3056 {
3057 LogFlow(("Child write pending\n"));
3058 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
3059 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
3060 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
3061 cbWrite -= cbThisWrite;
3062 uOffset += cbThisWrite;
3063 break;
3064 }
3065 }
3066 else
3067 {
3068 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
3069 break;
3070 }
3071 }
3072
3073 if (rc == VERR_VD_IOCTX_HALT)
3074 {
3075 cbWrite -= cbThisWrite;
3076 uOffset += cbThisWrite;
3077 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
3078 break;
3079 }
3080 else if (rc == VERR_VD_NOT_ENOUGH_METADATA)
3081 break;
3082
3083 cbWrite -= cbThisWrite;
3084 uOffset += cbThisWrite;
3085 } while (cbWrite != 0 && (RT_SUCCESS(rc) || rc == VERR_VD_ASYNC_IO_IN_PROGRESS));
3086
3087 if ( rc == VERR_VD_ASYNC_IO_IN_PROGRESS
3088 || rc == VERR_VD_NOT_ENOUGH_METADATA
3089 || rc == VERR_VD_IOCTX_HALT)
3090 {
3091 /*
3092 * Tell the caller that we don't need to go back here because all
3093 * writes are initiated.
3094 */
3095 if ( !cbWrite
3096 && rc != VERR_VD_IOCTX_HALT)
3097 rc = VINF_SUCCESS;
3098
3099 pIoCtx->Req.Io.uOffset = uOffset;
3100 pIoCtx->Req.Io.cbTransfer = cbWrite;
3101 }
3102
3103 return rc;
3104}
3105
3106/**
3107 * Flush helper async version.
3108 */
3109static int vdFlushHelperAsync(PVDIOCTX pIoCtx)
3110{
3111 int rc = VINF_SUCCESS;
3112 PVBOXHDD pDisk = pIoCtx->pDisk;
3113 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
3114
3115 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
3116 if (RT_SUCCESS(rc))
3117 {
3118 /* Mark the whole disk as locked. */
3119 pDisk->uOffsetStartLocked = 0;
3120 pDisk->uOffsetEndLocked = UINT64_C(0xffffffffffffffff);
3121
3122 vdResetModifiedFlag(pDisk);
3123 rc = pImage->Backend->pfnFlush(pImage->pBackendData, pIoCtx);
3124 if ( ( RT_SUCCESS(rc)
3125 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS
3126 || rc == VERR_VD_IOCTX_HALT)
3127 && pDisk->pCache)
3128 {
3129 rc = pDisk->pCache->Backend->pfnFlush(pDisk->pCache->pBackendData, pIoCtx);
3130 if ( RT_SUCCESS(rc)
3131 || ( rc != VERR_VD_ASYNC_IO_IN_PROGRESS
3132 && rc != VERR_VD_IOCTX_HALT))
3133 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessBlockedReqs */);
3134 else if (rc != VERR_VD_IOCTX_HALT)
3135 rc = VINF_SUCCESS;
3136 }
3137 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3138 rc = VINF_SUCCESS;
3139 else if (rc != VERR_VD_IOCTX_HALT)/* Some other error. */
3140 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessBlockedReqs */);
3141 }
3142
3143 return rc;
3144}
3145
3146/**
3147 * Async discard helper - discards a whole block which is recorded in the block
3148 * tree.
3149 *
3150 * @returns VBox status code.
3151 * @param pIoCtx The I/O context to operate on.
3152 */
3153static int vdDiscardWholeBlockAsync(PVDIOCTX pIoCtx)
3154{
3155 int rc = VINF_SUCCESS;
3156 PVBOXHDD pDisk = pIoCtx->pDisk;
3157 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3158 PVDDISCARDBLOCK pBlock = pIoCtx->Req.Discard.pBlock;
3159 size_t cbPreAllocated, cbPostAllocated, cbActuallyDiscarded;
3160
3161 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
3162
3163 AssertPtr(pBlock);
3164
3165 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
3166 pBlock->Core.Key, pBlock->cbDiscard,
3167 &cbPreAllocated, &cbPostAllocated,
3168 &cbActuallyDiscarded, NULL, 0);
3169 Assert(rc != VERR_VD_DISCARD_ALIGNMENT_NOT_MET);
3170 Assert(!cbPreAllocated);
3171 Assert(!cbPostAllocated);
3172 Assert(cbActuallyDiscarded == pBlock->cbDiscard || RT_FAILURE(rc));
3173
3174 /* Remove the block on success. */
3175 if ( RT_SUCCESS(rc)
3176 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3177 {
3178 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
3179 Assert(pBlockRemove == pBlock);
3180
3181 pDiscard->cbDiscarding -= pBlock->cbDiscard;
3182 RTListNodeRemove(&pBlock->NodeLru);
3183 RTMemFree(pBlock->pbmAllocated);
3184 RTMemFree(pBlock);
3185 pIoCtx->Req.Discard.pBlock = NULL;/* Safety precaution. */
3186 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync; /* Next part. */
3187 rc = VINF_SUCCESS;
3188 }
3189
3190 LogFlowFunc(("returns rc=%Rrc\n", rc));
3191 return rc;
3192}
3193
3194/**
3195 * Removes the least recently used blocks from the waiting list until
3196 * the new value is reached - version for async I/O.
3197 *
3198 * @returns VBox status code.
3199 * @param pDisk VD disk container.
3200 * @param pDiscard The discard state.
3201 * @param cbDiscardingNew How many bytes should be waiting on success.
3202 * The number of bytes waiting can be less.
3203 */
3204static int vdDiscardRemoveBlocksAsync(PVBOXHDD pDisk, PVDIOCTX pIoCtx, size_t cbDiscardingNew)
3205{
3206 int rc = VINF_SUCCESS;
3207 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3208
3209 LogFlowFunc(("pDisk=%#p pDiscard=%#p cbDiscardingNew=%zu\n",
3210 pDisk, pDiscard, cbDiscardingNew));
3211
3212 while (pDiscard->cbDiscarding > cbDiscardingNew)
3213 {
3214 PVDDISCARDBLOCK pBlock = RTListGetLast(&pDiscard->ListLru, VDDISCARDBLOCK, NodeLru);
3215
3216 Assert(!RTListIsEmpty(&pDiscard->ListLru));
3217
3218 /* Go over the allocation bitmap and mark all discarded sectors as unused. */
3219 uint64_t offStart = pBlock->Core.Key;
3220 uint32_t idxStart = 0;
3221 size_t cbLeft = pBlock->cbDiscard;
3222 bool fAllocated = ASMBitTest(pBlock->pbmAllocated, idxStart);
3223 uint32_t cSectors = (uint32_t)(pBlock->cbDiscard / 512);
3224
3225 while (cbLeft > 0)
3226 {
3227 int32_t idxEnd;
3228 size_t cbThis = cbLeft;
3229
3230 if (fAllocated)
3231 {
3232 /* Check for the first unallocated bit. */
3233 idxEnd = ASMBitNextClear(pBlock->pbmAllocated, cSectors, idxStart);
3234 if (idxEnd != -1)
3235 {
3236 cbThis = (idxEnd - idxStart) * 512;
3237 fAllocated = false;
3238 }
3239 }
3240 else
3241 {
3242 /* Mark as unused and check for the first set bit. */
3243 idxEnd = ASMBitNextSet(pBlock->pbmAllocated, cSectors, idxStart);
3244 if (idxEnd != -1)
3245 cbThis = (idxEnd - idxStart) * 512;
3246
3247 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
3248 offStart, cbThis, NULL, NULL, &cbThis,
3249 NULL, VD_DISCARD_MARK_UNUSED);
3250 if ( RT_FAILURE(rc)
3251 && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
3252 break;
3253
3254 fAllocated = true;
3255 }
3256
3257 idxStart = idxEnd;
3258 offStart += cbThis;
3259 cbLeft -= cbThis;
3260 }
3261
3262 if ( RT_FAILURE(rc)
3263 && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
3264 break;
3265
3266 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
3267 Assert(pBlockRemove == pBlock);
3268 RTListNodeRemove(&pBlock->NodeLru);
3269
3270 pDiscard->cbDiscarding -= pBlock->cbDiscard;
3271 RTMemFree(pBlock->pbmAllocated);
3272 RTMemFree(pBlock);
3273 }
3274
3275 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3276 rc = VINF_SUCCESS;
3277
3278 Assert(RT_FAILURE(rc) || pDiscard->cbDiscarding <= cbDiscardingNew);
3279
3280 LogFlowFunc(("returns rc=%Rrc\n", rc));
3281 return rc;
3282}
3283
3284/**
3285 * Async discard helper - discards the current range if there is no matching
3286 * block in the tree.
3287 *
3288 * @returns VBox status code.
3289 * @param pIoCtx The I/O context to operate on.
3290 */
3291static int vdDiscardCurrentRangeAsync(PVDIOCTX pIoCtx)
3292{
3293 PVBOXHDD pDisk = pIoCtx->pDisk;
3294 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3295 uint64_t offStart = pIoCtx->Req.Discard.offCur;
3296 size_t cbThisDiscard = pIoCtx->Req.Discard.cbThisDiscard;
3297 void *pbmAllocated = NULL;
3298 size_t cbPreAllocated, cbPostAllocated;
3299 int rc = VINF_SUCCESS;
3300
3301 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
3302
3303 /* No block found, try to discard using the backend first. */
3304 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
3305 offStart, cbThisDiscard, &cbPreAllocated,
3306 &cbPostAllocated, &cbThisDiscard,
3307 &pbmAllocated, 0);
3308 if (rc == VERR_VD_DISCARD_ALIGNMENT_NOT_MET)
3309 {
3310 /* Create new discard block. */
3311 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTMemAllocZ(sizeof(VDDISCARDBLOCK));
3312 if (pBlock)
3313 {
3314 pBlock->Core.Key = offStart - cbPreAllocated;
3315 pBlock->Core.KeyLast = offStart + cbThisDiscard + cbPostAllocated - 1;
3316 pBlock->cbDiscard = cbPreAllocated + cbThisDiscard + cbPostAllocated;
3317 pBlock->pbmAllocated = pbmAllocated;
3318 bool fInserted = RTAvlrU64Insert(pDiscard->pTreeBlocks, &pBlock->Core);
3319 Assert(fInserted);
3320
3321 RTListPrepend(&pDiscard->ListLru, &pBlock->NodeLru);
3322 pDiscard->cbDiscarding += pBlock->cbDiscard;
3323
3324 Assert(pIoCtx->Req.Discard.cbDiscardLeft >= cbThisDiscard);
3325 pIoCtx->Req.Discard.cbDiscardLeft -= cbThisDiscard;
3326 pIoCtx->Req.Discard.offCur += cbThisDiscard;
3327 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3328
3329 if (pDiscard->cbDiscarding > VD_DISCARD_REMOVE_THRESHOLD)
3330 rc = vdDiscardRemoveBlocksAsync(pDisk, pIoCtx, VD_DISCARD_REMOVE_THRESHOLD);
3331 else
3332 rc = VINF_SUCCESS;
3333
3334 if (RT_SUCCESS(rc))
3335 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync; /* Next part. */
3336 }
3337 else
3338 {
3339 RTMemFree(pbmAllocated);
3340 rc = VERR_NO_MEMORY;
3341 }
3342 }
3343 else if ( RT_SUCCESS(rc)
3344 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS) /* Save state and andvance to next range. */
3345 {
3346 Assert(pIoCtx->Req.Discard.cbDiscardLeft >= cbThisDiscard);
3347 pIoCtx->Req.Discard.cbDiscardLeft -= cbThisDiscard;
3348 pIoCtx->Req.Discard.offCur += cbThisDiscard;
3349 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3350 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync;
3351 rc = VINF_SUCCESS;
3352 }
3353
3354 LogFlowFunc(("returns rc=%Rrc\n", rc));
3355 return rc;
3356}
3357
3358/**
3359 * Async discard helper - entry point.
3360 *
3361 * @returns VBox status code.
3362 * @param pIoCtx The I/O context to operate on.
3363 */
3364static int vdDiscardHelperAsync(PVDIOCTX pIoCtx)
3365{
3366 int rc = VINF_SUCCESS;
3367 PVBOXHDD pDisk = pIoCtx->pDisk;
3368 PCRTRANGE paRanges = pIoCtx->Req.Discard.paRanges;
3369 unsigned cRanges = pIoCtx->Req.Discard.cRanges;
3370 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3371
3372 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
3373
3374 /* Check if the I/O context processed all ranges. */
3375 if ( pIoCtx->Req.Discard.idxRange == cRanges
3376 && !pIoCtx->Req.Discard.cbDiscardLeft)
3377 {
3378 LogFlowFunc(("All ranges discarded, completing\n"));
3379 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessDeferredReqs*/);
3380 return VINF_SUCCESS;
3381 }
3382
3383 if (pDisk->pIoCtxLockOwner != pIoCtx)
3384 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
3385
3386 if (RT_SUCCESS(rc))
3387 {
3388 uint64_t offStart = pIoCtx->Req.Discard.offCur;
3389 size_t cbDiscardLeft = pIoCtx->Req.Discard.cbDiscardLeft;
3390 size_t cbThisDiscard;
3391
3392 pDisk->uOffsetStartLocked = offStart;
3393 pDisk->uOffsetEndLocked = offStart + cbDiscardLeft;
3394
3395 if (RT_UNLIKELY(!pDiscard))
3396 {
3397 pDiscard = vdDiscardStateCreate();
3398 if (!pDiscard)
3399 return VERR_NO_MEMORY;
3400
3401 pDisk->pDiscard = pDiscard;
3402 }
3403
3404 if (!pIoCtx->Req.Discard.cbDiscardLeft)
3405 {
3406 offStart = paRanges[pIoCtx->Req.Discard.idxRange].offStart;
3407 cbDiscardLeft = paRanges[pIoCtx->Req.Discard.idxRange].cbRange;
3408 LogFlowFunc(("New range descriptor loaded (%u) offStart=%llu cbDiscard=%zu\n",
3409 pIoCtx->Req.Discard.idxRange, offStart, cbDiscardLeft));
3410 pIoCtx->Req.Discard.idxRange++;
3411 }
3412
3413 /* Look for a matching block in the AVL tree first. */
3414 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, offStart, false);
3415 if (!pBlock || pBlock->Core.KeyLast < offStart)
3416 {
3417 PVDDISCARDBLOCK pBlockAbove = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, offStart, true);
3418
3419 /* Clip range to remain in the current block. */
3420 if (pBlockAbove)
3421 cbThisDiscard = RT_MIN(cbDiscardLeft, pBlockAbove->Core.KeyLast - offStart + 1);
3422 else
3423 cbThisDiscard = cbDiscardLeft;
3424
3425 Assert(!(cbThisDiscard % 512));
3426 pIoCtx->Req.Discard.pBlock = NULL;
3427 pIoCtx->pfnIoCtxTransferNext = vdDiscardCurrentRangeAsync;
3428 }
3429 else
3430 {
3431 /* Range lies partly in the block, update allocation bitmap. */
3432 int32_t idxStart, idxEnd;
3433
3434 cbThisDiscard = RT_MIN(cbDiscardLeft, pBlock->Core.KeyLast - offStart + 1);
3435
3436 AssertPtr(pBlock);
3437
3438 Assert(!(cbThisDiscard % 512));
3439 Assert(!((offStart - pBlock->Core.Key) % 512));
3440
3441 idxStart = (offStart - pBlock->Core.Key) / 512;
3442 idxEnd = idxStart + (int32_t)(cbThisDiscard / 512);
3443
3444 ASMBitClearRange(pBlock->pbmAllocated, idxStart, idxEnd);
3445
3446 cbDiscardLeft -= cbThisDiscard;
3447 offStart += cbThisDiscard;
3448
3449 /* Call the backend to discard the block if it is completely unallocated now. */
3450 if (ASMBitFirstSet((volatile void *)pBlock->pbmAllocated, (uint32_t)(pBlock->cbDiscard / 512)) == -1)
3451 {
3452 pIoCtx->Req.Discard.pBlock = pBlock;
3453 pIoCtx->pfnIoCtxTransferNext = vdDiscardWholeBlockAsync;
3454 rc = VINF_SUCCESS;
3455 }
3456 else
3457 {
3458 RTListNodeRemove(&pBlock->NodeLru);
3459 RTListPrepend(&pDiscard->ListLru, &pBlock->NodeLru);
3460
3461 /* Start with next range. */
3462 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync;
3463 rc = VINF_SUCCESS;
3464 }
3465 }
3466
3467 /* Save state in the context. */
3468 pIoCtx->Req.Discard.offCur = offStart;
3469 pIoCtx->Req.Discard.cbDiscardLeft = cbDiscardLeft;
3470 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3471 }
3472
3473 LogFlowFunc(("returns rc=%Rrc\n", rc));
3474 return rc;
3475}
3476
3477#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
3478/**
3479 * @copydoc VDPLUGIN::pfnRegisterImage
3480 */
3481static DECLCALLBACK(int) vdPluginRegisterImage(void *pvUser, PCVBOXHDDBACKEND pBackend)
3482{
3483 int rc = VINF_SUCCESS;
3484
3485 if (pBackend->cbSize == sizeof(VBOXHDDBACKEND))
3486 vdAddBackend(pBackend);
3487 else
3488 {
3489 LogFunc(("ignored plugin: pBackend->cbSize=%d rc=%Rrc\n", pBackend->cbSize));
3490 rc = VERR_IGNORED;
3491 }
3492
3493 return rc;
3494}
3495
3496/**
3497 * @copydoc VDPLUGIN::pfnRegisterCache
3498 */
3499static DECLCALLBACK(int) vdPluginRegisterCache(void *pvUser, PCVDCACHEBACKEND pBackend)
3500{
3501 int rc = VINF_SUCCESS;
3502
3503 if (pBackend->cbSize == sizeof(VDCACHEBACKEND))
3504 vdAddCacheBackend(pBackend);
3505 else
3506 {
3507 LogFunc(("ignored plugin: pBackend->cbSize=%d rc=%Rrc\n", pBackend->cbSize));
3508 rc = VERR_IGNORED;
3509 }
3510
3511 return rc;
3512}
3513
3514/**
3515 * @copydoc VDPLUGIN::pfnRegisterFilter
3516 */
3517static DECLCALLBACK(int) vdPluginRegisterFilter(void *pvUser, PCVDFILTERBACKEND pBackend)
3518{
3519 int rc = VINF_SUCCESS;
3520
3521 if (pBackend->cbSize == sizeof(VDFILTERBACKEND))
3522 vdAddFilterBackend(pBackend);
3523 else
3524 {
3525 LogFunc(("ignored plugin: pBackend->cbSize=%d rc=%Rrc\n", pBackend->cbSize));
3526 rc = VERR_IGNORED;
3527 }
3528
3529 return rc;
3530}
3531
3532/**
3533 * Checks whether the given plugin filename was already loaded.
3534 *
3535 * @returns true if the plugin was already loaded, false otherwise.
3536 * @param pszFilename The filename to check.
3537 */
3538static bool vdPluginFind(const char *pszFilename)
3539{
3540 PVDPLUGIN pIt = NULL;
3541
3542 RTListForEach(&g_ListPluginsLoaded, pIt, VDPLUGIN, NodePlugin)
3543 {
3544 if (!RTStrCmp(pIt->pszFilename, pszFilename))
3545 return true;
3546 }
3547
3548 return false;
3549}
3550
3551/**
3552 * Adds a plugin to the list of loaded plugins.
3553 *
3554 * @returns VBox status code.
3555 * @param hPlugin Plugin handle to add.
3556 * @param pszFilename The associated filename, sued for finding duplicates.
3557 */
3558static int vdAddPlugin(RTLDRMOD hPlugin, const char *pszFilename)
3559{
3560 int rc = VINF_SUCCESS;
3561 PVDPLUGIN pPlugin = (PVDPLUGIN)RTMemAllocZ(sizeof(VDPLUGIN));
3562
3563 if (pPlugin)
3564 {
3565 pPlugin->hPlugin = hPlugin;
3566 pPlugin->pszFilename = RTStrDup(pszFilename);
3567 if (pPlugin->pszFilename)
3568 RTListAppend(&g_ListPluginsLoaded, &pPlugin->NodePlugin);
3569 else
3570 {
3571 RTMemFree(pPlugin);
3572 rc = VERR_NO_MEMORY;
3573 }
3574 }
3575 else
3576 rc = VERR_NO_MEMORY;
3577
3578 return rc;
3579}
3580#endif
3581
3582/**
3583 * Worker for VDPluginLoadFromFilename() and vdPluginLoadFromPath().
3584 *
3585 * @returns VBox status code.
3586 * @param pszFilename The plugin filename to load.
3587 */
3588static int vdPluginLoadFromFilename(const char *pszFilename)
3589{
3590#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
3591 /* Plugin loaded? Nothing to do. */
3592 if (vdPluginFind(pszFilename))
3593 return VINF_SUCCESS;
3594
3595 RTLDRMOD hPlugin = NIL_RTLDRMOD;
3596 int rc = SUPR3HardenedLdrLoadPlugIn(pszFilename, &hPlugin, NULL);
3597 if (RT_SUCCESS(rc))
3598 {
3599 VDBACKENDREGISTER BackendRegister;
3600 PFNVDPLUGINLOAD pfnVDPluginLoad = NULL;
3601
3602 BackendRegister.pfnRegisterImage = vdPluginRegisterImage;
3603 BackendRegister.pfnRegisterCache = vdPluginRegisterCache;
3604 BackendRegister.pfnRegisterFilter = vdPluginRegisterFilter;
3605
3606 rc = RTLdrGetSymbol(hPlugin, VD_PLUGIN_LOAD_NAME, (void**)&pfnVDPluginLoad);
3607 if (RT_FAILURE(rc) || !pfnVDPluginLoad)
3608 {
3609 LogFunc(("error resolving the entry point %s in plugin %s, rc=%Rrc, pfnVDPluginLoad=%#p\n",
3610 VD_PLUGIN_LOAD_NAME, pszFilename, rc, pfnVDPluginLoad));
3611 if (RT_SUCCESS(rc))
3612 rc = VERR_SYMBOL_NOT_FOUND;
3613 }
3614
3615 if (RT_SUCCESS(rc))
3616 {
3617 /* Get the function table. */
3618 rc = pfnVDPluginLoad(NULL, &BackendRegister);
3619 }
3620 else
3621 LogFunc(("ignored plugin '%s': rc=%Rrc\n", pszFilename, rc));
3622
3623 /* Create a plugin entry on success. */
3624 if (RT_SUCCESS(rc))
3625 vdAddPlugin(hPlugin, pszFilename);
3626 else
3627 RTLdrClose(hPlugin);
3628 }
3629
3630 return rc;
3631#else
3632 return VERR_NOT_IMPLEMENTED;
3633#endif
3634}
3635
3636/**
3637 * Worker for VDPluginLoadFromPath() and vdLoadDynamicBackends().
3638 *
3639 * @returns VBox status code.
3640 * @param pszPath The path to load plugins from.
3641 */
3642static int vdPluginLoadFromPath(const char *pszPath)
3643{
3644#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
3645 /* To get all entries with VBoxHDD as prefix. */
3646 char *pszPluginFilter = RTPathJoinA(pszPath, VD_PLUGIN_PREFIX "*");
3647 if (!pszPluginFilter)
3648 return VERR_NO_STR_MEMORY;
3649
3650 PRTDIRENTRYEX pPluginDirEntry = NULL;
3651 PRTDIR pPluginDir = NULL;
3652 size_t cbPluginDirEntry = sizeof(RTDIRENTRYEX);
3653 int rc = RTDirOpenFiltered(&pPluginDir, pszPluginFilter, RTDIRFILTER_WINNT, 0);
3654 if (RT_FAILURE(rc))
3655 {
3656 /* On Windows the above immediately signals that there are no
3657 * files matching, while on other platforms enumerating the
3658 * files below fails. Either way: no plugins. */
3659 goto out;
3660 }
3661
3662 pPluginDirEntry = (PRTDIRENTRYEX)RTMemAllocZ(sizeof(RTDIRENTRYEX));
3663 if (!pPluginDirEntry)
3664 {
3665 rc = VERR_NO_MEMORY;
3666 goto out;
3667 }
3668
3669 while ((rc = RTDirReadEx(pPluginDir, pPluginDirEntry, &cbPluginDirEntry, RTFSOBJATTRADD_NOTHING, RTPATH_F_ON_LINK)) != VERR_NO_MORE_FILES)
3670 {
3671 char *pszPluginPath = NULL;
3672
3673 if (rc == VERR_BUFFER_OVERFLOW)
3674 {
3675 /* allocate new buffer. */
3676 RTMemFree(pPluginDirEntry);
3677 pPluginDirEntry = (PRTDIRENTRYEX)RTMemAllocZ(cbPluginDirEntry);
3678 if (!pPluginDirEntry)
3679 {
3680 rc = VERR_NO_MEMORY;
3681 break;
3682 }
3683 /* Retry. */
3684 rc = RTDirReadEx(pPluginDir, pPluginDirEntry, &cbPluginDirEntry, RTFSOBJATTRADD_NOTHING, RTPATH_F_ON_LINK);
3685 if (RT_FAILURE(rc))
3686 break;
3687 }
3688 else if (RT_FAILURE(rc))
3689 break;
3690
3691 /* We got the new entry. */
3692 if (!RTFS_IS_FILE(pPluginDirEntry->Info.Attr.fMode))
3693 continue;
3694
3695 /* Prepend the path to the libraries. */
3696 pszPluginPath = RTPathJoinA(pszPath, pPluginDirEntry->szName);
3697 if (!pszPluginPath)
3698 {
3699 rc = VERR_NO_STR_MEMORY;
3700 break;
3701 }
3702
3703 rc = vdPluginLoadFromFilename(pszPluginPath);
3704 RTStrFree(pszPluginPath);
3705 }
3706out:
3707 if (rc == VERR_NO_MORE_FILES)
3708 rc = VINF_SUCCESS;
3709 RTStrFree(pszPluginFilter);
3710 if (pPluginDirEntry)
3711 RTMemFree(pPluginDirEntry);
3712 if (pPluginDir)
3713 RTDirClose(pPluginDir);
3714 return rc;
3715#else
3716 return VERR_NOT_IMPLEMENTED;
3717#endif
3718}
3719
3720/**
3721 * internal: scans plugin directory and loads found plugins.
3722 */
3723static int vdLoadDynamicBackends()
3724{
3725#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
3726 /*
3727 * Enumerate plugin backends from the application directory where the other
3728 * shared libraries are.
3729 */
3730 char szPath[RTPATH_MAX];
3731 int rc = RTPathAppPrivateArch(szPath, sizeof(szPath));
3732 if (RT_FAILURE(rc))
3733 return rc;
3734
3735 return vdPluginLoadFromPath(szPath);
3736#else
3737 return VINF_SUCCESS;
3738#endif
3739}
3740
3741/**
3742 * VD async I/O interface open callback.
3743 */
3744static int vdIOOpenFallback(void *pvUser, const char *pszLocation,
3745 uint32_t fOpen, PFNVDCOMPLETED pfnCompleted,
3746 void **ppStorage)
3747{
3748 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)RTMemAllocZ(sizeof(VDIIOFALLBACKSTORAGE));
3749
3750 if (!pStorage)
3751 return VERR_NO_MEMORY;
3752
3753 pStorage->pfnCompleted = pfnCompleted;
3754
3755 /* Open the file. */
3756 int rc = RTFileOpen(&pStorage->File, pszLocation, fOpen);
3757 if (RT_SUCCESS(rc))
3758 {
3759 *ppStorage = pStorage;
3760 return VINF_SUCCESS;
3761 }
3762
3763 RTMemFree(pStorage);
3764 return rc;
3765}
3766
3767/**
3768 * VD async I/O interface close callback.
3769 */
3770static int vdIOCloseFallback(void *pvUser, void *pvStorage)
3771{
3772 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3773
3774 RTFileClose(pStorage->File);
3775 RTMemFree(pStorage);
3776 return VINF_SUCCESS;
3777}
3778
3779static int vdIODeleteFallback(void *pvUser, const char *pcszFilename)
3780{
3781 return RTFileDelete(pcszFilename);
3782}
3783
3784static int vdIOMoveFallback(void *pvUser, const char *pcszSrc, const char *pcszDst, unsigned fMove)
3785{
3786 return RTFileMove(pcszSrc, pcszDst, fMove);
3787}
3788
3789static int vdIOGetFreeSpaceFallback(void *pvUser, const char *pcszFilename, int64_t *pcbFreeSpace)
3790{
3791 return RTFsQuerySizes(pcszFilename, NULL, pcbFreeSpace, NULL, NULL);
3792}
3793
3794static int vdIOGetModificationTimeFallback(void *pvUser, const char *pcszFilename, PRTTIMESPEC pModificationTime)
3795{
3796 RTFSOBJINFO info;
3797 int rc = RTPathQueryInfo(pcszFilename, &info, RTFSOBJATTRADD_NOTHING);
3798 if (RT_SUCCESS(rc))
3799 *pModificationTime = info.ModificationTime;
3800 return rc;
3801}
3802
3803/**
3804 * VD async I/O interface callback for retrieving the file size.
3805 */
3806static int vdIOGetSizeFallback(void *pvUser, void *pvStorage, uint64_t *pcbSize)
3807{
3808 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3809
3810 return RTFileGetSize(pStorage->File, pcbSize);
3811}
3812
3813/**
3814 * VD async I/O interface callback for setting the file size.
3815 */
3816static int vdIOSetSizeFallback(void *pvUser, void *pvStorage, uint64_t cbSize)
3817{
3818 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3819
3820 return RTFileSetSize(pStorage->File, cbSize);
3821}
3822
3823/**
3824 * VD async I/O interface callback for a synchronous write to the file.
3825 */
3826static int vdIOWriteSyncFallback(void *pvUser, void *pvStorage, uint64_t uOffset,
3827 const void *pvBuf, size_t cbWrite, size_t *pcbWritten)
3828{
3829 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3830
3831 return RTFileWriteAt(pStorage->File, uOffset, pvBuf, cbWrite, pcbWritten);
3832}
3833
3834/**
3835 * VD async I/O interface callback for a synchronous read from the file.
3836 */
3837static int vdIOReadSyncFallback(void *pvUser, void *pvStorage, uint64_t uOffset,
3838 void *pvBuf, size_t cbRead, size_t *pcbRead)
3839{
3840 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3841
3842 return RTFileReadAt(pStorage->File, uOffset, pvBuf, cbRead, pcbRead);
3843}
3844
3845/**
3846 * VD async I/O interface callback for a synchronous flush of the file data.
3847 */
3848static int vdIOFlushSyncFallback(void *pvUser, void *pvStorage)
3849{
3850 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3851
3852 return RTFileFlush(pStorage->File);
3853}
3854
3855/**
3856 * VD async I/O interface callback for a asynchronous read from the file.
3857 */
3858static int vdIOReadAsyncFallback(void *pvUser, void *pStorage, uint64_t uOffset,
3859 PCRTSGSEG paSegments, size_t cSegments,
3860 size_t cbRead, void *pvCompletion,
3861 void **ppTask)
3862{
3863 return VERR_NOT_IMPLEMENTED;
3864}
3865
3866/**
3867 * VD async I/O interface callback for a asynchronous write to the file.
3868 */
3869static int vdIOWriteAsyncFallback(void *pvUser, void *pStorage, uint64_t uOffset,
3870 PCRTSGSEG paSegments, size_t cSegments,
3871 size_t cbWrite, void *pvCompletion,
3872 void **ppTask)
3873{
3874 return VERR_NOT_IMPLEMENTED;
3875}
3876
3877/**
3878 * VD async I/O interface callback for a asynchronous flush of the file data.
3879 */
3880static int vdIOFlushAsyncFallback(void *pvUser, void *pStorage,
3881 void *pvCompletion, void **ppTask)
3882{
3883 return VERR_NOT_IMPLEMENTED;
3884}
3885
3886/**
3887 * Internal - Continues an I/O context after
3888 * it was halted because of an active transfer.
3889 */
3890static int vdIoCtxContinue(PVDIOCTX pIoCtx, int rcReq)
3891{
3892 PVBOXHDD pDisk = pIoCtx->pDisk;
3893 int rc = VINF_SUCCESS;
3894
3895 VD_IS_LOCKED(pDisk);
3896
3897 if (RT_FAILURE(rcReq))
3898 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rcReq, VINF_SUCCESS);
3899
3900 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
3901 {
3902 /* Continue the transfer */
3903 rc = vdIoCtxProcessLocked(pIoCtx);
3904
3905 if ( rc == VINF_VD_ASYNC_IO_FINISHED
3906 && ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
3907 {
3908 LogFlowFunc(("I/O context completed pIoCtx=%#p\n", pIoCtx));
3909 if (pIoCtx->pIoCtxParent)
3910 {
3911 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
3912
3913 Assert(!pIoCtxParent->pIoCtxParent);
3914 if (RT_FAILURE(pIoCtx->rcReq))
3915 ASMAtomicCmpXchgS32(&pIoCtxParent->rcReq, pIoCtx->rcReq, VINF_SUCCESS);
3916
3917 ASMAtomicDecU32(&pIoCtxParent->cDataTransfersPending);
3918
3919 if (pIoCtx->enmTxDir == VDIOCTXTXDIR_WRITE)
3920 {
3921 LogFlowFunc(("I/O context transferred %u bytes for the parent pIoCtxParent=%p\n",
3922 pIoCtx->Type.Child.cbTransferParent, pIoCtxParent));
3923
3924 /* Update the parent state. */
3925 Assert(pIoCtxParent->Req.Io.cbTransferLeft >= pIoCtx->Type.Child.cbTransferParent);
3926 ASMAtomicSubU32(&pIoCtxParent->Req.Io.cbTransferLeft, (uint32_t)pIoCtx->Type.Child.cbTransferParent);
3927 }
3928 else
3929 Assert(pIoCtx->enmTxDir == VDIOCTXTXDIR_FLUSH);
3930
3931 /*
3932 * A completed child write means that we finished growing the image.
3933 * We have to process any pending writes now.
3934 */
3935 vdIoCtxUnlockDisk(pDisk, pIoCtxParent, false /* fProcessDeferredReqs */);
3936
3937 /* Unblock the parent */
3938 pIoCtxParent->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
3939
3940 rc = vdIoCtxProcessLocked(pIoCtxParent);
3941
3942 if ( rc == VINF_VD_ASYNC_IO_FINISHED
3943 && ASMAtomicCmpXchgBool(&pIoCtxParent->fComplete, true, false))
3944 {
3945 LogFlowFunc(("Parent I/O context completed pIoCtxParent=%#p rcReq=%Rrc\n", pIoCtxParent, pIoCtxParent->rcReq));
3946 vdIoCtxRootComplete(pDisk, pIoCtxParent);
3947 vdThreadFinishWrite(pDisk);
3948 vdIoCtxFree(pDisk, pIoCtxParent);
3949 vdDiskProcessBlockedIoCtx(pDisk);
3950 }
3951 else if (!vdIoCtxIsDiskLockOwner(pDisk, pIoCtx))
3952 {
3953 /* Process any pending writes if the current request didn't caused another growing. */
3954 vdDiskProcessBlockedIoCtx(pDisk);
3955 }
3956 }
3957 else
3958 {
3959 if (pIoCtx->enmTxDir == VDIOCTXTXDIR_FLUSH)
3960 {
3961 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessDerredReqs */);
3962 vdThreadFinishWrite(pDisk);
3963 }
3964 else if ( pIoCtx->enmTxDir == VDIOCTXTXDIR_WRITE
3965 || pIoCtx->enmTxDir == VDIOCTXTXDIR_DISCARD)
3966 vdThreadFinishWrite(pDisk);
3967 else
3968 {
3969 Assert(pIoCtx->enmTxDir == VDIOCTXTXDIR_READ);
3970 vdThreadFinishRead(pDisk);
3971 }
3972
3973 LogFlowFunc(("I/O context completed pIoCtx=%#p rcReq=%Rrc\n", pIoCtx, pIoCtx->rcReq));
3974 vdIoCtxRootComplete(pDisk, pIoCtx);
3975 }
3976
3977 vdIoCtxFree(pDisk, pIoCtx);
3978 }
3979 }
3980
3981 return VINF_SUCCESS;
3982}
3983
3984/**
3985 * Internal - Called when user transfer completed.
3986 */
3987static int vdUserXferCompleted(PVDIOSTORAGE pIoStorage, PVDIOCTX pIoCtx,
3988 PFNVDXFERCOMPLETED pfnComplete, void *pvUser,
3989 size_t cbTransfer, int rcReq)
3990{
3991 int rc = VINF_SUCCESS;
3992 bool fIoCtxContinue = true;
3993 PVBOXHDD pDisk = pIoCtx->pDisk;
3994
3995 LogFlowFunc(("pIoStorage=%#p pIoCtx=%#p pfnComplete=%#p pvUser=%#p cbTransfer=%zu rcReq=%Rrc\n",
3996 pIoStorage, pIoCtx, pfnComplete, pvUser, cbTransfer, rcReq));
3997
3998 VD_IS_LOCKED(pDisk);
3999
4000 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbTransfer);
4001 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTransfer); Assert(cbTransfer == (uint32_t)cbTransfer);
4002 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4003
4004 if (pfnComplete)
4005 rc = pfnComplete(pIoStorage->pVDIo->pBackendData, pIoCtx, pvUser, rcReq);
4006
4007 if (RT_SUCCESS(rc))
4008 rc = vdIoCtxContinue(pIoCtx, rcReq);
4009 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4010 rc = VINF_SUCCESS;
4011
4012 return rc;
4013}
4014
4015/**
4016 * Internal - Called when a meta transfer completed.
4017 */
4018static int vdMetaXferCompleted(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser,
4019 PVDMETAXFER pMetaXfer, int rcReq)
4020{
4021 PVBOXHDD pDisk = pIoStorage->pVDIo->pDisk;
4022 RTLISTNODE ListIoCtxWaiting;
4023 bool fFlush;
4024
4025 LogFlowFunc(("pIoStorage=%#p pfnComplete=%#p pvUser=%#p pMetaXfer=%#p rcReq=%Rrc\n",
4026 pIoStorage, pfnComplete, pvUser, pMetaXfer, rcReq));
4027
4028 VD_IS_LOCKED(pDisk);
4029
4030 fFlush = VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_FLUSH;
4031 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4032
4033 if (!fFlush)
4034 {
4035 RTListMove(&ListIoCtxWaiting, &pMetaXfer->ListIoCtxWaiting);
4036
4037 if (RT_FAILURE(rcReq))
4038 {
4039 /* Remove from the AVL tree. */
4040 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4041 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4042 Assert(fRemoved);
4043 RTMemFree(pMetaXfer);
4044 }
4045 else
4046 {
4047 /* Increase the reference counter to make sure it doesn't go away before the last context is processed. */
4048 pMetaXfer->cRefs++;
4049 }
4050 }
4051 else
4052 RTListMove(&ListIoCtxWaiting, &pMetaXfer->ListIoCtxWaiting);
4053
4054 /* Go through the waiting list and continue the I/O contexts. */
4055 while (!RTListIsEmpty(&ListIoCtxWaiting))
4056 {
4057 int rc = VINF_SUCCESS;
4058 bool fContinue = true;
4059 PVDIOCTXDEFERRED pDeferred = RTListGetFirst(&ListIoCtxWaiting, VDIOCTXDEFERRED, NodeDeferred);
4060 PVDIOCTX pIoCtx = pDeferred->pIoCtx;
4061 RTListNodeRemove(&pDeferred->NodeDeferred);
4062
4063 RTMemFree(pDeferred);
4064 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
4065
4066 if (pfnComplete)
4067 rc = pfnComplete(pIoStorage->pVDIo->pBackendData, pIoCtx, pvUser, rcReq);
4068
4069 LogFlow(("Completion callback for I/O context %#p returned %Rrc\n", pIoCtx, rc));
4070
4071 if (RT_SUCCESS(rc))
4072 {
4073 rc = vdIoCtxContinue(pIoCtx, rcReq);
4074 AssertRC(rc);
4075 }
4076 else
4077 Assert(rc == VERR_VD_ASYNC_IO_IN_PROGRESS);
4078 }
4079
4080 /* Remove if not used anymore. */
4081 if (RT_SUCCESS(rcReq) && !fFlush)
4082 {
4083 pMetaXfer->cRefs--;
4084 if (!pMetaXfer->cRefs && RTListIsEmpty(&pMetaXfer->ListIoCtxWaiting))
4085 {
4086 /* Remove from the AVL tree. */
4087 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4088 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4089 Assert(fRemoved);
4090 RTMemFree(pMetaXfer);
4091 }
4092 }
4093 else if (fFlush)
4094 RTMemFree(pMetaXfer);
4095
4096 return VINF_SUCCESS;
4097}
4098
4099/**
4100 * Processes a list of waiting I/O tasks. The disk lock must be held by caller.
4101 *
4102 * @returns nothing.
4103 * @param pDisk The disk to process the list for.
4104 */
4105static void vdIoTaskProcessWaitingList(PVBOXHDD pDisk)
4106{
4107 LogFlowFunc(("pDisk=%#p\n", pDisk));
4108
4109 VD_IS_LOCKED(pDisk);
4110
4111 PVDIOTASK pHead = ASMAtomicXchgPtrT(&pDisk->pIoTasksPendingHead, NULL, PVDIOTASK);
4112
4113 Log(("I/O task list cleared\n"));
4114
4115 /* Reverse order. */
4116 PVDIOTASK pCur = pHead;
4117 pHead = NULL;
4118 while (pCur)
4119 {
4120 PVDIOTASK pInsert = pCur;
4121 pCur = pCur->pNext;
4122 pInsert->pNext = pHead;
4123 pHead = pInsert;
4124 }
4125
4126 while (pHead)
4127 {
4128 PVDIOSTORAGE pIoStorage = pHead->pIoStorage;
4129
4130 if (!pHead->fMeta)
4131 vdUserXferCompleted(pIoStorage, pHead->Type.User.pIoCtx,
4132 pHead->pfnComplete, pHead->pvUser,
4133 pHead->Type.User.cbTransfer, pHead->rcReq);
4134 else
4135 vdMetaXferCompleted(pIoStorage, pHead->pfnComplete, pHead->pvUser,
4136 pHead->Type.Meta.pMetaXfer, pHead->rcReq);
4137
4138 pCur = pHead;
4139 pHead = pHead->pNext;
4140 vdIoTaskFree(pDisk, pCur);
4141 }
4142}
4143
4144/**
4145 * Process any I/O context on the halted list.
4146 *
4147 * @returns nothing.
4148 * @param pDisk The disk.
4149 */
4150static void vdIoCtxProcessHaltedList(PVBOXHDD pDisk)
4151{
4152 LogFlowFunc(("pDisk=%#p\n", pDisk));
4153
4154 VD_IS_LOCKED(pDisk);
4155
4156 /* Get the waiting list and process it in FIFO order. */
4157 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxHaltedHead, NULL, PVDIOCTX);
4158
4159 /* Reverse it. */
4160 PVDIOCTX pCur = pIoCtxHead;
4161 pIoCtxHead = NULL;
4162 while (pCur)
4163 {
4164 PVDIOCTX pInsert = pCur;
4165 pCur = pCur->pIoCtxNext;
4166 pInsert->pIoCtxNext = pIoCtxHead;
4167 pIoCtxHead = pInsert;
4168 }
4169
4170 /* Process now. */
4171 pCur = pIoCtxHead;
4172 while (pCur)
4173 {
4174 PVDIOCTX pTmp = pCur;
4175
4176 pCur = pCur->pIoCtxNext;
4177 pTmp->pIoCtxNext = NULL;
4178
4179 /* Continue */
4180 pTmp->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
4181 vdIoCtxContinue(pTmp, pTmp->rcReq);
4182 }
4183}
4184
4185/**
4186 * Unlock the disk and process pending tasks.
4187 *
4188 * @returns VBox status code.
4189 * @param pDisk The disk to unlock.
4190 */
4191static int vdDiskUnlock(PVBOXHDD pDisk, PVDIOCTX pIoCtxRc)
4192{
4193 int rc = VINF_SUCCESS;
4194
4195 VD_IS_LOCKED(pDisk);
4196
4197 /*
4198 * Process the list of waiting I/O tasks first
4199 * because they might complete I/O contexts.
4200 * Same for the list of halted I/O contexts.
4201 * Afterwards comes the list of new I/O contexts.
4202 */
4203 vdIoTaskProcessWaitingList(pDisk);
4204 vdIoCtxProcessHaltedList(pDisk);
4205 rc = vdDiskProcessWaitingIoCtx(pDisk, pIoCtxRc);
4206 ASMAtomicXchgBool(&pDisk->fLocked, false);
4207
4208 /*
4209 * Need to check for new I/O tasks and waiting I/O contexts now
4210 * again as other threads might added them while we processed
4211 * previous lists.
4212 */
4213 while ( ASMAtomicUoReadPtrT(&pDisk->pIoCtxHead, PVDIOCTX) != NULL
4214 || ASMAtomicUoReadPtrT(&pDisk->pIoTasksPendingHead, PVDIOTASK) != NULL
4215 || ASMAtomicUoReadPtrT(&pDisk->pIoCtxHaltedHead, PVDIOCTX) != NULL)
4216 {
4217 /* Try lock disk again. */
4218 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
4219 {
4220 vdIoTaskProcessWaitingList(pDisk);
4221 vdIoCtxProcessHaltedList(pDisk);
4222 vdDiskProcessWaitingIoCtx(pDisk, NULL);
4223 ASMAtomicXchgBool(&pDisk->fLocked, false);
4224 }
4225 else /* Let the other thread everything when he unlocks the disk. */
4226 break;
4227 }
4228
4229 return rc;
4230}
4231
4232/**
4233 * Try to lock the disk to complete pressing of the I/O task.
4234 * The completion is deferred if the disk is locked already.
4235 *
4236 * @returns nothing.
4237 * @param pIoTask The I/O task to complete.
4238 */
4239static void vdXferTryLockDiskDeferIoTask(PVDIOTASK pIoTask)
4240{
4241 PVDIOSTORAGE pIoStorage = pIoTask->pIoStorage;
4242 PVBOXHDD pDisk = pIoStorage->pVDIo->pDisk;
4243
4244 Log(("Deferring I/O task pIoTask=%p\n", pIoTask));
4245
4246 /* Put it on the waiting list. */
4247 PVDIOTASK pNext = ASMAtomicUoReadPtrT(&pDisk->pIoTasksPendingHead, PVDIOTASK);
4248 PVDIOTASK pHeadOld;
4249 pIoTask->pNext = pNext;
4250 while (!ASMAtomicCmpXchgExPtr(&pDisk->pIoTasksPendingHead, pIoTask, pNext, &pHeadOld))
4251 {
4252 pNext = pHeadOld;
4253 Assert(pNext != pIoTask);
4254 pIoTask->pNext = pNext;
4255 ASMNopPause();
4256 }
4257
4258 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
4259 {
4260 /* Release disk lock, it will take care of processing all lists. */
4261 vdDiskUnlock(pDisk, NULL);
4262 }
4263}
4264
4265static int vdIOIntReqCompleted(void *pvUser, int rcReq)
4266{
4267 PVDIOTASK pIoTask = (PVDIOTASK)pvUser;
4268
4269 LogFlowFunc(("Task completed pIoTask=%#p\n", pIoTask));
4270
4271 pIoTask->rcReq = rcReq;
4272 vdXferTryLockDiskDeferIoTask(pIoTask);
4273 return VINF_SUCCESS;
4274}
4275
4276/**
4277 * VD I/O interface callback for opening a file.
4278 */
4279static int vdIOIntOpen(void *pvUser, const char *pszLocation,
4280 unsigned uOpenFlags, PPVDIOSTORAGE ppIoStorage)
4281{
4282 int rc = VINF_SUCCESS;
4283 PVDIO pVDIo = (PVDIO)pvUser;
4284 PVDIOSTORAGE pIoStorage = (PVDIOSTORAGE)RTMemAllocZ(sizeof(VDIOSTORAGE));
4285
4286 if (!pIoStorage)
4287 return VERR_NO_MEMORY;
4288
4289 /* Create the AVl tree. */
4290 pIoStorage->pTreeMetaXfers = (PAVLRFOFFTREE)RTMemAllocZ(sizeof(AVLRFOFFTREE));
4291 if (pIoStorage->pTreeMetaXfers)
4292 {
4293 rc = pVDIo->pInterfaceIo->pfnOpen(pVDIo->pInterfaceIo->Core.pvUser,
4294 pszLocation, uOpenFlags,
4295 vdIOIntReqCompleted,
4296 &pIoStorage->pStorage);
4297 if (RT_SUCCESS(rc))
4298 {
4299 pIoStorage->pVDIo = pVDIo;
4300 *ppIoStorage = pIoStorage;
4301 return VINF_SUCCESS;
4302 }
4303
4304 RTMemFree(pIoStorage->pTreeMetaXfers);
4305 }
4306 else
4307 rc = VERR_NO_MEMORY;
4308
4309 RTMemFree(pIoStorage);
4310 return rc;
4311}
4312
4313static int vdIOIntTreeMetaXferDestroy(PAVLRFOFFNODECORE pNode, void *pvUser)
4314{
4315 AssertMsgFailed(("Tree should be empty at this point!\n"));
4316 return VINF_SUCCESS;
4317}
4318
4319static int vdIOIntClose(void *pvUser, PVDIOSTORAGE pIoStorage)
4320{
4321 int rc = VINF_SUCCESS;
4322 PVDIO pVDIo = (PVDIO)pvUser;
4323
4324 /* We free everything here, even if closing the file failed for some reason. */
4325 rc = pVDIo->pInterfaceIo->pfnClose(pVDIo->pInterfaceIo->Core.pvUser, pIoStorage->pStorage);
4326 RTAvlrFileOffsetDestroy(pIoStorage->pTreeMetaXfers, vdIOIntTreeMetaXferDestroy, NULL);
4327 RTMemFree(pIoStorage->pTreeMetaXfers);
4328 RTMemFree(pIoStorage);
4329 return rc;
4330}
4331
4332static int vdIOIntDelete(void *pvUser, const char *pcszFilename)
4333{
4334 PVDIO pVDIo = (PVDIO)pvUser;
4335 return pVDIo->pInterfaceIo->pfnDelete(pVDIo->pInterfaceIo->Core.pvUser,
4336 pcszFilename);
4337}
4338
4339static int vdIOIntMove(void *pvUser, const char *pcszSrc, const char *pcszDst,
4340 unsigned fMove)
4341{
4342 PVDIO pVDIo = (PVDIO)pvUser;
4343 return pVDIo->pInterfaceIo->pfnMove(pVDIo->pInterfaceIo->Core.pvUser,
4344 pcszSrc, pcszDst, fMove);
4345}
4346
4347static int vdIOIntGetFreeSpace(void *pvUser, const char *pcszFilename,
4348 int64_t *pcbFreeSpace)
4349{
4350 PVDIO pVDIo = (PVDIO)pvUser;
4351 return pVDIo->pInterfaceIo->pfnGetFreeSpace(pVDIo->pInterfaceIo->Core.pvUser,
4352 pcszFilename, pcbFreeSpace);
4353}
4354
4355static int vdIOIntGetModificationTime(void *pvUser, const char *pcszFilename,
4356 PRTTIMESPEC pModificationTime)
4357{
4358 PVDIO pVDIo = (PVDIO)pvUser;
4359 return pVDIo->pInterfaceIo->pfnGetModificationTime(pVDIo->pInterfaceIo->Core.pvUser,
4360 pcszFilename, pModificationTime);
4361}
4362
4363static int vdIOIntGetSize(void *pvUser, PVDIOSTORAGE pIoStorage,
4364 uint64_t *pcbSize)
4365{
4366 PVDIO pVDIo = (PVDIO)pvUser;
4367 return pVDIo->pInterfaceIo->pfnGetSize(pVDIo->pInterfaceIo->Core.pvUser,
4368 pIoStorage->pStorage, pcbSize);
4369}
4370
4371static int vdIOIntSetSize(void *pvUser, PVDIOSTORAGE pIoStorage,
4372 uint64_t cbSize)
4373{
4374 PVDIO pVDIo = (PVDIO)pvUser;
4375 return pVDIo->pInterfaceIo->pfnSetSize(pVDIo->pInterfaceIo->Core.pvUser,
4376 pIoStorage->pStorage, cbSize);
4377}
4378
4379static int vdIOIntReadUser(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4380 PVDIOCTX pIoCtx, size_t cbRead)
4381{
4382 int rc = VINF_SUCCESS;
4383 PVDIO pVDIo = (PVDIO)pvUser;
4384 PVBOXHDD pDisk = pVDIo->pDisk;
4385
4386 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pIoCtx=%#p cbRead=%u\n",
4387 pvUser, pIoStorage, uOffset, pIoCtx, cbRead));
4388
4389 /** @todo: Enable check for sync I/O later. */
4390 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4391 VD_IS_LOCKED(pDisk);
4392
4393 Assert(cbRead > 0);
4394
4395 if (pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4396 {
4397 RTSGSEG Seg;
4398 unsigned cSegments = 1;
4399 size_t cbTaskRead = 0;
4400
4401 /* Synchronous I/O contexts only have one buffer segment. */
4402 AssertMsgReturn(pIoCtx->Req.Io.SgBuf.cSegs == 1,
4403 ("Invalid number of buffer segments for synchronous I/O context"),
4404 VERR_INVALID_PARAMETER);
4405
4406 cbTaskRead = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, &Seg, &cSegments, cbRead);
4407 Assert(cbRead == cbTaskRead);
4408 Assert(cSegments == 1);
4409 rc = pVDIo->pInterfaceIo->pfnReadSync(pVDIo->pInterfaceIo->Core.pvUser,
4410 pIoStorage->pStorage, uOffset,
4411 Seg.pvSeg, cbRead, NULL);
4412 if (RT_SUCCESS(rc))
4413 {
4414 Assert(cbRead == (uint32_t)cbRead);
4415 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbRead);
4416 }
4417 }
4418 else
4419 {
4420 /* Build the S/G array and spawn a new I/O task */
4421 while (cbRead)
4422 {
4423 RTSGSEG aSeg[VD_IO_TASK_SEGMENTS_MAX];
4424 unsigned cSegments = VD_IO_TASK_SEGMENTS_MAX;
4425 size_t cbTaskRead = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, aSeg, &cSegments, cbRead);
4426
4427 Assert(cSegments > 0);
4428 Assert(cbTaskRead > 0);
4429 AssertMsg(cbTaskRead <= cbRead, ("Invalid number of bytes to read\n"));
4430
4431 LogFlow(("Reading %u bytes into %u segments\n", cbTaskRead, cSegments));
4432
4433#ifdef RT_STRICT
4434 for (unsigned i = 0; i < cSegments; i++)
4435 AssertMsg(aSeg[i].pvSeg && !(aSeg[i].cbSeg % 512),
4436 ("Segment %u is invalid\n", i));
4437#endif
4438
4439 Assert(cbTaskRead == (uint32_t)cbTaskRead);
4440 PVDIOTASK pIoTask = vdIoTaskUserAlloc(pIoStorage, NULL, NULL, pIoCtx, (uint32_t)cbTaskRead);
4441
4442 if (!pIoTask)
4443 return VERR_NO_MEMORY;
4444
4445 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
4446
4447 void *pvTask;
4448 Log(("Spawning pIoTask=%p pIoCtx=%p\n", pIoTask, pIoCtx));
4449 rc = pVDIo->pInterfaceIo->pfnReadAsync(pVDIo->pInterfaceIo->Core.pvUser,
4450 pIoStorage->pStorage, uOffset,
4451 aSeg, cSegments, cbTaskRead, pIoTask,
4452 &pvTask);
4453 if (RT_SUCCESS(rc))
4454 {
4455 AssertMsg(cbTaskRead <= pIoCtx->Req.Io.cbTransferLeft, ("Impossible!\n"));
4456 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTaskRead);
4457 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4458 vdIoTaskFree(pDisk, pIoTask);
4459 }
4460 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4461 {
4462 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4463 vdIoTaskFree(pDisk, pIoTask);
4464 break;
4465 }
4466
4467 uOffset += cbTaskRead;
4468 cbRead -= cbTaskRead;
4469 }
4470 }
4471
4472 LogFlowFunc(("returns rc=%Rrc\n", rc));
4473 return rc;
4474}
4475
4476static int vdIOIntWriteUser(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4477 PVDIOCTX pIoCtx, size_t cbWrite, PFNVDXFERCOMPLETED pfnComplete,
4478 void *pvCompleteUser)
4479{
4480 int rc = VINF_SUCCESS;
4481 PVDIO pVDIo = (PVDIO)pvUser;
4482 PVBOXHDD pDisk = pVDIo->pDisk;
4483
4484 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pIoCtx=%#p cbWrite=%u\n",
4485 pvUser, pIoStorage, uOffset, pIoCtx, cbWrite));
4486
4487 /** @todo: Enable check for sync I/O later. */
4488 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4489 VD_IS_LOCKED(pDisk);
4490
4491 Assert(cbWrite > 0);
4492
4493 if (pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4494 {
4495 RTSGSEG Seg;
4496 unsigned cSegments = 1;
4497 size_t cbTaskWrite = 0;
4498
4499 /* Synchronous I/O contexts only have one buffer segment. */
4500 AssertMsgReturn(pIoCtx->Req.Io.SgBuf.cSegs == 1,
4501 ("Invalid number of buffer segments for synchronous I/O context"),
4502 VERR_INVALID_PARAMETER);
4503
4504 cbTaskWrite = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, &Seg, &cSegments, cbWrite);
4505 Assert(cbWrite == cbTaskWrite);
4506 Assert(cSegments == 1);
4507 rc = pVDIo->pInterfaceIo->pfnWriteSync(pVDIo->pInterfaceIo->Core.pvUser,
4508 pIoStorage->pStorage, uOffset,
4509 Seg.pvSeg, cbWrite, NULL);
4510 if (RT_SUCCESS(rc))
4511 {
4512 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbWrite);
4513 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbWrite);
4514 }
4515 }
4516 else
4517 {
4518 /* Build the S/G array and spawn a new I/O task */
4519 while (cbWrite)
4520 {
4521 RTSGSEG aSeg[VD_IO_TASK_SEGMENTS_MAX];
4522 unsigned cSegments = VD_IO_TASK_SEGMENTS_MAX;
4523 size_t cbTaskWrite = 0;
4524
4525 cbTaskWrite = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, aSeg, &cSegments, cbWrite);
4526
4527 Assert(cSegments > 0);
4528 Assert(cbTaskWrite > 0);
4529 AssertMsg(cbTaskWrite <= cbWrite, ("Invalid number of bytes to write\n"));
4530
4531 LogFlow(("Writing %u bytes from %u segments\n", cbTaskWrite, cSegments));
4532
4533#ifdef DEBUG
4534 for (unsigned i = 0; i < cSegments; i++)
4535 AssertMsg(aSeg[i].pvSeg && !(aSeg[i].cbSeg % 512),
4536 ("Segment %u is invalid\n", i));
4537#endif
4538
4539 Assert(cbTaskWrite == (uint32_t)cbTaskWrite);
4540 PVDIOTASK pIoTask = vdIoTaskUserAlloc(pIoStorage, pfnComplete, pvCompleteUser, pIoCtx, (uint32_t)cbTaskWrite);
4541
4542 if (!pIoTask)
4543 return VERR_NO_MEMORY;
4544
4545 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
4546
4547 void *pvTask;
4548 Log(("Spawning pIoTask=%p pIoCtx=%p\n", pIoTask, pIoCtx));
4549 rc = pVDIo->pInterfaceIo->pfnWriteAsync(pVDIo->pInterfaceIo->Core.pvUser,
4550 pIoStorage->pStorage,
4551 uOffset, aSeg, cSegments,
4552 cbTaskWrite, pIoTask, &pvTask);
4553 if (RT_SUCCESS(rc))
4554 {
4555 AssertMsg(cbTaskWrite <= pIoCtx->Req.Io.cbTransferLeft, ("Impossible!\n"));
4556 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTaskWrite);
4557 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4558 vdIoTaskFree(pDisk, pIoTask);
4559 }
4560 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4561 {
4562 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4563 vdIoTaskFree(pDisk, pIoTask);
4564 break;
4565 }
4566
4567 uOffset += cbTaskWrite;
4568 cbWrite -= cbTaskWrite;
4569 }
4570 }
4571
4572 LogFlowFunc(("returns rc=%Rrc\n", rc));
4573 return rc;
4574}
4575
4576static int vdIOIntReadMeta(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4577 void *pvBuf, size_t cbRead, PVDIOCTX pIoCtx,
4578 PPVDMETAXFER ppMetaXfer, PFNVDXFERCOMPLETED pfnComplete,
4579 void *pvCompleteUser)
4580{
4581 PVDIO pVDIo = (PVDIO)pvUser;
4582 PVBOXHDD pDisk = pVDIo->pDisk;
4583 int rc = VINF_SUCCESS;
4584 RTSGSEG Seg;
4585 PVDIOTASK pIoTask;
4586 PVDMETAXFER pMetaXfer = NULL;
4587 void *pvTask = NULL;
4588
4589 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pvBuf=%#p cbRead=%u\n",
4590 pvUser, pIoStorage, uOffset, pvBuf, cbRead));
4591
4592 AssertMsgReturn( pIoCtx
4593 || (!ppMetaXfer && !pfnComplete && !pvCompleteUser),
4594 ("A synchronous metadata read is requested but the parameters are wrong\n"),
4595 VERR_INVALID_POINTER);
4596
4597 /** @todo: Enable check for sync I/O later. */
4598 if ( pIoCtx
4599 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4600 VD_IS_LOCKED(pDisk);
4601
4602 if ( !pIoCtx
4603 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4604 {
4605 /* Handle synchronous metadata I/O. */
4606 /** @todo: Integrate with metadata transfers below. */
4607 rc = pVDIo->pInterfaceIo->pfnReadSync(pVDIo->pInterfaceIo->Core.pvUser,
4608 pIoStorage->pStorage, uOffset,
4609 pvBuf, cbRead, NULL);
4610 if (ppMetaXfer)
4611 *ppMetaXfer = NULL;
4612 }
4613 else
4614 {
4615 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGet(pIoStorage->pTreeMetaXfers, uOffset);
4616 if (!pMetaXfer)
4617 {
4618#ifdef RT_STRICT
4619 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGetBestFit(pIoStorage->pTreeMetaXfers, uOffset, false /* fAbove */);
4620 AssertMsg(!pMetaXfer || (pMetaXfer->Core.Key + (RTFOFF)pMetaXfer->cbMeta <= (RTFOFF)uOffset),
4621 ("Overlapping meta transfers!\n"));
4622#endif
4623
4624 /* Allocate a new meta transfer. */
4625 pMetaXfer = vdMetaXferAlloc(pIoStorage, uOffset, cbRead);
4626 if (!pMetaXfer)
4627 return VERR_NO_MEMORY;
4628
4629 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvCompleteUser, pMetaXfer);
4630 if (!pIoTask)
4631 {
4632 RTMemFree(pMetaXfer);
4633 return VERR_NO_MEMORY;
4634 }
4635
4636 Seg.cbSeg = cbRead;
4637 Seg.pvSeg = pMetaXfer->abData;
4638
4639 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_READ);
4640 rc = pVDIo->pInterfaceIo->pfnReadAsync(pVDIo->pInterfaceIo->Core.pvUser,
4641 pIoStorage->pStorage,
4642 uOffset, &Seg, 1,
4643 cbRead, pIoTask, &pvTask);
4644
4645 if (RT_SUCCESS(rc) || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4646 {
4647 bool fInserted = RTAvlrFileOffsetInsert(pIoStorage->pTreeMetaXfers, &pMetaXfer->Core);
4648 Assert(fInserted);
4649 }
4650 else
4651 RTMemFree(pMetaXfer);
4652
4653 if (RT_SUCCESS(rc))
4654 {
4655 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4656 vdIoTaskFree(pDisk, pIoTask);
4657 }
4658 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS && !pfnComplete)
4659 rc = VERR_VD_NOT_ENOUGH_METADATA;
4660 }
4661
4662 Assert(VALID_PTR(pMetaXfer) || RT_FAILURE(rc));
4663
4664 if (RT_SUCCESS(rc) || rc == VERR_VD_NOT_ENOUGH_METADATA || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4665 {
4666 /* If it is pending add the request to the list. */
4667 if (VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_READ)
4668 {
4669 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4670 AssertPtr(pDeferred);
4671
4672 RTListInit(&pDeferred->NodeDeferred);
4673 pDeferred->pIoCtx = pIoCtx;
4674
4675 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4676 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4677 rc = VERR_VD_NOT_ENOUGH_METADATA;
4678 }
4679 else
4680 {
4681 /* Transfer the data. */
4682 pMetaXfer->cRefs++;
4683 Assert(pMetaXfer->cbMeta >= cbRead);
4684 Assert(pMetaXfer->Core.Key == (RTFOFF)uOffset);
4685 memcpy(pvBuf, pMetaXfer->abData, cbRead);
4686 *ppMetaXfer = pMetaXfer;
4687 }
4688 }
4689 }
4690
4691 LogFlowFunc(("returns rc=%Rrc\n", rc));
4692 return rc;
4693}
4694
4695static int vdIOIntWriteMeta(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4696 const void *pvBuf, size_t cbWrite, PVDIOCTX pIoCtx,
4697 PFNVDXFERCOMPLETED pfnComplete, void *pvCompleteUser)
4698{
4699 PVDIO pVDIo = (PVDIO)pvUser;
4700 PVBOXHDD pDisk = pVDIo->pDisk;
4701 int rc = VINF_SUCCESS;
4702 RTSGSEG Seg;
4703 PVDIOTASK pIoTask;
4704 PVDMETAXFER pMetaXfer = NULL;
4705 bool fInTree = false;
4706 void *pvTask = NULL;
4707
4708 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pvBuf=%#p cbWrite=%u\n",
4709 pvUser, pIoStorage, uOffset, pvBuf, cbWrite));
4710
4711 AssertMsgReturn( pIoCtx
4712 || (!pfnComplete && !pvCompleteUser),
4713 ("A synchronous metadata write is requested but the parameters are wrong\n"),
4714 VERR_INVALID_POINTER);
4715
4716 /** @todo: Enable check for sync I/O later. */
4717 if ( pIoCtx
4718 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4719 VD_IS_LOCKED(pDisk);
4720
4721 if ( !pIoCtx
4722 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4723 {
4724 /* Handle synchronous metadata I/O. */
4725 /** @todo: Integrate with metadata transfers below. */
4726 rc = pVDIo->pInterfaceIo->pfnWriteSync(pVDIo->pInterfaceIo->Core.pvUser,
4727 pIoStorage->pStorage, uOffset,
4728 pvBuf, cbWrite, NULL);
4729 }
4730 else
4731 {
4732 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGet(pIoStorage->pTreeMetaXfers, uOffset);
4733 if (!pMetaXfer)
4734 {
4735 /* Allocate a new meta transfer. */
4736 pMetaXfer = vdMetaXferAlloc(pIoStorage, uOffset, cbWrite);
4737 if (!pMetaXfer)
4738 return VERR_NO_MEMORY;
4739 }
4740 else
4741 {
4742 Assert(pMetaXfer->cbMeta >= cbWrite);
4743 Assert(pMetaXfer->Core.Key == (RTFOFF)uOffset);
4744 fInTree = true;
4745 }
4746
4747 Assert(VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE);
4748
4749 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvCompleteUser, pMetaXfer);
4750 if (!pIoTask)
4751 {
4752 RTMemFree(pMetaXfer);
4753 return VERR_NO_MEMORY;
4754 }
4755
4756 memcpy(pMetaXfer->abData, pvBuf, cbWrite);
4757 Seg.cbSeg = cbWrite;
4758 Seg.pvSeg = pMetaXfer->abData;
4759
4760 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4761
4762 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_WRITE);
4763 rc = pVDIo->pInterfaceIo->pfnWriteAsync(pVDIo->pInterfaceIo->Core.pvUser,
4764 pIoStorage->pStorage,
4765 uOffset, &Seg, 1, cbWrite, pIoTask,
4766 &pvTask);
4767 if (RT_SUCCESS(rc))
4768 {
4769 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4770 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
4771 vdIoTaskFree(pDisk, pIoTask);
4772 if (fInTree && !pMetaXfer->cRefs)
4773 {
4774 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4775 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4776 AssertMsg(fRemoved, ("Metadata transfer wasn't removed\n"));
4777 RTMemFree(pMetaXfer);
4778 pMetaXfer = NULL;
4779 }
4780 }
4781 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4782 {
4783 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4784 AssertPtr(pDeferred);
4785
4786 RTListInit(&pDeferred->NodeDeferred);
4787 pDeferred->pIoCtx = pIoCtx;
4788
4789 if (!fInTree)
4790 {
4791 bool fInserted = RTAvlrFileOffsetInsert(pIoStorage->pTreeMetaXfers, &pMetaXfer->Core);
4792 Assert(fInserted);
4793 }
4794
4795 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4796 }
4797 else
4798 {
4799 RTMemFree(pMetaXfer);
4800 pMetaXfer = NULL;
4801 }
4802 }
4803
4804 LogFlowFunc(("returns rc=%Rrc\n", rc));
4805 return rc;
4806}
4807
4808static void vdIOIntMetaXferRelease(void *pvUser, PVDMETAXFER pMetaXfer)
4809{
4810 PVDIO pVDIo = (PVDIO)pvUser;
4811 PVBOXHDD pDisk = pVDIo->pDisk;
4812 PVDIOSTORAGE pIoStorage;
4813
4814 /*
4815 * It is possible that we get called with a NULL metadata xfer handle
4816 * for synchronous I/O. Just exit.
4817 */
4818 if (!pMetaXfer)
4819 return;
4820
4821 pIoStorage = pMetaXfer->pIoStorage;
4822
4823 VD_IS_LOCKED(pDisk);
4824
4825 Assert( VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE
4826 || VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_WRITE);
4827 Assert(pMetaXfer->cRefs > 0);
4828
4829 pMetaXfer->cRefs--;
4830 if ( !pMetaXfer->cRefs
4831 && RTListIsEmpty(&pMetaXfer->ListIoCtxWaiting)
4832 && VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE)
4833 {
4834 /* Free the meta data entry. */
4835 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4836 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4837 AssertMsg(fRemoved, ("Metadata transfer wasn't removed\n"));
4838
4839 RTMemFree(pMetaXfer);
4840 }
4841}
4842
4843static int vdIOIntFlush(void *pvUser, PVDIOSTORAGE pIoStorage, PVDIOCTX pIoCtx,
4844 PFNVDXFERCOMPLETED pfnComplete, void *pvCompleteUser)
4845{
4846 PVDIO pVDIo = (PVDIO)pvUser;
4847 PVBOXHDD pDisk = pVDIo->pDisk;
4848 int rc = VINF_SUCCESS;
4849 PVDIOTASK pIoTask;
4850 PVDMETAXFER pMetaXfer = NULL;
4851 void *pvTask = NULL;
4852
4853 LogFlowFunc(("pvUser=%#p pIoStorage=%#p pIoCtx=%#p\n",
4854 pvUser, pIoStorage, pIoCtx));
4855
4856 AssertMsgReturn( pIoCtx
4857 || (!pfnComplete && !pvCompleteUser),
4858 ("A synchronous metadata write is requested but the parameters are wrong\n"),
4859 VERR_INVALID_POINTER);
4860
4861 /** @todo: Enable check for sync I/O later. */
4862 if ( pIoCtx
4863 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4864 VD_IS_LOCKED(pDisk);
4865
4866 if (pVDIo->fIgnoreFlush)
4867 return VINF_SUCCESS;
4868
4869 if ( !pIoCtx
4870 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4871 {
4872 /* Handle synchronous flushes. */
4873 /** @todo: Integrate with metadata transfers below. */
4874 rc = pVDIo->pInterfaceIo->pfnFlushSync(pVDIo->pInterfaceIo->Core.pvUser,
4875 pIoStorage->pStorage);
4876 }
4877 else
4878 {
4879 /* Allocate a new meta transfer. */
4880 pMetaXfer = vdMetaXferAlloc(pIoStorage, 0, 0);
4881 if (!pMetaXfer)
4882 return VERR_NO_MEMORY;
4883
4884 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvUser, pMetaXfer);
4885 if (!pIoTask)
4886 {
4887 RTMemFree(pMetaXfer);
4888 return VERR_NO_MEMORY;
4889 }
4890
4891 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4892
4893 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4894 AssertPtr(pDeferred);
4895
4896 RTListInit(&pDeferred->NodeDeferred);
4897 pDeferred->pIoCtx = pIoCtx;
4898
4899 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4900 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_FLUSH);
4901 rc = pVDIo->pInterfaceIo->pfnFlushAsync(pVDIo->pInterfaceIo->Core.pvUser,
4902 pIoStorage->pStorage,
4903 pIoTask, &pvTask);
4904 if (RT_SUCCESS(rc))
4905 {
4906 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4907 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
4908 vdIoTaskFree(pDisk, pIoTask);
4909 RTMemFree(pDeferred);
4910 RTMemFree(pMetaXfer);
4911 }
4912 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4913 RTMemFree(pMetaXfer);
4914 }
4915
4916 LogFlowFunc(("returns rc=%Rrc\n", rc));
4917 return rc;
4918}
4919
4920static size_t vdIOIntIoCtxCopyTo(void *pvUser, PVDIOCTX pIoCtx,
4921 const void *pvBuf, size_t cbBuf)
4922{
4923 PVDIO pVDIo = (PVDIO)pvUser;
4924 PVBOXHDD pDisk = pVDIo->pDisk;
4925 size_t cbCopied = 0;
4926
4927 /** @todo: Enable check for sync I/O later. */
4928 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4929 VD_IS_LOCKED(pDisk);
4930
4931 cbCopied = vdIoCtxCopyTo(pIoCtx, (uint8_t *)pvBuf, cbBuf);
4932 Assert(cbCopied == cbBuf);
4933
4934 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft >= cbCopied); - triggers with vdCopyHelper/dmgRead.
4935 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCopied);
4936
4937 return cbCopied;
4938}
4939
4940static size_t vdIOIntIoCtxCopyFrom(void *pvUser, PVDIOCTX pIoCtx,
4941 void *pvBuf, size_t cbBuf)
4942{
4943 PVDIO pVDIo = (PVDIO)pvUser;
4944 PVBOXHDD pDisk = pVDIo->pDisk;
4945 size_t cbCopied = 0;
4946
4947 /** @todo: Enable check for sync I/O later. */
4948 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4949 VD_IS_LOCKED(pDisk);
4950
4951 cbCopied = vdIoCtxCopyFrom(pIoCtx, (uint8_t *)pvBuf, cbBuf);
4952 Assert(cbCopied == cbBuf);
4953
4954 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft > cbCopied); - triggers with vdCopyHelper/dmgRead.
4955 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCopied);
4956
4957 return cbCopied;
4958}
4959
4960static size_t vdIOIntIoCtxSet(void *pvUser, PVDIOCTX pIoCtx, int ch, size_t cb)
4961{
4962 PVDIO pVDIo = (PVDIO)pvUser;
4963 PVBOXHDD pDisk = pVDIo->pDisk;
4964 size_t cbSet = 0;
4965
4966 /** @todo: Enable check for sync I/O later. */
4967 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4968 VD_IS_LOCKED(pDisk);
4969
4970 cbSet = vdIoCtxSet(pIoCtx, ch, cb);
4971 Assert(cbSet == cb);
4972
4973 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft >= cbSet); - triggers with vdCopyHelper/dmgRead.
4974 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbSet);
4975
4976 return cbSet;
4977}
4978
4979static size_t vdIOIntIoCtxSegArrayCreate(void *pvUser, PVDIOCTX pIoCtx,
4980 PRTSGSEG paSeg, unsigned *pcSeg,
4981 size_t cbData)
4982{
4983 PVDIO pVDIo = (PVDIO)pvUser;
4984 PVBOXHDD pDisk = pVDIo->pDisk;
4985 size_t cbCreated = 0;
4986
4987 /** @todo: It is possible that this gets called from a filter plugin
4988 * outside of the disk lock. Refine assertion or remove completely. */
4989#if 0
4990 /** @todo: Enable check for sync I/O later. */
4991 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4992 VD_IS_LOCKED(pDisk);
4993#endif
4994
4995 cbCreated = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, paSeg, pcSeg, cbData);
4996 Assert(!paSeg || cbData == cbCreated);
4997
4998 return cbCreated;
4999}
5000
5001static void vdIOIntIoCtxCompleted(void *pvUser, PVDIOCTX pIoCtx, int rcReq,
5002 size_t cbCompleted)
5003{
5004 PVDIO pVDIo = (PVDIO)pvUser;
5005 PVBOXHDD pDisk = pVDIo->pDisk;
5006
5007 LogFlowFunc(("pvUser=%#p pIoCtx=%#p rcReq=%Rrc cbCompleted=%zu\n",
5008 pvUser, pIoCtx, rcReq, cbCompleted));
5009
5010 /*
5011 * Grab the disk critical section to avoid races with other threads which
5012 * might still modify the I/O context.
5013 * Example is that iSCSI is doing an asynchronous write but calls us already
5014 * while the other thread is still hanging in vdWriteHelperAsync and couldn't update
5015 * the blocked state yet.
5016 * It can overwrite the state to true before we call vdIoCtxContinue and the
5017 * the request would hang indefinite.
5018 */
5019 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rcReq, VINF_SUCCESS);
5020 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbCompleted);
5021 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCompleted);
5022
5023 /* Set next transfer function if the current one finished.
5024 * @todo: Find a better way to prevent vdIoCtxContinue from calling the current helper again. */
5025 if (!pIoCtx->Req.Io.cbTransferLeft)
5026 {
5027 pIoCtx->pfnIoCtxTransfer = pIoCtx->pfnIoCtxTransferNext;
5028 pIoCtx->pfnIoCtxTransferNext = NULL;
5029 }
5030
5031 vdIoCtxAddToWaitingList(&pDisk->pIoCtxHaltedHead, pIoCtx);
5032 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
5033 {
5034 /* Immediately drop the lock again, it will take care of processing the list. */
5035 vdDiskUnlock(pDisk, NULL);
5036 }
5037}
5038
5039static DECLCALLBACK(bool) vdIOIntIoCtxIsSynchronous(void *pvUser, PVDIOCTX pIoCtx)
5040{
5041 NOREF(pvUser);
5042 return !!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC);
5043}
5044
5045static DECLCALLBACK(bool) vdIOIntIoCtxIsZero(void *pvUser, PVDIOCTX pIoCtx, size_t cbCheck,
5046 bool fAdvance)
5047{
5048 NOREF(pvUser);
5049
5050 bool fIsZero = RTSgBufIsZero(&pIoCtx->Req.Io.SgBuf, cbCheck);
5051 if (fIsZero && fAdvance)
5052 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbCheck);
5053
5054 return fIsZero;
5055}
5056
5057static DECLCALLBACK(size_t) vdIOIntIoCtxGetDataUnitSize(void *pvUser, PVDIOCTX pIoCtx)
5058{
5059 PVDIO pVDIo = (PVDIO)pvUser;
5060 PVBOXHDD pDisk = pVDIo->pDisk;
5061
5062 PVDIMAGE pImage = vdGetImageByNumber(pDisk, VD_LAST_IMAGE);
5063 AssertPtrReturn(pImage, 0);
5064 return pImage->Backend->pfnGetSectorSize(pImage->pBackendData);
5065}
5066
5067/**
5068 * VD I/O interface callback for opening a file (limited version for VDGetFormat).
5069 */
5070static int vdIOIntOpenLimited(void *pvUser, const char *pszLocation,
5071 uint32_t fOpen, PPVDIOSTORAGE ppIoStorage)
5072{
5073 int rc = VINF_SUCCESS;
5074 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5075 PVDIOSTORAGE pIoStorage = (PVDIOSTORAGE)RTMemAllocZ(sizeof(VDIOSTORAGE));
5076
5077 if (!pIoStorage)
5078 return VERR_NO_MEMORY;
5079
5080 rc = pInterfaceIo->pfnOpen(NULL, pszLocation, fOpen, NULL, &pIoStorage->pStorage);
5081 if (RT_SUCCESS(rc))
5082 *ppIoStorage = pIoStorage;
5083 else
5084 RTMemFree(pIoStorage);
5085
5086 return rc;
5087}
5088
5089static int vdIOIntCloseLimited(void *pvUser, PVDIOSTORAGE pIoStorage)
5090{
5091 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5092 int rc = pInterfaceIo->pfnClose(NULL, pIoStorage->pStorage);
5093
5094 RTMemFree(pIoStorage);
5095 return rc;
5096}
5097
5098static int vdIOIntDeleteLimited(void *pvUser, const char *pcszFilename)
5099{
5100 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5101 return pInterfaceIo->pfnDelete(NULL, pcszFilename);
5102}
5103
5104static int vdIOIntMoveLimited(void *pvUser, const char *pcszSrc,
5105 const char *pcszDst, unsigned fMove)
5106{
5107 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5108 return pInterfaceIo->pfnMove(NULL, pcszSrc, pcszDst, fMove);
5109}
5110
5111static int vdIOIntGetFreeSpaceLimited(void *pvUser, const char *pcszFilename,
5112 int64_t *pcbFreeSpace)
5113{
5114 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5115 return pInterfaceIo->pfnGetFreeSpace(NULL, pcszFilename, pcbFreeSpace);
5116}
5117
5118static int vdIOIntGetModificationTimeLimited(void *pvUser,
5119 const char *pcszFilename,
5120 PRTTIMESPEC pModificationTime)
5121{
5122 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5123 return pInterfaceIo->pfnGetModificationTime(NULL, pcszFilename, pModificationTime);
5124}
5125
5126static int vdIOIntGetSizeLimited(void *pvUser, PVDIOSTORAGE pIoStorage,
5127 uint64_t *pcbSize)
5128{
5129 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5130 return pInterfaceIo->pfnGetSize(NULL, pIoStorage->pStorage, pcbSize);
5131}
5132
5133static int vdIOIntSetSizeLimited(void *pvUser, PVDIOSTORAGE pIoStorage,
5134 uint64_t cbSize)
5135{
5136 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5137 return pInterfaceIo->pfnSetSize(NULL, pIoStorage->pStorage, cbSize);
5138}
5139
5140static int vdIOIntWriteUserLimited(void *pvUser, PVDIOSTORAGE pStorage,
5141 uint64_t uOffset, PVDIOCTX pIoCtx,
5142 size_t cbWrite,
5143 PFNVDXFERCOMPLETED pfnComplete,
5144 void *pvCompleteUser)
5145{
5146 NOREF(pvUser);
5147 NOREF(pStorage);
5148 NOREF(uOffset);
5149 NOREF(pIoCtx);
5150 NOREF(cbWrite);
5151 NOREF(pfnComplete);
5152 NOREF(pvCompleteUser);
5153 AssertMsgFailedReturn(("This needs to be implemented when called\n"), VERR_NOT_IMPLEMENTED);
5154}
5155
5156static int vdIOIntReadUserLimited(void *pvUser, PVDIOSTORAGE pStorage,
5157 uint64_t uOffset, PVDIOCTX pIoCtx,
5158 size_t cbRead)
5159{
5160 NOREF(pvUser);
5161 NOREF(pStorage);
5162 NOREF(uOffset);
5163 NOREF(pIoCtx);
5164 NOREF(cbRead);
5165 AssertMsgFailedReturn(("This needs to be implemented when called\n"), VERR_NOT_IMPLEMENTED);
5166}
5167
5168static int vdIOIntWriteMetaLimited(void *pvUser, PVDIOSTORAGE pStorage,
5169 uint64_t uOffset, const void *pvBuffer,
5170 size_t cbBuffer, PVDIOCTX pIoCtx,
5171 PFNVDXFERCOMPLETED pfnComplete,
5172 void *pvCompleteUser)
5173{
5174 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5175
5176 AssertMsgReturn(!pIoCtx && !pfnComplete && !pvCompleteUser,
5177 ("Async I/O not implemented for the limited interface"),
5178 VERR_NOT_SUPPORTED);
5179
5180 return pInterfaceIo->pfnWriteSync(NULL, pStorage->pStorage, uOffset, pvBuffer, cbBuffer, NULL);
5181}
5182
5183static int vdIOIntReadMetaLimited(void *pvUser, PVDIOSTORAGE pStorage,
5184 uint64_t uOffset, void *pvBuffer,
5185 size_t cbBuffer, PVDIOCTX pIoCtx,
5186 PPVDMETAXFER ppMetaXfer,
5187 PFNVDXFERCOMPLETED pfnComplete,
5188 void *pvCompleteUser)
5189{
5190 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5191
5192 AssertMsgReturn(!pIoCtx && !ppMetaXfer && !pfnComplete && !pvCompleteUser,
5193 ("Async I/O not implemented for the limited interface"),
5194 VERR_NOT_SUPPORTED);
5195
5196 return pInterfaceIo->pfnReadSync(NULL, pStorage->pStorage, uOffset, pvBuffer, cbBuffer, NULL);
5197}
5198
5199static int vdIOIntMetaXferReleaseLimited(void *pvUser, PVDMETAXFER pMetaXfer)
5200{
5201 /* This is a NOP in this case. */
5202 NOREF(pvUser);
5203 NOREF(pMetaXfer);
5204 return VINF_SUCCESS;
5205}
5206
5207static int vdIOIntFlushLimited(void *pvUser, PVDIOSTORAGE pStorage,
5208 PVDIOCTX pIoCtx,
5209 PFNVDXFERCOMPLETED pfnComplete,
5210 void *pvCompleteUser)
5211{
5212 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
5213
5214 AssertMsgReturn(!pIoCtx && !pfnComplete && !pvCompleteUser,
5215 ("Async I/O not implemented for the limited interface"),
5216 VERR_NOT_SUPPORTED);
5217
5218 return pInterfaceIo->pfnFlushSync(NULL, pStorage->pStorage);
5219}
5220
5221/**
5222 * internal: send output to the log (unconditionally).
5223 */
5224int vdLogMessage(void *pvUser, const char *pszFormat, va_list args)
5225{
5226 NOREF(pvUser);
5227 RTLogPrintfV(pszFormat, args);
5228 return VINF_SUCCESS;
5229}
5230
5231DECLINLINE(int) vdMessageWrapper(PVBOXHDD pDisk, const char *pszFormat, ...)
5232{
5233 va_list va;
5234 va_start(va, pszFormat);
5235 int rc = pDisk->pInterfaceError->pfnMessage(pDisk->pInterfaceError->Core.pvUser,
5236 pszFormat, va);
5237 va_end(va);
5238 return rc;
5239}
5240
5241
5242/**
5243 * internal: adjust PCHS geometry
5244 */
5245static void vdFixupPCHSGeometry(PVDGEOMETRY pPCHS, uint64_t cbSize)
5246{
5247 /* Fix broken PCHS geometry. Can happen for two reasons: either the backend
5248 * mixes up PCHS and LCHS, or the application used to create the source
5249 * image has put garbage in it. Additionally, if the PCHS geometry covers
5250 * more than the image size, set it back to the default. */
5251 if ( pPCHS->cHeads > 16
5252 || pPCHS->cSectors > 63
5253 || pPCHS->cCylinders == 0
5254 || (uint64_t)pPCHS->cHeads * pPCHS->cSectors * pPCHS->cCylinders * 512 > cbSize)
5255 {
5256 Assert(!(RT_MIN(cbSize / 512 / 16 / 63, 16383) - (uint32_t)RT_MIN(cbSize / 512 / 16 / 63, 16383)));
5257 pPCHS->cCylinders = (uint32_t)RT_MIN(cbSize / 512 / 16 / 63, 16383);
5258 pPCHS->cHeads = 16;
5259 pPCHS->cSectors = 63;
5260 }
5261}
5262
5263/**
5264 * internal: adjust PCHS geometry
5265 */
5266static void vdFixupLCHSGeometry(PVDGEOMETRY pLCHS, uint64_t cbSize)
5267{
5268 /* Fix broken LCHS geometry. Can happen for two reasons: either the backend
5269 * mixes up PCHS and LCHS, or the application used to create the source
5270 * image has put garbage in it. The fix in this case is to clear the LCHS
5271 * geometry to trigger autodetection when it is used next. If the geometry
5272 * already says "please autodetect" (cylinders=0) keep it. */
5273 if ( ( pLCHS->cHeads > 255
5274 || pLCHS->cHeads == 0
5275 || pLCHS->cSectors > 63
5276 || pLCHS->cSectors == 0)
5277 && pLCHS->cCylinders != 0)
5278 {
5279 pLCHS->cCylinders = 0;
5280 pLCHS->cHeads = 0;
5281 pLCHS->cSectors = 0;
5282 }
5283 /* Always recompute the number of cylinders stored in the LCHS
5284 * geometry if it isn't set to "autotedetect" at the moment.
5285 * This is very useful if the destination image size is
5286 * larger or smaller than the source image size. Do not modify
5287 * the number of heads and sectors. Windows guests hate it. */
5288 if ( pLCHS->cCylinders != 0
5289 && pLCHS->cHeads != 0 /* paranoia */
5290 && pLCHS->cSectors != 0 /* paranoia */)
5291 {
5292 Assert(!(RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024) - (uint32_t)RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024)));
5293 pLCHS->cCylinders = (uint32_t)RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024);
5294 }
5295}
5296
5297/**
5298 * Sets the I/O callbacks of the given interface to the fallback methods
5299 *
5300 * @returns nothing.
5301 * @param pIfIo The I/O interface to setup.
5302 */
5303static void vdIfIoFallbackCallbacksSetup(PVDINTERFACEIO pIfIo)
5304{
5305 pIfIo->pfnOpen = vdIOOpenFallback;
5306 pIfIo->pfnClose = vdIOCloseFallback;
5307 pIfIo->pfnDelete = vdIODeleteFallback;
5308 pIfIo->pfnMove = vdIOMoveFallback;
5309 pIfIo->pfnGetFreeSpace = vdIOGetFreeSpaceFallback;
5310 pIfIo->pfnGetModificationTime = vdIOGetModificationTimeFallback;
5311 pIfIo->pfnGetSize = vdIOGetSizeFallback;
5312 pIfIo->pfnSetSize = vdIOSetSizeFallback;
5313 pIfIo->pfnReadSync = vdIOReadSyncFallback;
5314 pIfIo->pfnWriteSync = vdIOWriteSyncFallback;
5315 pIfIo->pfnFlushSync = vdIOFlushSyncFallback;
5316 pIfIo->pfnReadAsync = vdIOReadAsyncFallback;
5317 pIfIo->pfnWriteAsync = vdIOWriteAsyncFallback;
5318 pIfIo->pfnFlushAsync = vdIOFlushAsyncFallback;
5319}
5320
5321/**
5322 * Sets the internal I/O callbacks of the given interface.
5323 *
5324 * @returns nothing.
5325 * @param pIfIoInt The internal I/O interface to setup.
5326 */
5327static void vdIfIoIntCallbacksSetup(PVDINTERFACEIOINT pIfIoInt)
5328{
5329 pIfIoInt->pfnOpen = vdIOIntOpen;
5330 pIfIoInt->pfnClose = vdIOIntClose;
5331 pIfIoInt->pfnDelete = vdIOIntDelete;
5332 pIfIoInt->pfnMove = vdIOIntMove;
5333 pIfIoInt->pfnGetFreeSpace = vdIOIntGetFreeSpace;
5334 pIfIoInt->pfnGetModificationTime = vdIOIntGetModificationTime;
5335 pIfIoInt->pfnGetSize = vdIOIntGetSize;
5336 pIfIoInt->pfnSetSize = vdIOIntSetSize;
5337 pIfIoInt->pfnReadUser = vdIOIntReadUser;
5338 pIfIoInt->pfnWriteUser = vdIOIntWriteUser;
5339 pIfIoInt->pfnReadMeta = vdIOIntReadMeta;
5340 pIfIoInt->pfnWriteMeta = vdIOIntWriteMeta;
5341 pIfIoInt->pfnMetaXferRelease = vdIOIntMetaXferRelease;
5342 pIfIoInt->pfnFlush = vdIOIntFlush;
5343 pIfIoInt->pfnIoCtxCopyFrom = vdIOIntIoCtxCopyFrom;
5344 pIfIoInt->pfnIoCtxCopyTo = vdIOIntIoCtxCopyTo;
5345 pIfIoInt->pfnIoCtxSet = vdIOIntIoCtxSet;
5346 pIfIoInt->pfnIoCtxSegArrayCreate = vdIOIntIoCtxSegArrayCreate;
5347 pIfIoInt->pfnIoCtxCompleted = vdIOIntIoCtxCompleted;
5348 pIfIoInt->pfnIoCtxIsSynchronous = vdIOIntIoCtxIsSynchronous;
5349 pIfIoInt->pfnIoCtxIsZero = vdIOIntIoCtxIsZero;
5350 pIfIoInt->pfnIoCtxGetDataUnitSize = vdIOIntIoCtxGetDataUnitSize;
5351}
5352
5353/**
5354 * Internally used completion handler for synchronous I/O contexts.
5355 */
5356static DECLCALLBACK(void) vdIoCtxSyncComplete(void *pvUser1, void *pvUser2, int rcReq)
5357{
5358 PVBOXHDD pDisk = (PVBOXHDD)pvUser1;
5359 RTSEMEVENT hEvent = (RTSEMEVENT)pvUser2;
5360
5361 RTSemEventSignal(hEvent);
5362}
5363
5364/**
5365 * Initializes HDD backends.
5366 *
5367 * @returns VBox status code.
5368 */
5369VBOXDDU_DECL(int) VDInit(void)
5370{
5371 int rc = vdAddBackends(aStaticBackends, RT_ELEMENTS(aStaticBackends));
5372 if (RT_SUCCESS(rc))
5373 {
5374 rc = vdAddCacheBackends(aStaticCacheBackends, RT_ELEMENTS(aStaticCacheBackends));
5375 if (RT_SUCCESS(rc))
5376 {
5377 RTListInit(&g_ListPluginsLoaded);
5378 rc = vdLoadDynamicBackends();
5379 }
5380 }
5381 LogRel(("VDInit finished\n"));
5382 return rc;
5383}
5384
5385/**
5386 * Destroys loaded HDD backends.
5387 *
5388 * @returns VBox status code.
5389 */
5390VBOXDDU_DECL(int) VDShutdown(void)
5391{
5392 PCVBOXHDDBACKEND *pBackends = g_apBackends;
5393 PCVDCACHEBACKEND *pCacheBackends = g_apCacheBackends;
5394 unsigned cBackends = g_cBackends;
5395
5396 if (!g_apBackends)
5397 return VERR_INTERNAL_ERROR;
5398
5399 if (g_apCacheBackends)
5400 RTMemFree(g_apCacheBackends);
5401 RTMemFree(g_apBackends);
5402
5403 g_cBackends = 0;
5404 g_apBackends = NULL;
5405
5406 /* Clear the supported cache backends. */
5407 g_cCacheBackends = 0;
5408 g_apCacheBackends = NULL;
5409
5410#ifndef VBOX_HDD_NO_DYNAMIC_BACKENDS
5411 PVDPLUGIN pPlugin, pPluginNext;
5412
5413 RTListForEachSafe(&g_ListPluginsLoaded, pPlugin, pPluginNext, VDPLUGIN, NodePlugin)
5414 {
5415 RTLdrClose(pPlugin->hPlugin);
5416 RTStrFree(pPlugin->pszFilename);
5417 RTListNodeRemove(&pPlugin->NodePlugin);
5418 RTMemFree(pPlugin);
5419 }
5420#endif
5421
5422 return VINF_SUCCESS;
5423}
5424
5425/**
5426 * Loads a single plugin given by filename.
5427 *
5428 * @returns VBox status code.
5429 * @param pszFilename The plugin filename to load.
5430 */
5431VBOXDDU_DECL(int) VDPluginLoadFromFilename(const char *pszFilename)
5432{
5433 if (!g_apBackends)
5434 {
5435 int rc = VDInit();
5436 if (RT_FAILURE(rc))
5437 return rc;
5438 }
5439
5440 return vdPluginLoadFromFilename(pszFilename);
5441}
5442
5443/**
5444 * Load all plugins from a given path.
5445 *
5446 * @returns VBox statuse code.
5447 * @param pszPath The path to load plugins from.
5448 */
5449VBOXDDU_DECL(int) VDPluginLoadFromPath(const char *pszPath)
5450{
5451 if (!g_apBackends)
5452 {
5453 int rc = VDInit();
5454 if (RT_FAILURE(rc))
5455 return rc;
5456 }
5457
5458 return vdPluginLoadFromPath(pszPath);
5459}
5460
5461/**
5462 * Lists all HDD backends and their capabilities in a caller-provided buffer.
5463 *
5464 * @returns VBox status code.
5465 * VERR_BUFFER_OVERFLOW if not enough space is passed.
5466 * @param cEntriesAlloc Number of list entries available.
5467 * @param pEntries Pointer to array for the entries.
5468 * @param pcEntriesUsed Number of entries returned.
5469 */
5470VBOXDDU_DECL(int) VDBackendInfo(unsigned cEntriesAlloc, PVDBACKENDINFO pEntries,
5471 unsigned *pcEntriesUsed)
5472{
5473 int rc = VINF_SUCCESS;
5474 PRTDIR pPluginDir = NULL;
5475 unsigned cEntries = 0;
5476
5477 LogFlowFunc(("cEntriesAlloc=%u pEntries=%#p pcEntriesUsed=%#p\n", cEntriesAlloc, pEntries, pcEntriesUsed));
5478 /* Check arguments. */
5479 AssertMsgReturn(cEntriesAlloc,
5480 ("cEntriesAlloc=%u\n", cEntriesAlloc),
5481 VERR_INVALID_PARAMETER);
5482 AssertMsgReturn(VALID_PTR(pEntries),
5483 ("pEntries=%#p\n", pEntries),
5484 VERR_INVALID_PARAMETER);
5485 AssertMsgReturn(VALID_PTR(pcEntriesUsed),
5486 ("pcEntriesUsed=%#p\n", pcEntriesUsed),
5487 VERR_INVALID_PARAMETER);
5488 if (!g_apBackends)
5489 VDInit();
5490
5491 if (cEntriesAlloc < g_cBackends)
5492 {
5493 *pcEntriesUsed = g_cBackends;
5494 return VERR_BUFFER_OVERFLOW;
5495 }
5496
5497 for (unsigned i = 0; i < g_cBackends; i++)
5498 {
5499 pEntries[i].pszBackend = g_apBackends[i]->pszBackendName;
5500 pEntries[i].uBackendCaps = g_apBackends[i]->uBackendCaps;
5501 pEntries[i].paFileExtensions = g_apBackends[i]->paFileExtensions;
5502 pEntries[i].paConfigInfo = g_apBackends[i]->paConfigInfo;
5503 pEntries[i].pfnComposeLocation = g_apBackends[i]->pfnComposeLocation;
5504 pEntries[i].pfnComposeName = g_apBackends[i]->pfnComposeName;
5505 }
5506
5507 LogFlowFunc(("returns %Rrc *pcEntriesUsed=%u\n", rc, cEntries));
5508 *pcEntriesUsed = g_cBackends;
5509 return rc;
5510}
5511
5512/**
5513 * Lists the capabilities of a backend identified by its name.
5514 *
5515 * @returns VBox status code.
5516 * @param pszBackend The backend name.
5517 * @param pEntries Pointer to an entry.
5518 */
5519VBOXDDU_DECL(int) VDBackendInfoOne(const char *pszBackend, PVDBACKENDINFO pEntry)
5520{
5521 LogFlowFunc(("pszBackend=%#p pEntry=%#p\n", pszBackend, pEntry));
5522 /* Check arguments. */
5523 AssertMsgReturn(VALID_PTR(pszBackend),
5524 ("pszBackend=%#p\n", pszBackend),
5525 VERR_INVALID_PARAMETER);
5526 AssertMsgReturn(VALID_PTR(pEntry),
5527 ("pEntry=%#p\n", pEntry),
5528 VERR_INVALID_PARAMETER);
5529 if (!g_apBackends)
5530 VDInit();
5531
5532 /* Go through loaded backends. */
5533 for (unsigned i = 0; i < g_cBackends; i++)
5534 {
5535 if (!RTStrICmp(pszBackend, g_apBackends[i]->pszBackendName))
5536 {
5537 pEntry->pszBackend = g_apBackends[i]->pszBackendName;
5538 pEntry->uBackendCaps = g_apBackends[i]->uBackendCaps;
5539 pEntry->paFileExtensions = g_apBackends[i]->paFileExtensions;
5540 pEntry->paConfigInfo = g_apBackends[i]->paConfigInfo;
5541 return VINF_SUCCESS;
5542 }
5543 }
5544
5545 return VERR_NOT_FOUND;
5546}
5547
5548/**
5549 * Lists all filters and their capabilities in a caller-provided buffer.
5550 *
5551 * @return VBox status code.
5552 * VERR_BUFFER_OVERFLOW if not enough space is passed.
5553 * @param cEntriesAlloc Number of list entries available.
5554 * @param pEntries Pointer to array for the entries.
5555 * @param pcEntriesUsed Number of entries returned.
5556 */
5557VBOXDDU_DECL(int) VDFilterInfo(unsigned cEntriesAlloc, PVDFILTERINFO pEntries,
5558 unsigned *pcEntriesUsed)
5559{
5560 int rc = VINF_SUCCESS;
5561 unsigned cEntries = 0;
5562
5563 LogFlowFunc(("cEntriesAlloc=%u pEntries=%#p pcEntriesUsed=%#p\n", cEntriesAlloc, pEntries, pcEntriesUsed));
5564 /* Check arguments. */
5565 AssertMsgReturn(cEntriesAlloc,
5566 ("cEntriesAlloc=%u\n", cEntriesAlloc),
5567 VERR_INVALID_PARAMETER);
5568 AssertMsgReturn(VALID_PTR(pEntries),
5569 ("pEntries=%#p\n", pEntries),
5570 VERR_INVALID_PARAMETER);
5571 AssertMsgReturn(VALID_PTR(pcEntriesUsed),
5572 ("pcEntriesUsed=%#p\n", pcEntriesUsed),
5573 VERR_INVALID_PARAMETER);
5574 if (!g_apBackends)
5575 VDInit();
5576
5577 if (cEntriesAlloc < g_cFilterBackends)
5578 {
5579 *pcEntriesUsed = g_cFilterBackends;
5580 return VERR_BUFFER_OVERFLOW;
5581 }
5582
5583 for (unsigned i = 0; i < g_cFilterBackends; i++)
5584 {
5585 pEntries[i].pszFilter = g_apFilterBackends[i]->pszBackendName;
5586 pEntries[i].paConfigInfo = g_apFilterBackends[i]->paConfigInfo;
5587 }
5588
5589 LogFlowFunc(("returns %Rrc *pcEntriesUsed=%u\n", rc, cEntries));
5590 *pcEntriesUsed = g_cFilterBackends;
5591 return rc;
5592}
5593
5594/**
5595 * Lists the capabilities of a filter identified by its name.
5596 *
5597 * @return VBox status code.
5598 * @param pszFilter The filter name (case insensitive).
5599 * @param pEntries Pointer to an entry.
5600 */
5601VBOXDDU_DECL(int) VDFilterInfoOne(const char *pszFilter, PVDFILTERINFO pEntry)
5602{
5603 LogFlowFunc(("pszFilter=%#p pEntry=%#p\n", pszFilter, pEntry));
5604 /* Check arguments. */
5605 AssertMsgReturn(VALID_PTR(pszFilter),
5606 ("pszFilter=%#p\n", pszFilter),
5607 VERR_INVALID_PARAMETER);
5608 AssertMsgReturn(VALID_PTR(pEntry),
5609 ("pEntry=%#p\n", pEntry),
5610 VERR_INVALID_PARAMETER);
5611 if (!g_apBackends)
5612 VDInit();
5613
5614 /* Go through loaded backends. */
5615 for (unsigned i = 0; i < g_cFilterBackends; i++)
5616 {
5617 if (!RTStrICmp(pszFilter, g_apFilterBackends[i]->pszBackendName))
5618 {
5619 pEntry->pszFilter = g_apFilterBackends[i]->pszBackendName;
5620 pEntry->paConfigInfo = g_apFilterBackends[i]->paConfigInfo;
5621 return VINF_SUCCESS;
5622 }
5623 }
5624
5625 return VERR_NOT_FOUND;
5626}
5627
5628/**
5629 * Allocates and initializes an empty HDD container.
5630 * No image files are opened.
5631 *
5632 * @returns VBox status code.
5633 * @param pVDIfsDisk Pointer to the per-disk VD interface list.
5634 * @param enmType Type of the image container.
5635 * @param ppDisk Where to store the reference to HDD container.
5636 */
5637VBOXDDU_DECL(int) VDCreate(PVDINTERFACE pVDIfsDisk, VDTYPE enmType, PVBOXHDD *ppDisk)
5638{
5639 int rc = VINF_SUCCESS;
5640 PVBOXHDD pDisk = NULL;
5641
5642 LogFlowFunc(("pVDIfsDisk=%#p\n", pVDIfsDisk));
5643 do
5644 {
5645 /* Check arguments. */
5646 AssertMsgBreakStmt(VALID_PTR(ppDisk),
5647 ("ppDisk=%#p\n", ppDisk),
5648 rc = VERR_INVALID_PARAMETER);
5649
5650 pDisk = (PVBOXHDD)RTMemAllocZ(sizeof(VBOXHDD));
5651 if (pDisk)
5652 {
5653 pDisk->u32Signature = VBOXHDDDISK_SIGNATURE;
5654 pDisk->enmType = enmType;
5655 pDisk->cImages = 0;
5656 pDisk->pBase = NULL;
5657 pDisk->pLast = NULL;
5658 pDisk->cbSize = 0;
5659 pDisk->PCHSGeometry.cCylinders = 0;
5660 pDisk->PCHSGeometry.cHeads = 0;
5661 pDisk->PCHSGeometry.cSectors = 0;
5662 pDisk->LCHSGeometry.cCylinders = 0;
5663 pDisk->LCHSGeometry.cHeads = 0;
5664 pDisk->LCHSGeometry.cSectors = 0;
5665 pDisk->pVDIfsDisk = pVDIfsDisk;
5666 pDisk->pInterfaceError = NULL;
5667 pDisk->pInterfaceThreadSync = NULL;
5668 pDisk->pIoCtxLockOwner = NULL;
5669 pDisk->pIoCtxHead = NULL;
5670 pDisk->fLocked = false;
5671 pDisk->hMemCacheIoCtx = NIL_RTMEMCACHE;
5672 pDisk->hMemCacheIoTask = NIL_RTMEMCACHE;
5673 pDisk->pFilterHead = NULL;
5674 pDisk->pFilterTail = NULL;
5675
5676 /* Create the I/O ctx cache */
5677 rc = RTMemCacheCreate(&pDisk->hMemCacheIoCtx, sizeof(VDIOCTX), 0, UINT32_MAX,
5678 NULL, NULL, NULL, 0);
5679 if (RT_FAILURE(rc))
5680 break;
5681
5682 /* Create the I/O task cache */
5683 rc = RTMemCacheCreate(&pDisk->hMemCacheIoTask, sizeof(VDIOTASK), 0, UINT32_MAX,
5684 NULL, NULL, NULL, 0);
5685 if (RT_FAILURE(rc))
5686 break;
5687
5688 pDisk->pInterfaceError = VDIfErrorGet(pVDIfsDisk);
5689 pDisk->pInterfaceThreadSync = VDIfThreadSyncGet(pVDIfsDisk);
5690
5691 *ppDisk = pDisk;
5692 }
5693 else
5694 {
5695 rc = VERR_NO_MEMORY;
5696 break;
5697 }
5698 } while (0);
5699
5700 if ( RT_FAILURE(rc)
5701 && pDisk)
5702 {
5703 if (pDisk->hMemCacheIoCtx != NIL_RTMEMCACHE)
5704 RTMemCacheDestroy(pDisk->hMemCacheIoCtx);
5705 if (pDisk->hMemCacheIoTask != NIL_RTMEMCACHE)
5706 RTMemCacheDestroy(pDisk->hMemCacheIoTask);
5707 }
5708
5709 LogFlowFunc(("returns %Rrc (pDisk=%#p)\n", rc, pDisk));
5710 return rc;
5711}
5712
5713/**
5714 * Destroys HDD container.
5715 * If container has opened image files they will be closed.
5716 *
5717 * @returns VBox status code.
5718 * @param pDisk Pointer to HDD container.
5719 */
5720VBOXDDU_DECL(int) VDDestroy(PVBOXHDD pDisk)
5721{
5722 int rc = VINF_SUCCESS;
5723 LogFlowFunc(("pDisk=%#p\n", pDisk));
5724 do
5725 {
5726 /* sanity check */
5727 AssertPtrBreak(pDisk);
5728 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5729 Assert(!pDisk->fLocked);
5730
5731 rc = VDCloseAll(pDisk);
5732 int rc2 = VDFilterRemoveAll(pDisk);
5733 if (RT_SUCCESS(rc))
5734 rc = rc2;
5735
5736 RTMemCacheDestroy(pDisk->hMemCacheIoCtx);
5737 RTMemCacheDestroy(pDisk->hMemCacheIoTask);
5738 RTMemFree(pDisk);
5739 } while (0);
5740 LogFlowFunc(("returns %Rrc\n", rc));
5741 return rc;
5742}
5743
5744/**
5745 * Try to get the backend name which can use this image.
5746 *
5747 * @returns VBox status code.
5748 * VINF_SUCCESS if a plugin was found.
5749 * ppszFormat contains the string which can be used as backend name.
5750 * VERR_NOT_SUPPORTED if no backend was found.
5751 * @param pVDIfsDisk Pointer to the per-disk VD interface list.
5752 * @param pVDIfsImage Pointer to the per-image VD interface list.
5753 * @param pszFilename Name of the image file for which the backend is queried.
5754 * @param ppszFormat Receives pointer of the UTF-8 string which contains the format name.
5755 * The returned pointer must be freed using RTStrFree().
5756 */
5757VBOXDDU_DECL(int) VDGetFormat(PVDINTERFACE pVDIfsDisk, PVDINTERFACE pVDIfsImage,
5758 const char *pszFilename, char **ppszFormat, VDTYPE *penmType)
5759{
5760 int rc = VERR_NOT_SUPPORTED;
5761 VDINTERFACEIOINT VDIfIoInt;
5762 VDINTERFACEIO VDIfIoFallback;
5763 PVDINTERFACEIO pInterfaceIo;
5764
5765 LogFlowFunc(("pszFilename=\"%s\"\n", pszFilename));
5766 /* Check arguments. */
5767 AssertMsgReturn(VALID_PTR(pszFilename) && *pszFilename,
5768 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5769 VERR_INVALID_PARAMETER);
5770 AssertMsgReturn(VALID_PTR(ppszFormat),
5771 ("ppszFormat=%#p\n", ppszFormat),
5772 VERR_INVALID_PARAMETER);
5773 AssertMsgReturn(VALID_PTR(penmType),
5774 ("penmType=%#p\n", penmType),
5775 VERR_INVALID_PARAMETER);
5776
5777 if (!g_apBackends)
5778 VDInit();
5779
5780 pInterfaceIo = VDIfIoGet(pVDIfsImage);
5781 if (!pInterfaceIo)
5782 {
5783 /*
5784 * Caller doesn't provide an I/O interface, create our own using the
5785 * native file API.
5786 */
5787 vdIfIoFallbackCallbacksSetup(&VDIfIoFallback);
5788 pInterfaceIo = &VDIfIoFallback;
5789 }
5790
5791 /* Set up the internal I/O interface. */
5792 AssertReturn(!VDIfIoIntGet(pVDIfsImage), VERR_INVALID_PARAMETER);
5793 VDIfIoInt.pfnOpen = vdIOIntOpenLimited;
5794 VDIfIoInt.pfnClose = vdIOIntCloseLimited;
5795 VDIfIoInt.pfnDelete = vdIOIntDeleteLimited;
5796 VDIfIoInt.pfnMove = vdIOIntMoveLimited;
5797 VDIfIoInt.pfnGetFreeSpace = vdIOIntGetFreeSpaceLimited;
5798 VDIfIoInt.pfnGetModificationTime = vdIOIntGetModificationTimeLimited;
5799 VDIfIoInt.pfnGetSize = vdIOIntGetSizeLimited;
5800 VDIfIoInt.pfnSetSize = vdIOIntSetSizeLimited;
5801 VDIfIoInt.pfnReadUser = vdIOIntReadUserLimited;
5802 VDIfIoInt.pfnWriteUser = vdIOIntWriteUserLimited;
5803 VDIfIoInt.pfnReadMeta = vdIOIntReadMetaLimited;
5804 VDIfIoInt.pfnWriteMeta = vdIOIntWriteMetaLimited;
5805 VDIfIoInt.pfnFlush = vdIOIntFlushLimited;
5806 rc = VDInterfaceAdd(&VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
5807 pInterfaceIo, sizeof(VDINTERFACEIOINT), &pVDIfsImage);
5808 AssertRC(rc);
5809
5810 /* Find the backend supporting this file format. */
5811 for (unsigned i = 0; i < g_cBackends; i++)
5812 {
5813 if (g_apBackends[i]->pfnCheckIfValid)
5814 {
5815 rc = g_apBackends[i]->pfnCheckIfValid(pszFilename, pVDIfsDisk,
5816 pVDIfsImage, penmType);
5817 if ( RT_SUCCESS(rc)
5818 /* The correct backend has been found, but there is a small
5819 * incompatibility so that the file cannot be used. Stop here
5820 * and signal success - the actual open will of course fail,
5821 * but that will create a really sensible error message. */
5822 || ( rc != VERR_VD_GEN_INVALID_HEADER
5823 && rc != VERR_VD_VDI_INVALID_HEADER
5824 && rc != VERR_VD_VMDK_INVALID_HEADER
5825 && rc != VERR_VD_ISCSI_INVALID_HEADER
5826 && rc != VERR_VD_VHD_INVALID_HEADER
5827 && rc != VERR_VD_RAW_INVALID_HEADER
5828 && rc != VERR_VD_PARALLELS_INVALID_HEADER
5829 && rc != VERR_VD_DMG_INVALID_HEADER))
5830 {
5831 /* Copy the name into the new string. */
5832 char *pszFormat = RTStrDup(g_apBackends[i]->pszBackendName);
5833 if (!pszFormat)
5834 {
5835 rc = VERR_NO_MEMORY;
5836 break;
5837 }
5838 *ppszFormat = pszFormat;
5839 /* Do not consider the typical file access errors as success,
5840 * which allows the caller to deal with such issues. */
5841 if ( rc != VERR_ACCESS_DENIED
5842 && rc != VERR_PATH_NOT_FOUND
5843 && rc != VERR_FILE_NOT_FOUND)
5844 rc = VINF_SUCCESS;
5845 break;
5846 }
5847 rc = VERR_NOT_SUPPORTED;
5848 }
5849 }
5850
5851 /* Try the cache backends. */
5852 if (rc == VERR_NOT_SUPPORTED)
5853 {
5854 for (unsigned i = 0; i < g_cCacheBackends; i++)
5855 {
5856 if (g_apCacheBackends[i]->pfnProbe)
5857 {
5858 rc = g_apCacheBackends[i]->pfnProbe(pszFilename, pVDIfsDisk,
5859 pVDIfsImage);
5860 if ( RT_SUCCESS(rc)
5861 || (rc != VERR_VD_GEN_INVALID_HEADER))
5862 {
5863 /* Copy the name into the new string. */
5864 char *pszFormat = RTStrDup(g_apBackends[i]->pszBackendName);
5865 if (!pszFormat)
5866 {
5867 rc = VERR_NO_MEMORY;
5868 break;
5869 }
5870 *ppszFormat = pszFormat;
5871 rc = VINF_SUCCESS;
5872 break;
5873 }
5874 rc = VERR_NOT_SUPPORTED;
5875 }
5876 }
5877 }
5878
5879 LogFlowFunc(("returns %Rrc *ppszFormat=\"%s\"\n", rc, *ppszFormat));
5880 return rc;
5881}
5882
5883/**
5884 * Opens an image file.
5885 *
5886 * The first opened image file in HDD container must have a base image type,
5887 * others (next opened images) must be a differencing or undo images.
5888 * Linkage is checked for differencing image to be in consistence with the previously opened image.
5889 * When another differencing image is opened and the last image was opened in read/write access
5890 * mode, then the last image is reopened in read-only with deny write sharing mode. This allows
5891 * other processes to use images in read-only mode too.
5892 *
5893 * Note that the image is opened in read-only mode if a read/write open is not possible.
5894 * Use VDIsReadOnly to check open mode.
5895 *
5896 * @returns VBox status code.
5897 * @param pDisk Pointer to HDD container.
5898 * @param pszBackend Name of the image file backend to use.
5899 * @param pszFilename Name of the image file to open.
5900 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
5901 * @param pVDIfsImage Pointer to the per-image VD interface list.
5902 */
5903VBOXDDU_DECL(int) VDOpen(PVBOXHDD pDisk, const char *pszBackend,
5904 const char *pszFilename, unsigned uOpenFlags,
5905 PVDINTERFACE pVDIfsImage)
5906{
5907 int rc = VINF_SUCCESS;
5908 int rc2;
5909 bool fLockWrite = false;
5910 PVDIMAGE pImage = NULL;
5911
5912 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uOpenFlags=%#x, pVDIfsImage=%#p\n",
5913 pDisk, pszBackend, pszFilename, uOpenFlags, pVDIfsImage));
5914
5915 do
5916 {
5917 /* sanity check */
5918 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
5919 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5920
5921 /* Check arguments. */
5922 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
5923 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
5924 rc = VERR_INVALID_PARAMETER);
5925 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
5926 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5927 rc = VERR_INVALID_PARAMETER);
5928 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
5929 ("uOpenFlags=%#x\n", uOpenFlags),
5930 rc = VERR_INVALID_PARAMETER);
5931 AssertMsgBreakStmt( !(uOpenFlags & VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS)
5932 || (uOpenFlags & VD_OPEN_FLAGS_READONLY),
5933 ("uOpenFlags=%#x\n", uOpenFlags),
5934 rc = VERR_INVALID_PARAMETER);
5935
5936 /*
5937 * Destroy the current discard state first which might still have pending blocks
5938 * for the currently opened image which will be switched to readonly mode.
5939 */
5940 /* Lock disk for writing, as we modify pDisk information below. */
5941 rc2 = vdThreadStartWrite(pDisk);
5942 AssertRC(rc2);
5943 fLockWrite = true;
5944 rc = vdDiscardStateDestroy(pDisk);
5945 if (RT_FAILURE(rc))
5946 break;
5947 rc2 = vdThreadFinishWrite(pDisk);
5948 AssertRC(rc2);
5949 fLockWrite = false;
5950
5951 /* Set up image descriptor. */
5952 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
5953 if (!pImage)
5954 {
5955 rc = VERR_NO_MEMORY;
5956 break;
5957 }
5958 pImage->pszFilename = RTStrDup(pszFilename);
5959 if (!pImage->pszFilename)
5960 {
5961 rc = VERR_NO_MEMORY;
5962 break;
5963 }
5964
5965 pImage->VDIo.pDisk = pDisk;
5966 pImage->pVDIfsImage = pVDIfsImage;
5967
5968 rc = vdFindBackend(pszBackend, &pImage->Backend);
5969 if (RT_FAILURE(rc))
5970 break;
5971 if (!pImage->Backend)
5972 {
5973 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
5974 N_("VD: unknown backend name '%s'"), pszBackend);
5975 break;
5976 }
5977
5978 /*
5979 * Fail if the backend can't do async I/O but the
5980 * flag is set.
5981 */
5982 if ( !(pImage->Backend->uBackendCaps & VD_CAP_ASYNC)
5983 && (uOpenFlags & VD_OPEN_FLAGS_ASYNC_IO))
5984 {
5985 rc = vdError(pDisk, VERR_NOT_SUPPORTED, RT_SRC_POS,
5986 N_("VD: Backend '%s' does not support async I/O"), pszBackend);
5987 break;
5988 }
5989
5990 /*
5991 * Fail if the backend doesn't support the discard operation but the
5992 * flag is set.
5993 */
5994 if ( !(pImage->Backend->uBackendCaps & VD_CAP_DISCARD)
5995 && (uOpenFlags & VD_OPEN_FLAGS_DISCARD))
5996 {
5997 rc = vdError(pDisk, VERR_VD_DISCARD_NOT_SUPPORTED, RT_SRC_POS,
5998 N_("VD: Backend '%s' does not support discard"), pszBackend);
5999 break;
6000 }
6001
6002 /* Set up the I/O interface. */
6003 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
6004 if (!pImage->VDIo.pInterfaceIo)
6005 {
6006 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
6007 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6008 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
6009 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
6010 }
6011
6012 /* Set up the internal I/O interface. */
6013 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
6014 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
6015 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6016 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
6017 AssertRC(rc);
6018
6019 pImage->uOpenFlags = uOpenFlags & (VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_DISCARD | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS);
6020 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6021 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
6022 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS),
6023 pDisk->pVDIfsDisk,
6024 pImage->pVDIfsImage,
6025 pDisk->enmType,
6026 &pImage->pBackendData);
6027 /*
6028 * If the image is corrupted and there is a repair method try to repair it
6029 * first if it was openend in read-write mode and open again afterwards.
6030 */
6031 if ( RT_UNLIKELY(rc == VERR_VD_IMAGE_CORRUPTED)
6032 && !(uOpenFlags & VD_OPEN_FLAGS_READONLY)
6033 && pImage->Backend->pfnRepair)
6034 {
6035 rc = pImage->Backend->pfnRepair(pszFilename, pDisk->pVDIfsDisk, pImage->pVDIfsImage, 0 /* fFlags */);
6036 if (RT_SUCCESS(rc))
6037 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
6038 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS),
6039 pDisk->pVDIfsDisk,
6040 pImage->pVDIfsImage,
6041 pDisk->enmType,
6042 &pImage->pBackendData);
6043 else
6044 {
6045 rc = vdError(pDisk, rc, RT_SRC_POS,
6046 N_("VD: error %Rrc repairing corrupted image file '%s'"), rc, pszFilename);
6047 break;
6048 }
6049 }
6050 else if (RT_UNLIKELY(rc == VERR_VD_IMAGE_CORRUPTED))
6051 {
6052 rc = vdError(pDisk, rc, RT_SRC_POS,
6053 N_("VD: Image file '%s' is corrupted and can't be opened"), pszFilename);
6054 break;
6055 }
6056
6057 /* If the open in read-write mode failed, retry in read-only mode. */
6058 if (RT_FAILURE(rc))
6059 {
6060 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY)
6061 && ( rc == VERR_ACCESS_DENIED
6062 || rc == VERR_PERMISSION_DENIED
6063 || rc == VERR_WRITE_PROTECT
6064 || rc == VERR_SHARING_VIOLATION
6065 || rc == VERR_FILE_LOCK_FAILED))
6066 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
6067 (uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS))
6068 | VD_OPEN_FLAGS_READONLY,
6069 pDisk->pVDIfsDisk,
6070 pImage->pVDIfsImage,
6071 pDisk->enmType,
6072 &pImage->pBackendData);
6073 if (RT_FAILURE(rc))
6074 {
6075 rc = vdError(pDisk, rc, RT_SRC_POS,
6076 N_("VD: error %Rrc opening image file '%s'"), rc, pszFilename);
6077 break;
6078 }
6079 }
6080
6081 /* Lock disk for writing, as we modify pDisk information below. */
6082 rc2 = vdThreadStartWrite(pDisk);
6083 AssertRC(rc2);
6084 fLockWrite = true;
6085
6086 pImage->VDIo.pBackendData = pImage->pBackendData;
6087
6088 /* Check image type. As the image itself has only partial knowledge
6089 * whether it's a base image or not, this info is derived here. The
6090 * base image can be fixed or normal, all others must be normal or
6091 * diff images. Some image formats don't distinguish between normal
6092 * and diff images, so this must be corrected here. */
6093 unsigned uImageFlags;
6094 uImageFlags = pImage->Backend->pfnGetImageFlags(pImage->pBackendData);
6095 if (RT_FAILURE(rc))
6096 uImageFlags = VD_IMAGE_FLAGS_NONE;
6097 if ( RT_SUCCESS(rc)
6098 && !(uOpenFlags & VD_OPEN_FLAGS_INFO))
6099 {
6100 if ( pDisk->cImages == 0
6101 && (uImageFlags & VD_IMAGE_FLAGS_DIFF))
6102 {
6103 rc = VERR_VD_INVALID_TYPE;
6104 break;
6105 }
6106 else if (pDisk->cImages != 0)
6107 {
6108 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
6109 {
6110 rc = VERR_VD_INVALID_TYPE;
6111 break;
6112 }
6113 else
6114 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
6115 }
6116 }
6117
6118 /* Ensure we always get correct diff information, even if the backend
6119 * doesn't actually have a stored flag for this. It must not return
6120 * bogus information for the parent UUID if it is not a diff image. */
6121 RTUUID parentUuid;
6122 RTUuidClear(&parentUuid);
6123 rc2 = pImage->Backend->pfnGetParentUuid(pImage->pBackendData, &parentUuid);
6124 if (RT_SUCCESS(rc2) && !RTUuidIsNull(&parentUuid))
6125 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
6126
6127 pImage->uImageFlags = uImageFlags;
6128
6129 /* Force sane optimization settings. It's not worth avoiding writes
6130 * to fixed size images. The overhead would have almost no payback. */
6131 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
6132 pImage->uOpenFlags |= VD_OPEN_FLAGS_HONOR_SAME;
6133
6134 /** @todo optionally check UUIDs */
6135
6136 /* Cache disk information. */
6137 pDisk->cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
6138
6139 /* Cache PCHS geometry. */
6140 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
6141 &pDisk->PCHSGeometry);
6142 if (RT_FAILURE(rc2))
6143 {
6144 pDisk->PCHSGeometry.cCylinders = 0;
6145 pDisk->PCHSGeometry.cHeads = 0;
6146 pDisk->PCHSGeometry.cSectors = 0;
6147 }
6148 else
6149 {
6150 /* Make sure the PCHS geometry is properly clipped. */
6151 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
6152 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
6153 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
6154 }
6155
6156 /* Cache LCHS geometry. */
6157 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
6158 &pDisk->LCHSGeometry);
6159 if (RT_FAILURE(rc2))
6160 {
6161 pDisk->LCHSGeometry.cCylinders = 0;
6162 pDisk->LCHSGeometry.cHeads = 0;
6163 pDisk->LCHSGeometry.cSectors = 0;
6164 }
6165 else
6166 {
6167 /* Make sure the LCHS geometry is properly clipped. */
6168 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
6169 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
6170 }
6171
6172 if (pDisk->cImages != 0)
6173 {
6174 /* Switch previous image to read-only mode. */
6175 unsigned uOpenFlagsPrevImg;
6176 uOpenFlagsPrevImg = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
6177 if (!(uOpenFlagsPrevImg & VD_OPEN_FLAGS_READONLY))
6178 {
6179 uOpenFlagsPrevImg |= VD_OPEN_FLAGS_READONLY;
6180 rc = pDisk->pLast->Backend->pfnSetOpenFlags(pDisk->pLast->pBackendData, uOpenFlagsPrevImg);
6181 }
6182 }
6183
6184 if (RT_SUCCESS(rc))
6185 {
6186 /* Image successfully opened, make it the last image. */
6187 vdAddImageToList(pDisk, pImage);
6188 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
6189 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
6190 }
6191 else
6192 {
6193 /* Error detected, but image opened. Close image. */
6194 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, false);
6195 AssertRC(rc2);
6196 pImage->pBackendData = NULL;
6197 }
6198 } while (0);
6199
6200 if (RT_UNLIKELY(fLockWrite))
6201 {
6202 rc2 = vdThreadFinishWrite(pDisk);
6203 AssertRC(rc2);
6204 }
6205
6206 if (RT_FAILURE(rc))
6207 {
6208 if (pImage)
6209 {
6210 if (pImage->pszFilename)
6211 RTStrFree(pImage->pszFilename);
6212 RTMemFree(pImage);
6213 }
6214 }
6215
6216 LogFlowFunc(("returns %Rrc\n", rc));
6217 return rc;
6218}
6219
6220/**
6221 * Opens a cache image.
6222 *
6223 * @return VBox status code.
6224 * @param pDisk Pointer to the HDD container which should use the cache image.
6225 * @param pszBackend Name of the cache file backend to use (case insensitive).
6226 * @param pszFilename Name of the cache image to open.
6227 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6228 * @param pVDIfsCache Pointer to the per-cache VD interface list.
6229 */
6230VBOXDDU_DECL(int) VDCacheOpen(PVBOXHDD pDisk, const char *pszBackend,
6231 const char *pszFilename, unsigned uOpenFlags,
6232 PVDINTERFACE pVDIfsCache)
6233{
6234 int rc = VINF_SUCCESS;
6235 int rc2;
6236 bool fLockWrite = false;
6237 PVDCACHE pCache = NULL;
6238
6239 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uOpenFlags=%#x, pVDIfsCache=%#p\n",
6240 pDisk, pszBackend, pszFilename, uOpenFlags, pVDIfsCache));
6241
6242 do
6243 {
6244 /* sanity check */
6245 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6246 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6247
6248 /* Check arguments. */
6249 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6250 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6251 rc = VERR_INVALID_PARAMETER);
6252 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6253 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6254 rc = VERR_INVALID_PARAMETER);
6255 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6256 ("uOpenFlags=%#x\n", uOpenFlags),
6257 rc = VERR_INVALID_PARAMETER);
6258
6259 /* Set up image descriptor. */
6260 pCache = (PVDCACHE)RTMemAllocZ(sizeof(VDCACHE));
6261 if (!pCache)
6262 {
6263 rc = VERR_NO_MEMORY;
6264 break;
6265 }
6266 pCache->pszFilename = RTStrDup(pszFilename);
6267 if (!pCache->pszFilename)
6268 {
6269 rc = VERR_NO_MEMORY;
6270 break;
6271 }
6272
6273 pCache->VDIo.pDisk = pDisk;
6274 pCache->pVDIfsCache = pVDIfsCache;
6275
6276 rc = vdFindCacheBackend(pszBackend, &pCache->Backend);
6277 if (RT_FAILURE(rc))
6278 break;
6279 if (!pCache->Backend)
6280 {
6281 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6282 N_("VD: unknown backend name '%s'"), pszBackend);
6283 break;
6284 }
6285
6286 /* Set up the I/O interface. */
6287 pCache->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsCache);
6288 if (!pCache->VDIo.pInterfaceIo)
6289 {
6290 vdIfIoFallbackCallbacksSetup(&pCache->VDIo.VDIfIo);
6291 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6292 pDisk, sizeof(VDINTERFACEIO), &pVDIfsCache);
6293 pCache->VDIo.pInterfaceIo = &pCache->VDIo.VDIfIo;
6294 }
6295
6296 /* Set up the internal I/O interface. */
6297 AssertBreakStmt(!VDIfIoIntGet(pVDIfsCache), rc = VERR_INVALID_PARAMETER);
6298 vdIfIoIntCallbacksSetup(&pCache->VDIo.VDIfIoInt);
6299 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6300 &pCache->VDIo, sizeof(VDINTERFACEIOINT), &pCache->pVDIfsCache);
6301 AssertRC(rc);
6302
6303 pCache->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6304 rc = pCache->Backend->pfnOpen(pCache->pszFilename,
6305 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6306 pDisk->pVDIfsDisk,
6307 pCache->pVDIfsCache,
6308 &pCache->pBackendData);
6309 /* If the open in read-write mode failed, retry in read-only mode. */
6310 if (RT_FAILURE(rc))
6311 {
6312 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY)
6313 && ( rc == VERR_ACCESS_DENIED
6314 || rc == VERR_PERMISSION_DENIED
6315 || rc == VERR_WRITE_PROTECT
6316 || rc == VERR_SHARING_VIOLATION
6317 || rc == VERR_FILE_LOCK_FAILED))
6318 rc = pCache->Backend->pfnOpen(pCache->pszFilename,
6319 (uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME)
6320 | VD_OPEN_FLAGS_READONLY,
6321 pDisk->pVDIfsDisk,
6322 pCache->pVDIfsCache,
6323 &pCache->pBackendData);
6324 if (RT_FAILURE(rc))
6325 {
6326 rc = vdError(pDisk, rc, RT_SRC_POS,
6327 N_("VD: error %Rrc opening image file '%s'"), rc, pszFilename);
6328 break;
6329 }
6330 }
6331
6332 /* Lock disk for writing, as we modify pDisk information below. */
6333 rc2 = vdThreadStartWrite(pDisk);
6334 AssertRC(rc2);
6335 fLockWrite = true;
6336
6337 /*
6338 * Check that the modification UUID of the cache and last image
6339 * match. If not the image was modified in-between without the cache.
6340 * The cache might contain stale data.
6341 */
6342 RTUUID UuidImage, UuidCache;
6343
6344 rc = pCache->Backend->pfnGetModificationUuid(pCache->pBackendData,
6345 &UuidCache);
6346 if (RT_SUCCESS(rc))
6347 {
6348 rc = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6349 &UuidImage);
6350 if (RT_SUCCESS(rc))
6351 {
6352 if (RTUuidCompare(&UuidImage, &UuidCache))
6353 rc = VERR_VD_CACHE_NOT_UP_TO_DATE;
6354 }
6355 }
6356
6357 /*
6358 * We assume that the user knows what he is doing if one of the images
6359 * doesn't support the modification uuid.
6360 */
6361 if (rc == VERR_NOT_SUPPORTED)
6362 rc = VINF_SUCCESS;
6363
6364 if (RT_SUCCESS(rc))
6365 {
6366 /* Cache successfully opened, make it the current one. */
6367 if (!pDisk->pCache)
6368 pDisk->pCache = pCache;
6369 else
6370 rc = VERR_VD_CACHE_ALREADY_EXISTS;
6371 }
6372
6373 if (RT_FAILURE(rc))
6374 {
6375 /* Error detected, but image opened. Close image. */
6376 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, false);
6377 AssertRC(rc2);
6378 pCache->pBackendData = NULL;
6379 }
6380 } while (0);
6381
6382 if (RT_UNLIKELY(fLockWrite))
6383 {
6384 rc2 = vdThreadFinishWrite(pDisk);
6385 AssertRC(rc2);
6386 }
6387
6388 if (RT_FAILURE(rc))
6389 {
6390 if (pCache)
6391 {
6392 if (pCache->pszFilename)
6393 RTStrFree(pCache->pszFilename);
6394 RTMemFree(pCache);
6395 }
6396 }
6397
6398 LogFlowFunc(("returns %Rrc\n", rc));
6399 return rc;
6400}
6401
6402/**
6403 * Adds a filter to the disk.
6404 *
6405 * @returns VBox status code.
6406 * @param pDisk Pointer to the HDD container which should use the filter.
6407 * @param pszFilter Name of the filter backend to use (case insensitive).
6408 * @param pVDIfsFilter Pointer to the per-filter VD interface list.
6409 */
6410VBOXDDU_DECL(int) VDFilterAdd(PVBOXHDD pDisk, const char *pszFilter,
6411 PVDINTERFACE pVDIfsFilter)
6412{
6413 int rc = VINF_SUCCESS;
6414 int rc2;
6415 bool fLockWrite = false;
6416 PVDFILTER pFilter = NULL;
6417
6418 LogFlowFunc(("pDisk=%#p pszFilter=\"%s\" pVDIfsFilter=%#p\n",
6419 pDisk, pszFilter, pVDIfsFilter));
6420
6421 do
6422 {
6423 /* sanity check */
6424 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6425 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6426
6427 /* Check arguments. */
6428 AssertMsgBreakStmt(VALID_PTR(pszFilter) && *pszFilter,
6429 ("pszFilter=%#p \"%s\"\n", pszFilter, pszFilter),
6430 rc = VERR_INVALID_PARAMETER);
6431
6432 /* Set up image descriptor. */
6433 pFilter = (PVDFILTER)RTMemAllocZ(sizeof(VDFILTER));
6434 if (!pFilter)
6435 {
6436 rc = VERR_NO_MEMORY;
6437 break;
6438 }
6439
6440 rc = vdFindFilterBackend(pszFilter, &pFilter->pBackend);
6441 if (RT_FAILURE(rc))
6442 break;
6443 if (!pFilter->pBackend)
6444 {
6445 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6446 N_("VD: unknown filter backend name '%s'"), pszFilter);
6447 break;
6448 }
6449
6450 pFilter->VDIo.pDisk = pDisk;
6451 pFilter->pVDIfsFilter = pVDIfsFilter;
6452
6453 /* Set up the internal I/O interface. */
6454 AssertBreakStmt(!VDIfIoIntGet(pVDIfsFilter), rc = VERR_INVALID_PARAMETER);
6455 vdIfIoIntCallbacksSetup(&pFilter->VDIo.VDIfIoInt);
6456 rc = VDInterfaceAdd(&pFilter->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6457 &pFilter->VDIo, sizeof(VDINTERFACEIOINT), &pFilter->pVDIfsFilter);
6458 AssertRC(rc);
6459
6460 rc = pFilter->pBackend->pfnCreate(pDisk->pVDIfsDisk, pFilter->pVDIfsFilter,
6461 &pFilter->pvBackendData);
6462
6463 /* If the open in read-write mode failed, retry in read-only mode. */
6464 if (RT_FAILURE(rc))
6465 {
6466 rc = vdError(pDisk, rc, RT_SRC_POS,
6467 N_("VD: error %Rrc creating filter '%s'"), rc, pszFilter);
6468 break;
6469 }
6470
6471 /* Lock disk for writing, as we modify pDisk information below. */
6472 rc2 = vdThreadStartWrite(pDisk);
6473 AssertRC(rc2);
6474 fLockWrite = true;
6475
6476 /* Add filter to chain. */
6477 vdAddFilterToList(pDisk, pFilter);
6478 } while (0);
6479
6480 if (RT_UNLIKELY(fLockWrite))
6481 {
6482 rc2 = vdThreadFinishWrite(pDisk);
6483 AssertRC(rc2);
6484 }
6485
6486 if (RT_FAILURE(rc))
6487 {
6488 if (pFilter)
6489 RTMemFree(pFilter);
6490 }
6491
6492 LogFlowFunc(("returns %Rrc\n", rc));
6493 return rc;
6494}
6495
6496/**
6497 * Creates and opens a new base image file.
6498 *
6499 * @returns VBox status code.
6500 * @param pDisk Pointer to HDD container.
6501 * @param pszBackend Name of the image file backend to use.
6502 * @param pszFilename Name of the image file to create.
6503 * @param cbSize Image size in bytes.
6504 * @param uImageFlags Flags specifying special image features.
6505 * @param pszComment Pointer to image comment. NULL is ok.
6506 * @param pPCHSGeometry Pointer to physical disk geometry <= (16383,16,63). Not NULL.
6507 * @param pLCHSGeometry Pointer to logical disk geometry <= (x,255,63). Not NULL.
6508 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6509 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6510 * @param pVDIfsImage Pointer to the per-image VD interface list.
6511 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6512 */
6513VBOXDDU_DECL(int) VDCreateBase(PVBOXHDD pDisk, const char *pszBackend,
6514 const char *pszFilename, uint64_t cbSize,
6515 unsigned uImageFlags, const char *pszComment,
6516 PCVDGEOMETRY pPCHSGeometry,
6517 PCVDGEOMETRY pLCHSGeometry,
6518 PCRTUUID pUuid, unsigned uOpenFlags,
6519 PVDINTERFACE pVDIfsImage,
6520 PVDINTERFACE pVDIfsOperation)
6521{
6522 int rc = VINF_SUCCESS;
6523 int rc2;
6524 bool fLockWrite = false, fLockRead = false;
6525 PVDIMAGE pImage = NULL;
6526 RTUUID uuid;
6527
6528 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" cbSize=%llu uImageFlags=%#x pszComment=\"%s\" PCHS=%u/%u/%u LCHS=%u/%u/%u Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6529 pDisk, pszBackend, pszFilename, cbSize, uImageFlags, pszComment,
6530 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
6531 pPCHSGeometry->cSectors, pLCHSGeometry->cCylinders,
6532 pLCHSGeometry->cHeads, pLCHSGeometry->cSectors, pUuid,
6533 uOpenFlags, pVDIfsImage, pVDIfsOperation));
6534
6535 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6536
6537 do
6538 {
6539 /* sanity check */
6540 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6541 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6542
6543 /* Check arguments. */
6544 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6545 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6546 rc = VERR_INVALID_PARAMETER);
6547 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6548 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6549 rc = VERR_INVALID_PARAMETER);
6550 AssertMsgBreakStmt(cbSize,
6551 ("cbSize=%llu\n", cbSize),
6552 rc = VERR_INVALID_PARAMETER);
6553 AssertMsgBreakStmt( ((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0)
6554 || ((uImageFlags & (VD_IMAGE_FLAGS_FIXED | VD_IMAGE_FLAGS_DIFF)) != VD_IMAGE_FLAGS_FIXED),
6555 ("uImageFlags=%#x\n", uImageFlags),
6556 rc = VERR_INVALID_PARAMETER);
6557 /* The PCHS geometry fields may be 0 to leave it for later. */
6558 AssertMsgBreakStmt( VALID_PTR(pPCHSGeometry)
6559 && pPCHSGeometry->cHeads <= 16
6560 && pPCHSGeometry->cSectors <= 63,
6561 ("pPCHSGeometry=%#p PCHS=%u/%u/%u\n", pPCHSGeometry,
6562 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
6563 pPCHSGeometry->cSectors),
6564 rc = VERR_INVALID_PARAMETER);
6565 /* The LCHS geometry fields may be 0 to leave it to later autodetection. */
6566 AssertMsgBreakStmt( VALID_PTR(pLCHSGeometry)
6567 && pLCHSGeometry->cHeads <= 255
6568 && pLCHSGeometry->cSectors <= 63,
6569 ("pLCHSGeometry=%#p LCHS=%u/%u/%u\n", pLCHSGeometry,
6570 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads,
6571 pLCHSGeometry->cSectors),
6572 rc = VERR_INVALID_PARAMETER);
6573 /* The UUID may be NULL. */
6574 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6575 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6576 rc = VERR_INVALID_PARAMETER);
6577 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6578 ("uOpenFlags=%#x\n", uOpenFlags),
6579 rc = VERR_INVALID_PARAMETER);
6580
6581 /* Check state. Needs a temporary read lock. Holding the write lock
6582 * all the time would be blocking other activities for too long. */
6583 rc2 = vdThreadStartRead(pDisk);
6584 AssertRC(rc2);
6585 fLockRead = true;
6586 AssertMsgBreakStmt(pDisk->cImages == 0,
6587 ("Create base image cannot be done with other images open\n"),
6588 rc = VERR_VD_INVALID_STATE);
6589 rc2 = vdThreadFinishRead(pDisk);
6590 AssertRC(rc2);
6591 fLockRead = false;
6592
6593 /* Set up image descriptor. */
6594 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
6595 if (!pImage)
6596 {
6597 rc = VERR_NO_MEMORY;
6598 break;
6599 }
6600 pImage->pszFilename = RTStrDup(pszFilename);
6601 if (!pImage->pszFilename)
6602 {
6603 rc = VERR_NO_MEMORY;
6604 break;
6605 }
6606 pImage->VDIo.pDisk = pDisk;
6607 pImage->pVDIfsImage = pVDIfsImage;
6608
6609 /* Set up the I/O interface. */
6610 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
6611 if (!pImage->VDIo.pInterfaceIo)
6612 {
6613 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
6614 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6615 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
6616 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
6617 }
6618
6619 /* Set up the internal I/O interface. */
6620 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
6621 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
6622 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6623 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
6624 AssertRC(rc);
6625
6626 rc = vdFindBackend(pszBackend, &pImage->Backend);
6627 if (RT_FAILURE(rc))
6628 break;
6629 if (!pImage->Backend)
6630 {
6631 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6632 N_("VD: unknown backend name '%s'"), pszBackend);
6633 break;
6634 }
6635 if (!(pImage->Backend->uBackendCaps & ( VD_CAP_CREATE_FIXED
6636 | VD_CAP_CREATE_DYNAMIC)))
6637 {
6638 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6639 N_("VD: backend '%s' cannot create base images"), pszBackend);
6640 break;
6641 }
6642
6643 /* Create UUID if the caller didn't specify one. */
6644 if (!pUuid)
6645 {
6646 rc = RTUuidCreate(&uuid);
6647 if (RT_FAILURE(rc))
6648 {
6649 rc = vdError(pDisk, rc, RT_SRC_POS,
6650 N_("VD: cannot generate UUID for image '%s'"),
6651 pszFilename);
6652 break;
6653 }
6654 pUuid = &uuid;
6655 }
6656
6657 pImage->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6658 uImageFlags &= ~VD_IMAGE_FLAGS_DIFF;
6659 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6660 rc = pImage->Backend->pfnCreate(pImage->pszFilename, cbSize,
6661 uImageFlags, pszComment, pPCHSGeometry,
6662 pLCHSGeometry, pUuid,
6663 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6664 0, 99,
6665 pDisk->pVDIfsDisk,
6666 pImage->pVDIfsImage,
6667 pVDIfsOperation,
6668 &pImage->pBackendData);
6669
6670 if (RT_SUCCESS(rc))
6671 {
6672 pImage->VDIo.pBackendData = pImage->pBackendData;
6673 pImage->uImageFlags = uImageFlags;
6674
6675 /* Force sane optimization settings. It's not worth avoiding writes
6676 * to fixed size images. The overhead would have almost no payback. */
6677 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
6678 pImage->uOpenFlags |= VD_OPEN_FLAGS_HONOR_SAME;
6679
6680 /* Lock disk for writing, as we modify pDisk information below. */
6681 rc2 = vdThreadStartWrite(pDisk);
6682 AssertRC(rc2);
6683 fLockWrite = true;
6684
6685 /** @todo optionally check UUIDs */
6686
6687 /* Re-check state, as the lock wasn't held and another image
6688 * creation call could have been done by another thread. */
6689 AssertMsgStmt(pDisk->cImages == 0,
6690 ("Create base image cannot be done with other images open\n"),
6691 rc = VERR_VD_INVALID_STATE);
6692 }
6693
6694 if (RT_SUCCESS(rc))
6695 {
6696 /* Cache disk information. */
6697 pDisk->cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
6698
6699 /* Cache PCHS geometry. */
6700 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
6701 &pDisk->PCHSGeometry);
6702 if (RT_FAILURE(rc2))
6703 {
6704 pDisk->PCHSGeometry.cCylinders = 0;
6705 pDisk->PCHSGeometry.cHeads = 0;
6706 pDisk->PCHSGeometry.cSectors = 0;
6707 }
6708 else
6709 {
6710 /* Make sure the CHS geometry is properly clipped. */
6711 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
6712 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
6713 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
6714 }
6715
6716 /* Cache LCHS geometry. */
6717 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
6718 &pDisk->LCHSGeometry);
6719 if (RT_FAILURE(rc2))
6720 {
6721 pDisk->LCHSGeometry.cCylinders = 0;
6722 pDisk->LCHSGeometry.cHeads = 0;
6723 pDisk->LCHSGeometry.cSectors = 0;
6724 }
6725 else
6726 {
6727 /* Make sure the CHS geometry is properly clipped. */
6728 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
6729 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
6730 }
6731
6732 /* Image successfully opened, make it the last image. */
6733 vdAddImageToList(pDisk, pImage);
6734 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
6735 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
6736 }
6737 else
6738 {
6739 /* Error detected, image may or may not be opened. Close and delete
6740 * image if it was opened. */
6741 if (pImage->pBackendData)
6742 {
6743 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, true);
6744 AssertRC(rc2);
6745 pImage->pBackendData = NULL;
6746 }
6747 }
6748 } while (0);
6749
6750 if (RT_UNLIKELY(fLockWrite))
6751 {
6752 rc2 = vdThreadFinishWrite(pDisk);
6753 AssertRC(rc2);
6754 }
6755 else if (RT_UNLIKELY(fLockRead))
6756 {
6757 rc2 = vdThreadFinishRead(pDisk);
6758 AssertRC(rc2);
6759 }
6760
6761 if (RT_FAILURE(rc))
6762 {
6763 if (pImage)
6764 {
6765 if (pImage->pszFilename)
6766 RTStrFree(pImage->pszFilename);
6767 RTMemFree(pImage);
6768 }
6769 }
6770
6771 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6772 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6773
6774 LogFlowFunc(("returns %Rrc\n", rc));
6775 return rc;
6776}
6777
6778/**
6779 * Creates and opens a new differencing image file in HDD container.
6780 * See comments for VDOpen function about differencing images.
6781 *
6782 * @returns VBox status code.
6783 * @param pDisk Pointer to HDD container.
6784 * @param pszBackend Name of the image file backend to use.
6785 * @param pszFilename Name of the differencing image file to create.
6786 * @param uImageFlags Flags specifying special image features.
6787 * @param pszComment Pointer to image comment. NULL is ok.
6788 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6789 * @param pParentUuid New parent UUID of the image. If NULL, the UUID is queried automatically.
6790 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6791 * @param pVDIfsImage Pointer to the per-image VD interface list.
6792 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6793 */
6794VBOXDDU_DECL(int) VDCreateDiff(PVBOXHDD pDisk, const char *pszBackend,
6795 const char *pszFilename, unsigned uImageFlags,
6796 const char *pszComment, PCRTUUID pUuid,
6797 PCRTUUID pParentUuid, unsigned uOpenFlags,
6798 PVDINTERFACE pVDIfsImage,
6799 PVDINTERFACE pVDIfsOperation)
6800{
6801 int rc = VINF_SUCCESS;
6802 int rc2;
6803 bool fLockWrite = false, fLockRead = false;
6804 PVDIMAGE pImage = NULL;
6805 RTUUID uuid;
6806
6807 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uImageFlags=%#x pszComment=\"%s\" Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6808 pDisk, pszBackend, pszFilename, uImageFlags, pszComment, pUuid, uOpenFlags, pVDIfsImage, pVDIfsOperation));
6809
6810 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6811
6812 do
6813 {
6814 /* sanity check */
6815 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6816 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6817
6818 /* Check arguments. */
6819 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6820 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6821 rc = VERR_INVALID_PARAMETER);
6822 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6823 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6824 rc = VERR_INVALID_PARAMETER);
6825 AssertMsgBreakStmt((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0,
6826 ("uImageFlags=%#x\n", uImageFlags),
6827 rc = VERR_INVALID_PARAMETER);
6828 /* The UUID may be NULL. */
6829 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6830 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6831 rc = VERR_INVALID_PARAMETER);
6832 /* The parent UUID may be NULL. */
6833 AssertMsgBreakStmt(pParentUuid == NULL || VALID_PTR(pParentUuid),
6834 ("pParentUuid=%#p ParentUUID=%RTuuid\n", pParentUuid, pParentUuid),
6835 rc = VERR_INVALID_PARAMETER);
6836 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6837 ("uOpenFlags=%#x\n", uOpenFlags),
6838 rc = VERR_INVALID_PARAMETER);
6839
6840 /* Check state. Needs a temporary read lock. Holding the write lock
6841 * all the time would be blocking other activities for too long. */
6842 rc2 = vdThreadStartRead(pDisk);
6843 AssertRC(rc2);
6844 fLockRead = true;
6845 AssertMsgBreakStmt(pDisk->cImages != 0,
6846 ("Create diff image cannot be done without other images open\n"),
6847 rc = VERR_VD_INVALID_STATE);
6848 rc2 = vdThreadFinishRead(pDisk);
6849 AssertRC(rc2);
6850 fLockRead = false;
6851
6852 /*
6853 * Destroy the current discard state first which might still have pending blocks
6854 * for the currently opened image which will be switched to readonly mode.
6855 */
6856 /* Lock disk for writing, as we modify pDisk information below. */
6857 rc2 = vdThreadStartWrite(pDisk);
6858 AssertRC(rc2);
6859 fLockWrite = true;
6860 rc = vdDiscardStateDestroy(pDisk);
6861 if (RT_FAILURE(rc))
6862 break;
6863 rc2 = vdThreadFinishWrite(pDisk);
6864 AssertRC(rc2);
6865 fLockWrite = false;
6866
6867 /* Set up image descriptor. */
6868 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
6869 if (!pImage)
6870 {
6871 rc = VERR_NO_MEMORY;
6872 break;
6873 }
6874 pImage->pszFilename = RTStrDup(pszFilename);
6875 if (!pImage->pszFilename)
6876 {
6877 rc = VERR_NO_MEMORY;
6878 break;
6879 }
6880
6881 rc = vdFindBackend(pszBackend, &pImage->Backend);
6882 if (RT_FAILURE(rc))
6883 break;
6884 if (!pImage->Backend)
6885 {
6886 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6887 N_("VD: unknown backend name '%s'"), pszBackend);
6888 break;
6889 }
6890 if ( !(pImage->Backend->uBackendCaps & VD_CAP_DIFF)
6891 || !(pImage->Backend->uBackendCaps & ( VD_CAP_CREATE_FIXED
6892 | VD_CAP_CREATE_DYNAMIC)))
6893 {
6894 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6895 N_("VD: backend '%s' cannot create diff images"), pszBackend);
6896 break;
6897 }
6898
6899 pImage->VDIo.pDisk = pDisk;
6900 pImage->pVDIfsImage = pVDIfsImage;
6901
6902 /* Set up the I/O interface. */
6903 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
6904 if (!pImage->VDIo.pInterfaceIo)
6905 {
6906 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
6907 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6908 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
6909 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
6910 }
6911
6912 /* Set up the internal I/O interface. */
6913 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
6914 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
6915 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6916 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
6917 AssertRC(rc);
6918
6919 /* Create UUID if the caller didn't specify one. */
6920 if (!pUuid)
6921 {
6922 rc = RTUuidCreate(&uuid);
6923 if (RT_FAILURE(rc))
6924 {
6925 rc = vdError(pDisk, rc, RT_SRC_POS,
6926 N_("VD: cannot generate UUID for image '%s'"),
6927 pszFilename);
6928 break;
6929 }
6930 pUuid = &uuid;
6931 }
6932
6933 pImage->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6934 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6935 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
6936 rc = pImage->Backend->pfnCreate(pImage->pszFilename, pDisk->cbSize,
6937 uImageFlags | VD_IMAGE_FLAGS_DIFF,
6938 pszComment, &pDisk->PCHSGeometry,
6939 &pDisk->LCHSGeometry, pUuid,
6940 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6941 0, 99,
6942 pDisk->pVDIfsDisk,
6943 pImage->pVDIfsImage,
6944 pVDIfsOperation,
6945 &pImage->pBackendData);
6946
6947 if (RT_SUCCESS(rc))
6948 {
6949 pImage->VDIo.pBackendData = pImage->pBackendData;
6950 pImage->uImageFlags = uImageFlags;
6951
6952 /* Lock disk for writing, as we modify pDisk information below. */
6953 rc2 = vdThreadStartWrite(pDisk);
6954 AssertRC(rc2);
6955 fLockWrite = true;
6956
6957 /* Switch previous image to read-only mode. */
6958 unsigned uOpenFlagsPrevImg;
6959 uOpenFlagsPrevImg = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
6960 if (!(uOpenFlagsPrevImg & VD_OPEN_FLAGS_READONLY))
6961 {
6962 uOpenFlagsPrevImg |= VD_OPEN_FLAGS_READONLY;
6963 rc = pDisk->pLast->Backend->pfnSetOpenFlags(pDisk->pLast->pBackendData, uOpenFlagsPrevImg);
6964 }
6965
6966 /** @todo optionally check UUIDs */
6967
6968 /* Re-check state, as the lock wasn't held and another image
6969 * creation call could have been done by another thread. */
6970 AssertMsgStmt(pDisk->cImages != 0,
6971 ("Create diff image cannot be done without other images open\n"),
6972 rc = VERR_VD_INVALID_STATE);
6973 }
6974
6975 if (RT_SUCCESS(rc))
6976 {
6977 RTUUID Uuid;
6978 RTTIMESPEC ts;
6979
6980 if (pParentUuid && !RTUuidIsNull(pParentUuid))
6981 {
6982 Uuid = *pParentUuid;
6983 pImage->Backend->pfnSetParentUuid(pImage->pBackendData, &Uuid);
6984 }
6985 else
6986 {
6987 rc2 = pDisk->pLast->Backend->pfnGetUuid(pDisk->pLast->pBackendData,
6988 &Uuid);
6989 if (RT_SUCCESS(rc2))
6990 pImage->Backend->pfnSetParentUuid(pImage->pBackendData, &Uuid);
6991 }
6992 rc2 = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6993 &Uuid);
6994 if (RT_SUCCESS(rc2))
6995 pImage->Backend->pfnSetParentModificationUuid(pImage->pBackendData,
6996 &Uuid);
6997 if (pDisk->pLast->Backend->pfnGetTimeStamp)
6998 rc2 = pDisk->pLast->Backend->pfnGetTimeStamp(pDisk->pLast->pBackendData,
6999 &ts);
7000 else
7001 rc2 = VERR_NOT_IMPLEMENTED;
7002 if (RT_SUCCESS(rc2) && pImage->Backend->pfnSetParentTimeStamp)
7003 pImage->Backend->pfnSetParentTimeStamp(pImage->pBackendData, &ts);
7004
7005 if (pImage->Backend->pfnSetParentFilename)
7006 rc2 = pImage->Backend->pfnSetParentFilename(pImage->pBackendData, pDisk->pLast->pszFilename);
7007 }
7008
7009 if (RT_SUCCESS(rc))
7010 {
7011 /* Image successfully opened, make it the last image. */
7012 vdAddImageToList(pDisk, pImage);
7013 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
7014 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
7015 }
7016 else
7017 {
7018 /* Error detected, but image opened. Close and delete image. */
7019 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, true);
7020 AssertRC(rc2);
7021 pImage->pBackendData = NULL;
7022 }
7023 } while (0);
7024
7025 if (RT_UNLIKELY(fLockWrite))
7026 {
7027 rc2 = vdThreadFinishWrite(pDisk);
7028 AssertRC(rc2);
7029 }
7030 else if (RT_UNLIKELY(fLockRead))
7031 {
7032 rc2 = vdThreadFinishRead(pDisk);
7033 AssertRC(rc2);
7034 }
7035
7036 if (RT_FAILURE(rc))
7037 {
7038 if (pImage)
7039 {
7040 if (pImage->pszFilename)
7041 RTStrFree(pImage->pszFilename);
7042 RTMemFree(pImage);
7043 }
7044 }
7045
7046 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
7047 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7048
7049 LogFlowFunc(("returns %Rrc\n", rc));
7050 return rc;
7051}
7052
7053
7054/**
7055 * Creates and opens new cache image file in HDD container.
7056 *
7057 * @return VBox status code.
7058 * @param pDisk Name of the cache file backend to use (case insensitive).
7059 * @param pszFilename Name of the differencing cache file to create.
7060 * @param cbSize Maximum size of the cache.
7061 * @param uImageFlags Flags specifying special cache features.
7062 * @param pszComment Pointer to image comment. NULL is ok.
7063 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
7064 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
7065 * @param pVDIfsCache Pointer to the per-cache VD interface list.
7066 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7067 */
7068VBOXDDU_DECL(int) VDCreateCache(PVBOXHDD pDisk, const char *pszBackend,
7069 const char *pszFilename, uint64_t cbSize,
7070 unsigned uImageFlags, const char *pszComment,
7071 PCRTUUID pUuid, unsigned uOpenFlags,
7072 PVDINTERFACE pVDIfsCache, PVDINTERFACE pVDIfsOperation)
7073{
7074 int rc = VINF_SUCCESS;
7075 int rc2;
7076 bool fLockWrite = false, fLockRead = false;
7077 PVDCACHE pCache = NULL;
7078 RTUUID uuid;
7079
7080 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" cbSize=%llu uImageFlags=%#x pszComment=\"%s\" Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
7081 pDisk, pszBackend, pszFilename, cbSize, uImageFlags, pszComment, pUuid, uOpenFlags, pVDIfsCache, pVDIfsOperation));
7082
7083 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7084
7085 do
7086 {
7087 /* sanity check */
7088 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
7089 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
7090
7091 /* Check arguments. */
7092 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
7093 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
7094 rc = VERR_INVALID_PARAMETER);
7095 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
7096 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
7097 rc = VERR_INVALID_PARAMETER);
7098 AssertMsgBreakStmt(cbSize,
7099 ("cbSize=%llu\n", cbSize),
7100 rc = VERR_INVALID_PARAMETER);
7101 AssertMsgBreakStmt((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0,
7102 ("uImageFlags=%#x\n", uImageFlags),
7103 rc = VERR_INVALID_PARAMETER);
7104 /* The UUID may be NULL. */
7105 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
7106 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
7107 rc = VERR_INVALID_PARAMETER);
7108 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
7109 ("uOpenFlags=%#x\n", uOpenFlags),
7110 rc = VERR_INVALID_PARAMETER);
7111
7112 /* Check state. Needs a temporary read lock. Holding the write lock
7113 * all the time would be blocking other activities for too long. */
7114 rc2 = vdThreadStartRead(pDisk);
7115 AssertRC(rc2);
7116 fLockRead = true;
7117 AssertMsgBreakStmt(!pDisk->pCache,
7118 ("Create cache image cannot be done with a cache already attached\n"),
7119 rc = VERR_VD_CACHE_ALREADY_EXISTS);
7120 rc2 = vdThreadFinishRead(pDisk);
7121 AssertRC(rc2);
7122 fLockRead = false;
7123
7124 /* Set up image descriptor. */
7125 pCache = (PVDCACHE)RTMemAllocZ(sizeof(VDCACHE));
7126 if (!pCache)
7127 {
7128 rc = VERR_NO_MEMORY;
7129 break;
7130 }
7131 pCache->pszFilename = RTStrDup(pszFilename);
7132 if (!pCache->pszFilename)
7133 {
7134 rc = VERR_NO_MEMORY;
7135 break;
7136 }
7137
7138 rc = vdFindCacheBackend(pszBackend, &pCache->Backend);
7139 if (RT_FAILURE(rc))
7140 break;
7141 if (!pCache->Backend)
7142 {
7143 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
7144 N_("VD: unknown backend name '%s'"), pszBackend);
7145 break;
7146 }
7147
7148 pCache->VDIo.pDisk = pDisk;
7149 pCache->pVDIfsCache = pVDIfsCache;
7150
7151 /* Set up the I/O interface. */
7152 pCache->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsCache);
7153 if (!pCache->VDIo.pInterfaceIo)
7154 {
7155 vdIfIoFallbackCallbacksSetup(&pCache->VDIo.VDIfIo);
7156 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
7157 pDisk, sizeof(VDINTERFACEIO), &pVDIfsCache);
7158 pCache->VDIo.pInterfaceIo = &pCache->VDIo.VDIfIo;
7159 }
7160
7161 /* Set up the internal I/O interface. */
7162 AssertBreakStmt(!VDIfIoIntGet(pVDIfsCache), rc = VERR_INVALID_PARAMETER);
7163 vdIfIoIntCallbacksSetup(&pCache->VDIo.VDIfIoInt);
7164 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
7165 &pCache->VDIo, sizeof(VDINTERFACEIOINT), &pCache->pVDIfsCache);
7166 AssertRC(rc);
7167
7168 /* Create UUID if the caller didn't specify one. */
7169 if (!pUuid)
7170 {
7171 rc = RTUuidCreate(&uuid);
7172 if (RT_FAILURE(rc))
7173 {
7174 rc = vdError(pDisk, rc, RT_SRC_POS,
7175 N_("VD: cannot generate UUID for image '%s'"),
7176 pszFilename);
7177 break;
7178 }
7179 pUuid = &uuid;
7180 }
7181
7182 pCache->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
7183 pCache->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
7184 rc = pCache->Backend->pfnCreate(pCache->pszFilename, cbSize,
7185 uImageFlags,
7186 pszComment, pUuid,
7187 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
7188 0, 99,
7189 pDisk->pVDIfsDisk,
7190 pCache->pVDIfsCache,
7191 pVDIfsOperation,
7192 &pCache->pBackendData);
7193
7194 if (RT_SUCCESS(rc))
7195 {
7196 /* Lock disk for writing, as we modify pDisk information below. */
7197 rc2 = vdThreadStartWrite(pDisk);
7198 AssertRC(rc2);
7199 fLockWrite = true;
7200
7201 pCache->VDIo.pBackendData = pCache->pBackendData;
7202
7203 /* Re-check state, as the lock wasn't held and another image
7204 * creation call could have been done by another thread. */
7205 AssertMsgStmt(!pDisk->pCache,
7206 ("Create cache image cannot be done with another cache open\n"),
7207 rc = VERR_VD_CACHE_ALREADY_EXISTS);
7208 }
7209
7210 if ( RT_SUCCESS(rc)
7211 && pDisk->pLast)
7212 {
7213 RTUUID UuidModification;
7214
7215 /* Set same modification Uuid as the last image. */
7216 rc = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
7217 &UuidModification);
7218 if (RT_SUCCESS(rc))
7219 {
7220 rc = pCache->Backend->pfnSetModificationUuid(pCache->pBackendData,
7221 &UuidModification);
7222 }
7223
7224 if (rc == VERR_NOT_SUPPORTED)
7225 rc = VINF_SUCCESS;
7226 }
7227
7228 if (RT_SUCCESS(rc))
7229 {
7230 /* Cache successfully created. */
7231 pDisk->pCache = pCache;
7232 }
7233 else
7234 {
7235 /* Error detected, but image opened. Close and delete image. */
7236 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, true);
7237 AssertRC(rc2);
7238 pCache->pBackendData = NULL;
7239 }
7240 } while (0);
7241
7242 if (RT_UNLIKELY(fLockWrite))
7243 {
7244 rc2 = vdThreadFinishWrite(pDisk);
7245 AssertRC(rc2);
7246 }
7247 else if (RT_UNLIKELY(fLockRead))
7248 {
7249 rc2 = vdThreadFinishRead(pDisk);
7250 AssertRC(rc2);
7251 }
7252
7253 if (RT_FAILURE(rc))
7254 {
7255 if (pCache)
7256 {
7257 if (pCache->pszFilename)
7258 RTStrFree(pCache->pszFilename);
7259 RTMemFree(pCache);
7260 }
7261 }
7262
7263 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
7264 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7265
7266 LogFlowFunc(("returns %Rrc\n", rc));
7267 return rc;
7268}
7269
7270/**
7271 * Merges two images (not necessarily with direct parent/child relationship).
7272 * As a side effect the source image and potentially the other images which
7273 * are also merged to the destination are deleted from both the disk and the
7274 * images in the HDD container.
7275 *
7276 * @returns VBox status code.
7277 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7278 * @param pDisk Pointer to HDD container.
7279 * @param nImageFrom Name of the image file to merge from.
7280 * @param nImageTo Name of the image file to merge to.
7281 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7282 */
7283VBOXDDU_DECL(int) VDMerge(PVBOXHDD pDisk, unsigned nImageFrom,
7284 unsigned nImageTo, PVDINTERFACE pVDIfsOperation)
7285{
7286 int rc = VINF_SUCCESS;
7287 int rc2;
7288 bool fLockWrite = false, fLockRead = false;
7289 void *pvBuf = NULL;
7290
7291 LogFlowFunc(("pDisk=%#p nImageFrom=%u nImageTo=%u pVDIfsOperation=%#p\n",
7292 pDisk, nImageFrom, nImageTo, pVDIfsOperation));
7293
7294 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7295
7296 do
7297 {
7298 /* sanity check */
7299 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
7300 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
7301
7302 /* For simplicity reasons lock for writing as the image reopen below
7303 * might need it. After all the reopen is usually needed. */
7304 rc2 = vdThreadStartWrite(pDisk);
7305 AssertRC(rc2);
7306 fLockWrite = true;
7307 PVDIMAGE pImageFrom = vdGetImageByNumber(pDisk, nImageFrom);
7308 PVDIMAGE pImageTo = vdGetImageByNumber(pDisk, nImageTo);
7309 if (!pImageFrom || !pImageTo)
7310 {
7311 rc = VERR_VD_IMAGE_NOT_FOUND;
7312 break;
7313 }
7314 AssertBreakStmt(pImageFrom != pImageTo, rc = VERR_INVALID_PARAMETER);
7315
7316 /* Make sure destination image is writable. */
7317 unsigned uOpenFlags = pImageTo->Backend->pfnGetOpenFlags(pImageTo->pBackendData);
7318 if (uOpenFlags & VD_OPEN_FLAGS_READONLY)
7319 {
7320 /*
7321 * Clear skip consistency checks because the image is made writable now and
7322 * skipping consistency checks is only possible for readonly images.
7323 */
7324 uOpenFlags &= ~(VD_OPEN_FLAGS_READONLY | VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS);
7325 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7326 uOpenFlags);
7327 if (RT_FAILURE(rc))
7328 break;
7329 }
7330
7331 /* Get size of destination image. */
7332 uint64_t cbSize = pImageTo->Backend->pfnGetSize(pImageTo->pBackendData);
7333 rc2 = vdThreadFinishWrite(pDisk);
7334 AssertRC(rc2);
7335 fLockWrite = false;
7336
7337 /* Allocate tmp buffer. */
7338 pvBuf = RTMemTmpAlloc(VD_MERGE_BUFFER_SIZE);
7339 if (!pvBuf)
7340 {
7341 rc = VERR_NO_MEMORY;
7342 break;
7343 }
7344
7345 /* Merging is done directly on the images itself. This potentially
7346 * causes trouble if the disk is full in the middle of operation. */
7347 if (nImageFrom < nImageTo)
7348 {
7349 /* Merge parent state into child. This means writing all not
7350 * allocated blocks in the destination image which are allocated in
7351 * the images to be merged. */
7352 uint64_t uOffset = 0;
7353 uint64_t cbRemaining = cbSize;
7354 do
7355 {
7356 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
7357 RTSGSEG SegmentBuf;
7358 RTSGBUF SgBuf;
7359 VDIOCTX IoCtx;
7360
7361 SegmentBuf.pvSeg = pvBuf;
7362 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
7363 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
7364 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, 0, 0, NULL,
7365 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
7366
7367 /* Need to hold the write lock during a read-write operation. */
7368 rc2 = vdThreadStartWrite(pDisk);
7369 AssertRC(rc2);
7370 fLockWrite = true;
7371
7372 rc = pImageTo->Backend->pfnRead(pImageTo->pBackendData,
7373 uOffset, cbThisRead,
7374 &IoCtx, &cbThisRead);
7375 if (rc == VERR_VD_BLOCK_FREE)
7376 {
7377 /* Search for image with allocated block. Do not attempt to
7378 * read more than the previous reads marked as valid.
7379 * Otherwise this would return stale data when different
7380 * block sizes are used for the images. */
7381 for (PVDIMAGE pCurrImage = pImageTo->pPrev;
7382 pCurrImage != NULL && pCurrImage != pImageFrom->pPrev && rc == VERR_VD_BLOCK_FREE;
7383 pCurrImage = pCurrImage->pPrev)
7384 {
7385 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
7386 uOffset, cbThisRead,
7387 &IoCtx, &cbThisRead);
7388 }
7389
7390 if (rc != VERR_VD_BLOCK_FREE)
7391 {
7392 if (RT_FAILURE(rc))
7393 break;
7394 /* Updating the cache is required because this might be a live merge. */
7395 rc = vdWriteHelperEx(pDisk, pImageTo, pImageFrom->pPrev,
7396 uOffset, pvBuf, cbThisRead,
7397 VDIOCTX_FLAGS_READ_UPDATE_CACHE, 0);
7398 if (RT_FAILURE(rc))
7399 break;
7400 }
7401 else
7402 rc = VINF_SUCCESS;
7403 }
7404 else if (RT_FAILURE(rc))
7405 break;
7406
7407 rc2 = vdThreadFinishWrite(pDisk);
7408 AssertRC(rc2);
7409 fLockWrite = false;
7410
7411 uOffset += cbThisRead;
7412 cbRemaining -= cbThisRead;
7413
7414 if (pIfProgress && pIfProgress->pfnProgress)
7415 {
7416 /** @todo r=klaus: this can update the progress to the same
7417 * percentage over and over again if the image format makes
7418 * relatively small increments. */
7419 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
7420 uOffset * 99 / cbSize);
7421 if (RT_FAILURE(rc))
7422 break;
7423 }
7424 } while (uOffset < cbSize);
7425 }
7426 else
7427 {
7428 /*
7429 * We may need to update the parent uuid of the child coming after
7430 * the last image to be merged. We have to reopen it read/write.
7431 *
7432 * This is done before we do the actual merge to prevent an
7433 * inconsistent chain if the mode change fails for some reason.
7434 */
7435 if (pImageFrom->pNext)
7436 {
7437 PVDIMAGE pImageChild = pImageFrom->pNext;
7438
7439 /* Take the write lock. */
7440 rc2 = vdThreadStartWrite(pDisk);
7441 AssertRC(rc2);
7442 fLockWrite = true;
7443
7444 /* We need to open the image in read/write mode. */
7445 uOpenFlags = pImageChild->Backend->pfnGetOpenFlags(pImageChild->pBackendData);
7446
7447 if (uOpenFlags & VD_OPEN_FLAGS_READONLY)
7448 {
7449 uOpenFlags &= ~VD_OPEN_FLAGS_READONLY;
7450 rc = pImageChild->Backend->pfnSetOpenFlags(pImageChild->pBackendData,
7451 uOpenFlags);
7452 if (RT_FAILURE(rc))
7453 break;
7454 }
7455
7456 rc2 = vdThreadFinishWrite(pDisk);
7457 AssertRC(rc2);
7458 fLockWrite = false;
7459 }
7460
7461 /* If the merge is from the last image we have to relay all writes
7462 * to the merge destination as well, so that concurrent writes
7463 * (in case of a live merge) are handled correctly. */
7464 if (!pImageFrom->pNext)
7465 {
7466 /* Take the write lock. */
7467 rc2 = vdThreadStartWrite(pDisk);
7468 AssertRC(rc2);
7469 fLockWrite = true;
7470
7471 pDisk->pImageRelay = pImageTo;
7472
7473 rc2 = vdThreadFinishWrite(pDisk);
7474 AssertRC(rc2);
7475 fLockWrite = false;
7476 }
7477
7478 /* Merge child state into parent. This means writing all blocks
7479 * which are allocated in the image up to the source image to the
7480 * destination image. */
7481 uint64_t uOffset = 0;
7482 uint64_t cbRemaining = cbSize;
7483 do
7484 {
7485 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
7486 RTSGSEG SegmentBuf;
7487 RTSGBUF SgBuf;
7488 VDIOCTX IoCtx;
7489
7490 rc = VERR_VD_BLOCK_FREE;
7491
7492 SegmentBuf.pvSeg = pvBuf;
7493 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
7494 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
7495 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, 0, 0, NULL,
7496 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
7497
7498 /* Need to hold the write lock during a read-write operation. */
7499 rc2 = vdThreadStartWrite(pDisk);
7500 AssertRC(rc2);
7501 fLockWrite = true;
7502
7503 /* Search for image with allocated block. Do not attempt to
7504 * read more than the previous reads marked as valid. Otherwise
7505 * this would return stale data when different block sizes are
7506 * used for the images. */
7507 for (PVDIMAGE pCurrImage = pImageFrom;
7508 pCurrImage != NULL && pCurrImage != pImageTo && rc == VERR_VD_BLOCK_FREE;
7509 pCurrImage = pCurrImage->pPrev)
7510 {
7511 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
7512 uOffset, cbThisRead,
7513 &IoCtx, &cbThisRead);
7514 }
7515
7516 if (rc != VERR_VD_BLOCK_FREE)
7517 {
7518 if (RT_FAILURE(rc))
7519 break;
7520 rc = vdWriteHelper(pDisk, pImageTo, uOffset, pvBuf,
7521 cbThisRead, VDIOCTX_FLAGS_READ_UPDATE_CACHE);
7522 if (RT_FAILURE(rc))
7523 break;
7524 }
7525 else
7526 rc = VINF_SUCCESS;
7527
7528 rc2 = vdThreadFinishWrite(pDisk);
7529 AssertRC(rc2);
7530 fLockWrite = false;
7531
7532 uOffset += cbThisRead;
7533 cbRemaining -= cbThisRead;
7534
7535 if (pIfProgress && pIfProgress->pfnProgress)
7536 {
7537 /** @todo r=klaus: this can update the progress to the same
7538 * percentage over and over again if the image format makes
7539 * relatively small increments. */
7540 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
7541 uOffset * 99 / cbSize);
7542 if (RT_FAILURE(rc))
7543 break;
7544 }
7545 } while (uOffset < cbSize);
7546
7547 /* In case we set up a "write proxy" image above we must clear
7548 * this again now to prevent stray writes. Failure or not. */
7549 if (!pImageFrom->pNext)
7550 {
7551 /* Take the write lock. */
7552 rc2 = vdThreadStartWrite(pDisk);
7553 AssertRC(rc2);
7554 fLockWrite = true;
7555
7556 pDisk->pImageRelay = NULL;
7557
7558 rc2 = vdThreadFinishWrite(pDisk);
7559 AssertRC(rc2);
7560 fLockWrite = false;
7561 }
7562 }
7563
7564 /*
7565 * Leave in case of an error to avoid corrupted data in the image chain
7566 * (includes cancelling the operation by the user).
7567 */
7568 if (RT_FAILURE(rc))
7569 break;
7570
7571 /* Need to hold the write lock while finishing the merge. */
7572 rc2 = vdThreadStartWrite(pDisk);
7573 AssertRC(rc2);
7574 fLockWrite = true;
7575
7576 /* Update parent UUID so that image chain is consistent.
7577 * The two attempts work around the problem that some backends
7578 * (e.g. iSCSI) do not support UUIDs, so we exploit the fact that
7579 * so far there can only be one such image in the chain. */
7580 /** @todo needs a better long-term solution, passing the UUID
7581 * knowledge from the caller or some such */
7582 RTUUID Uuid;
7583 PVDIMAGE pImageChild = NULL;
7584 if (nImageFrom < nImageTo)
7585 {
7586 if (pImageFrom->pPrev)
7587 {
7588 /* plan A: ask the parent itself for its UUID */
7589 rc = pImageFrom->pPrev->Backend->pfnGetUuid(pImageFrom->pPrev->pBackendData,
7590 &Uuid);
7591 if (RT_FAILURE(rc))
7592 {
7593 /* plan B: ask the child of the parent for parent UUID */
7594 rc = pImageFrom->Backend->pfnGetParentUuid(pImageFrom->pBackendData,
7595 &Uuid);
7596 }
7597 AssertRC(rc);
7598 }
7599 else
7600 RTUuidClear(&Uuid);
7601 rc = pImageTo->Backend->pfnSetParentUuid(pImageTo->pBackendData,
7602 &Uuid);
7603 AssertRC(rc);
7604 }
7605 else
7606 {
7607 /* Update the parent uuid of the child of the last merged image. */
7608 if (pImageFrom->pNext)
7609 {
7610 /* plan A: ask the parent itself for its UUID */
7611 rc = pImageTo->Backend->pfnGetUuid(pImageTo->pBackendData,
7612 &Uuid);
7613 if (RT_FAILURE(rc))
7614 {
7615 /* plan B: ask the child of the parent for parent UUID */
7616 rc = pImageTo->pNext->Backend->pfnGetParentUuid(pImageTo->pNext->pBackendData,
7617 &Uuid);
7618 }
7619 AssertRC(rc);
7620
7621 rc = pImageFrom->Backend->pfnSetParentUuid(pImageFrom->pNext->pBackendData,
7622 &Uuid);
7623 AssertRC(rc);
7624
7625 pImageChild = pImageFrom->pNext;
7626 }
7627 }
7628
7629 /* Delete the no longer needed images. */
7630 PVDIMAGE pImg = pImageFrom, pTmp;
7631 while (pImg != pImageTo)
7632 {
7633 if (nImageFrom < nImageTo)
7634 pTmp = pImg->pNext;
7635 else
7636 pTmp = pImg->pPrev;
7637 vdRemoveImageFromList(pDisk, pImg);
7638 pImg->Backend->pfnClose(pImg->pBackendData, true);
7639 RTMemFree(pImg->pszFilename);
7640 RTMemFree(pImg);
7641 pImg = pTmp;
7642 }
7643
7644 /* Make sure destination image is back to read only if necessary. */
7645 if (pImageTo != pDisk->pLast)
7646 {
7647 uOpenFlags = pImageTo->Backend->pfnGetOpenFlags(pImageTo->pBackendData);
7648 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
7649 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7650 uOpenFlags);
7651 if (RT_FAILURE(rc))
7652 break;
7653 }
7654
7655 /*
7656 * Make sure the child is readonly
7657 * for the child -> parent merge direction
7658 * if necessary.
7659 */
7660 if ( nImageFrom > nImageTo
7661 && pImageChild
7662 && pImageChild != pDisk->pLast)
7663 {
7664 uOpenFlags = pImageChild->Backend->pfnGetOpenFlags(pImageChild->pBackendData);
7665 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
7666 rc = pImageChild->Backend->pfnSetOpenFlags(pImageChild->pBackendData,
7667 uOpenFlags);
7668 if (RT_FAILURE(rc))
7669 break;
7670 }
7671 } while (0);
7672
7673 if (RT_UNLIKELY(fLockWrite))
7674 {
7675 rc2 = vdThreadFinishWrite(pDisk);
7676 AssertRC(rc2);
7677 }
7678 else if (RT_UNLIKELY(fLockRead))
7679 {
7680 rc2 = vdThreadFinishRead(pDisk);
7681 AssertRC(rc2);
7682 }
7683
7684 if (pvBuf)
7685 RTMemTmpFree(pvBuf);
7686
7687 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
7688 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7689
7690 LogFlowFunc(("returns %Rrc\n", rc));
7691 return rc;
7692}
7693
7694/**
7695 * Copies an image from one HDD container to another - extended version.
7696 * The copy is opened in the target HDD container.
7697 * It is possible to convert between different image formats, because the
7698 * backend for the destination may be different from the source.
7699 * If both the source and destination reference the same HDD container,
7700 * then the image is moved (by copying/deleting or renaming) to the new location.
7701 * The source container is unchanged if the move operation fails, otherwise
7702 * the image at the new location is opened in the same way as the old one was.
7703 *
7704 * @note The read/write accesses across disks are not synchronized, just the
7705 * accesses to each disk. Once there is a use case which requires a defined
7706 * read/write behavior in this situation this needs to be extended.
7707 *
7708 * @return VBox status code.
7709 * @return VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7710 * @param pDiskFrom Pointer to source HDD container.
7711 * @param nImage Image number, counts from 0. 0 is always base image of container.
7712 * @param pDiskTo Pointer to destination HDD container.
7713 * @param pszBackend Name of the image file backend to use (may be NULL to use the same as the source, case insensitive).
7714 * @param pszFilename New name of the image (may be NULL to specify that the
7715 * copy destination is the destination container, or
7716 * if pDiskFrom == pDiskTo, i.e. when moving).
7717 * @param fMoveByRename If true, attempt to perform a move by renaming (if successful the new size is ignored).
7718 * @param cbSize New image size (0 means leave unchanged).
7719 * @param nImageSameFrom todo
7720 * @param nImageSameTo todo
7721 * @param uImageFlags Flags specifying special destination image features.
7722 * @param pDstUuid New UUID of the destination image. If NULL, a new UUID is created.
7723 * This parameter is used if and only if a true copy is created.
7724 * In all rename/move cases or copy to existing image cases the modification UUIDs are copied over.
7725 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
7726 * Only used if the destination image is created.
7727 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7728 * @param pDstVDIfsImage Pointer to the per-image VD interface list, for the
7729 * destination image.
7730 * @param pDstVDIfsOperation Pointer to the per-operation VD interface list,
7731 * for the destination operation.
7732 */
7733VBOXDDU_DECL(int) VDCopyEx(PVBOXHDD pDiskFrom, unsigned nImage, PVBOXHDD pDiskTo,
7734 const char *pszBackend, const char *pszFilename,
7735 bool fMoveByRename, uint64_t cbSize,
7736 unsigned nImageFromSame, unsigned nImageToSame,
7737 unsigned uImageFlags, PCRTUUID pDstUuid,
7738 unsigned uOpenFlags, PVDINTERFACE pVDIfsOperation,
7739 PVDINTERFACE pDstVDIfsImage,
7740 PVDINTERFACE pDstVDIfsOperation)
7741{
7742 int rc = VINF_SUCCESS;
7743 int rc2;
7744 bool fLockReadFrom = false, fLockWriteFrom = false, fLockWriteTo = false;
7745 PVDIMAGE pImageTo = NULL;
7746
7747 LogFlowFunc(("pDiskFrom=%#p nImage=%u pDiskTo=%#p pszBackend=\"%s\" pszFilename=\"%s\" fMoveByRename=%d cbSize=%llu nImageFromSame=%u nImageToSame=%u uImageFlags=%#x pDstUuid=%#p uOpenFlags=%#x pVDIfsOperation=%#p pDstVDIfsImage=%#p pDstVDIfsOperation=%#p\n",
7748 pDiskFrom, nImage, pDiskTo, pszBackend, pszFilename, fMoveByRename, cbSize, nImageFromSame, nImageToSame, uImageFlags, pDstUuid, uOpenFlags, pVDIfsOperation, pDstVDIfsImage, pDstVDIfsOperation));
7749
7750 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7751 PVDINTERFACEPROGRESS pDstIfProgress = VDIfProgressGet(pDstVDIfsOperation);
7752
7753 do {
7754 /* Check arguments. */
7755 AssertMsgBreakStmt(VALID_PTR(pDiskFrom), ("pDiskFrom=%#p\n", pDiskFrom),
7756 rc = VERR_INVALID_PARAMETER);
7757 AssertMsg(pDiskFrom->u32Signature == VBOXHDDDISK_SIGNATURE,
7758 ("u32Signature=%08x\n", pDiskFrom->u32Signature));
7759
7760 rc2 = vdThreadStartRead(pDiskFrom);
7761 AssertRC(rc2);
7762 fLockReadFrom = true;
7763 PVDIMAGE pImageFrom = vdGetImageByNumber(pDiskFrom, nImage);
7764 AssertPtrBreakStmt(pImageFrom, rc = VERR_VD_IMAGE_NOT_FOUND);
7765 AssertMsgBreakStmt(VALID_PTR(pDiskTo), ("pDiskTo=%#p\n", pDiskTo),
7766 rc = VERR_INVALID_PARAMETER);
7767 AssertMsg(pDiskTo->u32Signature == VBOXHDDDISK_SIGNATURE,
7768 ("u32Signature=%08x\n", pDiskTo->u32Signature));
7769 AssertMsgBreakStmt( (nImageFromSame < nImage || nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN)
7770 && (nImageToSame < pDiskTo->cImages || nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7771 && ( (nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN && nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7772 || (nImageFromSame != VD_IMAGE_CONTENT_UNKNOWN && nImageToSame != VD_IMAGE_CONTENT_UNKNOWN)),
7773 ("nImageFromSame=%u nImageToSame=%u\n", nImageFromSame, nImageToSame),
7774 rc = VERR_INVALID_PARAMETER);
7775
7776 /* Move the image. */
7777 if (pDiskFrom == pDiskTo)
7778 {
7779 /* Rename only works when backends are the same, are file based
7780 * and the rename method is implemented. */
7781 if ( fMoveByRename
7782 && !RTStrICmp(pszBackend, pImageFrom->Backend->pszBackendName)
7783 && pImageFrom->Backend->uBackendCaps & VD_CAP_FILE
7784 && pImageFrom->Backend->pfnRename)
7785 {
7786 rc2 = vdThreadFinishRead(pDiskFrom);
7787 AssertRC(rc2);
7788 fLockReadFrom = false;
7789
7790 rc2 = vdThreadStartWrite(pDiskFrom);
7791 AssertRC(rc2);
7792 fLockWriteFrom = true;
7793 rc = pImageFrom->Backend->pfnRename(pImageFrom->pBackendData, pszFilename ? pszFilename : pImageFrom->pszFilename);
7794 break;
7795 }
7796
7797 /** @todo Moving (including shrinking/growing) of the image is
7798 * requested, but the rename attempt failed or it wasn't possible.
7799 * Must now copy image to temp location. */
7800 AssertReleaseMsgFailed(("VDCopy: moving by copy/delete not implemented\n"));
7801 }
7802
7803 /* pszFilename is allowed to be NULL, as this indicates copy to the existing image. */
7804 AssertMsgBreakStmt(pszFilename == NULL || (VALID_PTR(pszFilename) && *pszFilename),
7805 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
7806 rc = VERR_INVALID_PARAMETER);
7807
7808 uint64_t cbSizeFrom;
7809 cbSizeFrom = pImageFrom->Backend->pfnGetSize(pImageFrom->pBackendData);
7810 if (cbSizeFrom == 0)
7811 {
7812 rc = VERR_VD_VALUE_NOT_FOUND;
7813 break;
7814 }
7815
7816 VDGEOMETRY PCHSGeometryFrom = {0, 0, 0};
7817 VDGEOMETRY LCHSGeometryFrom = {0, 0, 0};
7818 pImageFrom->Backend->pfnGetPCHSGeometry(pImageFrom->pBackendData, &PCHSGeometryFrom);
7819 pImageFrom->Backend->pfnGetLCHSGeometry(pImageFrom->pBackendData, &LCHSGeometryFrom);
7820
7821 RTUUID ImageUuid, ImageModificationUuid;
7822 if (pDiskFrom != pDiskTo)
7823 {
7824 if (pDstUuid)
7825 ImageUuid = *pDstUuid;
7826 else
7827 RTUuidCreate(&ImageUuid);
7828 }
7829 else
7830 {
7831 rc = pImageFrom->Backend->pfnGetUuid(pImageFrom->pBackendData, &ImageUuid);
7832 if (RT_FAILURE(rc))
7833 RTUuidCreate(&ImageUuid);
7834 }
7835 rc = pImageFrom->Backend->pfnGetModificationUuid(pImageFrom->pBackendData, &ImageModificationUuid);
7836 if (RT_FAILURE(rc))
7837 RTUuidClear(&ImageModificationUuid);
7838
7839 char szComment[1024];
7840 rc = pImageFrom->Backend->pfnGetComment(pImageFrom->pBackendData, szComment, sizeof(szComment));
7841 if (RT_FAILURE(rc))
7842 szComment[0] = '\0';
7843 else
7844 szComment[sizeof(szComment) - 1] = '\0';
7845
7846 rc2 = vdThreadFinishRead(pDiskFrom);
7847 AssertRC(rc2);
7848 fLockReadFrom = false;
7849
7850 rc2 = vdThreadStartRead(pDiskTo);
7851 AssertRC(rc2);
7852 unsigned cImagesTo = pDiskTo->cImages;
7853 rc2 = vdThreadFinishRead(pDiskTo);
7854 AssertRC(rc2);
7855
7856 if (pszFilename)
7857 {
7858 if (cbSize == 0)
7859 cbSize = cbSizeFrom;
7860
7861 /* Create destination image with the properties of source image. */
7862 /** @todo replace the VDCreateDiff/VDCreateBase calls by direct
7863 * calls to the backend. Unifies the code and reduces the API
7864 * dependencies. Would also make the synchronization explicit. */
7865 if (cImagesTo > 0)
7866 {
7867 rc = VDCreateDiff(pDiskTo, pszBackend, pszFilename,
7868 uImageFlags, szComment, &ImageUuid,
7869 NULL /* pParentUuid */,
7870 uOpenFlags & ~VD_OPEN_FLAGS_READONLY,
7871 pDstVDIfsImage, NULL);
7872
7873 rc2 = vdThreadStartWrite(pDiskTo);
7874 AssertRC(rc2);
7875 fLockWriteTo = true;
7876 } else {
7877 /** @todo hack to force creation of a fixed image for
7878 * the RAW backend, which can't handle anything else. */
7879 if (!RTStrICmp(pszBackend, "RAW"))
7880 uImageFlags |= VD_IMAGE_FLAGS_FIXED;
7881
7882 vdFixupPCHSGeometry(&PCHSGeometryFrom, cbSize);
7883 vdFixupLCHSGeometry(&LCHSGeometryFrom, cbSize);
7884
7885 rc = VDCreateBase(pDiskTo, pszBackend, pszFilename, cbSize,
7886 uImageFlags, szComment,
7887 &PCHSGeometryFrom, &LCHSGeometryFrom,
7888 NULL, uOpenFlags & ~VD_OPEN_FLAGS_READONLY,
7889 pDstVDIfsImage, NULL);
7890
7891 rc2 = vdThreadStartWrite(pDiskTo);
7892 AssertRC(rc2);
7893 fLockWriteTo = true;
7894
7895 if (RT_SUCCESS(rc) && !RTUuidIsNull(&ImageUuid))
7896 pDiskTo->pLast->Backend->pfnSetUuid(pDiskTo->pLast->pBackendData, &ImageUuid);
7897 }
7898 if (RT_FAILURE(rc))
7899 break;
7900
7901 pImageTo = pDiskTo->pLast;
7902 AssertPtrBreakStmt(pImageTo, rc = VERR_VD_IMAGE_NOT_FOUND);
7903
7904 cbSize = RT_MIN(cbSize, cbSizeFrom);
7905 }
7906 else
7907 {
7908 pImageTo = pDiskTo->pLast;
7909 AssertPtrBreakStmt(pImageTo, rc = VERR_VD_IMAGE_NOT_FOUND);
7910
7911 uint64_t cbSizeTo;
7912 cbSizeTo = pImageTo->Backend->pfnGetSize(pImageTo->pBackendData);
7913 if (cbSizeTo == 0)
7914 {
7915 rc = VERR_VD_VALUE_NOT_FOUND;
7916 break;
7917 }
7918
7919 if (cbSize == 0)
7920 cbSize = RT_MIN(cbSizeFrom, cbSizeTo);
7921
7922 vdFixupPCHSGeometry(&PCHSGeometryFrom, cbSize);
7923 vdFixupLCHSGeometry(&LCHSGeometryFrom, cbSize);
7924
7925 /* Update the geometry in the destination image. */
7926 pImageTo->Backend->pfnSetPCHSGeometry(pImageTo->pBackendData, &PCHSGeometryFrom);
7927 pImageTo->Backend->pfnSetLCHSGeometry(pImageTo->pBackendData, &LCHSGeometryFrom);
7928 }
7929
7930 rc2 = vdThreadFinishWrite(pDiskTo);
7931 AssertRC(rc2);
7932 fLockWriteTo = false;
7933
7934 /* Whether we can take the optimized copy path (false) or not.
7935 * Don't optimize if the image existed or if it is a child image. */
7936 bool fSuppressRedundantIo = ( !(pszFilename == NULL || cImagesTo > 0)
7937 || (nImageToSame != VD_IMAGE_CONTENT_UNKNOWN));
7938 unsigned cImagesFromReadBack, cImagesToReadBack;
7939
7940 if (nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN)
7941 cImagesFromReadBack = 0;
7942 else
7943 {
7944 if (nImage == VD_LAST_IMAGE)
7945 cImagesFromReadBack = pDiskFrom->cImages - nImageFromSame - 1;
7946 else
7947 cImagesFromReadBack = nImage - nImageFromSame;
7948 }
7949
7950 if (nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7951 cImagesToReadBack = 0;
7952 else
7953 cImagesToReadBack = pDiskTo->cImages - nImageToSame - 1;
7954
7955 /* Copy the data. */
7956 rc = vdCopyHelper(pDiskFrom, pImageFrom, pDiskTo, cbSize,
7957 cImagesFromReadBack, cImagesToReadBack,
7958 fSuppressRedundantIo, pIfProgress, pDstIfProgress);
7959
7960 if (RT_SUCCESS(rc))
7961 {
7962 rc2 = vdThreadStartWrite(pDiskTo);
7963 AssertRC(rc2);
7964 fLockWriteTo = true;
7965
7966 /* Only set modification UUID if it is non-null, since the source
7967 * backend might not provide a valid modification UUID. */
7968 if (!RTUuidIsNull(&ImageModificationUuid))
7969 pImageTo->Backend->pfnSetModificationUuid(pImageTo->pBackendData, &ImageModificationUuid);
7970
7971 /* Set the requested open flags if they differ from the value
7972 * required for creating the image and copying the contents. */
7973 if ( pImageTo && pszFilename
7974 && uOpenFlags != (uOpenFlags & ~VD_OPEN_FLAGS_READONLY))
7975 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7976 uOpenFlags);
7977 }
7978 } while (0);
7979
7980 if (RT_FAILURE(rc) && pImageTo && pszFilename)
7981 {
7982 /* Take the write lock only if it is not taken. Not worth making the
7983 * above code even more complicated. */
7984 if (RT_UNLIKELY(!fLockWriteTo))
7985 {
7986 rc2 = vdThreadStartWrite(pDiskTo);
7987 AssertRC(rc2);
7988 fLockWriteTo = true;
7989 }
7990 /* Error detected, but new image created. Remove image from list. */
7991 vdRemoveImageFromList(pDiskTo, pImageTo);
7992
7993 /* Close and delete image. */
7994 rc2 = pImageTo->Backend->pfnClose(pImageTo->pBackendData, true);
7995 AssertRC(rc2);
7996 pImageTo->pBackendData = NULL;
7997
7998 /* Free remaining resources. */
7999 if (pImageTo->pszFilename)
8000 RTStrFree(pImageTo->pszFilename);
8001
8002 RTMemFree(pImageTo);
8003 }
8004
8005 if (RT_UNLIKELY(fLockWriteTo))
8006 {
8007 rc2 = vdThreadFinishWrite(pDiskTo);
8008 AssertRC(rc2);
8009 }
8010 if (RT_UNLIKELY(fLockWriteFrom))
8011 {
8012 rc2 = vdThreadFinishWrite(pDiskFrom);
8013 AssertRC(rc2);
8014 }
8015 else if (RT_UNLIKELY(fLockReadFrom))
8016 {
8017 rc2 = vdThreadFinishRead(pDiskFrom);
8018 AssertRC(rc2);
8019 }
8020
8021 if (RT_SUCCESS(rc))
8022 {
8023 if (pIfProgress && pIfProgress->pfnProgress)
8024 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
8025 if (pDstIfProgress && pDstIfProgress->pfnProgress)
8026 pDstIfProgress->pfnProgress(pDstIfProgress->Core.pvUser, 100);
8027 }
8028
8029 LogFlowFunc(("returns %Rrc\n", rc));
8030 return rc;
8031}
8032
8033/**
8034 * Copies an image from one HDD container to another.
8035 * The copy is opened in the target HDD container.
8036 * It is possible to convert between different image formats, because the
8037 * backend for the destination may be different from the source.
8038 * If both the source and destination reference the same HDD container,
8039 * then the image is moved (by copying/deleting or renaming) to the new location.
8040 * The source container is unchanged if the move operation fails, otherwise
8041 * the image at the new location is opened in the same way as the old one was.
8042 *
8043 * @returns VBox status code.
8044 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8045 * @param pDiskFrom Pointer to source HDD container.
8046 * @param nImage Image number, counts from 0. 0 is always base image of container.
8047 * @param pDiskTo Pointer to destination HDD container.
8048 * @param pszBackend Name of the image file backend to use.
8049 * @param pszFilename New name of the image (may be NULL if pDiskFrom == pDiskTo).
8050 * @param fMoveByRename If true, attempt to perform a move by renaming (if successful the new size is ignored).
8051 * @param cbSize New image size (0 means leave unchanged).
8052 * @param uImageFlags Flags specifying special destination image features.
8053 * @param pDstUuid New UUID of the destination image. If NULL, a new UUID is created.
8054 * This parameter is used if and only if a true copy is created.
8055 * In all rename/move cases the UUIDs are copied over.
8056 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
8057 * Only used if the destination image is created.
8058 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
8059 * @param pDstVDIfsImage Pointer to the per-image VD interface list, for the
8060 * destination image.
8061 * @param pDstVDIfsOperation Pointer to the per-image VD interface list,
8062 * for the destination image.
8063 */
8064VBOXDDU_DECL(int) VDCopy(PVBOXHDD pDiskFrom, unsigned nImage, PVBOXHDD pDiskTo,
8065 const char *pszBackend, const char *pszFilename,
8066 bool fMoveByRename, uint64_t cbSize,
8067 unsigned uImageFlags, PCRTUUID pDstUuid,
8068 unsigned uOpenFlags, PVDINTERFACE pVDIfsOperation,
8069 PVDINTERFACE pDstVDIfsImage,
8070 PVDINTERFACE pDstVDIfsOperation)
8071{
8072 return VDCopyEx(pDiskFrom, nImage, pDiskTo, pszBackend, pszFilename, fMoveByRename,
8073 cbSize, VD_IMAGE_CONTENT_UNKNOWN, VD_IMAGE_CONTENT_UNKNOWN,
8074 uImageFlags, pDstUuid, uOpenFlags, pVDIfsOperation,
8075 pDstVDIfsImage, pDstVDIfsOperation);
8076}
8077
8078/**
8079 * Optimizes the storage consumption of an image. Typically the unused blocks
8080 * have to be wiped with zeroes to achieve a substantial reduced storage use.
8081 * Another optimization done is reordering the image blocks, which can provide
8082 * a significant performance boost, as reads and writes tend to use less random
8083 * file offsets.
8084 *
8085 * @return VBox status code.
8086 * @return VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8087 * @return VERR_VD_IMAGE_READ_ONLY if image is not writable.
8088 * @return VERR_NOT_SUPPORTED if this kind of image can be compacted, but
8089 * the code for this isn't implemented yet.
8090 * @param pDisk Pointer to HDD container.
8091 * @param nImage Image number, counts from 0. 0 is always base image of container.
8092 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
8093 */
8094VBOXDDU_DECL(int) VDCompact(PVBOXHDD pDisk, unsigned nImage,
8095 PVDINTERFACE pVDIfsOperation)
8096{
8097 int rc = VINF_SUCCESS;
8098 int rc2;
8099 bool fLockRead = false, fLockWrite = false;
8100 void *pvBuf = NULL;
8101 void *pvTmp = NULL;
8102
8103 LogFlowFunc(("pDisk=%#p nImage=%u pVDIfsOperation=%#p\n",
8104 pDisk, nImage, pVDIfsOperation));
8105
8106 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
8107
8108 do {
8109 /* Check arguments. */
8110 AssertMsgBreakStmt(VALID_PTR(pDisk), ("pDisk=%#p\n", pDisk),
8111 rc = VERR_INVALID_PARAMETER);
8112 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE,
8113 ("u32Signature=%08x\n", pDisk->u32Signature));
8114
8115 rc2 = vdThreadStartRead(pDisk);
8116 AssertRC(rc2);
8117 fLockRead = true;
8118
8119 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8120 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8121
8122 /* If there is no compact callback for not file based backends then
8123 * the backend doesn't need compaction. No need to make much fuss about
8124 * this. For file based ones signal this as not yet supported. */
8125 if (!pImage->Backend->pfnCompact)
8126 {
8127 if (pImage->Backend->uBackendCaps & VD_CAP_FILE)
8128 rc = VERR_NOT_SUPPORTED;
8129 else
8130 rc = VINF_SUCCESS;
8131 break;
8132 }
8133
8134 /* Insert interface for reading parent state into per-operation list,
8135 * if there is a parent image. */
8136 VDINTERFACEPARENTSTATE VDIfParent;
8137 VDPARENTSTATEDESC ParentUser;
8138 if (pImage->pPrev)
8139 {
8140 VDIfParent.pfnParentRead = vdParentRead;
8141 ParentUser.pDisk = pDisk;
8142 ParentUser.pImage = pImage->pPrev;
8143 rc = VDInterfaceAdd(&VDIfParent.Core, "VDCompact_ParentState", VDINTERFACETYPE_PARENTSTATE,
8144 &ParentUser, sizeof(VDINTERFACEPARENTSTATE), &pVDIfsOperation);
8145 AssertRC(rc);
8146 }
8147
8148 rc2 = vdThreadFinishRead(pDisk);
8149 AssertRC(rc2);
8150 fLockRead = false;
8151
8152 rc2 = vdThreadStartWrite(pDisk);
8153 AssertRC(rc2);
8154 fLockWrite = true;
8155
8156 rc = pImage->Backend->pfnCompact(pImage->pBackendData,
8157 0, 99,
8158 pDisk->pVDIfsDisk,
8159 pImage->pVDIfsImage,
8160 pVDIfsOperation);
8161 } while (0);
8162
8163 if (RT_UNLIKELY(fLockWrite))
8164 {
8165 rc2 = vdThreadFinishWrite(pDisk);
8166 AssertRC(rc2);
8167 }
8168 else if (RT_UNLIKELY(fLockRead))
8169 {
8170 rc2 = vdThreadFinishRead(pDisk);
8171 AssertRC(rc2);
8172 }
8173
8174 if (pvBuf)
8175 RTMemTmpFree(pvBuf);
8176 if (pvTmp)
8177 RTMemTmpFree(pvTmp);
8178
8179 if (RT_SUCCESS(rc))
8180 {
8181 if (pIfProgress && pIfProgress->pfnProgress)
8182 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
8183 }
8184
8185 LogFlowFunc(("returns %Rrc\n", rc));
8186 return rc;
8187}
8188
8189/**
8190 * Resizes the given disk image to the given size.
8191 *
8192 * @return VBox status
8193 * @return VERR_VD_IMAGE_READ_ONLY if image is not writable.
8194 * @return VERR_NOT_SUPPORTED if this kind of image can be compacted, but
8195 *
8196 * @param pDisk Pointer to the HDD container.
8197 * @param cbSize New size of the image.
8198 * @param pPCHSGeometry Pointer to the new physical disk geometry <= (16383,16,63). Not NULL.
8199 * @param pLCHSGeometry Pointer to the new logical disk geometry <= (x,255,63). Not NULL.
8200 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
8201 */
8202VBOXDDU_DECL(int) VDResize(PVBOXHDD pDisk, uint64_t cbSize,
8203 PCVDGEOMETRY pPCHSGeometry,
8204 PCVDGEOMETRY pLCHSGeometry,
8205 PVDINTERFACE pVDIfsOperation)
8206{
8207 /** @todo r=klaus resizing was designed to be part of VDCopy, so having a separate function is not desirable. */
8208 int rc = VINF_SUCCESS;
8209 int rc2;
8210 bool fLockRead = false, fLockWrite = false;
8211
8212 LogFlowFunc(("pDisk=%#p cbSize=%llu pVDIfsOperation=%#p\n",
8213 pDisk, cbSize, pVDIfsOperation));
8214
8215 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
8216
8217 do {
8218 /* Check arguments. */
8219 AssertMsgBreakStmt(VALID_PTR(pDisk), ("pDisk=%#p\n", pDisk),
8220 rc = VERR_INVALID_PARAMETER);
8221 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE,
8222 ("u32Signature=%08x\n", pDisk->u32Signature));
8223
8224 rc2 = vdThreadStartRead(pDisk);
8225 AssertRC(rc2);
8226 fLockRead = true;
8227
8228 /* Must have at least one image in the chain, will resize last. */
8229 AssertMsgBreakStmt(pDisk->cImages >= 1, ("cImages=%u\n", pDisk->cImages),
8230 rc = VERR_NOT_SUPPORTED);
8231
8232 PVDIMAGE pImage = pDisk->pLast;
8233
8234 /* If there is no compact callback for not file based backends then
8235 * the backend doesn't need compaction. No need to make much fuss about
8236 * this. For file based ones signal this as not yet supported. */
8237 if (!pImage->Backend->pfnResize)
8238 {
8239 if (pImage->Backend->uBackendCaps & VD_CAP_FILE)
8240 rc = VERR_NOT_SUPPORTED;
8241 else
8242 rc = VINF_SUCCESS;
8243 break;
8244 }
8245
8246 rc2 = vdThreadFinishRead(pDisk);
8247 AssertRC(rc2);
8248 fLockRead = false;
8249
8250 rc2 = vdThreadStartWrite(pDisk);
8251 AssertRC(rc2);
8252 fLockWrite = true;
8253
8254 VDGEOMETRY PCHSGeometryOld;
8255 VDGEOMETRY LCHSGeometryOld;
8256 PCVDGEOMETRY pPCHSGeometryNew;
8257 PCVDGEOMETRY pLCHSGeometryNew;
8258
8259 if (pPCHSGeometry->cCylinders == 0)
8260 {
8261 /* Auto-detect marker, calculate new value ourself. */
8262 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData, &PCHSGeometryOld);
8263 if (RT_SUCCESS(rc) && (PCHSGeometryOld.cCylinders != 0))
8264 PCHSGeometryOld.cCylinders = RT_MIN(cbSize / 512 / PCHSGeometryOld.cHeads / PCHSGeometryOld.cSectors, 16383);
8265 else if (rc == VERR_VD_GEOMETRY_NOT_SET)
8266 rc = VINF_SUCCESS;
8267
8268 pPCHSGeometryNew = &PCHSGeometryOld;
8269 }
8270 else
8271 pPCHSGeometryNew = pPCHSGeometry;
8272
8273 if (pLCHSGeometry->cCylinders == 0)
8274 {
8275 /* Auto-detect marker, calculate new value ourself. */
8276 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData, &LCHSGeometryOld);
8277 if (RT_SUCCESS(rc) && (LCHSGeometryOld.cCylinders != 0))
8278 LCHSGeometryOld.cCylinders = cbSize / 512 / LCHSGeometryOld.cHeads / LCHSGeometryOld.cSectors;
8279 else if (rc == VERR_VD_GEOMETRY_NOT_SET)
8280 rc = VINF_SUCCESS;
8281
8282 pLCHSGeometryNew = &LCHSGeometryOld;
8283 }
8284 else
8285 pLCHSGeometryNew = pLCHSGeometry;
8286
8287 if (RT_SUCCESS(rc))
8288 rc = pImage->Backend->pfnResize(pImage->pBackendData,
8289 cbSize,
8290 pPCHSGeometryNew,
8291 pLCHSGeometryNew,
8292 0, 99,
8293 pDisk->pVDIfsDisk,
8294 pImage->pVDIfsImage,
8295 pVDIfsOperation);
8296 } while (0);
8297
8298 if (RT_UNLIKELY(fLockWrite))
8299 {
8300 rc2 = vdThreadFinishWrite(pDisk);
8301 AssertRC(rc2);
8302 }
8303 else if (RT_UNLIKELY(fLockRead))
8304 {
8305 rc2 = vdThreadFinishRead(pDisk);
8306 AssertRC(rc2);
8307 }
8308
8309 if (RT_SUCCESS(rc))
8310 {
8311 if (pIfProgress && pIfProgress->pfnProgress)
8312 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
8313
8314 pDisk->cbSize = cbSize;
8315 }
8316
8317 LogFlowFunc(("returns %Rrc\n", rc));
8318 return rc;
8319}
8320
8321/**
8322 * Closes the last opened image file in HDD container.
8323 * If previous image file was opened in read-only mode (the normal case) and
8324 * the last opened image is in read-write mode then the previous image will be
8325 * reopened in read/write mode.
8326 *
8327 * @returns VBox status code.
8328 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8329 * @param pDisk Pointer to HDD container.
8330 * @param fDelete If true, delete the image from the host disk.
8331 */
8332VBOXDDU_DECL(int) VDClose(PVBOXHDD pDisk, bool fDelete)
8333{
8334 int rc = VINF_SUCCESS;
8335 int rc2;
8336 bool fLockWrite = false;
8337
8338 LogFlowFunc(("pDisk=%#p fDelete=%d\n", pDisk, fDelete));
8339 do
8340 {
8341 /* sanity check */
8342 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8343 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8344
8345 /* Not worth splitting this up into a read lock phase and write
8346 * lock phase, as closing an image is a relatively fast operation
8347 * dominated by the part which needs the write lock. */
8348 rc2 = vdThreadStartWrite(pDisk);
8349 AssertRC(rc2);
8350 fLockWrite = true;
8351
8352 PVDIMAGE pImage = pDisk->pLast;
8353 if (!pImage)
8354 {
8355 rc = VERR_VD_NOT_OPENED;
8356 break;
8357 }
8358
8359 /* Destroy the current discard state first which might still have pending blocks. */
8360 rc = vdDiscardStateDestroy(pDisk);
8361 if (RT_FAILURE(rc))
8362 break;
8363
8364 unsigned uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
8365 /* Remove image from list of opened images. */
8366 vdRemoveImageFromList(pDisk, pImage);
8367 /* Close (and optionally delete) image. */
8368 rc = pImage->Backend->pfnClose(pImage->pBackendData, fDelete);
8369 /* Free remaining resources related to the image. */
8370 RTStrFree(pImage->pszFilename);
8371 RTMemFree(pImage);
8372
8373 pImage = pDisk->pLast;
8374 if (!pImage)
8375 break;
8376
8377 /* If disk was previously in read/write mode, make sure it will stay
8378 * like this (if possible) after closing this image. Set the open flags
8379 * accordingly. */
8380 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
8381 {
8382 uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
8383 uOpenFlags &= ~ VD_OPEN_FLAGS_READONLY;
8384 rc = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData, uOpenFlags);
8385 }
8386
8387 /* Cache disk information. */
8388 pDisk->cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
8389
8390 /* Cache PCHS geometry. */
8391 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8392 &pDisk->PCHSGeometry);
8393 if (RT_FAILURE(rc2))
8394 {
8395 pDisk->PCHSGeometry.cCylinders = 0;
8396 pDisk->PCHSGeometry.cHeads = 0;
8397 pDisk->PCHSGeometry.cSectors = 0;
8398 }
8399 else
8400 {
8401 /* Make sure the PCHS geometry is properly clipped. */
8402 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
8403 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
8404 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
8405 }
8406
8407 /* Cache LCHS geometry. */
8408 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
8409 &pDisk->LCHSGeometry);
8410 if (RT_FAILURE(rc2))
8411 {
8412 pDisk->LCHSGeometry.cCylinders = 0;
8413 pDisk->LCHSGeometry.cHeads = 0;
8414 pDisk->LCHSGeometry.cSectors = 0;
8415 }
8416 else
8417 {
8418 /* Make sure the LCHS geometry is properly clipped. */
8419 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
8420 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
8421 }
8422 } while (0);
8423
8424 if (RT_UNLIKELY(fLockWrite))
8425 {
8426 rc2 = vdThreadFinishWrite(pDisk);
8427 AssertRC(rc2);
8428 }
8429
8430 LogFlowFunc(("returns %Rrc\n", rc));
8431 return rc;
8432}
8433
8434/**
8435 * Closes the currently opened cache image file in HDD container.
8436 *
8437 * @return VBox status code.
8438 * @return VERR_VD_NOT_OPENED if no cache is opened in HDD container.
8439 * @param pDisk Pointer to HDD container.
8440 * @param fDelete If true, delete the image from the host disk.
8441 */
8442VBOXDDU_DECL(int) VDCacheClose(PVBOXHDD pDisk, bool fDelete)
8443{
8444 int rc = VINF_SUCCESS;
8445 int rc2;
8446 bool fLockWrite = false;
8447 PVDCACHE pCache = NULL;
8448
8449 LogFlowFunc(("pDisk=%#p fDelete=%d\n", pDisk, fDelete));
8450
8451 do
8452 {
8453 /* sanity check */
8454 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8455 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8456
8457 rc2 = vdThreadStartWrite(pDisk);
8458 AssertRC(rc2);
8459 fLockWrite = true;
8460
8461 AssertPtrBreakStmt(pDisk->pCache, rc = VERR_VD_CACHE_NOT_FOUND);
8462
8463 pCache = pDisk->pCache;
8464 pDisk->pCache = NULL;
8465
8466 pCache->Backend->pfnClose(pCache->pBackendData, fDelete);
8467 if (pCache->pszFilename)
8468 RTStrFree(pCache->pszFilename);
8469 RTMemFree(pCache);
8470 } while (0);
8471
8472 if (RT_LIKELY(fLockWrite))
8473 {
8474 rc2 = vdThreadFinishWrite(pDisk);
8475 AssertRC(rc2);
8476 }
8477
8478 LogFlowFunc(("returns %Rrc\n", rc));
8479 return rc;
8480}
8481
8482/**
8483 * Removes the last added filter in the HDD container.
8484 *
8485 * @return VBox status code.
8486 * @retval VERR_VD_NOT_OPENED if no filter is present for the disk.
8487 * @param pDisk Pointer to HDD container.
8488 */
8489VBOXDDU_DECL(int) VDFilterRemove(PVBOXHDD pDisk)
8490{
8491 int rc = VINF_SUCCESS;
8492 int rc2;
8493 bool fLockWrite = false;
8494 PVDFILTER pFilter = NULL;
8495
8496 LogFlowFunc(("pDisk=%#p\n", pDisk));
8497
8498 do
8499 {
8500 /* sanity check */
8501 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8502 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8503
8504 rc2 = vdThreadStartWrite(pDisk);
8505 AssertRC(rc2);
8506 fLockWrite = true;
8507
8508 AssertPtrBreakStmt(pDisk->pFilterHead, rc = VERR_VD_NOT_OPENED);
8509
8510 pFilter = pDisk->pFilterTail;
8511 vdRemoveFilterFromList(pDisk, pFilter);
8512
8513 pFilter->pBackend->pfnDestroy(pFilter->pvBackendData);
8514 RTMemFree(pFilter);
8515 } while (0);
8516
8517 if (RT_LIKELY(fLockWrite))
8518 {
8519 rc2 = vdThreadFinishWrite(pDisk);
8520 AssertRC(rc2);
8521 }
8522
8523 LogFlowFunc(("returns %Rrc\n", rc));
8524 return rc;
8525}
8526
8527/**
8528 * Closes all opened image files in HDD container.
8529 *
8530 * @returns VBox status code.
8531 * @param pDisk Pointer to HDD container.
8532 */
8533VBOXDDU_DECL(int) VDCloseAll(PVBOXHDD pDisk)
8534{
8535 int rc = VINF_SUCCESS;
8536 int rc2;
8537 bool fLockWrite = false;
8538
8539 LogFlowFunc(("pDisk=%#p\n", pDisk));
8540 do
8541 {
8542 /* sanity check */
8543 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8544 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8545
8546 /* Lock the entire operation. */
8547 rc2 = vdThreadStartWrite(pDisk);
8548 AssertRC(rc2);
8549 fLockWrite = true;
8550
8551 PVDCACHE pCache = pDisk->pCache;
8552 if (pCache)
8553 {
8554 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, false);
8555 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
8556 rc = rc2;
8557
8558 if (pCache->pszFilename)
8559 RTStrFree(pCache->pszFilename);
8560 RTMemFree(pCache);
8561 }
8562
8563 PVDIMAGE pImage = pDisk->pLast;
8564 while (VALID_PTR(pImage))
8565 {
8566 PVDIMAGE pPrev = pImage->pPrev;
8567 /* Remove image from list of opened images. */
8568 vdRemoveImageFromList(pDisk, pImage);
8569 /* Close image. */
8570 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, false);
8571 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
8572 rc = rc2;
8573 /* Free remaining resources related to the image. */
8574 RTStrFree(pImage->pszFilename);
8575 RTMemFree(pImage);
8576 pImage = pPrev;
8577 }
8578 Assert(!VALID_PTR(pDisk->pLast));
8579 } while (0);
8580
8581 if (RT_UNLIKELY(fLockWrite))
8582 {
8583 rc2 = vdThreadFinishWrite(pDisk);
8584 AssertRC(rc2);
8585 }
8586
8587 LogFlowFunc(("returns %Rrc\n", rc));
8588 return rc;
8589}
8590
8591/**
8592 * Removes all filters of the given HDD container.
8593 *
8594 * @return VBox status code.
8595 * @param pDisk Pointer to HDD container.
8596 */
8597VBOXDDU_DECL(int) VDFilterRemoveAll(PVBOXHDD pDisk)
8598{
8599 int rc = VINF_SUCCESS;
8600 int rc2;
8601 bool fLockWrite = false;
8602
8603 LogFlowFunc(("pDisk=%#p\n", pDisk));
8604 do
8605 {
8606 /* sanity check */
8607 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8608 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8609
8610 /* Lock the entire operation. */
8611 rc2 = vdThreadStartWrite(pDisk);
8612 AssertRC(rc2);
8613 fLockWrite = true;
8614
8615 PVDFILTER pFilter = pDisk->pFilterTail;
8616 while (VALID_PTR(pFilter))
8617 {
8618 PVDFILTER pPrev = pFilter->pPrev;
8619 vdRemoveFilterFromList(pDisk, pFilter);
8620
8621 rc2 = pFilter->pBackend->pfnDestroy(pFilter->pvBackendData);
8622 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
8623 rc = rc2;
8624 /* Free remaining resources related to the image. */
8625 RTMemFree(pFilter);
8626 pFilter = pPrev;
8627 }
8628 Assert(!VALID_PTR(pDisk->pFilterTail));
8629 } while (0);
8630
8631 if (RT_UNLIKELY(fLockWrite))
8632 {
8633 rc2 = vdThreadFinishWrite(pDisk);
8634 AssertRC(rc2);
8635 }
8636
8637 LogFlowFunc(("returns %Rrc\n", rc));
8638 return rc;
8639}
8640
8641/**
8642 * Read data from virtual HDD.
8643 *
8644 * @returns VBox status code.
8645 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8646 * @param pDisk Pointer to HDD container.
8647 * @param uOffset Offset of first reading byte from start of disk.
8648 * @param pvBuf Pointer to buffer for reading data.
8649 * @param cbRead Number of bytes to read.
8650 */
8651VBOXDDU_DECL(int) VDRead(PVBOXHDD pDisk, uint64_t uOffset, void *pvBuf,
8652 size_t cbRead)
8653{
8654 int rc = VINF_SUCCESS;
8655 int rc2;
8656 bool fLockRead = false;
8657
8658 LogFlowFunc(("pDisk=%#p uOffset=%llu pvBuf=%p cbRead=%zu\n",
8659 pDisk, uOffset, pvBuf, cbRead));
8660 do
8661 {
8662 /* sanity check */
8663 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8664 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8665
8666 /* Check arguments. */
8667 AssertMsgBreakStmt(VALID_PTR(pvBuf),
8668 ("pvBuf=%#p\n", pvBuf),
8669 rc = VERR_INVALID_PARAMETER);
8670 AssertMsgBreakStmt(cbRead,
8671 ("cbRead=%zu\n", cbRead),
8672 rc = VERR_INVALID_PARAMETER);
8673
8674 rc2 = vdThreadStartRead(pDisk);
8675 AssertRC(rc2);
8676 fLockRead = true;
8677
8678 PVDIMAGE pImage = pDisk->pLast;
8679 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8680
8681 if (uOffset + cbRead > pDisk->cbSize)
8682 {
8683 /* Floppy images might be smaller than the standard expected by
8684 the floppy controller code. So, we won't fail here. */
8685 AssertMsgBreakStmt(pDisk->enmType == VDTYPE_FLOPPY,
8686 ("uOffset=%llu cbRead=%zu pDisk->cbSize=%llu\n",
8687 uOffset, cbRead, pDisk->cbSize),
8688 rc = VERR_EOF);
8689 memset(pvBuf, 0xf6, cbRead); /* f6h = format.com filler byte */
8690 if (uOffset >= pDisk->cbSize)
8691 break;
8692 cbRead = pDisk->cbSize - uOffset;
8693 }
8694
8695 rc = vdReadHelper(pDisk, pImage, uOffset, pvBuf, cbRead,
8696 true /* fUpdateCache */);
8697 } while (0);
8698
8699 if (RT_UNLIKELY(fLockRead))
8700 {
8701 rc2 = vdThreadFinishRead(pDisk);
8702 AssertRC(rc2);
8703 }
8704
8705 LogFlowFunc(("returns %Rrc\n", rc));
8706 return rc;
8707}
8708
8709/**
8710 * Write data to virtual HDD.
8711 *
8712 * @returns VBox status code.
8713 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8714 * @param pDisk Pointer to HDD container.
8715 * @param uOffset Offset of the first byte being
8716 * written from start of disk.
8717 * @param pvBuf Pointer to buffer for writing data.
8718 * @param cbWrite Number of bytes to write.
8719 */
8720VBOXDDU_DECL(int) VDWrite(PVBOXHDD pDisk, uint64_t uOffset, const void *pvBuf,
8721 size_t cbWrite)
8722{
8723 int rc = VINF_SUCCESS;
8724 int rc2;
8725 bool fLockWrite = false;
8726
8727 LogFlowFunc(("pDisk=%#p uOffset=%llu pvBuf=%p cbWrite=%zu\n",
8728 pDisk, uOffset, pvBuf, cbWrite));
8729 do
8730 {
8731 /* sanity check */
8732 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8733 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8734
8735 /* Check arguments. */
8736 AssertMsgBreakStmt(VALID_PTR(pvBuf),
8737 ("pvBuf=%#p\n", pvBuf),
8738 rc = VERR_INVALID_PARAMETER);
8739 AssertMsgBreakStmt(cbWrite,
8740 ("cbWrite=%zu\n", cbWrite),
8741 rc = VERR_INVALID_PARAMETER);
8742
8743 rc2 = vdThreadStartWrite(pDisk);
8744 AssertRC(rc2);
8745 fLockWrite = true;
8746
8747 AssertMsgBreakStmt(uOffset + cbWrite <= pDisk->cbSize,
8748 ("uOffset=%llu cbWrite=%zu pDisk->cbSize=%llu\n",
8749 uOffset, cbWrite, pDisk->cbSize),
8750 rc = VERR_INVALID_PARAMETER);
8751
8752 PVDIMAGE pImage = pDisk->pLast;
8753 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8754
8755 vdSetModifiedFlag(pDisk);
8756 rc = vdWriteHelper(pDisk, pImage, uOffset, pvBuf, cbWrite,
8757 VDIOCTX_FLAGS_READ_UPDATE_CACHE);
8758 if (RT_FAILURE(rc))
8759 break;
8760
8761 /* If there is a merge (in the direction towards a parent) running
8762 * concurrently then we have to also "relay" the write to this parent,
8763 * as the merge position might be already past the position where
8764 * this write is going. The "context" of the write can come from the
8765 * natural chain, since merging either already did or will take care
8766 * of the "other" content which is might be needed to fill the block
8767 * to a full allocation size. The cache doesn't need to be touched
8768 * as this write is covered by the previous one. */
8769 if (RT_UNLIKELY(pDisk->pImageRelay))
8770 rc = vdWriteHelper(pDisk, pDisk->pImageRelay, uOffset,
8771 pvBuf, cbWrite, VDIOCTX_FLAGS_DEFAULT);
8772 } while (0);
8773
8774 if (RT_UNLIKELY(fLockWrite))
8775 {
8776 rc2 = vdThreadFinishWrite(pDisk);
8777 AssertRC(rc2);
8778 }
8779
8780 LogFlowFunc(("returns %Rrc\n", rc));
8781 return rc;
8782}
8783
8784/**
8785 * Make sure the on disk representation of a virtual HDD is up to date.
8786 *
8787 * @returns VBox status code.
8788 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8789 * @param pDisk Pointer to HDD container.
8790 */
8791VBOXDDU_DECL(int) VDFlush(PVBOXHDD pDisk)
8792{
8793 int rc = VINF_SUCCESS;
8794 int rc2;
8795 bool fLockWrite = false;
8796
8797 LogFlowFunc(("pDisk=%#p\n", pDisk));
8798 do
8799 {
8800 /* sanity check */
8801 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8802 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8803
8804 rc2 = vdThreadStartWrite(pDisk);
8805 AssertRC(rc2);
8806 fLockWrite = true;
8807
8808 PVDIMAGE pImage = pDisk->pLast;
8809 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8810
8811 VDIOCTX IoCtx;
8812 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
8813
8814 rc = RTSemEventCreate(&hEventComplete);
8815 if (RT_FAILURE(rc))
8816 break;
8817
8818 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_FLUSH, 0, 0, pImage, NULL,
8819 NULL, vdFlushHelperAsync, VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE);
8820
8821 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
8822 IoCtx.Type.Root.pvUser1 = pDisk;
8823 IoCtx.Type.Root.pvUser2 = hEventComplete;
8824 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
8825
8826 RTSemEventDestroy(hEventComplete);
8827 } while (0);
8828
8829 if (RT_UNLIKELY(fLockWrite))
8830 {
8831 rc2 = vdThreadFinishWrite(pDisk);
8832 AssertRC(rc2);
8833 }
8834
8835 LogFlowFunc(("returns %Rrc\n", rc));
8836 return rc;
8837}
8838
8839/**
8840 * Get number of opened images in HDD container.
8841 *
8842 * @returns Number of opened images for HDD container. 0 if no images have been opened.
8843 * @param pDisk Pointer to HDD container.
8844 */
8845VBOXDDU_DECL(unsigned) VDGetCount(PVBOXHDD pDisk)
8846{
8847 unsigned cImages;
8848 int rc2;
8849 bool fLockRead = false;
8850
8851 LogFlowFunc(("pDisk=%#p\n", pDisk));
8852 do
8853 {
8854 /* sanity check */
8855 AssertPtrBreakStmt(pDisk, cImages = 0);
8856 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8857
8858 rc2 = vdThreadStartRead(pDisk);
8859 AssertRC(rc2);
8860 fLockRead = true;
8861
8862 cImages = pDisk->cImages;
8863 } while (0);
8864
8865 if (RT_UNLIKELY(fLockRead))
8866 {
8867 rc2 = vdThreadFinishRead(pDisk);
8868 AssertRC(rc2);
8869 }
8870
8871 LogFlowFunc(("returns %u\n", cImages));
8872 return cImages;
8873}
8874
8875/**
8876 * Get read/write mode of HDD container.
8877 *
8878 * @returns Virtual disk ReadOnly status.
8879 * @returns true if no image is opened in HDD container.
8880 * @param pDisk Pointer to HDD container.
8881 */
8882VBOXDDU_DECL(bool) VDIsReadOnly(PVBOXHDD pDisk)
8883{
8884 bool fReadOnly;
8885 int rc2;
8886 bool fLockRead = false;
8887
8888 LogFlowFunc(("pDisk=%#p\n", pDisk));
8889 do
8890 {
8891 /* sanity check */
8892 AssertPtrBreakStmt(pDisk, fReadOnly = false);
8893 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8894
8895 rc2 = vdThreadStartRead(pDisk);
8896 AssertRC(rc2);
8897 fLockRead = true;
8898
8899 PVDIMAGE pImage = pDisk->pLast;
8900 AssertPtrBreakStmt(pImage, fReadOnly = true);
8901
8902 unsigned uOpenFlags;
8903 uOpenFlags = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
8904 fReadOnly = !!(uOpenFlags & VD_OPEN_FLAGS_READONLY);
8905 } while (0);
8906
8907 if (RT_UNLIKELY(fLockRead))
8908 {
8909 rc2 = vdThreadFinishRead(pDisk);
8910 AssertRC(rc2);
8911 }
8912
8913 LogFlowFunc(("returns %d\n", fReadOnly));
8914 return fReadOnly;
8915}
8916
8917/**
8918 * Get sector size of an image in HDD container.
8919 *
8920 * @return Virtual disk sector size in bytes.
8921 * @return 0 if image with specified number was not opened.
8922 * @param pDisk Pointer to HDD container.
8923 * @param nImage Image number, counts from 0. 0 is always base image of container.
8924 */
8925VBOXDDU_DECL(uint32_t) VDGetSectorSize(PVBOXHDD pDisk, unsigned nImage)
8926{
8927 uint64_t cbSector;
8928 int rc2;
8929 bool fLockRead = false;
8930
8931 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8932 do
8933 {
8934 /* sanity check */
8935 AssertPtrBreakStmt(pDisk, cbSector = 0);
8936 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8937
8938 rc2 = vdThreadStartRead(pDisk);
8939 AssertRC(rc2);
8940 fLockRead = true;
8941
8942 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8943 AssertPtrBreakStmt(pImage, cbSector = 0);
8944 cbSector = pImage->Backend->pfnGetSectorSize(pImage->pBackendData);
8945 } while (0);
8946
8947 if (RT_UNLIKELY(fLockRead))
8948 {
8949 rc2 = vdThreadFinishRead(pDisk);
8950 AssertRC(rc2);
8951 }
8952
8953 LogFlowFunc(("returns %u\n", cbSector));
8954 return cbSector;
8955}
8956
8957/**
8958 * Get total capacity of an image in HDD container.
8959 *
8960 * @returns Virtual disk size in bytes.
8961 * @returns 0 if no image with specified number was not opened.
8962 * @param pDisk Pointer to HDD container.
8963 * @param nImage Image number, counts from 0. 0 is always base image of container.
8964 */
8965VBOXDDU_DECL(uint64_t) VDGetSize(PVBOXHDD pDisk, unsigned nImage)
8966{
8967 uint64_t cbSize;
8968 int rc2;
8969 bool fLockRead = false;
8970
8971 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8972 do
8973 {
8974 /* sanity check */
8975 AssertPtrBreakStmt(pDisk, cbSize = 0);
8976 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8977
8978 rc2 = vdThreadStartRead(pDisk);
8979 AssertRC(rc2);
8980 fLockRead = true;
8981
8982 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8983 AssertPtrBreakStmt(pImage, cbSize = 0);
8984 cbSize = pImage->Backend->pfnGetSize(pImage->pBackendData);
8985 } while (0);
8986
8987 if (RT_UNLIKELY(fLockRead))
8988 {
8989 rc2 = vdThreadFinishRead(pDisk);
8990 AssertRC(rc2);
8991 }
8992
8993 LogFlowFunc(("returns %llu\n", cbSize));
8994 return cbSize;
8995}
8996
8997/**
8998 * Get total file size of an image in HDD container.
8999 *
9000 * @returns Virtual disk size in bytes.
9001 * @returns 0 if no image is opened in HDD container.
9002 * @param pDisk Pointer to HDD container.
9003 * @param nImage Image number, counts from 0. 0 is always base image of container.
9004 */
9005VBOXDDU_DECL(uint64_t) VDGetFileSize(PVBOXHDD pDisk, unsigned nImage)
9006{
9007 uint64_t cbSize;
9008 int rc2;
9009 bool fLockRead = false;
9010
9011 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
9012 do
9013 {
9014 /* sanity check */
9015 AssertPtrBreakStmt(pDisk, cbSize = 0);
9016 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9017
9018 rc2 = vdThreadStartRead(pDisk);
9019 AssertRC(rc2);
9020 fLockRead = true;
9021
9022 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9023 AssertPtrBreakStmt(pImage, cbSize = 0);
9024 cbSize = pImage->Backend->pfnGetFileSize(pImage->pBackendData);
9025 } while (0);
9026
9027 if (RT_UNLIKELY(fLockRead))
9028 {
9029 rc2 = vdThreadFinishRead(pDisk);
9030 AssertRC(rc2);
9031 }
9032
9033 LogFlowFunc(("returns %llu\n", cbSize));
9034 return cbSize;
9035}
9036
9037/**
9038 * Get virtual disk PCHS geometry stored in HDD container.
9039 *
9040 * @returns VBox status code.
9041 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9042 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
9043 * @param pDisk Pointer to HDD container.
9044 * @param nImage Image number, counts from 0. 0 is always base image of container.
9045 * @param pPCHSGeometry Where to store PCHS geometry. Not NULL.
9046 */
9047VBOXDDU_DECL(int) VDGetPCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
9048 PVDGEOMETRY pPCHSGeometry)
9049{
9050 int rc = VINF_SUCCESS;
9051 int rc2;
9052 bool fLockRead = false;
9053
9054 LogFlowFunc(("pDisk=%#p nImage=%u pPCHSGeometry=%#p\n",
9055 pDisk, nImage, pPCHSGeometry));
9056 do
9057 {
9058 /* sanity check */
9059 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9060 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9061
9062 /* Check arguments. */
9063 AssertMsgBreakStmt(VALID_PTR(pPCHSGeometry),
9064 ("pPCHSGeometry=%#p\n", pPCHSGeometry),
9065 rc = VERR_INVALID_PARAMETER);
9066
9067 rc2 = vdThreadStartRead(pDisk);
9068 AssertRC(rc2);
9069 fLockRead = true;
9070
9071 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9072 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9073
9074 if (pImage == pDisk->pLast)
9075 {
9076 /* Use cached information if possible. */
9077 if (pDisk->PCHSGeometry.cCylinders != 0)
9078 *pPCHSGeometry = pDisk->PCHSGeometry;
9079 else
9080 rc = VERR_VD_GEOMETRY_NOT_SET;
9081 }
9082 else
9083 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
9084 pPCHSGeometry);
9085 } while (0);
9086
9087 if (RT_UNLIKELY(fLockRead))
9088 {
9089 rc2 = vdThreadFinishRead(pDisk);
9090 AssertRC(rc2);
9091 }
9092
9093 LogFlowFunc(("%Rrc (PCHS=%u/%u/%u)\n", rc,
9094 pDisk->PCHSGeometry.cCylinders, pDisk->PCHSGeometry.cHeads,
9095 pDisk->PCHSGeometry.cSectors));
9096 return rc;
9097}
9098
9099/**
9100 * Store virtual disk PCHS geometry in HDD container.
9101 *
9102 * Note that in case of unrecoverable error all images in HDD container will be closed.
9103 *
9104 * @returns VBox status code.
9105 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9106 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
9107 * @param pDisk Pointer to HDD container.
9108 * @param nImage Image number, counts from 0. 0 is always base image of container.
9109 * @param pPCHSGeometry Where to load PCHS geometry from. Not NULL.
9110 */
9111VBOXDDU_DECL(int) VDSetPCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
9112 PCVDGEOMETRY pPCHSGeometry)
9113{
9114 int rc = VINF_SUCCESS;
9115 int rc2;
9116 bool fLockWrite = false;
9117
9118 LogFlowFunc(("pDisk=%#p nImage=%u pPCHSGeometry=%#p PCHS=%u/%u/%u\n",
9119 pDisk, nImage, pPCHSGeometry, pPCHSGeometry->cCylinders,
9120 pPCHSGeometry->cHeads, pPCHSGeometry->cSectors));
9121 do
9122 {
9123 /* sanity check */
9124 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9125 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9126
9127 /* Check arguments. */
9128 AssertMsgBreakStmt( VALID_PTR(pPCHSGeometry)
9129 && pPCHSGeometry->cHeads <= 16
9130 && pPCHSGeometry->cSectors <= 63,
9131 ("pPCHSGeometry=%#p PCHS=%u/%u/%u\n", pPCHSGeometry,
9132 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
9133 pPCHSGeometry->cSectors),
9134 rc = VERR_INVALID_PARAMETER);
9135
9136 rc2 = vdThreadStartWrite(pDisk);
9137 AssertRC(rc2);
9138 fLockWrite = true;
9139
9140 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9141 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9142
9143 if (pImage == pDisk->pLast)
9144 {
9145 if ( pPCHSGeometry->cCylinders != pDisk->PCHSGeometry.cCylinders
9146 || pPCHSGeometry->cHeads != pDisk->PCHSGeometry.cHeads
9147 || pPCHSGeometry->cSectors != pDisk->PCHSGeometry.cSectors)
9148 {
9149 /* Only update geometry if it is changed. Avoids similar checks
9150 * in every backend. Most of the time the new geometry is set
9151 * to the previous values, so no need to go through the hassle
9152 * of updating an image which could be opened in read-only mode
9153 * right now. */
9154 rc = pImage->Backend->pfnSetPCHSGeometry(pImage->pBackendData,
9155 pPCHSGeometry);
9156
9157 /* Cache new geometry values in any case. */
9158 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
9159 &pDisk->PCHSGeometry);
9160 if (RT_FAILURE(rc2))
9161 {
9162 pDisk->PCHSGeometry.cCylinders = 0;
9163 pDisk->PCHSGeometry.cHeads = 0;
9164 pDisk->PCHSGeometry.cSectors = 0;
9165 }
9166 else
9167 {
9168 /* Make sure the CHS geometry is properly clipped. */
9169 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 255);
9170 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
9171 }
9172 }
9173 }
9174 else
9175 {
9176 VDGEOMETRY PCHS;
9177 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
9178 &PCHS);
9179 if ( RT_FAILURE(rc)
9180 || pPCHSGeometry->cCylinders != PCHS.cCylinders
9181 || pPCHSGeometry->cHeads != PCHS.cHeads
9182 || pPCHSGeometry->cSectors != PCHS.cSectors)
9183 {
9184 /* Only update geometry if it is changed. Avoids similar checks
9185 * in every backend. Most of the time the new geometry is set
9186 * to the previous values, so no need to go through the hassle
9187 * of updating an image which could be opened in read-only mode
9188 * right now. */
9189 rc = pImage->Backend->pfnSetPCHSGeometry(pImage->pBackendData,
9190 pPCHSGeometry);
9191 }
9192 }
9193 } while (0);
9194
9195 if (RT_UNLIKELY(fLockWrite))
9196 {
9197 rc2 = vdThreadFinishWrite(pDisk);
9198 AssertRC(rc2);
9199 }
9200
9201 LogFlowFunc(("returns %Rrc\n", rc));
9202 return rc;
9203}
9204
9205/**
9206 * Get virtual disk LCHS geometry stored in HDD container.
9207 *
9208 * @returns VBox status code.
9209 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9210 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
9211 * @param pDisk Pointer to HDD container.
9212 * @param nImage Image number, counts from 0. 0 is always base image of container.
9213 * @param pLCHSGeometry Where to store LCHS geometry. Not NULL.
9214 */
9215VBOXDDU_DECL(int) VDGetLCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
9216 PVDGEOMETRY pLCHSGeometry)
9217{
9218 int rc = VINF_SUCCESS;
9219 int rc2;
9220 bool fLockRead = false;
9221
9222 LogFlowFunc(("pDisk=%#p nImage=%u pLCHSGeometry=%#p\n",
9223 pDisk, nImage, pLCHSGeometry));
9224 do
9225 {
9226 /* sanity check */
9227 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9228 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9229
9230 /* Check arguments. */
9231 AssertMsgBreakStmt(VALID_PTR(pLCHSGeometry),
9232 ("pLCHSGeometry=%#p\n", pLCHSGeometry),
9233 rc = VERR_INVALID_PARAMETER);
9234
9235 rc2 = vdThreadStartRead(pDisk);
9236 AssertRC(rc2);
9237 fLockRead = true;
9238
9239 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9240 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9241
9242 if (pImage == pDisk->pLast)
9243 {
9244 /* Use cached information if possible. */
9245 if (pDisk->LCHSGeometry.cCylinders != 0)
9246 *pLCHSGeometry = pDisk->LCHSGeometry;
9247 else
9248 rc = VERR_VD_GEOMETRY_NOT_SET;
9249 }
9250 else
9251 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
9252 pLCHSGeometry);
9253 } while (0);
9254
9255 if (RT_UNLIKELY(fLockRead))
9256 {
9257 rc2 = vdThreadFinishRead(pDisk);
9258 AssertRC(rc2);
9259 }
9260
9261 LogFlowFunc((": %Rrc (LCHS=%u/%u/%u)\n", rc,
9262 pDisk->LCHSGeometry.cCylinders, pDisk->LCHSGeometry.cHeads,
9263 pDisk->LCHSGeometry.cSectors));
9264 return rc;
9265}
9266
9267/**
9268 * Store virtual disk LCHS geometry in HDD container.
9269 *
9270 * Note that in case of unrecoverable error all images in HDD container will be closed.
9271 *
9272 * @returns VBox status code.
9273 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9274 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
9275 * @param pDisk Pointer to HDD container.
9276 * @param nImage Image number, counts from 0. 0 is always base image of container.
9277 * @param pLCHSGeometry Where to load LCHS geometry from. Not NULL.
9278 */
9279VBOXDDU_DECL(int) VDSetLCHSGeometry(PVBOXHDD pDisk, unsigned nImage,
9280 PCVDGEOMETRY pLCHSGeometry)
9281{
9282 int rc = VINF_SUCCESS;
9283 int rc2;
9284 bool fLockWrite = false;
9285
9286 LogFlowFunc(("pDisk=%#p nImage=%u pLCHSGeometry=%#p LCHS=%u/%u/%u\n",
9287 pDisk, nImage, pLCHSGeometry, pLCHSGeometry->cCylinders,
9288 pLCHSGeometry->cHeads, pLCHSGeometry->cSectors));
9289 do
9290 {
9291 /* sanity check */
9292 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9293 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9294
9295 /* Check arguments. */
9296 AssertMsgBreakStmt( VALID_PTR(pLCHSGeometry)
9297 && pLCHSGeometry->cHeads <= 255
9298 && pLCHSGeometry->cSectors <= 63,
9299 ("pLCHSGeometry=%#p LCHS=%u/%u/%u\n", pLCHSGeometry,
9300 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads,
9301 pLCHSGeometry->cSectors),
9302 rc = VERR_INVALID_PARAMETER);
9303
9304 rc2 = vdThreadStartWrite(pDisk);
9305 AssertRC(rc2);
9306 fLockWrite = true;
9307
9308 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9309 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9310
9311 if (pImage == pDisk->pLast)
9312 {
9313 if ( pLCHSGeometry->cCylinders != pDisk->LCHSGeometry.cCylinders
9314 || pLCHSGeometry->cHeads != pDisk->LCHSGeometry.cHeads
9315 || pLCHSGeometry->cSectors != pDisk->LCHSGeometry.cSectors)
9316 {
9317 /* Only update geometry if it is changed. Avoids similar checks
9318 * in every backend. Most of the time the new geometry is set
9319 * to the previous values, so no need to go through the hassle
9320 * of updating an image which could be opened in read-only mode
9321 * right now. */
9322 rc = pImage->Backend->pfnSetLCHSGeometry(pImage->pBackendData,
9323 pLCHSGeometry);
9324
9325 /* Cache new geometry values in any case. */
9326 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
9327 &pDisk->LCHSGeometry);
9328 if (RT_FAILURE(rc2))
9329 {
9330 pDisk->LCHSGeometry.cCylinders = 0;
9331 pDisk->LCHSGeometry.cHeads = 0;
9332 pDisk->LCHSGeometry.cSectors = 0;
9333 }
9334 else
9335 {
9336 /* Make sure the CHS geometry is properly clipped. */
9337 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
9338 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
9339 }
9340 }
9341 }
9342 else
9343 {
9344 VDGEOMETRY LCHS;
9345 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
9346 &LCHS);
9347 if ( RT_FAILURE(rc)
9348 || pLCHSGeometry->cCylinders != LCHS.cCylinders
9349 || pLCHSGeometry->cHeads != LCHS.cHeads
9350 || pLCHSGeometry->cSectors != LCHS.cSectors)
9351 {
9352 /* Only update geometry if it is changed. Avoids similar checks
9353 * in every backend. Most of the time the new geometry is set
9354 * to the previous values, so no need to go through the hassle
9355 * of updating an image which could be opened in read-only mode
9356 * right now. */
9357 rc = pImage->Backend->pfnSetLCHSGeometry(pImage->pBackendData,
9358 pLCHSGeometry);
9359 }
9360 }
9361 } while (0);
9362
9363 if (RT_UNLIKELY(fLockWrite))
9364 {
9365 rc2 = vdThreadFinishWrite(pDisk);
9366 AssertRC(rc2);
9367 }
9368
9369 LogFlowFunc(("returns %Rrc\n", rc));
9370 return rc;
9371}
9372
9373/**
9374 * Get version of image in HDD container.
9375 *
9376 * @returns VBox status code.
9377 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9378 * @param pDisk Pointer to HDD container.
9379 * @param nImage Image number, counts from 0. 0 is always base image of container.
9380 * @param puVersion Where to store the image version.
9381 */
9382VBOXDDU_DECL(int) VDGetVersion(PVBOXHDD pDisk, unsigned nImage,
9383 unsigned *puVersion)
9384{
9385 int rc = VINF_SUCCESS;
9386 int rc2;
9387 bool fLockRead = false;
9388
9389 LogFlowFunc(("pDisk=%#p nImage=%u puVersion=%#p\n",
9390 pDisk, nImage, puVersion));
9391 do
9392 {
9393 /* sanity check */
9394 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9395 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9396
9397 /* Check arguments. */
9398 AssertMsgBreakStmt(VALID_PTR(puVersion),
9399 ("puVersion=%#p\n", puVersion),
9400 rc = VERR_INVALID_PARAMETER);
9401
9402 rc2 = vdThreadStartRead(pDisk);
9403 AssertRC(rc2);
9404 fLockRead = true;
9405
9406 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9407 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9408
9409 *puVersion = pImage->Backend->pfnGetVersion(pImage->pBackendData);
9410 } while (0);
9411
9412 if (RT_UNLIKELY(fLockRead))
9413 {
9414 rc2 = vdThreadFinishRead(pDisk);
9415 AssertRC(rc2);
9416 }
9417
9418 LogFlowFunc(("returns %Rrc uVersion=%#x\n", rc, *puVersion));
9419 return rc;
9420}
9421
9422/**
9423 * List the capabilities of image backend in HDD container.
9424 *
9425 * @returns VBox status code.
9426 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9427 * @param pDisk Pointer to the HDD container.
9428 * @param nImage Image number, counts from 0. 0 is always base image of container.
9429 * @param pbackendInfo Where to store the backend information.
9430 */
9431VBOXDDU_DECL(int) VDBackendInfoSingle(PVBOXHDD pDisk, unsigned nImage,
9432 PVDBACKENDINFO pBackendInfo)
9433{
9434 int rc = VINF_SUCCESS;
9435 int rc2;
9436 bool fLockRead = false;
9437
9438 LogFlowFunc(("pDisk=%#p nImage=%u pBackendInfo=%#p\n",
9439 pDisk, nImage, pBackendInfo));
9440 do
9441 {
9442 /* sanity check */
9443 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9444 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9445
9446 /* Check arguments. */
9447 AssertMsgBreakStmt(VALID_PTR(pBackendInfo),
9448 ("pBackendInfo=%#p\n", pBackendInfo),
9449 rc = VERR_INVALID_PARAMETER);
9450
9451 rc2 = vdThreadStartRead(pDisk);
9452 AssertRC(rc2);
9453 fLockRead = true;
9454
9455 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9456 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9457
9458 pBackendInfo->pszBackend = pImage->Backend->pszBackendName;
9459 pBackendInfo->uBackendCaps = pImage->Backend->uBackendCaps;
9460 pBackendInfo->paFileExtensions = pImage->Backend->paFileExtensions;
9461 pBackendInfo->paConfigInfo = pImage->Backend->paConfigInfo;
9462 } while (0);
9463
9464 if (RT_UNLIKELY(fLockRead))
9465 {
9466 rc2 = vdThreadFinishRead(pDisk);
9467 AssertRC(rc2);
9468 }
9469
9470 LogFlowFunc(("returns %Rrc\n", rc));
9471 return rc;
9472}
9473
9474/**
9475 * Get flags of image in HDD container.
9476 *
9477 * @returns VBox status code.
9478 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9479 * @param pDisk Pointer to HDD container.
9480 * @param nImage Image number, counts from 0. 0 is always base image of container.
9481 * @param puImageFlags Where to store the image flags.
9482 */
9483VBOXDDU_DECL(int) VDGetImageFlags(PVBOXHDD pDisk, unsigned nImage,
9484 unsigned *puImageFlags)
9485{
9486 int rc = VINF_SUCCESS;
9487 int rc2;
9488 bool fLockRead = false;
9489
9490 LogFlowFunc(("pDisk=%#p nImage=%u puImageFlags=%#p\n",
9491 pDisk, nImage, puImageFlags));
9492 do
9493 {
9494 /* sanity check */
9495 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9496 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9497
9498 /* Check arguments. */
9499 AssertMsgBreakStmt(VALID_PTR(puImageFlags),
9500 ("puImageFlags=%#p\n", puImageFlags),
9501 rc = VERR_INVALID_PARAMETER);
9502
9503 rc2 = vdThreadStartRead(pDisk);
9504 AssertRC(rc2);
9505 fLockRead = true;
9506
9507 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9508 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9509
9510 *puImageFlags = pImage->uImageFlags;
9511 } while (0);
9512
9513 if (RT_UNLIKELY(fLockRead))
9514 {
9515 rc2 = vdThreadFinishRead(pDisk);
9516 AssertRC(rc2);
9517 }
9518
9519 LogFlowFunc(("returns %Rrc uImageFlags=%#x\n", rc, *puImageFlags));
9520 return rc;
9521}
9522
9523/**
9524 * Get open flags of image in HDD container.
9525 *
9526 * @returns VBox status code.
9527 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9528 * @param pDisk Pointer to HDD container.
9529 * @param nImage Image number, counts from 0. 0 is always base image of container.
9530 * @param puOpenFlags Where to store the image open flags.
9531 */
9532VBOXDDU_DECL(int) VDGetOpenFlags(PVBOXHDD pDisk, unsigned nImage,
9533 unsigned *puOpenFlags)
9534{
9535 int rc = VINF_SUCCESS;
9536 int rc2;
9537 bool fLockRead = false;
9538
9539 LogFlowFunc(("pDisk=%#p nImage=%u puOpenFlags=%#p\n",
9540 pDisk, nImage, puOpenFlags));
9541 do
9542 {
9543 /* sanity check */
9544 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9545 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9546
9547 /* Check arguments. */
9548 AssertMsgBreakStmt(VALID_PTR(puOpenFlags),
9549 ("puOpenFlags=%#p\n", puOpenFlags),
9550 rc = VERR_INVALID_PARAMETER);
9551
9552 rc2 = vdThreadStartRead(pDisk);
9553 AssertRC(rc2);
9554 fLockRead = true;
9555
9556 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9557 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9558
9559 *puOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
9560 } while (0);
9561
9562 if (RT_UNLIKELY(fLockRead))
9563 {
9564 rc2 = vdThreadFinishRead(pDisk);
9565 AssertRC(rc2);
9566 }
9567
9568 LogFlowFunc(("returns %Rrc uOpenFlags=%#x\n", rc, *puOpenFlags));
9569 return rc;
9570}
9571
9572/**
9573 * Set open flags of image in HDD container.
9574 * This operation may cause file locking changes and/or files being reopened.
9575 * Note that in case of unrecoverable error all images in HDD container will be closed.
9576 *
9577 * @returns VBox status code.
9578 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9579 * @param pDisk Pointer to HDD container.
9580 * @param nImage Image number, counts from 0. 0 is always base image of container.
9581 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
9582 */
9583VBOXDDU_DECL(int) VDSetOpenFlags(PVBOXHDD pDisk, unsigned nImage,
9584 unsigned uOpenFlags)
9585{
9586 int rc;
9587 int rc2;
9588 bool fLockWrite = false;
9589
9590 LogFlowFunc(("pDisk=%#p uOpenFlags=%#u\n", pDisk, uOpenFlags));
9591 do
9592 {
9593 /* sanity check */
9594 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9595 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9596
9597 /* Check arguments. */
9598 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
9599 ("uOpenFlags=%#x\n", uOpenFlags),
9600 rc = VERR_INVALID_PARAMETER);
9601
9602 rc2 = vdThreadStartWrite(pDisk);
9603 AssertRC(rc2);
9604 fLockWrite = true;
9605
9606 /* Destroy any discard state because the image might be changed to readonly mode. */
9607 rc = vdDiscardStateDestroy(pDisk);
9608 if (RT_FAILURE(rc))
9609 break;
9610
9611 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9612 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9613
9614 rc = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData,
9615 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS));
9616 if (RT_SUCCESS(rc))
9617 pImage->uOpenFlags = uOpenFlags & (VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_DISCARD | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS);
9618 } while (0);
9619
9620 if (RT_UNLIKELY(fLockWrite))
9621 {
9622 rc2 = vdThreadFinishWrite(pDisk);
9623 AssertRC(rc2);
9624 }
9625
9626 LogFlowFunc(("returns %Rrc\n", rc));
9627 return rc;
9628}
9629
9630/**
9631 * Get base filename of image in HDD container. Some image formats use
9632 * other filenames as well, so don't use this for anything but informational
9633 * purposes.
9634 *
9635 * @returns VBox status code.
9636 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9637 * @returns VERR_BUFFER_OVERFLOW if pszFilename buffer too small to hold filename.
9638 * @param pDisk Pointer to HDD container.
9639 * @param nImage Image number, counts from 0. 0 is always base image of container.
9640 * @param pszFilename Where to store the image file name.
9641 * @param cbFilename Size of buffer pszFilename points to.
9642 */
9643VBOXDDU_DECL(int) VDGetFilename(PVBOXHDD pDisk, unsigned nImage,
9644 char *pszFilename, unsigned cbFilename)
9645{
9646 int rc;
9647 int rc2;
9648 bool fLockRead = false;
9649
9650 LogFlowFunc(("pDisk=%#p nImage=%u pszFilename=%#p cbFilename=%u\n",
9651 pDisk, nImage, pszFilename, cbFilename));
9652 do
9653 {
9654 /* sanity check */
9655 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9656 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9657
9658 /* Check arguments. */
9659 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
9660 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
9661 rc = VERR_INVALID_PARAMETER);
9662 AssertMsgBreakStmt(cbFilename,
9663 ("cbFilename=%u\n", cbFilename),
9664 rc = VERR_INVALID_PARAMETER);
9665
9666 rc2 = vdThreadStartRead(pDisk);
9667 AssertRC(rc2);
9668 fLockRead = true;
9669
9670 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9671 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9672
9673 size_t cb = strlen(pImage->pszFilename);
9674 if (cb <= cbFilename)
9675 {
9676 strcpy(pszFilename, pImage->pszFilename);
9677 rc = VINF_SUCCESS;
9678 }
9679 else
9680 {
9681 strncpy(pszFilename, pImage->pszFilename, cbFilename - 1);
9682 pszFilename[cbFilename - 1] = '\0';
9683 rc = VERR_BUFFER_OVERFLOW;
9684 }
9685 } while (0);
9686
9687 if (RT_UNLIKELY(fLockRead))
9688 {
9689 rc2 = vdThreadFinishRead(pDisk);
9690 AssertRC(rc2);
9691 }
9692
9693 LogFlowFunc(("returns %Rrc, pszFilename=\"%s\"\n", rc, pszFilename));
9694 return rc;
9695}
9696
9697/**
9698 * Get the comment line of image in HDD container.
9699 *
9700 * @returns VBox status code.
9701 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9702 * @returns VERR_BUFFER_OVERFLOW if pszComment buffer too small to hold comment text.
9703 * @param pDisk Pointer to HDD container.
9704 * @param nImage Image number, counts from 0. 0 is always base image of container.
9705 * @param pszComment Where to store the comment string of image. NULL is ok.
9706 * @param cbComment The size of pszComment buffer. 0 is ok.
9707 */
9708VBOXDDU_DECL(int) VDGetComment(PVBOXHDD pDisk, unsigned nImage,
9709 char *pszComment, unsigned cbComment)
9710{
9711 int rc;
9712 int rc2;
9713 bool fLockRead = false;
9714
9715 LogFlowFunc(("pDisk=%#p nImage=%u pszComment=%#p cbComment=%u\n",
9716 pDisk, nImage, pszComment, cbComment));
9717 do
9718 {
9719 /* sanity check */
9720 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9721 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9722
9723 /* Check arguments. */
9724 AssertMsgBreakStmt(VALID_PTR(pszComment),
9725 ("pszComment=%#p \"%s\"\n", pszComment, pszComment),
9726 rc = VERR_INVALID_PARAMETER);
9727 AssertMsgBreakStmt(cbComment,
9728 ("cbComment=%u\n", cbComment),
9729 rc = VERR_INVALID_PARAMETER);
9730
9731 rc2 = vdThreadStartRead(pDisk);
9732 AssertRC(rc2);
9733 fLockRead = true;
9734
9735 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9736 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9737
9738 rc = pImage->Backend->pfnGetComment(pImage->pBackendData, pszComment,
9739 cbComment);
9740 } while (0);
9741
9742 if (RT_UNLIKELY(fLockRead))
9743 {
9744 rc2 = vdThreadFinishRead(pDisk);
9745 AssertRC(rc2);
9746 }
9747
9748 LogFlowFunc(("returns %Rrc, pszComment=\"%s\"\n", rc, pszComment));
9749 return rc;
9750}
9751
9752/**
9753 * Changes the comment line of image in HDD container.
9754 *
9755 * @returns VBox status code.
9756 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9757 * @param pDisk Pointer to HDD container.
9758 * @param nImage Image number, counts from 0. 0 is always base image of container.
9759 * @param pszComment New comment string (UTF-8). NULL is allowed to reset the comment.
9760 */
9761VBOXDDU_DECL(int) VDSetComment(PVBOXHDD pDisk, unsigned nImage,
9762 const char *pszComment)
9763{
9764 int rc;
9765 int rc2;
9766 bool fLockWrite = false;
9767
9768 LogFlowFunc(("pDisk=%#p nImage=%u pszComment=%#p \"%s\"\n",
9769 pDisk, nImage, pszComment, pszComment));
9770 do
9771 {
9772 /* sanity check */
9773 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9774 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9775
9776 /* Check arguments. */
9777 AssertMsgBreakStmt(VALID_PTR(pszComment) || pszComment == NULL,
9778 ("pszComment=%#p \"%s\"\n", pszComment, pszComment),
9779 rc = VERR_INVALID_PARAMETER);
9780
9781 rc2 = vdThreadStartWrite(pDisk);
9782 AssertRC(rc2);
9783 fLockWrite = true;
9784
9785 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9786 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9787
9788 rc = pImage->Backend->pfnSetComment(pImage->pBackendData, pszComment);
9789 } while (0);
9790
9791 if (RT_UNLIKELY(fLockWrite))
9792 {
9793 rc2 = vdThreadFinishWrite(pDisk);
9794 AssertRC(rc2);
9795 }
9796
9797 LogFlowFunc(("returns %Rrc\n", rc));
9798 return rc;
9799}
9800
9801
9802/**
9803 * Get UUID of image in HDD container.
9804 *
9805 * @returns VBox status code.
9806 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9807 * @param pDisk Pointer to HDD container.
9808 * @param nImage Image number, counts from 0. 0 is always base image of container.
9809 * @param pUuid Where to store the image creation UUID.
9810 */
9811VBOXDDU_DECL(int) VDGetUuid(PVBOXHDD pDisk, unsigned nImage, PRTUUID pUuid)
9812{
9813 int rc;
9814 int rc2;
9815 bool fLockRead = false;
9816
9817 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9818 do
9819 {
9820 /* sanity check */
9821 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9822 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9823
9824 /* Check arguments. */
9825 AssertMsgBreakStmt(VALID_PTR(pUuid),
9826 ("pUuid=%#p\n", pUuid),
9827 rc = VERR_INVALID_PARAMETER);
9828
9829 rc2 = vdThreadStartRead(pDisk);
9830 AssertRC(rc2);
9831 fLockRead = true;
9832
9833 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9834 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9835
9836 rc = pImage->Backend->pfnGetUuid(pImage->pBackendData, pUuid);
9837 } while (0);
9838
9839 if (RT_UNLIKELY(fLockRead))
9840 {
9841 rc2 = vdThreadFinishRead(pDisk);
9842 AssertRC(rc2);
9843 }
9844
9845 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9846 return rc;
9847}
9848
9849/**
9850 * Set the image's UUID. Should not be used by normal applications.
9851 *
9852 * @returns VBox status code.
9853 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9854 * @param pDisk Pointer to HDD container.
9855 * @param nImage Image number, counts from 0. 0 is always base image of container.
9856 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
9857 */
9858VBOXDDU_DECL(int) VDSetUuid(PVBOXHDD pDisk, unsigned nImage, PCRTUUID pUuid)
9859{
9860 int rc;
9861 int rc2;
9862 bool fLockWrite = false;
9863
9864 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9865 pDisk, nImage, pUuid, pUuid));
9866 do
9867 {
9868 /* sanity check */
9869 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9870 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9871
9872 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9873 ("pUuid=%#p\n", pUuid),
9874 rc = VERR_INVALID_PARAMETER);
9875
9876 rc2 = vdThreadStartWrite(pDisk);
9877 AssertRC(rc2);
9878 fLockWrite = true;
9879
9880 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9881 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9882
9883 RTUUID Uuid;
9884 if (!pUuid)
9885 {
9886 RTUuidCreate(&Uuid);
9887 pUuid = &Uuid;
9888 }
9889 rc = pImage->Backend->pfnSetUuid(pImage->pBackendData, pUuid);
9890 } while (0);
9891
9892 if (RT_UNLIKELY(fLockWrite))
9893 {
9894 rc2 = vdThreadFinishWrite(pDisk);
9895 AssertRC(rc2);
9896 }
9897
9898 LogFlowFunc(("returns %Rrc\n", rc));
9899 return rc;
9900}
9901
9902/**
9903 * Get last modification UUID of image in HDD container.
9904 *
9905 * @returns VBox status code.
9906 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9907 * @param pDisk Pointer to HDD container.
9908 * @param nImage Image number, counts from 0. 0 is always base image of container.
9909 * @param pUuid Where to store the image modification UUID.
9910 */
9911VBOXDDU_DECL(int) VDGetModificationUuid(PVBOXHDD pDisk, unsigned nImage, PRTUUID pUuid)
9912{
9913 int rc = VINF_SUCCESS;
9914 int rc2;
9915 bool fLockRead = false;
9916
9917 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9918 do
9919 {
9920 /* sanity check */
9921 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9922 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9923
9924 /* Check arguments. */
9925 AssertMsgBreakStmt(VALID_PTR(pUuid),
9926 ("pUuid=%#p\n", pUuid),
9927 rc = VERR_INVALID_PARAMETER);
9928
9929 rc2 = vdThreadStartRead(pDisk);
9930 AssertRC(rc2);
9931 fLockRead = true;
9932
9933 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9934 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9935
9936 rc = pImage->Backend->pfnGetModificationUuid(pImage->pBackendData,
9937 pUuid);
9938 } while (0);
9939
9940 if (RT_UNLIKELY(fLockRead))
9941 {
9942 rc2 = vdThreadFinishRead(pDisk);
9943 AssertRC(rc2);
9944 }
9945
9946 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9947 return rc;
9948}
9949
9950/**
9951 * Set the image's last modification UUID. Should not be used by normal applications.
9952 *
9953 * @returns VBox status code.
9954 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9955 * @param pDisk Pointer to HDD container.
9956 * @param nImage Image number, counts from 0. 0 is always base image of container.
9957 * @param pUuid New modification UUID of the image. If NULL, a new UUID is created.
9958 */
9959VBOXDDU_DECL(int) VDSetModificationUuid(PVBOXHDD pDisk, unsigned nImage, PCRTUUID pUuid)
9960{
9961 int rc;
9962 int rc2;
9963 bool fLockWrite = false;
9964
9965 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9966 pDisk, nImage, pUuid, pUuid));
9967 do
9968 {
9969 /* sanity check */
9970 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9971 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9972
9973 /* Check arguments. */
9974 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9975 ("pUuid=%#p\n", pUuid),
9976 rc = VERR_INVALID_PARAMETER);
9977
9978 rc2 = vdThreadStartWrite(pDisk);
9979 AssertRC(rc2);
9980 fLockWrite = true;
9981
9982 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9983 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9984
9985 RTUUID Uuid;
9986 if (!pUuid)
9987 {
9988 RTUuidCreate(&Uuid);
9989 pUuid = &Uuid;
9990 }
9991 rc = pImage->Backend->pfnSetModificationUuid(pImage->pBackendData,
9992 pUuid);
9993 } while (0);
9994
9995 if (RT_UNLIKELY(fLockWrite))
9996 {
9997 rc2 = vdThreadFinishWrite(pDisk);
9998 AssertRC(rc2);
9999 }
10000
10001 LogFlowFunc(("returns %Rrc\n", rc));
10002 return rc;
10003}
10004
10005/**
10006 * Get parent UUID of image in HDD container.
10007 *
10008 * @returns VBox status code.
10009 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
10010 * @param pDisk Pointer to HDD container.
10011 * @param nImage Image number, counts from 0. 0 is always base image of container.
10012 * @param pUuid Where to store the parent image UUID.
10013 */
10014VBOXDDU_DECL(int) VDGetParentUuid(PVBOXHDD pDisk, unsigned nImage,
10015 PRTUUID pUuid)
10016{
10017 int rc = VINF_SUCCESS;
10018 int rc2;
10019 bool fLockRead = false;
10020
10021 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
10022 do
10023 {
10024 /* sanity check */
10025 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10026 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10027
10028 /* Check arguments. */
10029 AssertMsgBreakStmt(VALID_PTR(pUuid),
10030 ("pUuid=%#p\n", pUuid),
10031 rc = VERR_INVALID_PARAMETER);
10032
10033 rc2 = vdThreadStartRead(pDisk);
10034 AssertRC(rc2);
10035 fLockRead = true;
10036
10037 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
10038 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
10039
10040 rc = pImage->Backend->pfnGetParentUuid(pImage->pBackendData, pUuid);
10041 } while (0);
10042
10043 if (RT_UNLIKELY(fLockRead))
10044 {
10045 rc2 = vdThreadFinishRead(pDisk);
10046 AssertRC(rc2);
10047 }
10048
10049 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
10050 return rc;
10051}
10052
10053/**
10054 * Set the image's parent UUID. Should not be used by normal applications.
10055 *
10056 * @returns VBox status code.
10057 * @param pDisk Pointer to HDD container.
10058 * @param nImage Image number, counts from 0. 0 is always base image of container.
10059 * @param pUuid New parent UUID of the image. If NULL, a new UUID is created.
10060 */
10061VBOXDDU_DECL(int) VDSetParentUuid(PVBOXHDD pDisk, unsigned nImage,
10062 PCRTUUID pUuid)
10063{
10064 int rc;
10065 int rc2;
10066 bool fLockWrite = false;
10067
10068 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
10069 pDisk, nImage, pUuid, pUuid));
10070 do
10071 {
10072 /* sanity check */
10073 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10074 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10075
10076 /* Check arguments. */
10077 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
10078 ("pUuid=%#p\n", pUuid),
10079 rc = VERR_INVALID_PARAMETER);
10080
10081 rc2 = vdThreadStartWrite(pDisk);
10082 AssertRC(rc2);
10083 fLockWrite = true;
10084
10085 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
10086 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
10087
10088 RTUUID Uuid;
10089 if (!pUuid)
10090 {
10091 RTUuidCreate(&Uuid);
10092 pUuid = &Uuid;
10093 }
10094 rc = pImage->Backend->pfnSetParentUuid(pImage->pBackendData, pUuid);
10095 } while (0);
10096
10097 if (RT_UNLIKELY(fLockWrite))
10098 {
10099 rc2 = vdThreadFinishWrite(pDisk);
10100 AssertRC(rc2);
10101 }
10102
10103 LogFlowFunc(("returns %Rrc\n", rc));
10104 return rc;
10105}
10106
10107
10108/**
10109 * Debug helper - dumps all opened images in HDD container into the log file.
10110 *
10111 * @param pDisk Pointer to HDD container.
10112 */
10113VBOXDDU_DECL(void) VDDumpImages(PVBOXHDD pDisk)
10114{
10115 int rc2;
10116 bool fLockRead = false;
10117
10118 do
10119 {
10120 /* sanity check */
10121 AssertPtrBreak(pDisk);
10122 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10123
10124 if (!pDisk->pInterfaceError || !VALID_PTR(pDisk->pInterfaceError->pfnMessage))
10125 pDisk->pInterfaceError->pfnMessage = vdLogMessage;
10126
10127 rc2 = vdThreadStartRead(pDisk);
10128 AssertRC(rc2);
10129 fLockRead = true;
10130
10131 vdMessageWrapper(pDisk, "--- Dumping VD Disk, Images=%u\n", pDisk->cImages);
10132 for (PVDIMAGE pImage = pDisk->pBase; pImage; pImage = pImage->pNext)
10133 {
10134 vdMessageWrapper(pDisk, "Dumping VD image \"%s\" (Backend=%s)\n",
10135 pImage->pszFilename, pImage->Backend->pszBackendName);
10136 pImage->Backend->pfnDump(pImage->pBackendData);
10137 }
10138 } while (0);
10139
10140 if (RT_UNLIKELY(fLockRead))
10141 {
10142 rc2 = vdThreadFinishRead(pDisk);
10143 AssertRC(rc2);
10144 }
10145}
10146
10147
10148VBOXDDU_DECL(int) VDDiscardRanges(PVBOXHDD pDisk, PCRTRANGE paRanges, unsigned cRanges)
10149{
10150 int rc;
10151 int rc2;
10152 bool fLockWrite = false;
10153
10154 LogFlowFunc(("pDisk=%#p paRanges=%#p cRanges=%u\n",
10155 pDisk, paRanges, cRanges));
10156 do
10157 {
10158 /* sanity check */
10159 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10160 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10161
10162 /* Check arguments. */
10163 AssertMsgBreakStmt(cRanges,
10164 ("cRanges=%u\n", cRanges),
10165 rc = VERR_INVALID_PARAMETER);
10166 AssertMsgBreakStmt(VALID_PTR(paRanges),
10167 ("paRanges=%#p\n", paRanges),
10168 rc = VERR_INVALID_PARAMETER);
10169
10170 rc2 = vdThreadStartWrite(pDisk);
10171 AssertRC(rc2);
10172 fLockWrite = true;
10173
10174 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10175
10176 AssertMsgBreakStmt(pDisk->pLast->uOpenFlags & VD_OPEN_FLAGS_DISCARD,
10177 ("Discarding not supported\n"),
10178 rc = VERR_NOT_SUPPORTED);
10179
10180 VDIOCTX IoCtx;
10181 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
10182
10183 rc = RTSemEventCreate(&hEventComplete);
10184 if (RT_FAILURE(rc))
10185 break;
10186
10187 vdIoCtxDiscardInit(&IoCtx, pDisk, paRanges, cRanges,
10188 vdIoCtxSyncComplete, pDisk, hEventComplete, NULL,
10189 vdDiscardHelperAsync, VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE);
10190 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
10191
10192 RTSemEventDestroy(hEventComplete);
10193 } while (0);
10194
10195 if (RT_UNLIKELY(fLockWrite))
10196 {
10197 rc2 = vdThreadFinishWrite(pDisk);
10198 AssertRC(rc2);
10199 }
10200
10201 LogFlowFunc(("returns %Rrc\n", rc));
10202 return rc;
10203}
10204
10205
10206VBOXDDU_DECL(int) VDAsyncRead(PVBOXHDD pDisk, uint64_t uOffset, size_t cbRead,
10207 PCRTSGBUF pcSgBuf,
10208 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10209 void *pvUser1, void *pvUser2)
10210{
10211 int rc = VERR_VD_BLOCK_FREE;
10212 int rc2;
10213 bool fLockRead = false;
10214 PVDIOCTX pIoCtx = NULL;
10215
10216 LogFlowFunc(("pDisk=%#p uOffset=%llu pcSgBuf=%#p cbRead=%zu pvUser1=%#p pvUser2=%#p\n",
10217 pDisk, uOffset, pcSgBuf, cbRead, pvUser1, pvUser2));
10218
10219 do
10220 {
10221 /* sanity check */
10222 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10223 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10224
10225 /* Check arguments. */
10226 AssertMsgBreakStmt(cbRead,
10227 ("cbRead=%zu\n", cbRead),
10228 rc = VERR_INVALID_PARAMETER);
10229 AssertMsgBreakStmt(VALID_PTR(pcSgBuf),
10230 ("pcSgBuf=%#p\n", pcSgBuf),
10231 rc = VERR_INVALID_PARAMETER);
10232
10233 rc2 = vdThreadStartRead(pDisk);
10234 AssertRC(rc2);
10235 fLockRead = true;
10236
10237 AssertMsgBreakStmt(uOffset + cbRead <= pDisk->cbSize,
10238 ("uOffset=%llu cbRead=%zu pDisk->cbSize=%llu\n",
10239 uOffset, cbRead, pDisk->cbSize),
10240 rc = VERR_INVALID_PARAMETER);
10241 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10242
10243 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_READ, uOffset,
10244 cbRead, pDisk->pLast, pcSgBuf,
10245 pfnComplete, pvUser1, pvUser2,
10246 NULL, vdReadHelperAsync,
10247 VDIOCTX_FLAGS_ZERO_FREE_BLOCKS);
10248 if (!pIoCtx)
10249 {
10250 rc = VERR_NO_MEMORY;
10251 break;
10252 }
10253
10254 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10255 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10256 {
10257 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10258 vdIoCtxFree(pDisk, pIoCtx);
10259 else
10260 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10261 }
10262 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10263 vdIoCtxFree(pDisk, pIoCtx);
10264
10265 } while (0);
10266
10267 if (RT_UNLIKELY(fLockRead) && ( rc == VINF_VD_ASYNC_IO_FINISHED
10268 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10269 {
10270 rc2 = vdThreadFinishRead(pDisk);
10271 AssertRC(rc2);
10272 }
10273
10274 LogFlowFunc(("returns %Rrc\n", rc));
10275 return rc;
10276}
10277
10278
10279VBOXDDU_DECL(int) VDAsyncWrite(PVBOXHDD pDisk, uint64_t uOffset, size_t cbWrite,
10280 PCRTSGBUF pcSgBuf,
10281 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10282 void *pvUser1, void *pvUser2)
10283{
10284 int rc;
10285 int rc2;
10286 bool fLockWrite = false;
10287 PVDIOCTX pIoCtx = NULL;
10288
10289 LogFlowFunc(("pDisk=%#p uOffset=%llu cSgBuf=%#p cbWrite=%zu pvUser1=%#p pvUser2=%#p\n",
10290 pDisk, uOffset, pcSgBuf, cbWrite, pvUser1, pvUser2));
10291 do
10292 {
10293 /* sanity check */
10294 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10295 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10296
10297 /* Check arguments. */
10298 AssertMsgBreakStmt(cbWrite,
10299 ("cbWrite=%zu\n", cbWrite),
10300 rc = VERR_INVALID_PARAMETER);
10301 AssertMsgBreakStmt(VALID_PTR(pcSgBuf),
10302 ("pcSgBuf=%#p\n", pcSgBuf),
10303 rc = VERR_INVALID_PARAMETER);
10304
10305 rc2 = vdThreadStartWrite(pDisk);
10306 AssertRC(rc2);
10307 fLockWrite = true;
10308
10309 AssertMsgBreakStmt(uOffset + cbWrite <= pDisk->cbSize,
10310 ("uOffset=%llu cbWrite=%zu pDisk->cbSize=%llu\n",
10311 uOffset, cbWrite, pDisk->cbSize),
10312 rc = VERR_INVALID_PARAMETER);
10313 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10314
10315 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_WRITE, uOffset,
10316 cbWrite, pDisk->pLast, pcSgBuf,
10317 pfnComplete, pvUser1, pvUser2,
10318 NULL, vdWriteHelperAsync,
10319 VDIOCTX_FLAGS_DEFAULT);
10320 if (!pIoCtx)
10321 {
10322 rc = VERR_NO_MEMORY;
10323 break;
10324 }
10325
10326 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10327 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10328 {
10329 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10330 vdIoCtxFree(pDisk, pIoCtx);
10331 else
10332 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10333 }
10334 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10335 vdIoCtxFree(pDisk, pIoCtx);
10336 } while (0);
10337
10338 if (RT_UNLIKELY(fLockWrite) && ( rc == VINF_VD_ASYNC_IO_FINISHED
10339 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10340 {
10341 rc2 = vdThreadFinishWrite(pDisk);
10342 AssertRC(rc2);
10343 }
10344
10345 LogFlowFunc(("returns %Rrc\n", rc));
10346 return rc;
10347}
10348
10349
10350VBOXDDU_DECL(int) VDAsyncFlush(PVBOXHDD pDisk, PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10351 void *pvUser1, void *pvUser2)
10352{
10353 int rc;
10354 int rc2;
10355 bool fLockWrite = false;
10356 PVDIOCTX pIoCtx = NULL;
10357
10358 LogFlowFunc(("pDisk=%#p\n", pDisk));
10359
10360 do
10361 {
10362 /* sanity check */
10363 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10364 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10365
10366 rc2 = vdThreadStartWrite(pDisk);
10367 AssertRC(rc2);
10368 fLockWrite = true;
10369
10370 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10371
10372 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_FLUSH, 0,
10373 0, pDisk->pLast, NULL,
10374 pfnComplete, pvUser1, pvUser2,
10375 NULL, vdFlushHelperAsync,
10376 VDIOCTX_FLAGS_DEFAULT);
10377 if (!pIoCtx)
10378 {
10379 rc = VERR_NO_MEMORY;
10380 break;
10381 }
10382
10383 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10384 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10385 {
10386 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10387 vdIoCtxFree(pDisk, pIoCtx);
10388 else
10389 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10390 }
10391 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10392 vdIoCtxFree(pDisk, pIoCtx);
10393 } while (0);
10394
10395 if (RT_UNLIKELY(fLockWrite) && ( rc == VINF_VD_ASYNC_IO_FINISHED
10396 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10397 {
10398 rc2 = vdThreadFinishWrite(pDisk);
10399 AssertRC(rc2);
10400 }
10401
10402 LogFlowFunc(("returns %Rrc\n", rc));
10403 return rc;
10404}
10405
10406VBOXDDU_DECL(int) VDAsyncDiscardRanges(PVBOXHDD pDisk, PCRTRANGE paRanges, unsigned cRanges,
10407 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10408 void *pvUser1, void *pvUser2)
10409{
10410 int rc;
10411 int rc2;
10412 bool fLockWrite = false;
10413 PVDIOCTX pIoCtx = NULL;
10414
10415 LogFlowFunc(("pDisk=%#p\n", pDisk));
10416
10417 do
10418 {
10419 /* sanity check */
10420 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10421 AssertMsg(pDisk->u32Signature == VBOXHDDDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10422
10423 rc2 = vdThreadStartWrite(pDisk);
10424 AssertRC(rc2);
10425 fLockWrite = true;
10426
10427 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10428
10429 pIoCtx = vdIoCtxDiscardAlloc(pDisk, paRanges, cRanges,
10430 pfnComplete, pvUser1, pvUser2, NULL,
10431 vdDiscardHelperAsync,
10432 VDIOCTX_FLAGS_DEFAULT);
10433 if (!pIoCtx)
10434 {
10435 rc = VERR_NO_MEMORY;
10436 break;
10437 }
10438
10439 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10440 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10441 {
10442 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10443 vdIoCtxFree(pDisk, pIoCtx);
10444 else
10445 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10446 }
10447 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10448 vdIoCtxFree(pDisk, pIoCtx);
10449 } while (0);
10450
10451 if (RT_UNLIKELY(fLockWrite) && ( rc == VINF_VD_ASYNC_IO_FINISHED
10452 || rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10453 {
10454 rc2 = vdThreadFinishWrite(pDisk);
10455 AssertRC(rc2);
10456 }
10457
10458 LogFlowFunc(("returns %Rrc\n", rc));
10459 return rc;
10460}
10461
10462VBOXDDU_DECL(int) VDRepair(PVDINTERFACE pVDIfsDisk, PVDINTERFACE pVDIfsImage,
10463 const char *pszFilename, const char *pszBackend,
10464 uint32_t fFlags)
10465{
10466 int rc = VERR_NOT_SUPPORTED;
10467 PCVBOXHDDBACKEND pBackend = NULL;
10468 VDINTERFACEIOINT VDIfIoInt;
10469 VDINTERFACEIO VDIfIoFallback;
10470 PVDINTERFACEIO pInterfaceIo;
10471
10472 LogFlowFunc(("pszFilename=\"%s\"\n", pszFilename));
10473 /* Check arguments. */
10474 AssertMsgReturn(VALID_PTR(pszFilename) && *pszFilename,
10475 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
10476 VERR_INVALID_PARAMETER);
10477 AssertMsgReturn(VALID_PTR(pszBackend),
10478 ("pszBackend=%#p\n", pszBackend),
10479 VERR_INVALID_PARAMETER);
10480 AssertMsgReturn((fFlags & ~VD_REPAIR_FLAGS_MASK) == 0,
10481 ("fFlags=%#x\n", fFlags),
10482 VERR_INVALID_PARAMETER);
10483
10484 pInterfaceIo = VDIfIoGet(pVDIfsImage);
10485 if (!pInterfaceIo)
10486 {
10487 /*
10488 * Caller doesn't provide an I/O interface, create our own using the
10489 * native file API.
10490 */
10491 vdIfIoFallbackCallbacksSetup(&VDIfIoFallback);
10492 pInterfaceIo = &VDIfIoFallback;
10493 }
10494
10495 /* Set up the internal I/O interface. */
10496 AssertReturn(!VDIfIoIntGet(pVDIfsImage), VERR_INVALID_PARAMETER);
10497 VDIfIoInt.pfnOpen = vdIOIntOpenLimited;
10498 VDIfIoInt.pfnClose = vdIOIntCloseLimited;
10499 VDIfIoInt.pfnDelete = vdIOIntDeleteLimited;
10500 VDIfIoInt.pfnMove = vdIOIntMoveLimited;
10501 VDIfIoInt.pfnGetFreeSpace = vdIOIntGetFreeSpaceLimited;
10502 VDIfIoInt.pfnGetModificationTime = vdIOIntGetModificationTimeLimited;
10503 VDIfIoInt.pfnGetSize = vdIOIntGetSizeLimited;
10504 VDIfIoInt.pfnSetSize = vdIOIntSetSizeLimited;
10505 VDIfIoInt.pfnReadUser = vdIOIntReadUserLimited;
10506 VDIfIoInt.pfnWriteUser = vdIOIntWriteUserLimited;
10507 VDIfIoInt.pfnReadMeta = vdIOIntReadMetaLimited;
10508 VDIfIoInt.pfnWriteMeta = vdIOIntWriteMetaLimited;
10509 VDIfIoInt.pfnFlush = vdIOIntFlushLimited;
10510 rc = VDInterfaceAdd(&VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
10511 pInterfaceIo, sizeof(VDINTERFACEIOINT), &pVDIfsImage);
10512 AssertRC(rc);
10513
10514 rc = vdFindBackend(pszBackend, &pBackend);
10515 if (RT_SUCCESS(rc))
10516 {
10517 if (pBackend->pfnRepair)
10518 rc = pBackend->pfnRepair(pszFilename, pVDIfsDisk, pVDIfsImage, fFlags);
10519 else
10520 rc = VERR_VD_IMAGE_REPAIR_NOT_SUPPORTED;
10521 }
10522
10523 LogFlowFunc(("returns %Rrc\n", rc));
10524 return rc;
10525}
10526
Note: See TracBrowser for help on using the repository browser.

© 2025 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette