VirtualBox

source: vbox/trunk/src/VBox/Storage/VD.cpp@ 68181

Last change on this file since 68181 was 67464, checked in by vboxsync, 8 years ago

VD.cpp: VDGetFormat: Here be dragons. Killed the one named VERR_EOF, but can imagine a there are a lot more lurking around...

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 375.4 KB
Line 
1/* $Id: VD.cpp 67464 2017-06-19 10:08:36Z vboxsync $ */
2/** @file
3 * VD - Virtual disk container implementation.
4 */
5
6/*
7 * Copyright (C) 2006-2017 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*********************************************************************************************************************************
20* Header Files *
21*********************************************************************************************************************************/
22#define LOG_GROUP LOG_GROUP_VD
23#include <VBox/vd.h>
24#include <VBox/err.h>
25#include <VBox/sup.h>
26#include <VBox/log.h>
27
28#include <iprt/alloc.h>
29#include <iprt/assert.h>
30#include <iprt/uuid.h>
31#include <iprt/file.h>
32#include <iprt/string.h>
33#include <iprt/asm.h>
34#include <iprt/param.h>
35#include <iprt/path.h>
36#include <iprt/sg.h>
37#include <iprt/semaphore.h>
38
39#include "VDInternal.h"
40
41/** Buffer size used for merging images. */
42#define VD_MERGE_BUFFER_SIZE (16 * _1M)
43
44/** Maximum number of segments in one I/O task. */
45#define VD_IO_TASK_SEGMENTS_MAX 64
46
47/** Threshold after not recently used blocks are removed from the list. */
48#define VD_DISCARD_REMOVE_THRESHOLD (10 * _1M) /** @todo experiment */
49
50/**
51 * VD async I/O interface storage descriptor.
52 */
53typedef struct VDIIOFALLBACKSTORAGE
54{
55 /** File handle. */
56 RTFILE File;
57 /** Completion callback. */
58 PFNVDCOMPLETED pfnCompleted;
59 /** Thread for async access. */
60 RTTHREAD ThreadAsync;
61} VDIIOFALLBACKSTORAGE, *PVDIIOFALLBACKSTORAGE;
62
63/**
64 * uModified bit flags.
65 */
66#define VD_IMAGE_MODIFIED_FLAG RT_BIT(0)
67#define VD_IMAGE_MODIFIED_FIRST RT_BIT(1)
68#define VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE RT_BIT(2)
69
70
71# define VD_IS_LOCKED(a_pDisk) \
72 do \
73 { \
74 NOREF(a_pDisk); \
75 AssertMsg((a_pDisk)->fLocked, \
76 ("Lock not held\n"));\
77 } while(0)
78
79/**
80 * VBox parent read descriptor, used internally for compaction.
81 */
82typedef struct VDPARENTSTATEDESC
83{
84 /** Pointer to disk descriptor. */
85 PVDISK pDisk;
86 /** Pointer to image descriptor. */
87 PVDIMAGE pImage;
88} VDPARENTSTATEDESC, *PVDPARENTSTATEDESC;
89
90/**
91 * Transfer direction.
92 */
93typedef enum VDIOCTXTXDIR
94{
95 /** Read */
96 VDIOCTXTXDIR_READ = 0,
97 /** Write */
98 VDIOCTXTXDIR_WRITE,
99 /** Flush */
100 VDIOCTXTXDIR_FLUSH,
101 /** Discard */
102 VDIOCTXTXDIR_DISCARD,
103 /** 32bit hack */
104 VDIOCTXTXDIR_32BIT_HACK = 0x7fffffff
105} VDIOCTXTXDIR, *PVDIOCTXTXDIR;
106
107/** Transfer function */
108typedef DECLCALLBACK(int) FNVDIOCTXTRANSFER (PVDIOCTX pIoCtx);
109/** Pointer to a transfer function. */
110typedef FNVDIOCTXTRANSFER *PFNVDIOCTXTRANSFER;
111
112/**
113 * I/O context
114 */
115typedef struct VDIOCTX
116{
117 /** Pointer to the next I/O context. */
118 struct VDIOCTX * volatile pIoCtxNext;
119 /** Disk this is request is for. */
120 PVDISK pDisk;
121 /** Return code. */
122 int rcReq;
123 /** Various flags for the I/O context. */
124 uint32_t fFlags;
125 /** Number of data transfers currently pending. */
126 volatile uint32_t cDataTransfersPending;
127 /** How many meta data transfers are pending. */
128 volatile uint32_t cMetaTransfersPending;
129 /** Flag whether the request finished */
130 volatile bool fComplete;
131 /** Temporary allocated memory which is freed
132 * when the context completes. */
133 void *pvAllocation;
134 /** Transfer function. */
135 PFNVDIOCTXTRANSFER pfnIoCtxTransfer;
136 /** Next transfer part after the current one completed. */
137 PFNVDIOCTXTRANSFER pfnIoCtxTransferNext;
138 /** Transfer direction */
139 VDIOCTXTXDIR enmTxDir;
140 /** Request type dependent data. */
141 union
142 {
143 /** I/O request (read/write). */
144 struct
145 {
146 /** Number of bytes left until this context completes. */
147 volatile uint32_t cbTransferLeft;
148 /** Current offset */
149 volatile uint64_t uOffset;
150 /** Number of bytes to transfer */
151 volatile size_t cbTransfer;
152 /** Current image in the chain. */
153 PVDIMAGE pImageCur;
154 /** Start image to read from. pImageCur is reset to this
155 * value after it reached the first image in the chain. */
156 PVDIMAGE pImageStart;
157 /** S/G buffer */
158 RTSGBUF SgBuf;
159 /** Number of bytes to clear in the buffer before the current read. */
160 size_t cbBufClear;
161 /** Number of images to read. */
162 unsigned cImagesRead;
163 /** Override for the parent image to start reading from. */
164 PVDIMAGE pImageParentOverride;
165 /** Original offset of the transfer - required for filtering read requests. */
166 uint64_t uOffsetXferOrig;
167 /** Original size of the transfer - required for fitlering read requests. */
168 size_t cbXferOrig;
169 } Io;
170 /** Discard requests. */
171 struct
172 {
173 /** Pointer to the range descriptor array. */
174 PCRTRANGE paRanges;
175 /** Number of ranges in the array. */
176 unsigned cRanges;
177 /** Range descriptor index which is processed. */
178 unsigned idxRange;
179 /** Start offset to discard currently. */
180 uint64_t offCur;
181 /** How many bytes left to discard in the current range. */
182 size_t cbDiscardLeft;
183 /** How many bytes to discard in the current block (<= cbDiscardLeft). */
184 size_t cbThisDiscard;
185 /** Discard block handled currently. */
186 PVDDISCARDBLOCK pBlock;
187 } Discard;
188 } Req;
189 /** Parent I/O context if any. Sets the type of the context (root/child) */
190 PVDIOCTX pIoCtxParent;
191 /** Type dependent data (root/child) */
192 union
193 {
194 /** Root data */
195 struct
196 {
197 /** Completion callback */
198 PFNVDASYNCTRANSFERCOMPLETE pfnComplete;
199 /** User argument 1 passed on completion. */
200 void *pvUser1;
201 /** User argument 2 passed on completion. */
202 void *pvUser2;
203 } Root;
204 /** Child data */
205 struct
206 {
207 /** Saved start offset */
208 uint64_t uOffsetSaved;
209 /** Saved transfer size */
210 size_t cbTransferLeftSaved;
211 /** Number of bytes transferred from the parent if this context completes. */
212 size_t cbTransferParent;
213 /** Number of bytes to pre read */
214 size_t cbPreRead;
215 /** Number of bytes to post read. */
216 size_t cbPostRead;
217 /** Number of bytes to write left in the parent. */
218 size_t cbWriteParent;
219 /** Write type dependent data. */
220 union
221 {
222 /** Optimized */
223 struct
224 {
225 /** Bytes to fill to satisfy the block size. Not part of the virtual disk. */
226 size_t cbFill;
227 /** Bytes to copy instead of reading from the parent */
228 size_t cbWriteCopy;
229 /** Bytes to read from the image. */
230 size_t cbReadImage;
231 } Optimized;
232 } Write;
233 } Child;
234 } Type;
235} VDIOCTX;
236
237/** Default flags for an I/O context, i.e. unblocked and async. */
238#define VDIOCTX_FLAGS_DEFAULT (0)
239/** Flag whether the context is blocked. */
240#define VDIOCTX_FLAGS_BLOCKED RT_BIT_32(0)
241/** Flag whether the I/O context is using synchronous I/O. */
242#define VDIOCTX_FLAGS_SYNC RT_BIT_32(1)
243/** Flag whether the read should update the cache. */
244#define VDIOCTX_FLAGS_READ_UPDATE_CACHE RT_BIT_32(2)
245/** Flag whether free blocks should be zeroed.
246 * If false and no image has data for sepcified
247 * range VERR_VD_BLOCK_FREE is returned for the I/O context.
248 * Note that unallocated blocks are still zeroed
249 * if at least one image has valid data for a part
250 * of the range.
251 */
252#define VDIOCTX_FLAGS_ZERO_FREE_BLOCKS RT_BIT_32(3)
253/** Don't free the I/O context when complete because
254 * it was alloacted elsewhere (stack, ...). */
255#define VDIOCTX_FLAGS_DONT_FREE RT_BIT_32(4)
256/** Don't set the modified flag for this I/O context when writing. */
257#define VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG RT_BIT_32(5)
258/** The write filter was applied already and shouldn't be applied a second time.
259 * Used at the beginning of vdWriteHelperAsync() because it might be called
260 * multiple times.
261 */
262#define VDIOCTX_FLAGS_WRITE_FILTER_APPLIED RT_BIT_32(6)
263
264/** NIL I/O context pointer value. */
265#define NIL_VDIOCTX ((PVDIOCTX)0)
266
267/**
268 * List node for deferred I/O contexts.
269 */
270typedef struct VDIOCTXDEFERRED
271{
272 /** Node in the list of deferred requests.
273 * A request can be deferred if the image is growing
274 * and the request accesses the same range or if
275 * the backend needs to read or write metadata from the disk
276 * before it can continue. */
277 RTLISTNODE NodeDeferred;
278 /** I/O context this entry points to. */
279 PVDIOCTX pIoCtx;
280} VDIOCTXDEFERRED, *PVDIOCTXDEFERRED;
281
282/**
283 * I/O task.
284 */
285typedef struct VDIOTASK
286{
287 /** Next I/O task waiting in the list. */
288 struct VDIOTASK * volatile pNext;
289 /** Storage this task belongs to. */
290 PVDIOSTORAGE pIoStorage;
291 /** Optional completion callback. */
292 PFNVDXFERCOMPLETED pfnComplete;
293 /** Opaque user data. */
294 void *pvUser;
295 /** Completion status code for the task. */
296 int rcReq;
297 /** Flag whether this is a meta data transfer. */
298 bool fMeta;
299 /** Type dependent data. */
300 union
301 {
302 /** User data transfer. */
303 struct
304 {
305 /** Number of bytes this task transferred. */
306 uint32_t cbTransfer;
307 /** Pointer to the I/O context the task belongs. */
308 PVDIOCTX pIoCtx;
309 } User;
310 /** Meta data transfer. */
311 struct
312 {
313 /** Meta transfer this task is for. */
314 PVDMETAXFER pMetaXfer;
315 } Meta;
316 } Type;
317} VDIOTASK;
318
319/**
320 * Storage handle.
321 */
322typedef struct VDIOSTORAGE
323{
324 /** Image I/O state this storage handle belongs to. */
325 PVDIO pVDIo;
326 /** AVL tree for pending async metadata transfers. */
327 PAVLRFOFFTREE pTreeMetaXfers;
328 /** Storage handle */
329 void *pStorage;
330} VDIOSTORAGE;
331
332/**
333 * Metadata transfer.
334 *
335 * @note This entry can't be freed if either the list is not empty or
336 * the reference counter is not 0.
337 * The assumption is that the backends don't need to read huge amounts of
338 * metadata to complete a transfer so the additional memory overhead should
339 * be relatively small.
340 */
341typedef struct VDMETAXFER
342{
343 /** AVL core for fast search (the file offset is the key) */
344 AVLRFOFFNODECORE Core;
345 /** I/O storage for this transfer. */
346 PVDIOSTORAGE pIoStorage;
347 /** Flags. */
348 uint32_t fFlags;
349 /** List of I/O contexts waiting for this metadata transfer to complete. */
350 RTLISTNODE ListIoCtxWaiting;
351 /** Number of references to this entry. */
352 unsigned cRefs;
353 /** Size of the data stored with this entry. */
354 size_t cbMeta;
355 /** Shadow buffer which is used in case a write is still active and other
356 * writes update the shadow buffer. */
357 uint8_t *pbDataShw;
358 /** List of I/O contexts updating the shadow buffer while there is a write
359 * in progress. */
360 RTLISTNODE ListIoCtxShwWrites;
361 /** Data stored - variable size. */
362 uint8_t abData[1];
363} VDMETAXFER;
364
365/**
366 * The transfer direction for the metadata.
367 */
368#define VDMETAXFER_TXDIR_MASK 0x3
369#define VDMETAXFER_TXDIR_NONE 0x0
370#define VDMETAXFER_TXDIR_WRITE 0x1
371#define VDMETAXFER_TXDIR_READ 0x2
372#define VDMETAXFER_TXDIR_FLUSH 0x3
373#define VDMETAXFER_TXDIR_GET(flags) ((flags) & VDMETAXFER_TXDIR_MASK)
374#define VDMETAXFER_TXDIR_SET(flags, dir) ((flags) = (flags & ~VDMETAXFER_TXDIR_MASK) | (dir))
375
376/** Forward declaration of the async discard helper. */
377static DECLCALLBACK(int) vdDiscardHelperAsync(PVDIOCTX pIoCtx);
378static DECLCALLBACK(int) vdWriteHelperAsync(PVDIOCTX pIoCtx);
379static void vdDiskProcessBlockedIoCtx(PVDISK pDisk);
380static int vdDiskUnlock(PVDISK pDisk, PVDIOCTX pIoCtxRc);
381static DECLCALLBACK(void) vdIoCtxSyncComplete(void *pvUser1, void *pvUser2, int rcReq);
382
383/**
384 * internal: issue error message.
385 */
386static int vdError(PVDISK pDisk, int rc, RT_SRC_POS_DECL,
387 const char *pszFormat, ...)
388{
389 va_list va;
390 va_start(va, pszFormat);
391 if (pDisk->pInterfaceError)
392 pDisk->pInterfaceError->pfnError(pDisk->pInterfaceError->Core.pvUser, rc, RT_SRC_POS_ARGS, pszFormat, va);
393 va_end(va);
394 return rc;
395}
396
397/**
398 * internal: thread synchronization, start read.
399 */
400DECLINLINE(int) vdThreadStartRead(PVDISK pDisk)
401{
402 int rc = VINF_SUCCESS;
403 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
404 rc = pDisk->pInterfaceThreadSync->pfnStartRead(pDisk->pInterfaceThreadSync->Core.pvUser);
405 return rc;
406}
407
408/**
409 * internal: thread synchronization, finish read.
410 */
411DECLINLINE(int) vdThreadFinishRead(PVDISK pDisk)
412{
413 int rc = VINF_SUCCESS;
414 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
415 rc = pDisk->pInterfaceThreadSync->pfnFinishRead(pDisk->pInterfaceThreadSync->Core.pvUser);
416 return rc;
417}
418
419/**
420 * internal: thread synchronization, start write.
421 */
422DECLINLINE(int) vdThreadStartWrite(PVDISK pDisk)
423{
424 int rc = VINF_SUCCESS;
425 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
426 rc = pDisk->pInterfaceThreadSync->pfnStartWrite(pDisk->pInterfaceThreadSync->Core.pvUser);
427 return rc;
428}
429
430/**
431 * internal: thread synchronization, finish write.
432 */
433DECLINLINE(int) vdThreadFinishWrite(PVDISK pDisk)
434{
435 int rc = VINF_SUCCESS;
436 if (RT_UNLIKELY(pDisk->pInterfaceThreadSync))
437 rc = pDisk->pInterfaceThreadSync->pfnFinishWrite(pDisk->pInterfaceThreadSync->Core.pvUser);
438 return rc;
439}
440
441/**
442 * internal: add image structure to the end of images list.
443 */
444static void vdAddImageToList(PVDISK pDisk, PVDIMAGE pImage)
445{
446 pImage->pPrev = NULL;
447 pImage->pNext = NULL;
448
449 if (pDisk->pBase)
450 {
451 Assert(pDisk->cImages > 0);
452 pImage->pPrev = pDisk->pLast;
453 pDisk->pLast->pNext = pImage;
454 pDisk->pLast = pImage;
455 }
456 else
457 {
458 Assert(pDisk->cImages == 0);
459 pDisk->pBase = pImage;
460 pDisk->pLast = pImage;
461 }
462
463 pDisk->cImages++;
464}
465
466/**
467 * internal: remove image structure from the images list.
468 */
469static void vdRemoveImageFromList(PVDISK pDisk, PVDIMAGE pImage)
470{
471 Assert(pDisk->cImages > 0);
472
473 if (pImage->pPrev)
474 pImage->pPrev->pNext = pImage->pNext;
475 else
476 pDisk->pBase = pImage->pNext;
477
478 if (pImage->pNext)
479 pImage->pNext->pPrev = pImage->pPrev;
480 else
481 pDisk->pLast = pImage->pPrev;
482
483 pImage->pPrev = NULL;
484 pImage->pNext = NULL;
485
486 pDisk->cImages--;
487}
488
489/**
490 * Release a referene to the filter decrementing the counter and destroying the filter
491 * when the counter reaches zero.
492 *
493 * @returns The new reference count.
494 * @param pFilter The filter to release.
495 */
496static uint32_t vdFilterRelease(PVDFILTER pFilter)
497{
498 uint32_t cRefs = ASMAtomicDecU32(&pFilter->cRefs);
499 if (!cRefs)
500 {
501 pFilter->pBackend->pfnDestroy(pFilter->pvBackendData);
502 RTMemFree(pFilter);
503 }
504
505 return cRefs;
506}
507
508/**
509 * Increments the reference counter of the given filter.
510 *
511 * @return The new reference count.
512 * @param pFilter The filter.
513 */
514static uint32_t vdFilterRetain(PVDFILTER pFilter)
515{
516 return ASMAtomicIncU32(&pFilter->cRefs);
517}
518
519/**
520 * internal: find image by index into the images list.
521 */
522static PVDIMAGE vdGetImageByNumber(PVDISK pDisk, unsigned nImage)
523{
524 PVDIMAGE pImage = pDisk->pBase;
525 if (nImage == VD_LAST_IMAGE)
526 return pDisk->pLast;
527 while (pImage && nImage)
528 {
529 pImage = pImage->pNext;
530 nImage--;
531 }
532 return pImage;
533}
534
535/**
536 * Creates a new region list from the given one converting to match the flags if necessary.
537 *
538 * @returns VBox status code.
539 * @param pRegionList The region list to convert from.
540 * @param fFlags The flags for the new region list.
541 * @param ppRegionList Where to store the new region list on success.
542 */
543static int vdRegionListConv(PCVDREGIONLIST pRegionList, uint32_t fFlags, PPVDREGIONLIST ppRegionList)
544{
545 int rc = VINF_SUCCESS;
546 PVDREGIONLIST pRegionListNew = (PVDREGIONLIST)RTMemDup(pRegionList, RT_UOFFSETOF(VDREGIONLIST, aRegions[pRegionList->cRegions]));
547 if (RT_LIKELY(pRegionListNew))
548 {
549 /* Do we have to convert anything? */
550 if (pRegionList->fFlags != fFlags)
551 {
552 uint64_t offRegionNext = 0;
553
554 pRegionListNew->fFlags = fFlags;
555 for (unsigned i = 0; i < pRegionListNew->cRegions; i++)
556 {
557 PVDREGIONDESC pRegion = &pRegionListNew->aRegions[i];
558
559 if ( (fFlags & VD_REGION_LIST_F_LOC_SIZE_BLOCKS)
560 && !(pRegionList->fFlags & VD_REGION_LIST_F_LOC_SIZE_BLOCKS))
561 {
562 Assert(!(pRegion->cRegionBlocksOrBytes % pRegion->cbBlock));
563
564 /* Convert from bytes to logical blocks. */
565 pRegion->offRegion = offRegionNext;
566 pRegion->cRegionBlocksOrBytes = pRegion->cRegionBlocksOrBytes / pRegion->cbBlock;
567 offRegionNext += pRegion->cRegionBlocksOrBytes;
568 }
569 else
570 {
571 /* Convert from logical blocks to bytes. */
572 pRegion->offRegion = offRegionNext;
573 pRegion->cRegionBlocksOrBytes = pRegion->cRegionBlocksOrBytes * pRegion->cbBlock;
574 offRegionNext += pRegion->cRegionBlocksOrBytes;
575 }
576 }
577 }
578
579 *ppRegionList = pRegionListNew;
580 }
581 else
582 rc = VERR_NO_MEMORY;
583
584 return rc;
585}
586
587/**
588 * Returns the virtual size of the image in bytes.
589 *
590 * @returns Size of the given image in bytes.
591 * @param pImage The image to get the size from.
592 */
593static uint64_t vdImageGetSize(PVDIMAGE pImage)
594{
595 uint64_t cbImage = 0;
596 PCVDREGIONLIST pRegionList = NULL;
597 int rc = pImage->Backend->pfnQueryRegions(pImage->pBackendData, &pRegionList);
598 if (RT_SUCCESS(rc))
599 {
600 if (pRegionList->fFlags & VD_REGION_LIST_F_LOC_SIZE_BLOCKS)
601 {
602 PVDREGIONLIST pRegionListConv = NULL;
603 rc = vdRegionListConv(pRegionList, 0, &pRegionListConv);
604 if (RT_SUCCESS(rc))
605 {
606 for (uint32_t i = 0; i < pRegionListConv->cRegions; i++)
607 cbImage += pRegionListConv->aRegions[i].cRegionBlocksOrBytes;
608
609 VDRegionListFree(pRegionListConv);
610 }
611 }
612 else
613 for (uint32_t i = 0; i < pRegionList->cRegions; i++)
614 cbImage += pRegionList->aRegions[i].cRegionBlocksOrBytes;
615
616 AssertPtr(pImage->Backend->pfnRegionListRelease);
617 pImage->Backend->pfnRegionListRelease(pImage->pBackendData, pRegionList);
618 }
619
620 return cbImage;
621}
622
623/**
624 * Applies the filter chain to the given write request.
625 *
626 * @returns VBox status code.
627 * @param pDisk The HDD container.
628 * @param uOffset The start offset of the write.
629 * @param cbWrite Number of bytes to write.
630 * @param pIoCtx The I/O context associated with the request.
631 */
632static int vdFilterChainApplyWrite(PVDISK pDisk, uint64_t uOffset, size_t cbWrite,
633 PVDIOCTX pIoCtx)
634{
635 int rc = VINF_SUCCESS;
636
637 VD_IS_LOCKED(pDisk);
638
639 PVDFILTER pFilter;
640 RTListForEach(&pDisk->ListFilterChainWrite, pFilter, VDFILTER, ListNodeChainWrite)
641 {
642 rc = pFilter->pBackend->pfnFilterWrite(pFilter->pvBackendData, uOffset, cbWrite, pIoCtx);
643 if (RT_FAILURE(rc))
644 break;
645 /* Reset S/G buffer for the next filter. */
646 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
647 }
648
649 return rc;
650}
651
652/**
653 * Applies the filter chain to the given read request.
654 *
655 * @returns VBox status code.
656 * @param pDisk The HDD container.
657 * @param uOffset The start offset of the read.
658 * @param cbRead Number of bytes read.
659 * @param pIoCtx The I/O context associated with the request.
660 */
661static int vdFilterChainApplyRead(PVDISK pDisk, uint64_t uOffset, size_t cbRead,
662 PVDIOCTX pIoCtx)
663{
664 int rc = VINF_SUCCESS;
665
666 VD_IS_LOCKED(pDisk);
667
668 /* Reset buffer before starting. */
669 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
670
671 PVDFILTER pFilter;
672 RTListForEach(&pDisk->ListFilterChainRead, pFilter, VDFILTER, ListNodeChainRead)
673 {
674 rc = pFilter->pBackend->pfnFilterRead(pFilter->pvBackendData, uOffset, cbRead, pIoCtx);
675 if (RT_FAILURE(rc))
676 break;
677 /* Reset S/G buffer for the next filter. */
678 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
679 }
680
681 return rc;
682}
683
684DECLINLINE(void) vdIoCtxRootComplete(PVDISK pDisk, PVDIOCTX pIoCtx)
685{
686 if ( RT_SUCCESS(pIoCtx->rcReq)
687 && pIoCtx->enmTxDir == VDIOCTXTXDIR_READ)
688 pIoCtx->rcReq = vdFilterChainApplyRead(pDisk, pIoCtx->Req.Io.uOffsetXferOrig,
689 pIoCtx->Req.Io.cbXferOrig, pIoCtx);
690
691 pIoCtx->Type.Root.pfnComplete(pIoCtx->Type.Root.pvUser1,
692 pIoCtx->Type.Root.pvUser2,
693 pIoCtx->rcReq);
694}
695
696/**
697 * Initialize the structure members of a given I/O context.
698 */
699DECLINLINE(void) vdIoCtxInit(PVDIOCTX pIoCtx, PVDISK pDisk, VDIOCTXTXDIR enmTxDir,
700 uint64_t uOffset, size_t cbTransfer, PVDIMAGE pImageStart,
701 PCRTSGBUF pcSgBuf, void *pvAllocation,
702 PFNVDIOCTXTRANSFER pfnIoCtxTransfer, uint32_t fFlags)
703{
704 pIoCtx->pDisk = pDisk;
705 pIoCtx->enmTxDir = enmTxDir;
706 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbTransfer; Assert((uint32_t)cbTransfer == cbTransfer);
707 pIoCtx->Req.Io.uOffset = uOffset;
708 pIoCtx->Req.Io.cbTransfer = cbTransfer;
709 pIoCtx->Req.Io.pImageStart = pImageStart;
710 pIoCtx->Req.Io.pImageCur = pImageStart;
711 pIoCtx->Req.Io.cbBufClear = 0;
712 pIoCtx->Req.Io.pImageParentOverride = NULL;
713 pIoCtx->Req.Io.uOffsetXferOrig = uOffset;
714 pIoCtx->Req.Io.cbXferOrig = cbTransfer;
715 pIoCtx->cDataTransfersPending = 0;
716 pIoCtx->cMetaTransfersPending = 0;
717 pIoCtx->fComplete = false;
718 pIoCtx->fFlags = fFlags;
719 pIoCtx->pvAllocation = pvAllocation;
720 pIoCtx->pfnIoCtxTransfer = pfnIoCtxTransfer;
721 pIoCtx->pfnIoCtxTransferNext = NULL;
722 pIoCtx->rcReq = VINF_SUCCESS;
723 pIoCtx->pIoCtxParent = NULL;
724
725 /* There is no S/G list for a flush request. */
726 if ( enmTxDir != VDIOCTXTXDIR_FLUSH
727 && enmTxDir != VDIOCTXTXDIR_DISCARD)
728 RTSgBufClone(&pIoCtx->Req.Io.SgBuf, pcSgBuf);
729 else
730 memset(&pIoCtx->Req.Io.SgBuf, 0, sizeof(RTSGBUF));
731}
732
733/**
734 * Internal: Tries to read the desired range from the given cache.
735 *
736 * @returns VBox status code.
737 * @retval VERR_VD_BLOCK_FREE if the block is not in the cache.
738 * pcbRead will be set to the number of bytes not in the cache.
739 * Everything thereafter might be in the cache.
740 * @param pCache The cache to read from.
741 * @param uOffset Offset of the virtual disk to read.
742 * @param cbRead How much to read.
743 * @param pIoCtx The I/O context to read into.
744 * @param pcbRead Where to store the number of bytes actually read.
745 * On success this indicates the number of bytes read from the cache.
746 * If VERR_VD_BLOCK_FREE is returned this gives the number of bytes
747 * which are not in the cache.
748 * In both cases everything beyond this value
749 * might or might not be in the cache.
750 */
751static int vdCacheReadHelper(PVDCACHE pCache, uint64_t uOffset,
752 size_t cbRead, PVDIOCTX pIoCtx, size_t *pcbRead)
753{
754 int rc = VINF_SUCCESS;
755
756 LogFlowFunc(("pCache=%#p uOffset=%llu pIoCtx=%p cbRead=%zu pcbRead=%#p\n",
757 pCache, uOffset, pIoCtx, cbRead, pcbRead));
758
759 AssertPtr(pCache);
760 AssertPtr(pcbRead);
761
762 rc = pCache->Backend->pfnRead(pCache->pBackendData, uOffset, cbRead,
763 pIoCtx, pcbRead);
764
765 LogFlowFunc(("returns rc=%Rrc pcbRead=%zu\n", rc, *pcbRead));
766 return rc;
767}
768
769/**
770 * Internal: Writes data for the given block into the cache.
771 *
772 * @returns VBox status code.
773 * @param pCache The cache to write to.
774 * @param uOffset Offset of the virtual disk to write to the cache.
775 * @param cbWrite How much to write.
776 * @param pIoCtx The I/O context to write from.
777 * @param pcbWritten How much data could be written, optional.
778 */
779static int vdCacheWriteHelper(PVDCACHE pCache, uint64_t uOffset, size_t cbWrite,
780 PVDIOCTX pIoCtx, size_t *pcbWritten)
781{
782 int rc = VINF_SUCCESS;
783
784 LogFlowFunc(("pCache=%#p uOffset=%llu pIoCtx=%p cbWrite=%zu pcbWritten=%#p\n",
785 pCache, uOffset, pIoCtx, cbWrite, pcbWritten));
786
787 AssertPtr(pCache);
788 AssertPtr(pIoCtx);
789 Assert(cbWrite > 0);
790
791 if (pcbWritten)
792 rc = pCache->Backend->pfnWrite(pCache->pBackendData, uOffset, cbWrite,
793 pIoCtx, pcbWritten);
794 else
795 {
796 size_t cbWritten = 0;
797
798 do
799 {
800 rc = pCache->Backend->pfnWrite(pCache->pBackendData, uOffset, cbWrite,
801 pIoCtx, &cbWritten);
802 uOffset += cbWritten;
803 cbWrite -= cbWritten;
804 } while ( cbWrite
805 && ( RT_SUCCESS(rc)
806 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS));
807 }
808
809 LogFlowFunc(("returns rc=%Rrc pcbWritten=%zu\n",
810 rc, pcbWritten ? *pcbWritten : cbWrite));
811 return rc;
812}
813
814/**
815 * Creates a new empty discard state.
816 *
817 * @returns Pointer to the new discard state or NULL if out of memory.
818 */
819static PVDDISCARDSTATE vdDiscardStateCreate(void)
820{
821 PVDDISCARDSTATE pDiscard = (PVDDISCARDSTATE)RTMemAllocZ(sizeof(VDDISCARDSTATE));
822
823 if (pDiscard)
824 {
825 RTListInit(&pDiscard->ListLru);
826 pDiscard->pTreeBlocks = (PAVLRU64TREE)RTMemAllocZ(sizeof(AVLRU64TREE));
827 if (!pDiscard->pTreeBlocks)
828 {
829 RTMemFree(pDiscard);
830 pDiscard = NULL;
831 }
832 }
833
834 return pDiscard;
835}
836
837/**
838 * Removes the least recently used blocks from the waiting list until
839 * the new value is reached.
840 *
841 * @returns VBox status code.
842 * @param pDisk VD disk container.
843 * @param pDiscard The discard state.
844 * @param cbDiscardingNew How many bytes should be waiting on success.
845 * The number of bytes waiting can be less.
846 */
847static int vdDiscardRemoveBlocks(PVDISK pDisk, PVDDISCARDSTATE pDiscard, size_t cbDiscardingNew)
848{
849 int rc = VINF_SUCCESS;
850
851 LogFlowFunc(("pDisk=%#p pDiscard=%#p cbDiscardingNew=%zu\n",
852 pDisk, pDiscard, cbDiscardingNew));
853
854 while (pDiscard->cbDiscarding > cbDiscardingNew)
855 {
856 PVDDISCARDBLOCK pBlock = RTListGetLast(&pDiscard->ListLru, VDDISCARDBLOCK, NodeLru);
857
858 Assert(!RTListIsEmpty(&pDiscard->ListLru));
859
860 /* Go over the allocation bitmap and mark all discarded sectors as unused. */
861 uint64_t offStart = pBlock->Core.Key;
862 uint32_t idxStart = 0;
863 size_t cbLeft = pBlock->cbDiscard;
864 bool fAllocated = ASMBitTest(pBlock->pbmAllocated, idxStart);
865 uint32_t cSectors = (uint32_t)(pBlock->cbDiscard / 512);
866
867 while (cbLeft > 0)
868 {
869 int32_t idxEnd;
870 size_t cbThis = cbLeft;
871
872 if (fAllocated)
873 {
874 /* Check for the first unallocated bit. */
875 idxEnd = ASMBitNextClear(pBlock->pbmAllocated, cSectors, idxStart);
876 if (idxEnd != -1)
877 {
878 cbThis = (idxEnd - idxStart) * 512;
879 fAllocated = false;
880 }
881 }
882 else
883 {
884 /* Mark as unused and check for the first set bit. */
885 idxEnd = ASMBitNextSet(pBlock->pbmAllocated, cSectors, idxStart);
886 if (idxEnd != -1)
887 cbThis = (idxEnd - idxStart) * 512;
888
889
890 VDIOCTX IoCtx;
891 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_DISCARD, 0, 0, NULL,
892 NULL, NULL, NULL, VDIOCTX_FLAGS_SYNC);
893 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData,
894 &IoCtx, offStart, cbThis, NULL,
895 NULL, &cbThis, NULL,
896 VD_DISCARD_MARK_UNUSED);
897 if (RT_FAILURE(rc))
898 break;
899
900 fAllocated = true;
901 }
902
903 idxStart = idxEnd;
904 offStart += cbThis;
905 cbLeft -= cbThis;
906 }
907
908 if (RT_FAILURE(rc))
909 break;
910
911 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
912 Assert(pBlockRemove == pBlock); NOREF(pBlockRemove);
913 RTListNodeRemove(&pBlock->NodeLru);
914
915 pDiscard->cbDiscarding -= pBlock->cbDiscard;
916 RTMemFree(pBlock->pbmAllocated);
917 RTMemFree(pBlock);
918 }
919
920 Assert(RT_FAILURE(rc) || pDiscard->cbDiscarding <= cbDiscardingNew);
921
922 LogFlowFunc(("returns rc=%Rrc\n", rc));
923 return rc;
924}
925
926/**
927 * Destroys the current discard state, writing any waiting blocks to the image.
928 *
929 * @returns VBox status code.
930 * @param pDisk VD disk container.
931 */
932static int vdDiscardStateDestroy(PVDISK pDisk)
933{
934 int rc = VINF_SUCCESS;
935
936 if (pDisk->pDiscard)
937 {
938 rc = vdDiscardRemoveBlocks(pDisk, pDisk->pDiscard, 0 /* Remove all blocks. */);
939 AssertRC(rc);
940 RTMemFree(pDisk->pDiscard->pTreeBlocks);
941 RTMemFree(pDisk->pDiscard);
942 pDisk->pDiscard = NULL;
943 }
944
945 return rc;
946}
947
948/**
949 * Marks the given range as allocated in the image.
950 * Required if there are discards in progress and a write to a block which can get discarded
951 * is written to.
952 *
953 * @returns VBox status code.
954 * @param pDisk VD container data.
955 * @param uOffset First byte to mark as allocated.
956 * @param cbRange Number of bytes to mark as allocated.
957 */
958static int vdDiscardSetRangeAllocated(PVDISK pDisk, uint64_t uOffset, size_t cbRange)
959{
960 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
961 int rc = VINF_SUCCESS;
962
963 if (pDiscard)
964 {
965 do
966 {
967 size_t cbThisRange = cbRange;
968 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTAvlrU64RangeGet(pDiscard->pTreeBlocks, uOffset);
969
970 if (pBlock)
971 {
972 int32_t idxStart, idxEnd;
973
974 Assert(!(cbThisRange % 512));
975 Assert(!((uOffset - pBlock->Core.Key) % 512));
976
977 cbThisRange = RT_MIN(cbThisRange, pBlock->Core.KeyLast - uOffset + 1);
978
979 idxStart = (uOffset - pBlock->Core.Key) / 512;
980 idxEnd = idxStart + (int32_t)(cbThisRange / 512);
981 ASMBitSetRange(pBlock->pbmAllocated, idxStart, idxEnd);
982 }
983 else
984 {
985 pBlock = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, uOffset, true);
986 if (pBlock)
987 cbThisRange = RT_MIN(cbThisRange, pBlock->Core.Key - uOffset);
988 }
989
990 Assert(cbRange >= cbThisRange);
991
992 uOffset += cbThisRange;
993 cbRange -= cbThisRange;
994 } while (cbRange != 0);
995 }
996
997 return rc;
998}
999
1000DECLINLINE(PVDIOCTX) vdIoCtxAlloc(PVDISK pDisk, VDIOCTXTXDIR enmTxDir,
1001 uint64_t uOffset, size_t cbTransfer,
1002 PVDIMAGE pImageStart,PCRTSGBUF pcSgBuf,
1003 void *pvAllocation, PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1004 uint32_t fFlags)
1005{
1006 PVDIOCTX pIoCtx = NULL;
1007
1008 pIoCtx = (PVDIOCTX)RTMemCacheAlloc(pDisk->hMemCacheIoCtx);
1009 if (RT_LIKELY(pIoCtx))
1010 {
1011 vdIoCtxInit(pIoCtx, pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1012 pcSgBuf, pvAllocation, pfnIoCtxTransfer, fFlags);
1013 }
1014
1015 return pIoCtx;
1016}
1017
1018DECLINLINE(PVDIOCTX) vdIoCtxRootAlloc(PVDISK pDisk, VDIOCTXTXDIR enmTxDir,
1019 uint64_t uOffset, size_t cbTransfer,
1020 PVDIMAGE pImageStart, PCRTSGBUF pcSgBuf,
1021 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1022 void *pvUser1, void *pvUser2,
1023 void *pvAllocation,
1024 PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1025 uint32_t fFlags)
1026{
1027 PVDIOCTX pIoCtx = vdIoCtxAlloc(pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1028 pcSgBuf, pvAllocation, pfnIoCtxTransfer, fFlags);
1029
1030 if (RT_LIKELY(pIoCtx))
1031 {
1032 pIoCtx->pIoCtxParent = NULL;
1033 pIoCtx->Type.Root.pfnComplete = pfnComplete;
1034 pIoCtx->Type.Root.pvUser1 = pvUser1;
1035 pIoCtx->Type.Root.pvUser2 = pvUser2;
1036 }
1037
1038 LogFlow(("Allocated root I/O context %#p\n", pIoCtx));
1039 return pIoCtx;
1040}
1041
1042DECLINLINE(void) vdIoCtxDiscardInit(PVDIOCTX pIoCtx, PVDISK pDisk, PCRTRANGE paRanges,
1043 unsigned cRanges, PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1044 void *pvUser1, void *pvUser2, void *pvAllocation,
1045 PFNVDIOCTXTRANSFER pfnIoCtxTransfer, uint32_t fFlags)
1046{
1047 pIoCtx->pIoCtxNext = NULL;
1048 pIoCtx->pDisk = pDisk;
1049 pIoCtx->enmTxDir = VDIOCTXTXDIR_DISCARD;
1050 pIoCtx->cDataTransfersPending = 0;
1051 pIoCtx->cMetaTransfersPending = 0;
1052 pIoCtx->fComplete = false;
1053 pIoCtx->fFlags = fFlags;
1054 pIoCtx->pvAllocation = pvAllocation;
1055 pIoCtx->pfnIoCtxTransfer = pfnIoCtxTransfer;
1056 pIoCtx->pfnIoCtxTransferNext = NULL;
1057 pIoCtx->rcReq = VINF_SUCCESS;
1058 pIoCtx->Req.Discard.paRanges = paRanges;
1059 pIoCtx->Req.Discard.cRanges = cRanges;
1060 pIoCtx->Req.Discard.idxRange = 0;
1061 pIoCtx->Req.Discard.cbDiscardLeft = 0;
1062 pIoCtx->Req.Discard.offCur = 0;
1063 pIoCtx->Req.Discard.cbThisDiscard = 0;
1064
1065 pIoCtx->pIoCtxParent = NULL;
1066 pIoCtx->Type.Root.pfnComplete = pfnComplete;
1067 pIoCtx->Type.Root.pvUser1 = pvUser1;
1068 pIoCtx->Type.Root.pvUser2 = pvUser2;
1069}
1070
1071DECLINLINE(PVDIOCTX) vdIoCtxDiscardAlloc(PVDISK pDisk, PCRTRANGE paRanges,
1072 unsigned cRanges,
1073 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
1074 void *pvUser1, void *pvUser2,
1075 void *pvAllocation,
1076 PFNVDIOCTXTRANSFER pfnIoCtxTransfer,
1077 uint32_t fFlags)
1078{
1079 PVDIOCTX pIoCtx = NULL;
1080
1081 pIoCtx = (PVDIOCTX)RTMemCacheAlloc(pDisk->hMemCacheIoCtx);
1082 if (RT_LIKELY(pIoCtx))
1083 {
1084 vdIoCtxDiscardInit(pIoCtx, pDisk, paRanges, cRanges, pfnComplete, pvUser1,
1085 pvUser2, pvAllocation, pfnIoCtxTransfer, fFlags);
1086 }
1087
1088 LogFlow(("Allocated discard I/O context %#p\n", pIoCtx));
1089 return pIoCtx;
1090}
1091
1092DECLINLINE(PVDIOCTX) vdIoCtxChildAlloc(PVDISK pDisk, VDIOCTXTXDIR enmTxDir,
1093 uint64_t uOffset, size_t cbTransfer,
1094 PVDIMAGE pImageStart, PCRTSGBUF pcSgBuf,
1095 PVDIOCTX pIoCtxParent, size_t cbTransferParent,
1096 size_t cbWriteParent, void *pvAllocation,
1097 PFNVDIOCTXTRANSFER pfnIoCtxTransfer)
1098{
1099 PVDIOCTX pIoCtx = vdIoCtxAlloc(pDisk, enmTxDir, uOffset, cbTransfer, pImageStart,
1100 pcSgBuf, pvAllocation, pfnIoCtxTransfer, pIoCtxParent->fFlags & ~VDIOCTX_FLAGS_DONT_FREE);
1101
1102 AssertPtr(pIoCtxParent);
1103 Assert(!pIoCtxParent->pIoCtxParent);
1104
1105 if (RT_LIKELY(pIoCtx))
1106 {
1107 pIoCtx->pIoCtxParent = pIoCtxParent;
1108 pIoCtx->Type.Child.uOffsetSaved = uOffset;
1109 pIoCtx->Type.Child.cbTransferLeftSaved = cbTransfer;
1110 pIoCtx->Type.Child.cbTransferParent = cbTransferParent;
1111 pIoCtx->Type.Child.cbWriteParent = cbWriteParent;
1112 }
1113
1114 LogFlow(("Allocated child I/O context %#p\n", pIoCtx));
1115 return pIoCtx;
1116}
1117
1118DECLINLINE(PVDIOTASK) vdIoTaskUserAlloc(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser, PVDIOCTX pIoCtx, uint32_t cbTransfer)
1119{
1120 PVDIOTASK pIoTask = NULL;
1121
1122 pIoTask = (PVDIOTASK)RTMemCacheAlloc(pIoStorage->pVDIo->pDisk->hMemCacheIoTask);
1123 if (pIoTask)
1124 {
1125 pIoTask->pIoStorage = pIoStorage;
1126 pIoTask->pfnComplete = pfnComplete;
1127 pIoTask->pvUser = pvUser;
1128 pIoTask->fMeta = false;
1129 pIoTask->Type.User.cbTransfer = cbTransfer;
1130 pIoTask->Type.User.pIoCtx = pIoCtx;
1131 }
1132
1133 return pIoTask;
1134}
1135
1136DECLINLINE(PVDIOTASK) vdIoTaskMetaAlloc(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser, PVDMETAXFER pMetaXfer)
1137{
1138 PVDIOTASK pIoTask = NULL;
1139
1140 pIoTask = (PVDIOTASK)RTMemCacheAlloc(pIoStorage->pVDIo->pDisk->hMemCacheIoTask);
1141 if (pIoTask)
1142 {
1143 pIoTask->pIoStorage = pIoStorage;
1144 pIoTask->pfnComplete = pfnComplete;
1145 pIoTask->pvUser = pvUser;
1146 pIoTask->fMeta = true;
1147 pIoTask->Type.Meta.pMetaXfer = pMetaXfer;
1148 }
1149
1150 return pIoTask;
1151}
1152
1153DECLINLINE(void) vdIoCtxFree(PVDISK pDisk, PVDIOCTX pIoCtx)
1154{
1155 Log(("Freeing I/O context %#p\n", pIoCtx));
1156
1157 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_DONT_FREE))
1158 {
1159 if (pIoCtx->pvAllocation)
1160 RTMemFree(pIoCtx->pvAllocation);
1161#ifdef DEBUG
1162 memset(&pIoCtx->pDisk, 0xff, sizeof(void *));
1163#endif
1164 RTMemCacheFree(pDisk->hMemCacheIoCtx, pIoCtx);
1165 }
1166}
1167
1168DECLINLINE(void) vdIoTaskFree(PVDISK pDisk, PVDIOTASK pIoTask)
1169{
1170#ifdef DEBUG
1171 memset(pIoTask, 0xff, sizeof(VDIOTASK));
1172#endif
1173 RTMemCacheFree(pDisk->hMemCacheIoTask, pIoTask);
1174}
1175
1176DECLINLINE(void) vdIoCtxChildReset(PVDIOCTX pIoCtx)
1177{
1178 AssertPtr(pIoCtx->pIoCtxParent);
1179
1180 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
1181 pIoCtx->Req.Io.uOffset = pIoCtx->Type.Child.uOffsetSaved;
1182 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)pIoCtx->Type.Child.cbTransferLeftSaved;
1183 Assert((uint32_t)pIoCtx->Type.Child.cbTransferLeftSaved == pIoCtx->Type.Child.cbTransferLeftSaved);
1184}
1185
1186DECLINLINE(PVDMETAXFER) vdMetaXferAlloc(PVDIOSTORAGE pIoStorage, uint64_t uOffset, size_t cb)
1187{
1188 PVDMETAXFER pMetaXfer = (PVDMETAXFER)RTMemAlloc(RT_OFFSETOF(VDMETAXFER, abData[cb]));
1189
1190 if (RT_LIKELY(pMetaXfer))
1191 {
1192 pMetaXfer->Core.Key = uOffset;
1193 pMetaXfer->Core.KeyLast = uOffset + cb - 1;
1194 pMetaXfer->fFlags = VDMETAXFER_TXDIR_NONE;
1195 pMetaXfer->cbMeta = cb;
1196 pMetaXfer->pIoStorage = pIoStorage;
1197 pMetaXfer->cRefs = 0;
1198 pMetaXfer->pbDataShw = NULL;
1199 RTListInit(&pMetaXfer->ListIoCtxWaiting);
1200 RTListInit(&pMetaXfer->ListIoCtxShwWrites);
1201 }
1202 return pMetaXfer;
1203}
1204
1205DECLINLINE(void) vdIoCtxAddToWaitingList(volatile PVDIOCTX *ppList, PVDIOCTX pIoCtx)
1206{
1207 /* Put it on the waiting list. */
1208 PVDIOCTX pNext = ASMAtomicUoReadPtrT(ppList, PVDIOCTX);
1209 PVDIOCTX pHeadOld;
1210 pIoCtx->pIoCtxNext = pNext;
1211 while (!ASMAtomicCmpXchgExPtr(ppList, pIoCtx, pNext, &pHeadOld))
1212 {
1213 pNext = pHeadOld;
1214 Assert(pNext != pIoCtx);
1215 pIoCtx->pIoCtxNext = pNext;
1216 ASMNopPause();
1217 }
1218}
1219
1220DECLINLINE(void) vdIoCtxDefer(PVDISK pDisk, PVDIOCTX pIoCtx)
1221{
1222 LogFlowFunc(("Deferring I/O context pIoCtx=%#p\n", pIoCtx));
1223
1224 Assert(!pIoCtx->pIoCtxParent && !(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED));
1225 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
1226 vdIoCtxAddToWaitingList(&pDisk->pIoCtxBlockedHead, pIoCtx);
1227}
1228
1229static size_t vdIoCtxCopy(PVDIOCTX pIoCtxDst, PVDIOCTX pIoCtxSrc, size_t cbData)
1230{
1231 return RTSgBufCopy(&pIoCtxDst->Req.Io.SgBuf, &pIoCtxSrc->Req.Io.SgBuf, cbData);
1232}
1233
1234#if 0 /* unused */
1235static int vdIoCtxCmp(PVDIOCTX pIoCtx1, PVDIOCTX pIoCtx2, size_t cbData)
1236{
1237 return RTSgBufCmp(&pIoCtx1->Req.Io.SgBuf, &pIoCtx2->Req.Io.SgBuf, cbData);
1238}
1239#endif
1240
1241static size_t vdIoCtxCopyTo(PVDIOCTX pIoCtx, const uint8_t *pbData, size_t cbData)
1242{
1243 return RTSgBufCopyFromBuf(&pIoCtx->Req.Io.SgBuf, pbData, cbData);
1244}
1245
1246static size_t vdIoCtxCopyFrom(PVDIOCTX pIoCtx, uint8_t *pbData, size_t cbData)
1247{
1248 return RTSgBufCopyToBuf(&pIoCtx->Req.Io.SgBuf, pbData, cbData);
1249}
1250
1251static size_t vdIoCtxSet(PVDIOCTX pIoCtx, uint8_t ch, size_t cbData)
1252{
1253 return RTSgBufSet(&pIoCtx->Req.Io.SgBuf, ch, cbData);
1254}
1255
1256/**
1257 * Returns whether the given I/O context has completed.
1258 *
1259 * @returns Flag whether the I/O context is complete.
1260 * @param pIoCtx The I/O context to check.
1261 */
1262DECLINLINE(bool) vdIoCtxIsComplete(PVDIOCTX pIoCtx)
1263{
1264 if ( !pIoCtx->cMetaTransfersPending
1265 && !pIoCtx->cDataTransfersPending
1266 && !pIoCtx->pfnIoCtxTransfer)
1267 return true;
1268
1269 /*
1270 * We complete the I/O context in case of an error
1271 * if there is no I/O task pending.
1272 */
1273 if ( RT_FAILURE(pIoCtx->rcReq)
1274 && !pIoCtx->cMetaTransfersPending
1275 && !pIoCtx->cDataTransfersPending)
1276 return true;
1277
1278 return false;
1279}
1280
1281/**
1282 * Returns whether the given I/O context is blocked due to a metadata transfer
1283 * or because the backend blocked it.
1284 *
1285 * @returns Flag whether the I/O context is blocked.
1286 * @param pIoCtx The I/O context to check.
1287 */
1288DECLINLINE(bool) vdIoCtxIsBlocked(PVDIOCTX pIoCtx)
1289{
1290 /* Don't change anything if there is a metadata transfer pending or we are blocked. */
1291 if ( pIoCtx->cMetaTransfersPending
1292 || (pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
1293 return true;
1294
1295 return false;
1296}
1297
1298/**
1299 * Process the I/O context, core method which assumes that the I/O context
1300 * acquired the lock.
1301 *
1302 * @returns VBox status code.
1303 * @param pIoCtx I/O context to process.
1304 */
1305static int vdIoCtxProcessLocked(PVDIOCTX pIoCtx)
1306{
1307 int rc = VINF_SUCCESS;
1308
1309 VD_IS_LOCKED(pIoCtx->pDisk);
1310
1311 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
1312
1313 if (!vdIoCtxIsComplete(pIoCtx))
1314 {
1315 if (!vdIoCtxIsBlocked(pIoCtx))
1316 {
1317 if (pIoCtx->pfnIoCtxTransfer)
1318 {
1319 /* Call the transfer function advancing to the next while there is no error. */
1320 while ( pIoCtx->pfnIoCtxTransfer
1321 && !pIoCtx->cMetaTransfersPending
1322 && RT_SUCCESS(rc))
1323 {
1324 LogFlowFunc(("calling transfer function %#p\n", pIoCtx->pfnIoCtxTransfer));
1325 rc = pIoCtx->pfnIoCtxTransfer(pIoCtx);
1326
1327 /* Advance to the next part of the transfer if the current one succeeded. */
1328 if (RT_SUCCESS(rc))
1329 {
1330 pIoCtx->pfnIoCtxTransfer = pIoCtx->pfnIoCtxTransferNext;
1331 pIoCtx->pfnIoCtxTransferNext = NULL;
1332 }
1333 }
1334 }
1335
1336 if ( RT_SUCCESS(rc)
1337 && !pIoCtx->cMetaTransfersPending
1338 && !pIoCtx->cDataTransfersPending
1339 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
1340 rc = VINF_VD_ASYNC_IO_FINISHED;
1341 else if ( RT_SUCCESS(rc)
1342 || rc == VERR_VD_NOT_ENOUGH_METADATA
1343 || rc == VERR_VD_IOCTX_HALT)
1344 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1345 else if ( RT_FAILURE(rc)
1346 && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
1347 {
1348 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rc, VINF_SUCCESS);
1349
1350 /*
1351 * The I/O context completed if we have an error and there is no data
1352 * or meta data transfer pending.
1353 */
1354 if ( !pIoCtx->cMetaTransfersPending
1355 && !pIoCtx->cDataTransfersPending)
1356 rc = VINF_VD_ASYNC_IO_FINISHED;
1357 else
1358 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1359 }
1360 }
1361 else
1362 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1363 }
1364 else
1365 rc = VINF_VD_ASYNC_IO_FINISHED;
1366
1367 LogFlowFunc(("pIoCtx=%#p rc=%Rrc cDataTransfersPending=%u cMetaTransfersPending=%u fComplete=%RTbool\n",
1368 pIoCtx, rc, pIoCtx->cDataTransfersPending, pIoCtx->cMetaTransfersPending,
1369 pIoCtx->fComplete));
1370
1371 return rc;
1372}
1373
1374/**
1375 * Processes the list of waiting I/O contexts.
1376 *
1377 * @returns VBox status code, only valid if pIoCtxRc is not NULL, treat as void
1378 * function otherwise.
1379 * @param pDisk The disk structure.
1380 * @param pIoCtxRc An I/O context handle which waits on the list. When processed
1381 * The status code is returned. NULL if there is no I/O context
1382 * to return the status code for.
1383 */
1384static int vdDiskProcessWaitingIoCtx(PVDISK pDisk, PVDIOCTX pIoCtxRc)
1385{
1386 int rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1387
1388 LogFlowFunc(("pDisk=%#p pIoCtxRc=%#p\n", pDisk, pIoCtxRc));
1389
1390 VD_IS_LOCKED(pDisk);
1391
1392 /* Get the waiting list and process it in FIFO order. */
1393 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxHead, NULL, PVDIOCTX);
1394
1395 /* Reverse it. */
1396 PVDIOCTX pCur = pIoCtxHead;
1397 pIoCtxHead = NULL;
1398 while (pCur)
1399 {
1400 PVDIOCTX pInsert = pCur;
1401 pCur = pCur->pIoCtxNext;
1402 pInsert->pIoCtxNext = pIoCtxHead;
1403 pIoCtxHead = pInsert;
1404 }
1405
1406 /* Process now. */
1407 pCur = pIoCtxHead;
1408 while (pCur)
1409 {
1410 int rcTmp;
1411 PVDIOCTX pTmp = pCur;
1412
1413 pCur = pCur->pIoCtxNext;
1414 pTmp->pIoCtxNext = NULL;
1415
1416 /*
1417 * Need to clear the sync flag here if there is a new I/O context
1418 * with it set and the context is not given in pIoCtxRc.
1419 * This happens most likely on a different thread and that one shouldn't
1420 * process the context synchronously.
1421 *
1422 * The thread who issued the context will wait on the event semaphore
1423 * anyway which is signalled when the completion handler is called.
1424 */
1425 if ( pTmp->fFlags & VDIOCTX_FLAGS_SYNC
1426 && pTmp != pIoCtxRc)
1427 pTmp->fFlags &= ~VDIOCTX_FLAGS_SYNC;
1428
1429 rcTmp = vdIoCtxProcessLocked(pTmp);
1430 if (pTmp == pIoCtxRc)
1431 {
1432 if ( rcTmp == VINF_VD_ASYNC_IO_FINISHED
1433 && RT_SUCCESS(pTmp->rcReq)
1434 && pTmp->enmTxDir == VDIOCTXTXDIR_READ)
1435 {
1436 int rc2 = vdFilterChainApplyRead(pDisk, pTmp->Req.Io.uOffsetXferOrig,
1437 pTmp->Req.Io.cbXferOrig, pTmp);
1438 if (RT_FAILURE(rc2))
1439 rcTmp = rc2;
1440 }
1441
1442 /* The given I/O context was processed, pass the return code to the caller. */
1443 if ( rcTmp == VINF_VD_ASYNC_IO_FINISHED
1444 && (pTmp->fFlags & VDIOCTX_FLAGS_SYNC))
1445 rc = pTmp->rcReq;
1446 else
1447 rc = rcTmp;
1448 }
1449 else if ( rcTmp == VINF_VD_ASYNC_IO_FINISHED
1450 && ASMAtomicCmpXchgBool(&pTmp->fComplete, true, false))
1451 {
1452 LogFlowFunc(("Waiting I/O context completed pTmp=%#p\n", pTmp));
1453 vdThreadFinishWrite(pDisk);
1454
1455 bool fFreeCtx = RT_BOOL(!(pTmp->fFlags & VDIOCTX_FLAGS_DONT_FREE));
1456 vdIoCtxRootComplete(pDisk, pTmp);
1457
1458 if (fFreeCtx)
1459 vdIoCtxFree(pDisk, pTmp);
1460 }
1461 }
1462
1463 LogFlowFunc(("returns rc=%Rrc\n", rc));
1464 return rc;
1465}
1466
1467/**
1468 * Processes the list of blocked I/O contexts.
1469 *
1470 * @returns nothing.
1471 * @param pDisk The disk structure.
1472 */
1473static void vdDiskProcessBlockedIoCtx(PVDISK pDisk)
1474{
1475 LogFlowFunc(("pDisk=%#p\n", pDisk));
1476
1477 VD_IS_LOCKED(pDisk);
1478
1479 /* Get the waiting list and process it in FIFO order. */
1480 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxBlockedHead, NULL, PVDIOCTX);
1481
1482 /* Reverse it. */
1483 PVDIOCTX pCur = pIoCtxHead;
1484 pIoCtxHead = NULL;
1485 while (pCur)
1486 {
1487 PVDIOCTX pInsert = pCur;
1488 pCur = pCur->pIoCtxNext;
1489 pInsert->pIoCtxNext = pIoCtxHead;
1490 pIoCtxHead = pInsert;
1491 }
1492
1493 /* Process now. */
1494 pCur = pIoCtxHead;
1495 while (pCur)
1496 {
1497 int rc;
1498 PVDIOCTX pTmp = pCur;
1499
1500 pCur = pCur->pIoCtxNext;
1501 pTmp->pIoCtxNext = NULL;
1502
1503 Assert(!pTmp->pIoCtxParent);
1504 Assert(pTmp->fFlags & VDIOCTX_FLAGS_BLOCKED);
1505 pTmp->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
1506
1507 rc = vdIoCtxProcessLocked(pTmp);
1508 if ( rc == VINF_VD_ASYNC_IO_FINISHED
1509 && ASMAtomicCmpXchgBool(&pTmp->fComplete, true, false))
1510 {
1511 LogFlowFunc(("Waiting I/O context completed pTmp=%#p\n", pTmp));
1512 vdThreadFinishWrite(pDisk);
1513
1514 bool fFreeCtx = RT_BOOL(!(pTmp->fFlags & VDIOCTX_FLAGS_DONT_FREE));
1515 vdIoCtxRootComplete(pDisk, pTmp);
1516 if (fFreeCtx)
1517 vdIoCtxFree(pDisk, pTmp);
1518 }
1519 }
1520
1521 LogFlowFunc(("returns\n"));
1522}
1523
1524/**
1525 * Processes the I/O context trying to lock the criticial section.
1526 * The context is deferred if the critical section is busy.
1527 *
1528 * @returns VBox status code.
1529 * @param pIoCtx The I/O context to process.
1530 */
1531static int vdIoCtxProcessTryLockDefer(PVDIOCTX pIoCtx)
1532{
1533 int rc = VINF_SUCCESS;
1534 PVDISK pDisk = pIoCtx->pDisk;
1535
1536 Log(("Defer pIoCtx=%#p\n", pIoCtx));
1537
1538 /* Put it on the waiting list first. */
1539 vdIoCtxAddToWaitingList(&pDisk->pIoCtxHead, pIoCtx);
1540
1541 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
1542 {
1543 /* Leave it again, the context will be processed just before leaving the lock. */
1544 LogFlowFunc(("Successfully acquired the lock\n"));
1545 rc = vdDiskUnlock(pDisk, pIoCtx);
1546 }
1547 else
1548 {
1549 LogFlowFunc(("Lock is held\n"));
1550 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1551 }
1552
1553 return rc;
1554}
1555
1556/**
1557 * Process the I/O context in a synchronous manner, waiting
1558 * for it to complete.
1559 *
1560 * @returns VBox status code of the completed request.
1561 * @param pIoCtx The sync I/O context.
1562 * @param hEventComplete Event sempahore to wait on for completion.
1563 */
1564static int vdIoCtxProcessSync(PVDIOCTX pIoCtx, RTSEMEVENT hEventComplete)
1565{
1566 int rc = VINF_SUCCESS;
1567 PVDISK pDisk = pIoCtx->pDisk;
1568
1569 LogFlowFunc(("pIoCtx=%p\n", pIoCtx));
1570
1571 AssertMsg(pIoCtx->fFlags & (VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE),
1572 ("I/O context is not marked as synchronous\n"));
1573
1574 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
1575 if (rc == VINF_VD_ASYNC_IO_FINISHED)
1576 rc = VINF_SUCCESS;
1577
1578 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
1579 {
1580 rc = RTSemEventWait(hEventComplete, RT_INDEFINITE_WAIT);
1581 AssertRC(rc);
1582 }
1583
1584 rc = pIoCtx->rcReq;
1585 vdIoCtxFree(pDisk, pIoCtx);
1586
1587 return rc;
1588}
1589
1590DECLINLINE(bool) vdIoCtxIsDiskLockOwner(PVDISK pDisk, PVDIOCTX pIoCtx)
1591{
1592 return pDisk->pIoCtxLockOwner == pIoCtx;
1593}
1594
1595static int vdIoCtxLockDisk(PVDISK pDisk, PVDIOCTX pIoCtx)
1596{
1597 int rc = VINF_SUCCESS;
1598
1599 VD_IS_LOCKED(pDisk);
1600
1601 LogFlowFunc(("pDisk=%#p pIoCtx=%#p\n", pDisk, pIoCtx));
1602
1603 if (!ASMAtomicCmpXchgPtr(&pDisk->pIoCtxLockOwner, pIoCtx, NIL_VDIOCTX))
1604 {
1605 Assert(pDisk->pIoCtxLockOwner != pIoCtx); /* No nesting allowed. */
1606 vdIoCtxDefer(pDisk, pIoCtx);
1607 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
1608 }
1609
1610 LogFlowFunc(("returns -> %Rrc\n", rc));
1611 return rc;
1612}
1613
1614static void vdIoCtxUnlockDisk(PVDISK pDisk, PVDIOCTX pIoCtx, bool fProcessBlockedReqs)
1615{
1616 RT_NOREF1(pIoCtx);
1617 LogFlowFunc(("pDisk=%#p pIoCtx=%#p fProcessBlockedReqs=%RTbool\n",
1618 pDisk, pIoCtx, fProcessBlockedReqs));
1619
1620 VD_IS_LOCKED(pDisk);
1621
1622 LogFlow(("Unlocking disk lock owner is %#p\n", pDisk->pIoCtxLockOwner));
1623 Assert(pDisk->pIoCtxLockOwner == pIoCtx);
1624 ASMAtomicXchgPtrT(&pDisk->pIoCtxLockOwner, NIL_VDIOCTX, PVDIOCTX);
1625
1626 if (fProcessBlockedReqs)
1627 {
1628 /* Process any blocked writes if the current request didn't caused another growing. */
1629 vdDiskProcessBlockedIoCtx(pDisk);
1630 }
1631
1632 LogFlowFunc(("returns\n"));
1633}
1634
1635/**
1636 * Internal: Reads a given amount of data from the image chain of the disk.
1637 **/
1638static int vdDiskReadHelper(PVDISK pDisk, PVDIMAGE pImage, PVDIMAGE pImageParentOverride,
1639 uint64_t uOffset, size_t cbRead, PVDIOCTX pIoCtx, size_t *pcbThisRead)
1640{
1641 RT_NOREF1(pDisk);
1642 int rc = VINF_SUCCESS;
1643 size_t cbThisRead = cbRead;
1644
1645 AssertPtr(pcbThisRead);
1646
1647 *pcbThisRead = 0;
1648
1649 /*
1650 * Try to read from the given image.
1651 * If the block is not allocated read from override chain if present.
1652 */
1653 rc = pImage->Backend->pfnRead(pImage->pBackendData,
1654 uOffset, cbThisRead, pIoCtx,
1655 &cbThisRead);
1656
1657 if (rc == VERR_VD_BLOCK_FREE)
1658 {
1659 for (PVDIMAGE pCurrImage = pImageParentOverride ? pImageParentOverride : pImage->pPrev;
1660 pCurrImage != NULL && rc == VERR_VD_BLOCK_FREE;
1661 pCurrImage = pCurrImage->pPrev)
1662 {
1663 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
1664 uOffset, cbThisRead, pIoCtx,
1665 &cbThisRead);
1666 }
1667 }
1668
1669 if (RT_SUCCESS(rc) || rc == VERR_VD_BLOCK_FREE)
1670 *pcbThisRead = cbThisRead;
1671
1672 return rc;
1673}
1674
1675/**
1676 * internal: read the specified amount of data in whatever blocks the backend
1677 * will give us - async version.
1678 */
1679static DECLCALLBACK(int) vdReadHelperAsync(PVDIOCTX pIoCtx)
1680{
1681 int rc;
1682 PVDISK pDisk = pIoCtx->pDisk;
1683 size_t cbToRead = pIoCtx->Req.Io.cbTransfer;
1684 uint64_t uOffset = pIoCtx->Req.Io.uOffset;
1685 PVDIMAGE pCurrImage = pIoCtx->Req.Io.pImageCur;
1686 PVDIMAGE pImageParentOverride = pIoCtx->Req.Io.pImageParentOverride;
1687 unsigned cImagesRead = pIoCtx->Req.Io.cImagesRead;
1688 size_t cbThisRead;
1689
1690 /*
1691 * Check whether there is a full block write in progress which was not allocated.
1692 * Defer I/O if the range interferes but only if it does not belong to the
1693 * write doing the allocation.
1694 */
1695 if ( pDisk->pIoCtxLockOwner != NIL_VDIOCTX
1696 && uOffset >= pDisk->uOffsetStartLocked
1697 && uOffset < pDisk->uOffsetEndLocked
1698 && ( !pIoCtx->pIoCtxParent
1699 || pIoCtx->pIoCtxParent != pDisk->pIoCtxLockOwner))
1700 {
1701 Log(("Interferring read while allocating a new block => deferring read\n"));
1702 vdIoCtxDefer(pDisk, pIoCtx);
1703 return VERR_VD_ASYNC_IO_IN_PROGRESS;
1704 }
1705
1706 /* Loop until all reads started or we have a backend which needs to read metadata. */
1707 do
1708 {
1709 /* Search for image with allocated block. Do not attempt to read more
1710 * than the previous reads marked as valid. Otherwise this would return
1711 * stale data when different block sizes are used for the images. */
1712 cbThisRead = cbToRead;
1713
1714 if ( pDisk->pCache
1715 && !pImageParentOverride)
1716 {
1717 rc = vdCacheReadHelper(pDisk->pCache, uOffset, cbThisRead,
1718 pIoCtx, &cbThisRead);
1719 if (rc == VERR_VD_BLOCK_FREE)
1720 {
1721 rc = vdDiskReadHelper(pDisk, pCurrImage, NULL, uOffset, cbThisRead,
1722 pIoCtx, &cbThisRead);
1723
1724 /* If the read was successful, write the data back into the cache. */
1725 if ( RT_SUCCESS(rc)
1726 && pIoCtx->fFlags & VDIOCTX_FLAGS_READ_UPDATE_CACHE)
1727 {
1728 rc = vdCacheWriteHelper(pDisk->pCache, uOffset, cbThisRead,
1729 pIoCtx, NULL);
1730 }
1731 }
1732 }
1733 else
1734 {
1735 /*
1736 * Try to read from the given image.
1737 * If the block is not allocated read from override chain if present.
1738 */
1739 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
1740 uOffset, cbThisRead, pIoCtx,
1741 &cbThisRead);
1742
1743 if ( rc == VERR_VD_BLOCK_FREE
1744 && cImagesRead != 1)
1745 {
1746 unsigned cImagesToProcess = cImagesRead;
1747
1748 pCurrImage = pImageParentOverride ? pImageParentOverride : pCurrImage->pPrev;
1749 pIoCtx->Req.Io.pImageParentOverride = NULL;
1750
1751 while (pCurrImage && rc == VERR_VD_BLOCK_FREE)
1752 {
1753 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
1754 uOffset, cbThisRead,
1755 pIoCtx, &cbThisRead);
1756 if (cImagesToProcess == 1)
1757 break;
1758 else if (cImagesToProcess > 0)
1759 cImagesToProcess--;
1760
1761 if (rc == VERR_VD_BLOCK_FREE)
1762 pCurrImage = pCurrImage->pPrev;
1763 }
1764 }
1765 }
1766
1767 /* The task state will be updated on success already, don't do it here!. */
1768 if (rc == VERR_VD_BLOCK_FREE)
1769 {
1770 /* No image in the chain contains the data for the block. */
1771 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbThisRead); Assert(cbThisRead == (uint32_t)cbThisRead);
1772
1773 /* Fill the free space with 0 if we are told to do so
1774 * or a previous read returned valid data. */
1775 if (pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS)
1776 vdIoCtxSet(pIoCtx, '\0', cbThisRead);
1777 else
1778 pIoCtx->Req.Io.cbBufClear += cbThisRead;
1779
1780 if (pIoCtx->Req.Io.pImageCur->uOpenFlags & VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS)
1781 rc = VINF_VD_NEW_ZEROED_BLOCK;
1782 else
1783 rc = VINF_SUCCESS;
1784 }
1785 else if (rc == VERR_VD_IOCTX_HALT)
1786 {
1787 uOffset += cbThisRead;
1788 cbToRead -= cbThisRead;
1789 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
1790 }
1791 else if ( RT_SUCCESS(rc)
1792 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
1793 {
1794 /* First not free block, fill the space before with 0. */
1795 if ( pIoCtx->Req.Io.cbBufClear
1796 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS))
1797 {
1798 RTSGBUF SgBuf;
1799 RTSgBufClone(&SgBuf, &pIoCtx->Req.Io.SgBuf);
1800 RTSgBufReset(&SgBuf);
1801 RTSgBufSet(&SgBuf, 0, pIoCtx->Req.Io.cbBufClear);
1802 pIoCtx->Req.Io.cbBufClear = 0;
1803 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
1804 }
1805 rc = VINF_SUCCESS;
1806 }
1807
1808 if (RT_FAILURE(rc))
1809 break;
1810
1811 cbToRead -= cbThisRead;
1812 uOffset += cbThisRead;
1813 pCurrImage = pIoCtx->Req.Io.pImageStart; /* Start with the highest image in the chain. */
1814 } while (cbToRead != 0 && RT_SUCCESS(rc));
1815
1816 if ( rc == VERR_VD_NOT_ENOUGH_METADATA
1817 || rc == VERR_VD_IOCTX_HALT)
1818 {
1819 /* Save the current state. */
1820 pIoCtx->Req.Io.uOffset = uOffset;
1821 pIoCtx->Req.Io.cbTransfer = cbToRead;
1822 pIoCtx->Req.Io.pImageCur = pCurrImage ? pCurrImage : pIoCtx->Req.Io.pImageStart;
1823 }
1824
1825 return (!(pIoCtx->fFlags & VDIOCTX_FLAGS_ZERO_FREE_BLOCKS))
1826 ? VERR_VD_BLOCK_FREE
1827 : rc;
1828}
1829
1830/**
1831 * internal: parent image read wrapper for compacting.
1832 */
1833static DECLCALLBACK(int) vdParentRead(void *pvUser, uint64_t uOffset, void *pvBuf,
1834 size_t cbRead)
1835{
1836 PVDPARENTSTATEDESC pParentState = (PVDPARENTSTATEDESC)pvUser;
1837
1838 /** @todo
1839 * Only used for compaction so far which is not possible to mix with async I/O.
1840 * Needs to be changed if we want to support online compaction of images.
1841 */
1842 bool fLocked = ASMAtomicXchgBool(&pParentState->pDisk->fLocked, true);
1843 AssertMsgReturn(!fLocked,
1844 ("Calling synchronous parent read while another thread holds the disk lock\n"),
1845 VERR_VD_INVALID_STATE);
1846
1847 /* Fake an I/O context. */
1848 RTSGSEG Segment;
1849 RTSGBUF SgBuf;
1850 VDIOCTX IoCtx;
1851
1852 Segment.pvSeg = pvBuf;
1853 Segment.cbSeg = cbRead;
1854 RTSgBufInit(&SgBuf, &Segment, 1);
1855 vdIoCtxInit(&IoCtx, pParentState->pDisk, VDIOCTXTXDIR_READ, uOffset, cbRead, pParentState->pImage,
1856 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_ZERO_FREE_BLOCKS);
1857 int rc = vdReadHelperAsync(&IoCtx);
1858 ASMAtomicXchgBool(&pParentState->pDisk->fLocked, false);
1859 return rc;
1860}
1861
1862/**
1863 * Extended version of vdReadHelper(), implementing certain optimizations
1864 * for image cloning.
1865 *
1866 * @returns VBox status code.
1867 * @param pDisk The disk to read from.
1868 * @param pImage The image to start reading from.
1869 * @param pImageParentOverride The parent image to read from
1870 * if the starting image returns a free block.
1871 * If NULL is passed the real parent of the image
1872 * in the chain is used.
1873 * @param uOffset Offset in the disk to start reading from.
1874 * @param pvBuf Where to store the read data.
1875 * @param cbRead How much to read.
1876 * @param fZeroFreeBlocks Flag whether free blocks should be zeroed.
1877 * If false and no image has data for sepcified
1878 * range VERR_VD_BLOCK_FREE is returned.
1879 * Note that unallocated blocks are still zeroed
1880 * if at least one image has valid data for a part
1881 * of the range.
1882 * @param fUpdateCache Flag whether to update the attached cache if
1883 * available.
1884 * @param cImagesRead Number of images in the chain to read until
1885 * the read is cut off. A value of 0 disables the cut off.
1886 */
1887static int vdReadHelperEx(PVDISK pDisk, PVDIMAGE pImage, PVDIMAGE pImageParentOverride,
1888 uint64_t uOffset, void *pvBuf, size_t cbRead,
1889 bool fZeroFreeBlocks, bool fUpdateCache, unsigned cImagesRead)
1890{
1891 int rc = VINF_SUCCESS;
1892 uint32_t fFlags = VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE;
1893 RTSGSEG Segment;
1894 RTSGBUF SgBuf;
1895 VDIOCTX IoCtx;
1896 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
1897
1898 rc = RTSemEventCreate(&hEventComplete);
1899 if (RT_FAILURE(rc))
1900 return rc;
1901
1902 if (fZeroFreeBlocks)
1903 fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
1904 if (fUpdateCache)
1905 fFlags |= VDIOCTX_FLAGS_READ_UPDATE_CACHE;
1906
1907 Segment.pvSeg = pvBuf;
1908 Segment.cbSeg = cbRead;
1909 RTSgBufInit(&SgBuf, &Segment, 1);
1910 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, uOffset, cbRead, pImage, &SgBuf,
1911 NULL, vdReadHelperAsync, fFlags);
1912
1913 IoCtx.Req.Io.pImageParentOverride = pImageParentOverride;
1914 IoCtx.Req.Io.cImagesRead = cImagesRead;
1915 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
1916 IoCtx.Type.Root.pvUser1 = pDisk;
1917 IoCtx.Type.Root.pvUser2 = hEventComplete;
1918 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
1919 RTSemEventDestroy(hEventComplete);
1920 return rc;
1921}
1922
1923/**
1924 * internal: read the specified amount of data in whatever blocks the backend
1925 * will give us.
1926 */
1927static int vdReadHelper(PVDISK pDisk, PVDIMAGE pImage, uint64_t uOffset,
1928 void *pvBuf, size_t cbRead, bool fUpdateCache)
1929{
1930 return vdReadHelperEx(pDisk, pImage, NULL, uOffset, pvBuf, cbRead,
1931 true /* fZeroFreeBlocks */, fUpdateCache, 0);
1932}
1933
1934/**
1935 * internal: mark the disk as not modified.
1936 */
1937static void vdResetModifiedFlag(PVDISK pDisk)
1938{
1939 if (pDisk->uModified & VD_IMAGE_MODIFIED_FLAG)
1940 {
1941 /* generate new last-modified uuid */
1942 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
1943 {
1944 RTUUID Uuid;
1945
1946 RTUuidCreate(&Uuid);
1947 pDisk->pLast->Backend->pfnSetModificationUuid(pDisk->pLast->pBackendData,
1948 &Uuid);
1949
1950 if (pDisk->pCache)
1951 pDisk->pCache->Backend->pfnSetModificationUuid(pDisk->pCache->pBackendData,
1952 &Uuid);
1953 }
1954
1955 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FLAG;
1956 }
1957}
1958
1959/**
1960 * internal: mark the disk as modified.
1961 */
1962static void vdSetModifiedFlag(PVDISK pDisk)
1963{
1964 pDisk->uModified |= VD_IMAGE_MODIFIED_FLAG;
1965 if (pDisk->uModified & VD_IMAGE_MODIFIED_FIRST)
1966 {
1967 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FIRST;
1968
1969 /* First modify, so create a UUID and ensure it's written to disk. */
1970 vdResetModifiedFlag(pDisk);
1971
1972 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
1973 {
1974 VDIOCTX IoCtx;
1975 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_FLUSH, 0, 0, NULL,
1976 NULL, NULL, NULL, VDIOCTX_FLAGS_SYNC);
1977 pDisk->pLast->Backend->pfnFlush(pDisk->pLast->pBackendData, &IoCtx);
1978 }
1979 }
1980}
1981
1982/**
1983 * internal: write buffer to the image, taking care of block boundaries and
1984 * write optimizations.
1985 */
1986static int vdWriteHelperEx(PVDISK pDisk, PVDIMAGE pImage,
1987 PVDIMAGE pImageParentOverride, uint64_t uOffset,
1988 const void *pvBuf, size_t cbWrite,
1989 uint32_t fFlags, unsigned cImagesRead)
1990{
1991 int rc = VINF_SUCCESS;
1992 RTSGSEG Segment;
1993 RTSGBUF SgBuf;
1994 VDIOCTX IoCtx;
1995 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
1996
1997 rc = RTSemEventCreate(&hEventComplete);
1998 if (RT_FAILURE(rc))
1999 return rc;
2000
2001 fFlags |= VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE;
2002
2003 Segment.pvSeg = (void *)pvBuf;
2004 Segment.cbSeg = cbWrite;
2005 RTSgBufInit(&SgBuf, &Segment, 1);
2006 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_WRITE, uOffset, cbWrite, pImage, &SgBuf,
2007 NULL, vdWriteHelperAsync, fFlags);
2008
2009 IoCtx.Req.Io.pImageParentOverride = pImageParentOverride;
2010 IoCtx.Req.Io.cImagesRead = cImagesRead;
2011 IoCtx.pIoCtxParent = NULL;
2012 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
2013 IoCtx.Type.Root.pvUser1 = pDisk;
2014 IoCtx.Type.Root.pvUser2 = hEventComplete;
2015 if (RT_SUCCESS(rc))
2016 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
2017
2018 RTSemEventDestroy(hEventComplete);
2019 return rc;
2020}
2021
2022/**
2023 * internal: write buffer to the image, taking care of block boundaries and
2024 * write optimizations.
2025 */
2026static int vdWriteHelper(PVDISK pDisk, PVDIMAGE pImage, uint64_t uOffset,
2027 const void *pvBuf, size_t cbWrite, uint32_t fFlags)
2028{
2029 return vdWriteHelperEx(pDisk, pImage, NULL, uOffset, pvBuf, cbWrite,
2030 fFlags, 0);
2031}
2032
2033/**
2034 * Internal: Copies the content of one disk to another one applying optimizations
2035 * to speed up the copy process if possible.
2036 */
2037static int vdCopyHelper(PVDISK pDiskFrom, PVDIMAGE pImageFrom, PVDISK pDiskTo,
2038 uint64_t cbSize, unsigned cImagesFromRead, unsigned cImagesToRead,
2039 bool fSuppressRedundantIo, PVDINTERFACEPROGRESS pIfProgress,
2040 PVDINTERFACEPROGRESS pDstIfProgress)
2041{
2042 int rc = VINF_SUCCESS;
2043 int rc2;
2044 uint64_t uOffset = 0;
2045 uint64_t cbRemaining = cbSize;
2046 void *pvBuf = NULL;
2047 bool fLockReadFrom = false;
2048 bool fLockWriteTo = false;
2049 bool fBlockwiseCopy = false;
2050 unsigned uProgressOld = 0;
2051
2052 LogFlowFunc(("pDiskFrom=%#p pImageFrom=%#p pDiskTo=%#p cbSize=%llu cImagesFromRead=%u cImagesToRead=%u fSuppressRedundantIo=%RTbool pIfProgress=%#p pDstIfProgress=%#p\n",
2053 pDiskFrom, pImageFrom, pDiskTo, cbSize, cImagesFromRead, cImagesToRead, fSuppressRedundantIo, pDstIfProgress, pDstIfProgress));
2054
2055 if ( (fSuppressRedundantIo || (cImagesFromRead > 0))
2056 && RTListIsEmpty(&pDiskFrom->ListFilterChainRead))
2057 fBlockwiseCopy = true;
2058
2059 /* Allocate tmp buffer. */
2060 pvBuf = RTMemTmpAlloc(VD_MERGE_BUFFER_SIZE);
2061 if (!pvBuf)
2062 return rc;
2063
2064 do
2065 {
2066 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
2067
2068 /* Note that we don't attempt to synchronize cross-disk accesses.
2069 * It wouldn't be very difficult to do, just the lock order would
2070 * need to be defined somehow to prevent deadlocks. Postpone such
2071 * magic as there is no use case for this. */
2072
2073 rc2 = vdThreadStartRead(pDiskFrom);
2074 AssertRC(rc2);
2075 fLockReadFrom = true;
2076
2077 if (fBlockwiseCopy)
2078 {
2079 RTSGSEG SegmentBuf;
2080 RTSGBUF SgBuf;
2081 VDIOCTX IoCtx;
2082
2083 SegmentBuf.pvSeg = pvBuf;
2084 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
2085 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
2086 vdIoCtxInit(&IoCtx, pDiskFrom, VDIOCTXTXDIR_READ, 0, 0, NULL,
2087 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
2088
2089 /* Read the source data. */
2090 rc = pImageFrom->Backend->pfnRead(pImageFrom->pBackendData,
2091 uOffset, cbThisRead, &IoCtx,
2092 &cbThisRead);
2093
2094 if ( rc == VERR_VD_BLOCK_FREE
2095 && cImagesFromRead != 1)
2096 {
2097 unsigned cImagesToProcess = cImagesFromRead;
2098
2099 for (PVDIMAGE pCurrImage = pImageFrom->pPrev;
2100 pCurrImage != NULL && rc == VERR_VD_BLOCK_FREE;
2101 pCurrImage = pCurrImage->pPrev)
2102 {
2103 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
2104 uOffset, cbThisRead,
2105 &IoCtx, &cbThisRead);
2106 if (cImagesToProcess == 1)
2107 break;
2108 else if (cImagesToProcess > 0)
2109 cImagesToProcess--;
2110 }
2111 }
2112 }
2113 else
2114 rc = vdReadHelper(pDiskFrom, pImageFrom, uOffset, pvBuf, cbThisRead,
2115 false /* fUpdateCache */);
2116
2117 if (RT_FAILURE(rc) && rc != VERR_VD_BLOCK_FREE)
2118 break;
2119
2120 rc2 = vdThreadFinishRead(pDiskFrom);
2121 AssertRC(rc2);
2122 fLockReadFrom = false;
2123
2124 if (rc != VERR_VD_BLOCK_FREE)
2125 {
2126 rc2 = vdThreadStartWrite(pDiskTo);
2127 AssertRC(rc2);
2128 fLockWriteTo = true;
2129
2130 /* Only do collapsed I/O if we are copying the data blockwise. */
2131 rc = vdWriteHelperEx(pDiskTo, pDiskTo->pLast, NULL, uOffset, pvBuf,
2132 cbThisRead, VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG /* fFlags */,
2133 fBlockwiseCopy ? cImagesToRead : 0);
2134 if (RT_FAILURE(rc))
2135 break;
2136
2137 rc2 = vdThreadFinishWrite(pDiskTo);
2138 AssertRC(rc2);
2139 fLockWriteTo = false;
2140 }
2141 else /* Don't propagate the error to the outside */
2142 rc = VINF_SUCCESS;
2143
2144 uOffset += cbThisRead;
2145 cbRemaining -= cbThisRead;
2146
2147 unsigned uProgressNew = uOffset * 99 / cbSize;
2148 if (uProgressNew != uProgressOld)
2149 {
2150 uProgressOld = uProgressNew;
2151
2152 if (pIfProgress && pIfProgress->pfnProgress)
2153 {
2154 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
2155 uProgressOld);
2156 if (RT_FAILURE(rc))
2157 break;
2158 }
2159 if (pDstIfProgress && pDstIfProgress->pfnProgress)
2160 {
2161 rc = pDstIfProgress->pfnProgress(pDstIfProgress->Core.pvUser,
2162 uProgressOld);
2163 if (RT_FAILURE(rc))
2164 break;
2165 }
2166 }
2167 } while (uOffset < cbSize);
2168
2169 RTMemFree(pvBuf);
2170
2171 if (fLockReadFrom)
2172 {
2173 rc2 = vdThreadFinishRead(pDiskFrom);
2174 AssertRC(rc2);
2175 }
2176
2177 if (fLockWriteTo)
2178 {
2179 rc2 = vdThreadFinishWrite(pDiskTo);
2180 AssertRC(rc2);
2181 }
2182
2183 LogFlowFunc(("returns rc=%Rrc\n", rc));
2184 return rc;
2185}
2186
2187/**
2188 * Flush helper async version.
2189 */
2190static DECLCALLBACK(int) vdSetModifiedHelperAsync(PVDIOCTX pIoCtx)
2191{
2192 int rc = VINF_SUCCESS;
2193 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2194
2195 rc = pImage->Backend->pfnFlush(pImage->pBackendData, pIoCtx);
2196 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2197 rc = VINF_SUCCESS;
2198
2199 return rc;
2200}
2201
2202/**
2203 * internal: mark the disk as modified - async version.
2204 */
2205static int vdSetModifiedFlagAsync(PVDISK pDisk, PVDIOCTX pIoCtx)
2206{
2207 int rc = VINF_SUCCESS;
2208
2209 VD_IS_LOCKED(pDisk);
2210
2211 pDisk->uModified |= VD_IMAGE_MODIFIED_FLAG;
2212 if (pDisk->uModified & VD_IMAGE_MODIFIED_FIRST)
2213 {
2214 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2215 if (RT_SUCCESS(rc))
2216 {
2217 pDisk->uModified &= ~VD_IMAGE_MODIFIED_FIRST;
2218
2219 /* First modify, so create a UUID and ensure it's written to disk. */
2220 vdResetModifiedFlag(pDisk);
2221
2222 if (!(pDisk->uModified & VD_IMAGE_MODIFIED_DISABLE_UUID_UPDATE))
2223 {
2224 PVDIOCTX pIoCtxFlush = vdIoCtxChildAlloc(pDisk, VDIOCTXTXDIR_FLUSH,
2225 0, 0, pDisk->pLast,
2226 NULL, pIoCtx, 0, 0, NULL,
2227 vdSetModifiedHelperAsync);
2228
2229 if (pIoCtxFlush)
2230 {
2231 rc = vdIoCtxProcessLocked(pIoCtxFlush);
2232 if (rc == VINF_VD_ASYNC_IO_FINISHED)
2233 {
2234 vdIoCtxUnlockDisk(pDisk, pIoCtx, false /* fProcessDeferredReqs */);
2235 vdIoCtxFree(pDisk, pIoCtxFlush);
2236 }
2237 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2238 {
2239 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
2240 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2241 }
2242 else /* Another error */
2243 vdIoCtxFree(pDisk, pIoCtxFlush);
2244 }
2245 else
2246 rc = VERR_NO_MEMORY;
2247 }
2248 }
2249 }
2250
2251 return rc;
2252}
2253
2254static DECLCALLBACK(int) vdWriteHelperCommitAsync(PVDIOCTX pIoCtx)
2255{
2256 int rc = VINF_SUCCESS;
2257 PVDIMAGE pImage = pIoCtx->Req.Io.pImageStart;
2258 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2259 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2260 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2261
2262 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2263 rc = pImage->Backend->pfnWrite(pImage->pBackendData,
2264 pIoCtx->Req.Io.uOffset - cbPreRead,
2265 cbPreRead + cbThisWrite + cbPostRead,
2266 pIoCtx, NULL, &cbPreRead, &cbPostRead, 0);
2267 Assert(rc != VERR_VD_BLOCK_FREE);
2268 Assert(rc == VERR_VD_NOT_ENOUGH_METADATA || cbPreRead == 0);
2269 Assert(rc == VERR_VD_NOT_ENOUGH_METADATA || cbPostRead == 0);
2270 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2271 rc = VINF_SUCCESS;
2272 else if (rc == VERR_VD_IOCTX_HALT)
2273 {
2274 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2275 rc = VINF_SUCCESS;
2276 }
2277
2278 LogFlowFunc(("returns rc=%Rrc\n", rc));
2279 return rc;
2280}
2281
2282static DECLCALLBACK(int) vdWriteHelperOptimizedCmpAndWriteAsync(PVDIOCTX pIoCtx)
2283{
2284 int rc = VINF_SUCCESS;
2285 size_t cbThisWrite = 0;
2286 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2287 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2288 size_t cbWriteCopy = pIoCtx->Type.Child.Write.Optimized.cbWriteCopy;
2289 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2290 size_t cbReadImage = pIoCtx->Type.Child.Write.Optimized.cbReadImage;
2291 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
2292
2293 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2294
2295 AssertPtr(pIoCtxParent);
2296 Assert(!pIoCtxParent->pIoCtxParent);
2297 Assert(!pIoCtx->Req.Io.cbTransferLeft && !pIoCtx->cMetaTransfersPending);
2298
2299 vdIoCtxChildReset(pIoCtx);
2300 cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2301 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbPreRead);
2302
2303 /* Check if the write would modify anything in this block. */
2304 if (!RTSgBufCmp(&pIoCtx->Req.Io.SgBuf, &pIoCtxParent->Req.Io.SgBuf, cbThisWrite))
2305 {
2306 RTSGBUF SgBufSrcTmp;
2307
2308 RTSgBufClone(&SgBufSrcTmp, &pIoCtxParent->Req.Io.SgBuf);
2309 RTSgBufAdvance(&SgBufSrcTmp, cbThisWrite);
2310 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbThisWrite);
2311
2312 if (!cbWriteCopy || !RTSgBufCmp(&pIoCtx->Req.Io.SgBuf, &SgBufSrcTmp, cbWriteCopy))
2313 {
2314 /* Block is completely unchanged, so no need to write anything. */
2315 LogFlowFunc(("Block didn't changed\n"));
2316 ASMAtomicWriteU32(&pIoCtx->Req.Io.cbTransferLeft, 0);
2317 RTSgBufAdvance(&pIoCtxParent->Req.Io.SgBuf, cbThisWrite);
2318 return VINF_VD_ASYNC_IO_FINISHED;
2319 }
2320 }
2321
2322 /* Copy the data to the right place in the buffer. */
2323 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2324 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbPreRead);
2325 vdIoCtxCopy(pIoCtx, pIoCtxParent, cbThisWrite);
2326
2327 /* Handle the data that goes after the write to fill the block. */
2328 if (cbPostRead)
2329 {
2330 /* Now assemble the remaining data. */
2331 if (cbWriteCopy)
2332 {
2333 /*
2334 * The S/G buffer of the parent needs to be cloned because
2335 * it is not allowed to modify the state.
2336 */
2337 RTSGBUF SgBufParentTmp;
2338
2339 RTSgBufClone(&SgBufParentTmp, &pIoCtxParent->Req.Io.SgBuf);
2340 RTSgBufCopy(&pIoCtx->Req.Io.SgBuf, &SgBufParentTmp, cbWriteCopy);
2341 }
2342
2343 /* Zero out the remainder of this block. Will never be visible, as this
2344 * is beyond the limit of the image. */
2345 if (cbFill)
2346 {
2347 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbReadImage);
2348 vdIoCtxSet(pIoCtx, '\0', cbFill);
2349 }
2350 }
2351
2352 /* Write the full block to the virtual disk. */
2353 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2354 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2355
2356 return rc;
2357}
2358
2359static DECLCALLBACK(int) vdWriteHelperOptimizedPreReadAsync(PVDIOCTX pIoCtx)
2360{
2361 int rc = VINF_SUCCESS;
2362
2363 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2364
2365 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2366
2367 if ( pIoCtx->Req.Io.cbTransferLeft
2368 && !pIoCtx->cDataTransfersPending)
2369 rc = vdReadHelperAsync(pIoCtx);
2370
2371 if ( ( RT_SUCCESS(rc)
2372 || (rc == VERR_VD_ASYNC_IO_IN_PROGRESS))
2373 && ( pIoCtx->Req.Io.cbTransferLeft
2374 || pIoCtx->cMetaTransfersPending))
2375 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2376 else
2377 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperOptimizedCmpAndWriteAsync;
2378
2379 return rc;
2380}
2381
2382/**
2383 * internal: write a complete block (only used for diff images), taking the
2384 * remaining data from parent images. This implementation optimizes out writes
2385 * that do not change the data relative to the state as of the parent images.
2386 * All backends which support differential/growing images support this - async version.
2387 */
2388static DECLCALLBACK(int) vdWriteHelperOptimizedAsync(PVDIOCTX pIoCtx)
2389{
2390 PVDISK pDisk = pIoCtx->pDisk;
2391 uint64_t uOffset = pIoCtx->Type.Child.uOffsetSaved;
2392 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2393 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2394 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2395 size_t cbWrite = pIoCtx->Type.Child.cbWriteParent;
2396 size_t cbFill = 0;
2397 size_t cbWriteCopy = 0;
2398 size_t cbReadImage = 0;
2399
2400 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2401
2402 AssertPtr(pIoCtx->pIoCtxParent);
2403 Assert(!pIoCtx->pIoCtxParent->pIoCtxParent);
2404
2405 if (cbPostRead)
2406 {
2407 /* Figure out how much we cannot read from the image, because
2408 * the last block to write might exceed the nominal size of the
2409 * image for technical reasons. */
2410 if (uOffset + cbThisWrite + cbPostRead > pDisk->cbSize)
2411 cbFill = uOffset + cbThisWrite + cbPostRead - pDisk->cbSize;
2412
2413 /* If we have data to be written, use that instead of reading
2414 * data from the image. */
2415 if (cbWrite > cbThisWrite)
2416 cbWriteCopy = RT_MIN(cbWrite - cbThisWrite, cbPostRead);
2417
2418 /* The rest must be read from the image. */
2419 cbReadImage = cbPostRead - cbWriteCopy - cbFill;
2420 }
2421
2422 pIoCtx->Type.Child.Write.Optimized.cbFill = cbFill;
2423 pIoCtx->Type.Child.Write.Optimized.cbWriteCopy = cbWriteCopy;
2424 pIoCtx->Type.Child.Write.Optimized.cbReadImage = cbReadImage;
2425
2426 /* Read the entire data of the block so that we can compare whether it will
2427 * be modified by the write or not. */
2428 size_t cbTmp = cbPreRead + cbThisWrite + cbPostRead - cbFill; Assert(cbTmp == (uint32_t)cbTmp);
2429 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbTmp;
2430 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2431 pIoCtx->Req.Io.uOffset -= cbPreRead;
2432
2433 /* Next step */
2434 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperOptimizedPreReadAsync;
2435 return VINF_SUCCESS;
2436}
2437
2438static DECLCALLBACK(int) vdWriteHelperStandardReadImageAsync(PVDIOCTX pIoCtx)
2439{
2440 int rc = VINF_SUCCESS;
2441
2442 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2443
2444 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2445
2446 if ( pIoCtx->Req.Io.cbTransferLeft
2447 && !pIoCtx->cDataTransfersPending)
2448 rc = vdReadHelperAsync(pIoCtx);
2449
2450 if ( RT_SUCCESS(rc)
2451 && ( pIoCtx->Req.Io.cbTransferLeft
2452 || pIoCtx->cMetaTransfersPending))
2453 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2454 else
2455 {
2456 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2457
2458 /* Zero out the remainder of this block. Will never be visible, as this
2459 * is beyond the limit of the image. */
2460 if (cbFill)
2461 vdIoCtxSet(pIoCtx, '\0', cbFill);
2462
2463 /* Write the full block to the virtual disk. */
2464 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2465
2466 vdIoCtxChildReset(pIoCtx);
2467 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2468 }
2469
2470 return rc;
2471}
2472
2473static DECLCALLBACK(int) vdWriteHelperStandardAssemble(PVDIOCTX pIoCtx)
2474{
2475 int rc = VINF_SUCCESS;
2476 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2477 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2478 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
2479
2480 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2481
2482 vdIoCtxCopy(pIoCtx, pIoCtxParent, cbThisWrite);
2483 if (cbPostRead)
2484 {
2485 size_t cbFill = pIoCtx->Type.Child.Write.Optimized.cbFill;
2486 size_t cbWriteCopy = pIoCtx->Type.Child.Write.Optimized.cbWriteCopy;
2487 size_t cbReadImage = pIoCtx->Type.Child.Write.Optimized.cbReadImage;
2488
2489 /* Now assemble the remaining data. */
2490 if (cbWriteCopy)
2491 {
2492 /*
2493 * The S/G buffer of the parent needs to be cloned because
2494 * it is not allowed to modify the state.
2495 */
2496 RTSGBUF SgBufParentTmp;
2497
2498 RTSgBufClone(&SgBufParentTmp, &pIoCtxParent->Req.Io.SgBuf);
2499 RTSgBufCopy(&pIoCtx->Req.Io.SgBuf, &SgBufParentTmp, cbWriteCopy);
2500 }
2501
2502 if (cbReadImage)
2503 {
2504 /* Read remaining data. */
2505 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardReadImageAsync;
2506
2507 /* Read the data that goes before the write to fill the block. */
2508 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbReadImage; Assert(cbReadImage == (uint32_t)cbReadImage);
2509 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2510 pIoCtx->Req.Io.uOffset += cbWriteCopy;
2511 }
2512 else
2513 {
2514 /* Zero out the remainder of this block. Will never be visible, as this
2515 * is beyond the limit of the image. */
2516 if (cbFill)
2517 vdIoCtxSet(pIoCtx, '\0', cbFill);
2518
2519 /* Write the full block to the virtual disk. */
2520 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2521 vdIoCtxChildReset(pIoCtx);
2522 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2523 }
2524 }
2525 else
2526 {
2527 /* Write the full block to the virtual disk. */
2528 RTSgBufReset(&pIoCtx->Req.Io.SgBuf);
2529 vdIoCtxChildReset(pIoCtx);
2530 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperCommitAsync;
2531 }
2532
2533 return rc;
2534}
2535
2536static DECLCALLBACK(int) vdWriteHelperStandardPreReadAsync(PVDIOCTX pIoCtx)
2537{
2538 int rc = VINF_SUCCESS;
2539
2540 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2541
2542 pIoCtx->fFlags |= VDIOCTX_FLAGS_ZERO_FREE_BLOCKS;
2543
2544 if ( pIoCtx->Req.Io.cbTransferLeft
2545 && !pIoCtx->cDataTransfersPending)
2546 rc = vdReadHelperAsync(pIoCtx);
2547
2548 if ( RT_SUCCESS(rc)
2549 && ( pIoCtx->Req.Io.cbTransferLeft
2550 || pIoCtx->cMetaTransfersPending))
2551 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2552 else
2553 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardAssemble;
2554
2555 return rc;
2556}
2557
2558static DECLCALLBACK(int) vdWriteHelperStandardAsync(PVDIOCTX pIoCtx)
2559{
2560 PVDISK pDisk = pIoCtx->pDisk;
2561 uint64_t uOffset = pIoCtx->Type.Child.uOffsetSaved;
2562 size_t cbThisWrite = pIoCtx->Type.Child.cbTransferParent;
2563 size_t cbPreRead = pIoCtx->Type.Child.cbPreRead;
2564 size_t cbPostRead = pIoCtx->Type.Child.cbPostRead;
2565 size_t cbWrite = pIoCtx->Type.Child.cbWriteParent;
2566 size_t cbFill = 0;
2567 size_t cbWriteCopy = 0;
2568 size_t cbReadImage = 0;
2569
2570 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2571
2572 AssertPtr(pIoCtx->pIoCtxParent);
2573 Assert(!pIoCtx->pIoCtxParent->pIoCtxParent);
2574
2575 /* Calculate the amount of data to read that goes after the write to fill the block. */
2576 if (cbPostRead)
2577 {
2578 /* If we have data to be written, use that instead of reading
2579 * data from the image. */
2580 if (cbWrite > cbThisWrite)
2581 cbWriteCopy = RT_MIN(cbWrite - cbThisWrite, cbPostRead);
2582 else
2583 cbWriteCopy = 0;
2584
2585 /* Figure out how much we cannot read from the image, because
2586 * the last block to write might exceed the nominal size of the
2587 * image for technical reasons. */
2588 if (uOffset + cbThisWrite + cbPostRead > pDisk->cbSize)
2589 cbFill = uOffset + cbThisWrite + cbPostRead - pDisk->cbSize;
2590
2591 /* The rest must be read from the image. */
2592 cbReadImage = cbPostRead - cbWriteCopy - cbFill;
2593 }
2594
2595 pIoCtx->Type.Child.Write.Optimized.cbFill = cbFill;
2596 pIoCtx->Type.Child.Write.Optimized.cbWriteCopy = cbWriteCopy;
2597 pIoCtx->Type.Child.Write.Optimized.cbReadImage = cbReadImage;
2598
2599 /* Next step */
2600 if (cbPreRead)
2601 {
2602 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardPreReadAsync;
2603
2604 /* Read the data that goes before the write to fill the block. */
2605 pIoCtx->Req.Io.cbTransferLeft = (uint32_t)cbPreRead; Assert(cbPreRead == (uint32_t)cbPreRead);
2606 pIoCtx->Req.Io.cbTransfer = pIoCtx->Req.Io.cbTransferLeft;
2607 pIoCtx->Req.Io.uOffset -= cbPreRead;
2608 }
2609 else
2610 pIoCtx->pfnIoCtxTransferNext = vdWriteHelperStandardAssemble;
2611
2612 return VINF_SUCCESS;
2613}
2614
2615/**
2616 * internal: write buffer to the image, taking care of block boundaries and
2617 * write optimizations - async version.
2618 */
2619static DECLCALLBACK(int) vdWriteHelperAsync(PVDIOCTX pIoCtx)
2620{
2621 int rc;
2622 size_t cbWrite = pIoCtx->Req.Io.cbTransfer;
2623 uint64_t uOffset = pIoCtx->Req.Io.uOffset;
2624 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2625 PVDISK pDisk = pIoCtx->pDisk;
2626 unsigned fWrite;
2627 size_t cbThisWrite;
2628 size_t cbPreRead, cbPostRead;
2629
2630 /* Apply write filter chain here if it was not done already. */
2631 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_WRITE_FILTER_APPLIED))
2632 {
2633 rc = vdFilterChainApplyWrite(pDisk, uOffset, cbWrite, pIoCtx);
2634 if (RT_FAILURE(rc))
2635 return rc;
2636 pIoCtx->fFlags |= VDIOCTX_FLAGS_WRITE_FILTER_APPLIED;
2637 }
2638
2639 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_DONT_SET_MODIFIED_FLAG))
2640 {
2641 rc = vdSetModifiedFlagAsync(pDisk, pIoCtx);
2642 if (RT_FAILURE(rc)) /* Includes I/O in progress. */
2643 return rc;
2644 }
2645
2646 rc = vdDiscardSetRangeAllocated(pDisk, uOffset, cbWrite);
2647 if (RT_FAILURE(rc))
2648 return rc;
2649
2650 /* Loop until all written. */
2651 do
2652 {
2653 /* Try to write the possibly partial block to the last opened image.
2654 * This works when the block is already allocated in this image or
2655 * if it is a full-block write (and allocation isn't suppressed below).
2656 * For image formats which don't support zero blocks, it's beneficial
2657 * to avoid unnecessarily allocating unchanged blocks. This prevents
2658 * unwanted expanding of images. VMDK is an example. */
2659 cbThisWrite = cbWrite;
2660
2661 /*
2662 * Check whether there is a full block write in progress which was not allocated.
2663 * Defer I/O if the range interferes.
2664 */
2665 if ( pDisk->pIoCtxLockOwner != NIL_VDIOCTX
2666 && uOffset >= pDisk->uOffsetStartLocked
2667 && uOffset < pDisk->uOffsetEndLocked)
2668 {
2669 Log(("Interferring write while allocating a new block => deferring write\n"));
2670 vdIoCtxDefer(pDisk, pIoCtx);
2671 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2672 break;
2673 }
2674
2675 fWrite = (pImage->uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME)
2676 ? 0 : VD_WRITE_NO_ALLOC;
2677 rc = pImage->Backend->pfnWrite(pImage->pBackendData, uOffset, cbThisWrite,
2678 pIoCtx, &cbThisWrite, &cbPreRead, &cbPostRead,
2679 fWrite);
2680 if (rc == VERR_VD_BLOCK_FREE)
2681 {
2682 /* Lock the disk .*/
2683 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2684 if (RT_SUCCESS(rc))
2685 {
2686 /*
2687 * Allocate segment and buffer in one go.
2688 * A bit hackish but avoids the need to allocate memory twice.
2689 */
2690 PRTSGBUF pTmp = (PRTSGBUF)RTMemAlloc(cbPreRead + cbThisWrite + cbPostRead + sizeof(RTSGSEG) + sizeof(RTSGBUF));
2691 AssertBreakStmt(pTmp, rc = VERR_NO_MEMORY);
2692 PRTSGSEG pSeg = (PRTSGSEG)(pTmp + 1);
2693
2694 pSeg->pvSeg = pSeg + 1;
2695 pSeg->cbSeg = cbPreRead + cbThisWrite + cbPostRead;
2696 RTSgBufInit(pTmp, pSeg, 1);
2697
2698 PVDIOCTX pIoCtxWrite = vdIoCtxChildAlloc(pDisk, VDIOCTXTXDIR_WRITE,
2699 uOffset, pSeg->cbSeg, pImage,
2700 pTmp,
2701 pIoCtx, cbThisWrite,
2702 cbWrite,
2703 pTmp,
2704 (pImage->uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME)
2705 ? vdWriteHelperStandardAsync
2706 : vdWriteHelperOptimizedAsync);
2707 if (!VALID_PTR(pIoCtxWrite))
2708 {
2709 RTMemTmpFree(pTmp);
2710 rc = VERR_NO_MEMORY;
2711 break;
2712 }
2713
2714 LogFlowFunc(("Disk is growing because of pIoCtx=%#p pIoCtxWrite=%#p\n",
2715 pIoCtx, pIoCtxWrite));
2716
2717 /* Save the current range for the growing operation to check for intersecting requests later. */
2718 pDisk->uOffsetStartLocked = uOffset - cbPreRead;
2719 pDisk->uOffsetEndLocked = uOffset + cbThisWrite + cbPostRead;
2720
2721 pIoCtxWrite->Type.Child.cbPreRead = cbPreRead;
2722 pIoCtxWrite->Type.Child.cbPostRead = cbPostRead;
2723 pIoCtxWrite->Req.Io.pImageParentOverride = pIoCtx->Req.Io.pImageParentOverride;
2724
2725 /* Process the write request */
2726 rc = vdIoCtxProcessLocked(pIoCtxWrite);
2727
2728 if (RT_FAILURE(rc) && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
2729 {
2730 vdIoCtxUnlockDisk(pDisk, pIoCtx, false /* fProcessDeferredReqs*/ );
2731 vdIoCtxFree(pDisk, pIoCtxWrite);
2732 break;
2733 }
2734 else if ( rc == VINF_VD_ASYNC_IO_FINISHED
2735 && ASMAtomicCmpXchgBool(&pIoCtxWrite->fComplete, true, false))
2736 {
2737 LogFlow(("Child write request completed\n"));
2738 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbThisWrite);
2739 Assert(cbThisWrite == (uint32_t)cbThisWrite);
2740 rc = pIoCtxWrite->rcReq;
2741 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbThisWrite);
2742 vdIoCtxUnlockDisk(pDisk, pIoCtx, false /* fProcessDeferredReqs*/ );
2743 vdIoCtxFree(pDisk, pIoCtxWrite);
2744 }
2745 else
2746 {
2747 LogFlow(("Child write pending\n"));
2748 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
2749 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2750 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2751 cbWrite -= cbThisWrite;
2752 uOffset += cbThisWrite;
2753 break;
2754 }
2755 }
2756 else
2757 {
2758 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2759 break;
2760 }
2761 }
2762
2763 if (rc == VERR_VD_IOCTX_HALT)
2764 {
2765 cbWrite -= cbThisWrite;
2766 uOffset += cbThisWrite;
2767 pIoCtx->fFlags |= VDIOCTX_FLAGS_BLOCKED;
2768 break;
2769 }
2770 else if (rc == VERR_VD_NOT_ENOUGH_METADATA)
2771 break;
2772
2773 cbWrite -= cbThisWrite;
2774 uOffset += cbThisWrite;
2775 } while (cbWrite != 0 && (RT_SUCCESS(rc) || rc == VERR_VD_ASYNC_IO_IN_PROGRESS));
2776
2777 if ( rc == VERR_VD_ASYNC_IO_IN_PROGRESS
2778 || rc == VERR_VD_NOT_ENOUGH_METADATA
2779 || rc == VERR_VD_IOCTX_HALT)
2780 {
2781 /*
2782 * Tell the caller that we don't need to go back here because all
2783 * writes are initiated.
2784 */
2785 if ( !cbWrite
2786 && rc != VERR_VD_IOCTX_HALT)
2787 rc = VINF_SUCCESS;
2788
2789 pIoCtx->Req.Io.uOffset = uOffset;
2790 pIoCtx->Req.Io.cbTransfer = cbWrite;
2791 }
2792
2793 return rc;
2794}
2795
2796/**
2797 * Flush helper async version.
2798 */
2799static DECLCALLBACK(int) vdFlushHelperAsync(PVDIOCTX pIoCtx)
2800{
2801 int rc = VINF_SUCCESS;
2802 PVDISK pDisk = pIoCtx->pDisk;
2803 PVDIMAGE pImage = pIoCtx->Req.Io.pImageCur;
2804
2805 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
2806 if (RT_SUCCESS(rc))
2807 {
2808 /* Mark the whole disk as locked. */
2809 pDisk->uOffsetStartLocked = 0;
2810 pDisk->uOffsetEndLocked = UINT64_C(0xffffffffffffffff);
2811
2812 vdResetModifiedFlag(pDisk);
2813 rc = pImage->Backend->pfnFlush(pImage->pBackendData, pIoCtx);
2814 if ( ( RT_SUCCESS(rc)
2815 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS
2816 || rc == VERR_VD_IOCTX_HALT)
2817 && pDisk->pCache)
2818 {
2819 rc = pDisk->pCache->Backend->pfnFlush(pDisk->pCache->pBackendData, pIoCtx);
2820 if ( RT_SUCCESS(rc)
2821 || ( rc != VERR_VD_ASYNC_IO_IN_PROGRESS
2822 && rc != VERR_VD_IOCTX_HALT))
2823 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessBlockedReqs */);
2824 else if (rc != VERR_VD_IOCTX_HALT)
2825 rc = VINF_SUCCESS;
2826 }
2827 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2828 rc = VINF_SUCCESS;
2829 else if (rc != VERR_VD_IOCTX_HALT)/* Some other error. */
2830 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessBlockedReqs */);
2831 }
2832
2833 return rc;
2834}
2835
2836/**
2837 * Async discard helper - discards a whole block which is recorded in the block
2838 * tree.
2839 *
2840 * @returns VBox status code.
2841 * @param pIoCtx The I/O context to operate on.
2842 */
2843static DECLCALLBACK(int) vdDiscardWholeBlockAsync(PVDIOCTX pIoCtx)
2844{
2845 int rc = VINF_SUCCESS;
2846 PVDISK pDisk = pIoCtx->pDisk;
2847 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
2848 PVDDISCARDBLOCK pBlock = pIoCtx->Req.Discard.pBlock;
2849 size_t cbPreAllocated, cbPostAllocated, cbActuallyDiscarded;
2850
2851 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2852
2853 AssertPtr(pBlock);
2854
2855 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
2856 pBlock->Core.Key, pBlock->cbDiscard,
2857 &cbPreAllocated, &cbPostAllocated,
2858 &cbActuallyDiscarded, NULL, 0);
2859 Assert(rc != VERR_VD_DISCARD_ALIGNMENT_NOT_MET);
2860 Assert(!cbPreAllocated);
2861 Assert(!cbPostAllocated);
2862 Assert(cbActuallyDiscarded == pBlock->cbDiscard || RT_FAILURE(rc));
2863
2864 /* Remove the block on success. */
2865 if ( RT_SUCCESS(rc)
2866 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2867 {
2868 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
2869 Assert(pBlockRemove == pBlock); RT_NOREF1(pBlockRemove);
2870
2871 pDiscard->cbDiscarding -= pBlock->cbDiscard;
2872 RTListNodeRemove(&pBlock->NodeLru);
2873 RTMemFree(pBlock->pbmAllocated);
2874 RTMemFree(pBlock);
2875 pIoCtx->Req.Discard.pBlock = NULL;/* Safety precaution. */
2876 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync; /* Next part. */
2877 rc = VINF_SUCCESS;
2878 }
2879
2880 LogFlowFunc(("returns rc=%Rrc\n", rc));
2881 return rc;
2882}
2883
2884/**
2885 * Removes the least recently used blocks from the waiting list until
2886 * the new value is reached - version for async I/O.
2887 *
2888 * @returns VBox status code.
2889 * @param pDisk VD disk container.
2890 * @param pIoCtx The I/O context associated with this discard operation.
2891 * @param cbDiscardingNew How many bytes should be waiting on success.
2892 * The number of bytes waiting can be less.
2893 */
2894static int vdDiscardRemoveBlocksAsync(PVDISK pDisk, PVDIOCTX pIoCtx, size_t cbDiscardingNew)
2895{
2896 int rc = VINF_SUCCESS;
2897 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
2898
2899 LogFlowFunc(("pDisk=%#p pDiscard=%#p cbDiscardingNew=%zu\n",
2900 pDisk, pDiscard, cbDiscardingNew));
2901
2902 while (pDiscard->cbDiscarding > cbDiscardingNew)
2903 {
2904 PVDDISCARDBLOCK pBlock = RTListGetLast(&pDiscard->ListLru, VDDISCARDBLOCK, NodeLru);
2905
2906 Assert(!RTListIsEmpty(&pDiscard->ListLru));
2907
2908 /* Go over the allocation bitmap and mark all discarded sectors as unused. */
2909 uint64_t offStart = pBlock->Core.Key;
2910 uint32_t idxStart = 0;
2911 size_t cbLeft = pBlock->cbDiscard;
2912 bool fAllocated = ASMBitTest(pBlock->pbmAllocated, idxStart);
2913 uint32_t cSectors = (uint32_t)(pBlock->cbDiscard / 512);
2914
2915 while (cbLeft > 0)
2916 {
2917 int32_t idxEnd;
2918 size_t cbThis = cbLeft;
2919
2920 if (fAllocated)
2921 {
2922 /* Check for the first unallocated bit. */
2923 idxEnd = ASMBitNextClear(pBlock->pbmAllocated, cSectors, idxStart);
2924 if (idxEnd != -1)
2925 {
2926 cbThis = (idxEnd - idxStart) * 512;
2927 fAllocated = false;
2928 }
2929 }
2930 else
2931 {
2932 /* Mark as unused and check for the first set bit. */
2933 idxEnd = ASMBitNextSet(pBlock->pbmAllocated, cSectors, idxStart);
2934 if (idxEnd != -1)
2935 cbThis = (idxEnd - idxStart) * 512;
2936
2937 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
2938 offStart, cbThis, NULL, NULL, &cbThis,
2939 NULL, VD_DISCARD_MARK_UNUSED);
2940 if ( RT_FAILURE(rc)
2941 && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
2942 break;
2943
2944 fAllocated = true;
2945 }
2946
2947 idxStart = idxEnd;
2948 offStart += cbThis;
2949 cbLeft -= cbThis;
2950 }
2951
2952 if ( RT_FAILURE(rc)
2953 && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
2954 break;
2955
2956 PVDDISCARDBLOCK pBlockRemove = (PVDDISCARDBLOCK)RTAvlrU64RangeRemove(pDiscard->pTreeBlocks, pBlock->Core.Key);
2957 Assert(pBlockRemove == pBlock); NOREF(pBlockRemove);
2958 RTListNodeRemove(&pBlock->NodeLru);
2959
2960 pDiscard->cbDiscarding -= pBlock->cbDiscard;
2961 RTMemFree(pBlock->pbmAllocated);
2962 RTMemFree(pBlock);
2963 }
2964
2965 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
2966 rc = VINF_SUCCESS;
2967
2968 Assert(RT_FAILURE(rc) || pDiscard->cbDiscarding <= cbDiscardingNew);
2969
2970 LogFlowFunc(("returns rc=%Rrc\n", rc));
2971 return rc;
2972}
2973
2974/**
2975 * Async discard helper - discards the current range if there is no matching
2976 * block in the tree.
2977 *
2978 * @returns VBox status code.
2979 * @param pIoCtx The I/O context to operate on.
2980 */
2981static DECLCALLBACK(int) vdDiscardCurrentRangeAsync(PVDIOCTX pIoCtx)
2982{
2983 PVDISK pDisk = pIoCtx->pDisk;
2984 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
2985 uint64_t offStart = pIoCtx->Req.Discard.offCur;
2986 size_t cbThisDiscard = pIoCtx->Req.Discard.cbThisDiscard;
2987 void *pbmAllocated = NULL;
2988 size_t cbPreAllocated, cbPostAllocated;
2989 int rc = VINF_SUCCESS;
2990
2991 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
2992
2993 /* No block found, try to discard using the backend first. */
2994 rc = pDisk->pLast->Backend->pfnDiscard(pDisk->pLast->pBackendData, pIoCtx,
2995 offStart, cbThisDiscard, &cbPreAllocated,
2996 &cbPostAllocated, &cbThisDiscard,
2997 &pbmAllocated, 0);
2998 if (rc == VERR_VD_DISCARD_ALIGNMENT_NOT_MET)
2999 {
3000 /* Create new discard block. */
3001 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTMemAllocZ(sizeof(VDDISCARDBLOCK));
3002 if (pBlock)
3003 {
3004 pBlock->Core.Key = offStart - cbPreAllocated;
3005 pBlock->Core.KeyLast = offStart + cbThisDiscard + cbPostAllocated - 1;
3006 pBlock->cbDiscard = cbPreAllocated + cbThisDiscard + cbPostAllocated;
3007 pBlock->pbmAllocated = pbmAllocated;
3008 bool fInserted = RTAvlrU64Insert(pDiscard->pTreeBlocks, &pBlock->Core);
3009 Assert(fInserted); NOREF(fInserted);
3010
3011 RTListPrepend(&pDiscard->ListLru, &pBlock->NodeLru);
3012 pDiscard->cbDiscarding += pBlock->cbDiscard;
3013
3014 Assert(pIoCtx->Req.Discard.cbDiscardLeft >= cbThisDiscard);
3015 pIoCtx->Req.Discard.cbDiscardLeft -= cbThisDiscard;
3016 pIoCtx->Req.Discard.offCur += cbThisDiscard;
3017 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3018
3019 if (pDiscard->cbDiscarding > VD_DISCARD_REMOVE_THRESHOLD)
3020 rc = vdDiscardRemoveBlocksAsync(pDisk, pIoCtx, VD_DISCARD_REMOVE_THRESHOLD);
3021 else
3022 rc = VINF_SUCCESS;
3023
3024 if (RT_SUCCESS(rc))
3025 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync; /* Next part. */
3026 }
3027 else
3028 {
3029 RTMemFree(pbmAllocated);
3030 rc = VERR_NO_MEMORY;
3031 }
3032 }
3033 else if ( RT_SUCCESS(rc)
3034 || rc == VERR_VD_ASYNC_IO_IN_PROGRESS) /* Save state and andvance to next range. */
3035 {
3036 Assert(pIoCtx->Req.Discard.cbDiscardLeft >= cbThisDiscard);
3037 pIoCtx->Req.Discard.cbDiscardLeft -= cbThisDiscard;
3038 pIoCtx->Req.Discard.offCur += cbThisDiscard;
3039 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3040 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync;
3041 rc = VINF_SUCCESS;
3042 }
3043
3044 LogFlowFunc(("returns rc=%Rrc\n", rc));
3045 return rc;
3046}
3047
3048/**
3049 * Async discard helper - entry point.
3050 *
3051 * @returns VBox status code.
3052 * @param pIoCtx The I/O context to operate on.
3053 */
3054static DECLCALLBACK(int) vdDiscardHelperAsync(PVDIOCTX pIoCtx)
3055{
3056 int rc = VINF_SUCCESS;
3057 PVDISK pDisk = pIoCtx->pDisk;
3058 PCRTRANGE paRanges = pIoCtx->Req.Discard.paRanges;
3059 unsigned cRanges = pIoCtx->Req.Discard.cRanges;
3060 PVDDISCARDSTATE pDiscard = pDisk->pDiscard;
3061
3062 LogFlowFunc(("pIoCtx=%#p\n", pIoCtx));
3063
3064 /* Check if the I/O context processed all ranges. */
3065 if ( pIoCtx->Req.Discard.idxRange == cRanges
3066 && !pIoCtx->Req.Discard.cbDiscardLeft)
3067 {
3068 LogFlowFunc(("All ranges discarded, completing\n"));
3069 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessDeferredReqs*/);
3070 return VINF_SUCCESS;
3071 }
3072
3073 if (pDisk->pIoCtxLockOwner != pIoCtx)
3074 rc = vdIoCtxLockDisk(pDisk, pIoCtx);
3075
3076 if (RT_SUCCESS(rc))
3077 {
3078 uint64_t offStart = pIoCtx->Req.Discard.offCur;
3079 size_t cbDiscardLeft = pIoCtx->Req.Discard.cbDiscardLeft;
3080 size_t cbThisDiscard;
3081
3082 pDisk->uOffsetStartLocked = offStart;
3083 pDisk->uOffsetEndLocked = offStart + cbDiscardLeft;
3084
3085 if (RT_UNLIKELY(!pDiscard))
3086 {
3087 pDiscard = vdDiscardStateCreate();
3088 if (!pDiscard)
3089 return VERR_NO_MEMORY;
3090
3091 pDisk->pDiscard = pDiscard;
3092 }
3093
3094 if (!pIoCtx->Req.Discard.cbDiscardLeft)
3095 {
3096 offStart = paRanges[pIoCtx->Req.Discard.idxRange].offStart;
3097 cbDiscardLeft = paRanges[pIoCtx->Req.Discard.idxRange].cbRange;
3098 LogFlowFunc(("New range descriptor loaded (%u) offStart=%llu cbDiscard=%zu\n",
3099 pIoCtx->Req.Discard.idxRange, offStart, cbDiscardLeft));
3100 pIoCtx->Req.Discard.idxRange++;
3101 }
3102
3103 /* Look for a matching block in the AVL tree first. */
3104 PVDDISCARDBLOCK pBlock = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, offStart, false);
3105 if (!pBlock || pBlock->Core.KeyLast < offStart)
3106 {
3107 PVDDISCARDBLOCK pBlockAbove = (PVDDISCARDBLOCK)RTAvlrU64GetBestFit(pDiscard->pTreeBlocks, offStart, true);
3108
3109 /* Clip range to remain in the current block. */
3110 if (pBlockAbove)
3111 cbThisDiscard = RT_MIN(cbDiscardLeft, pBlockAbove->Core.KeyLast - offStart + 1);
3112 else
3113 cbThisDiscard = cbDiscardLeft;
3114
3115 Assert(!(cbThisDiscard % 512));
3116 pIoCtx->Req.Discard.pBlock = NULL;
3117 pIoCtx->pfnIoCtxTransferNext = vdDiscardCurrentRangeAsync;
3118 }
3119 else
3120 {
3121 /* Range lies partly in the block, update allocation bitmap. */
3122 int32_t idxStart, idxEnd;
3123
3124 cbThisDiscard = RT_MIN(cbDiscardLeft, pBlock->Core.KeyLast - offStart + 1);
3125
3126 AssertPtr(pBlock);
3127
3128 Assert(!(cbThisDiscard % 512));
3129 Assert(!((offStart - pBlock->Core.Key) % 512));
3130
3131 idxStart = (offStart - pBlock->Core.Key) / 512;
3132 idxEnd = idxStart + (int32_t)(cbThisDiscard / 512);
3133
3134 ASMBitClearRange(pBlock->pbmAllocated, idxStart, idxEnd);
3135
3136 cbDiscardLeft -= cbThisDiscard;
3137 offStart += cbThisDiscard;
3138
3139 /* Call the backend to discard the block if it is completely unallocated now. */
3140 if (ASMBitFirstSet((volatile void *)pBlock->pbmAllocated, (uint32_t)(pBlock->cbDiscard / 512)) == -1)
3141 {
3142 pIoCtx->Req.Discard.pBlock = pBlock;
3143 pIoCtx->pfnIoCtxTransferNext = vdDiscardWholeBlockAsync;
3144 rc = VINF_SUCCESS;
3145 }
3146 else
3147 {
3148 RTListNodeRemove(&pBlock->NodeLru);
3149 RTListPrepend(&pDiscard->ListLru, &pBlock->NodeLru);
3150
3151 /* Start with next range. */
3152 pIoCtx->pfnIoCtxTransferNext = vdDiscardHelperAsync;
3153 rc = VINF_SUCCESS;
3154 }
3155 }
3156
3157 /* Save state in the context. */
3158 pIoCtx->Req.Discard.offCur = offStart;
3159 pIoCtx->Req.Discard.cbDiscardLeft = cbDiscardLeft;
3160 pIoCtx->Req.Discard.cbThisDiscard = cbThisDiscard;
3161 }
3162
3163 LogFlowFunc(("returns rc=%Rrc\n", rc));
3164 return rc;
3165}
3166
3167/**
3168 * VD async I/O interface open callback.
3169 */
3170static DECLCALLBACK(int) vdIOOpenFallback(void *pvUser, const char *pszLocation,
3171 uint32_t fOpen, PFNVDCOMPLETED pfnCompleted,
3172 void **ppStorage)
3173{
3174 RT_NOREF1(pvUser);
3175 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)RTMemAllocZ(sizeof(VDIIOFALLBACKSTORAGE));
3176
3177 if (!pStorage)
3178 return VERR_NO_MEMORY;
3179
3180 pStorage->pfnCompleted = pfnCompleted;
3181
3182 /* Open the file. */
3183 int rc = RTFileOpen(&pStorage->File, pszLocation, fOpen);
3184 if (RT_SUCCESS(rc))
3185 {
3186 *ppStorage = pStorage;
3187 return VINF_SUCCESS;
3188 }
3189
3190 RTMemFree(pStorage);
3191 return rc;
3192}
3193
3194/**
3195 * VD async I/O interface close callback.
3196 */
3197static DECLCALLBACK(int) vdIOCloseFallback(void *pvUser, void *pvStorage)
3198{
3199 RT_NOREF1(pvUser);
3200 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3201
3202 RTFileClose(pStorage->File);
3203 RTMemFree(pStorage);
3204 return VINF_SUCCESS;
3205}
3206
3207static DECLCALLBACK(int) vdIODeleteFallback(void *pvUser, const char *pcszFilename)
3208{
3209 RT_NOREF1(pvUser);
3210 return RTFileDelete(pcszFilename);
3211}
3212
3213static DECLCALLBACK(int) vdIOMoveFallback(void *pvUser, const char *pcszSrc, const char *pcszDst, unsigned fMove)
3214{
3215 RT_NOREF1(pvUser);
3216 return RTFileMove(pcszSrc, pcszDst, fMove);
3217}
3218
3219static DECLCALLBACK(int) vdIOGetFreeSpaceFallback(void *pvUser, const char *pcszFilename, int64_t *pcbFreeSpace)
3220{
3221 RT_NOREF1(pvUser);
3222 return RTFsQuerySizes(pcszFilename, NULL, pcbFreeSpace, NULL, NULL);
3223}
3224
3225static DECLCALLBACK(int) vdIOGetModificationTimeFallback(void *pvUser, const char *pcszFilename, PRTTIMESPEC pModificationTime)
3226{
3227 RT_NOREF1(pvUser);
3228 RTFSOBJINFO info;
3229 int rc = RTPathQueryInfo(pcszFilename, &info, RTFSOBJATTRADD_NOTHING);
3230 if (RT_SUCCESS(rc))
3231 *pModificationTime = info.ModificationTime;
3232 return rc;
3233}
3234
3235/**
3236 * VD async I/O interface callback for retrieving the file size.
3237 */
3238static DECLCALLBACK(int) vdIOGetSizeFallback(void *pvUser, void *pvStorage, uint64_t *pcbSize)
3239{
3240 RT_NOREF1(pvUser);
3241 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3242
3243 return RTFileGetSize(pStorage->File, pcbSize);
3244}
3245
3246/**
3247 * VD async I/O interface callback for setting the file size.
3248 */
3249static DECLCALLBACK(int) vdIOSetSizeFallback(void *pvUser, void *pvStorage, uint64_t cbSize)
3250{
3251 RT_NOREF1(pvUser);
3252 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3253
3254 return RTFileSetSize(pStorage->File, cbSize);
3255}
3256
3257/**
3258 * VD async I/O interface callback for setting the file allocation size.
3259 */
3260static DECLCALLBACK(int) vdIOSetAllocationSizeFallback(void *pvUser, void *pvStorage, uint64_t cbSize,
3261 uint32_t fFlags)
3262{
3263 RT_NOREF2(pvUser, fFlags);
3264 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3265
3266 return RTFileSetAllocationSize(pStorage->File, cbSize, RTFILE_ALLOC_SIZE_F_DEFAULT);
3267}
3268
3269/**
3270 * VD async I/O interface callback for a synchronous write to the file.
3271 */
3272static DECLCALLBACK(int) vdIOWriteSyncFallback(void *pvUser, void *pvStorage, uint64_t uOffset,
3273 const void *pvBuf, size_t cbWrite, size_t *pcbWritten)
3274{
3275 RT_NOREF1(pvUser);
3276 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3277
3278 return RTFileWriteAt(pStorage->File, uOffset, pvBuf, cbWrite, pcbWritten);
3279}
3280
3281/**
3282 * VD async I/O interface callback for a synchronous read from the file.
3283 */
3284static DECLCALLBACK(int) vdIOReadSyncFallback(void *pvUser, void *pvStorage, uint64_t uOffset,
3285 void *pvBuf, size_t cbRead, size_t *pcbRead)
3286{
3287 RT_NOREF1(pvUser);
3288 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3289
3290 return RTFileReadAt(pStorage->File, uOffset, pvBuf, cbRead, pcbRead);
3291}
3292
3293/**
3294 * VD async I/O interface callback for a synchronous flush of the file data.
3295 */
3296static DECLCALLBACK(int) vdIOFlushSyncFallback(void *pvUser, void *pvStorage)
3297{
3298 RT_NOREF1(pvUser);
3299 PVDIIOFALLBACKSTORAGE pStorage = (PVDIIOFALLBACKSTORAGE)pvStorage;
3300
3301 return RTFileFlush(pStorage->File);
3302}
3303
3304/**
3305 * VD async I/O interface callback for a asynchronous read from the file.
3306 */
3307static DECLCALLBACK(int) vdIOReadAsyncFallback(void *pvUser, void *pStorage, uint64_t uOffset,
3308 PCRTSGSEG paSegments, size_t cSegments,
3309 size_t cbRead, void *pvCompletion,
3310 void **ppTask)
3311{
3312 RT_NOREF8(pvUser, pStorage, uOffset, paSegments, cSegments, cbRead, pvCompletion, ppTask);
3313 return VERR_NOT_IMPLEMENTED;
3314}
3315
3316/**
3317 * VD async I/O interface callback for a asynchronous write to the file.
3318 */
3319static DECLCALLBACK(int) vdIOWriteAsyncFallback(void *pvUser, void *pStorage, uint64_t uOffset,
3320 PCRTSGSEG paSegments, size_t cSegments,
3321 size_t cbWrite, void *pvCompletion,
3322 void **ppTask)
3323{
3324 RT_NOREF8(pvUser, pStorage, uOffset, paSegments, cSegments, cbWrite, pvCompletion, ppTask);
3325 return VERR_NOT_IMPLEMENTED;
3326}
3327
3328/**
3329 * VD async I/O interface callback for a asynchronous flush of the file data.
3330 */
3331static DECLCALLBACK(int) vdIOFlushAsyncFallback(void *pvUser, void *pStorage,
3332 void *pvCompletion, void **ppTask)
3333{
3334 RT_NOREF4(pvUser, pStorage, pvCompletion, ppTask);
3335 return VERR_NOT_IMPLEMENTED;
3336}
3337
3338/**
3339 * Internal - Continues an I/O context after
3340 * it was halted because of an active transfer.
3341 */
3342static int vdIoCtxContinue(PVDIOCTX pIoCtx, int rcReq)
3343{
3344 PVDISK pDisk = pIoCtx->pDisk;
3345 int rc = VINF_SUCCESS;
3346
3347 VD_IS_LOCKED(pDisk);
3348
3349 if (RT_FAILURE(rcReq))
3350 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rcReq, VINF_SUCCESS);
3351
3352 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_BLOCKED))
3353 {
3354 /* Continue the transfer */
3355 rc = vdIoCtxProcessLocked(pIoCtx);
3356
3357 if ( rc == VINF_VD_ASYNC_IO_FINISHED
3358 && ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
3359 {
3360 LogFlowFunc(("I/O context completed pIoCtx=%#p\n", pIoCtx));
3361 bool fFreeCtx = RT_BOOL(!(pIoCtx->fFlags & VDIOCTX_FLAGS_DONT_FREE));
3362 if (pIoCtx->pIoCtxParent)
3363 {
3364 PVDIOCTX pIoCtxParent = pIoCtx->pIoCtxParent;
3365
3366 Assert(!pIoCtxParent->pIoCtxParent);
3367 if (RT_FAILURE(pIoCtx->rcReq))
3368 ASMAtomicCmpXchgS32(&pIoCtxParent->rcReq, pIoCtx->rcReq, VINF_SUCCESS);
3369
3370 ASMAtomicDecU32(&pIoCtxParent->cDataTransfersPending);
3371
3372 if (pIoCtx->enmTxDir == VDIOCTXTXDIR_WRITE)
3373 {
3374 LogFlowFunc(("I/O context transferred %u bytes for the parent pIoCtxParent=%p\n",
3375 pIoCtx->Type.Child.cbTransferParent, pIoCtxParent));
3376
3377 /* Update the parent state. */
3378 Assert(pIoCtxParent->Req.Io.cbTransferLeft >= pIoCtx->Type.Child.cbTransferParent);
3379 ASMAtomicSubU32(&pIoCtxParent->Req.Io.cbTransferLeft, (uint32_t)pIoCtx->Type.Child.cbTransferParent);
3380 }
3381 else
3382 Assert(pIoCtx->enmTxDir == VDIOCTXTXDIR_FLUSH);
3383
3384 /*
3385 * A completed child write means that we finished growing the image.
3386 * We have to process any pending writes now.
3387 */
3388 vdIoCtxUnlockDisk(pDisk, pIoCtxParent, false /* fProcessDeferredReqs */);
3389
3390 /* Unblock the parent */
3391 pIoCtxParent->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
3392
3393 rc = vdIoCtxProcessLocked(pIoCtxParent);
3394
3395 if ( rc == VINF_VD_ASYNC_IO_FINISHED
3396 && ASMAtomicCmpXchgBool(&pIoCtxParent->fComplete, true, false))
3397 {
3398 LogFlowFunc(("Parent I/O context completed pIoCtxParent=%#p rcReq=%Rrc\n", pIoCtxParent, pIoCtxParent->rcReq));
3399 bool fFreeParentCtx = RT_BOOL(!(pIoCtxParent->fFlags & VDIOCTX_FLAGS_DONT_FREE));
3400 vdIoCtxRootComplete(pDisk, pIoCtxParent);
3401 vdThreadFinishWrite(pDisk);
3402
3403 if (fFreeParentCtx)
3404 vdIoCtxFree(pDisk, pIoCtxParent);
3405 vdDiskProcessBlockedIoCtx(pDisk);
3406 }
3407 else if (!vdIoCtxIsDiskLockOwner(pDisk, pIoCtx))
3408 {
3409 /* Process any pending writes if the current request didn't caused another growing. */
3410 vdDiskProcessBlockedIoCtx(pDisk);
3411 }
3412 }
3413 else
3414 {
3415 if (pIoCtx->enmTxDir == VDIOCTXTXDIR_FLUSH)
3416 {
3417 vdIoCtxUnlockDisk(pDisk, pIoCtx, true /* fProcessDerredReqs */);
3418 vdThreadFinishWrite(pDisk);
3419 }
3420 else if ( pIoCtx->enmTxDir == VDIOCTXTXDIR_WRITE
3421 || pIoCtx->enmTxDir == VDIOCTXTXDIR_DISCARD)
3422 vdThreadFinishWrite(pDisk);
3423 else
3424 {
3425 Assert(pIoCtx->enmTxDir == VDIOCTXTXDIR_READ);
3426 vdThreadFinishRead(pDisk);
3427 }
3428
3429 LogFlowFunc(("I/O context completed pIoCtx=%#p rcReq=%Rrc\n", pIoCtx, pIoCtx->rcReq));
3430 vdIoCtxRootComplete(pDisk, pIoCtx);
3431 }
3432
3433 if (fFreeCtx)
3434 vdIoCtxFree(pDisk, pIoCtx);
3435 }
3436 }
3437
3438 return VINF_SUCCESS;
3439}
3440
3441/**
3442 * Internal - Called when user transfer completed.
3443 */
3444static int vdUserXferCompleted(PVDIOSTORAGE pIoStorage, PVDIOCTX pIoCtx,
3445 PFNVDXFERCOMPLETED pfnComplete, void *pvUser,
3446 size_t cbTransfer, int rcReq)
3447{
3448 int rc = VINF_SUCCESS;
3449 PVDISK pDisk = pIoCtx->pDisk;
3450
3451 LogFlowFunc(("pIoStorage=%#p pIoCtx=%#p pfnComplete=%#p pvUser=%#p cbTransfer=%zu rcReq=%Rrc\n",
3452 pIoStorage, pIoCtx, pfnComplete, pvUser, cbTransfer, rcReq));
3453
3454 VD_IS_LOCKED(pDisk);
3455
3456 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbTransfer);
3457 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTransfer); Assert(cbTransfer == (uint32_t)cbTransfer);
3458 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
3459
3460 if (pfnComplete)
3461 rc = pfnComplete(pIoStorage->pVDIo->pBackendData, pIoCtx, pvUser, rcReq);
3462
3463 if (RT_SUCCESS(rc))
3464 rc = vdIoCtxContinue(pIoCtx, rcReq);
3465 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3466 rc = VINF_SUCCESS;
3467
3468 return rc;
3469}
3470
3471static void vdIoCtxContinueDeferredList(PVDIOSTORAGE pIoStorage, PRTLISTANCHOR pListWaiting,
3472 PFNVDXFERCOMPLETED pfnComplete, void *pvUser, int rcReq)
3473{
3474 LogFlowFunc(("pIoStorage=%#p pListWaiting=%#p pfnComplete=%#p pvUser=%#p rcReq=%Rrc\n",
3475 pIoStorage, pListWaiting, pfnComplete, pvUser, rcReq));
3476
3477 /* Go through the waiting list and continue the I/O contexts. */
3478 while (!RTListIsEmpty(pListWaiting))
3479 {
3480 int rc = VINF_SUCCESS;
3481 PVDIOCTXDEFERRED pDeferred = RTListGetFirst(pListWaiting, VDIOCTXDEFERRED, NodeDeferred);
3482 PVDIOCTX pIoCtx = pDeferred->pIoCtx;
3483 RTListNodeRemove(&pDeferred->NodeDeferred);
3484
3485 RTMemFree(pDeferred);
3486 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
3487
3488 if (pfnComplete)
3489 rc = pfnComplete(pIoStorage->pVDIo->pBackendData, pIoCtx, pvUser, rcReq);
3490
3491 LogFlow(("Completion callback for I/O context %#p returned %Rrc\n", pIoCtx, rc));
3492
3493 if (RT_SUCCESS(rc))
3494 {
3495 rc = vdIoCtxContinue(pIoCtx, rcReq);
3496 AssertRC(rc);
3497 }
3498 else
3499 Assert(rc == VERR_VD_ASYNC_IO_IN_PROGRESS);
3500 }
3501}
3502
3503/**
3504 * Internal - Called when a meta transfer completed.
3505 */
3506static int vdMetaXferCompleted(PVDIOSTORAGE pIoStorage, PFNVDXFERCOMPLETED pfnComplete, void *pvUser,
3507 PVDMETAXFER pMetaXfer, int rcReq)
3508{
3509 PVDISK pDisk = pIoStorage->pVDIo->pDisk;
3510 RTLISTNODE ListIoCtxWaiting;
3511 bool fFlush;
3512
3513 LogFlowFunc(("pIoStorage=%#p pfnComplete=%#p pvUser=%#p pMetaXfer=%#p rcReq=%Rrc\n",
3514 pIoStorage, pfnComplete, pvUser, pMetaXfer, rcReq));
3515
3516 VD_IS_LOCKED(pDisk);
3517
3518 fFlush = VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_FLUSH;
3519
3520 if (!fFlush)
3521 {
3522 RTListMove(&ListIoCtxWaiting, &pMetaXfer->ListIoCtxWaiting);
3523
3524 if (RT_FAILURE(rcReq))
3525 {
3526 /* Remove from the AVL tree. */
3527 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
3528 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
3529 Assert(fRemoved); NOREF(fRemoved);
3530 /* If this was a write check if there is a shadow buffer with updated data. */
3531 if (pMetaXfer->pbDataShw)
3532 {
3533 Assert(VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_WRITE);
3534 Assert(!RTListIsEmpty(&pMetaXfer->ListIoCtxShwWrites));
3535 RTListConcatenate(&ListIoCtxWaiting, &pMetaXfer->ListIoCtxShwWrites);
3536 RTMemFree(pMetaXfer->pbDataShw);
3537 pMetaXfer->pbDataShw = NULL;
3538 }
3539 RTMemFree(pMetaXfer);
3540 }
3541 else
3542 {
3543 /* Increase the reference counter to make sure it doesn't go away before the last context is processed. */
3544 pMetaXfer->cRefs++;
3545 }
3546 }
3547 else
3548 RTListMove(&ListIoCtxWaiting, &pMetaXfer->ListIoCtxWaiting);
3549
3550 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
3551 vdIoCtxContinueDeferredList(pIoStorage, &ListIoCtxWaiting, pfnComplete, pvUser, rcReq);
3552
3553 /*
3554 * If there is a shadow buffer and the previous write was successful update with the
3555 * new data and trigger a new write.
3556 */
3557 if ( pMetaXfer->pbDataShw
3558 && RT_SUCCESS(rcReq)
3559 && VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE)
3560 {
3561 LogFlowFunc(("pMetaXfer=%#p Updating from shadow buffer and triggering new write\n", pMetaXfer));
3562 memcpy(pMetaXfer->abData, pMetaXfer->pbDataShw, pMetaXfer->cbMeta);
3563 RTMemFree(pMetaXfer->pbDataShw);
3564 pMetaXfer->pbDataShw = NULL;
3565 Assert(!RTListIsEmpty(&pMetaXfer->ListIoCtxShwWrites));
3566
3567 /* Setup a new I/O write. */
3568 PVDIOTASK pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvUser, pMetaXfer);
3569 if (RT_LIKELY(pIoTask))
3570 {
3571 void *pvTask = NULL;
3572 RTSGSEG Seg;
3573
3574 Seg.cbSeg = pMetaXfer->cbMeta;
3575 Seg.pvSeg = pMetaXfer->abData;
3576
3577 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_WRITE);
3578 rcReq = pIoStorage->pVDIo->pInterfaceIo->pfnWriteAsync(pIoStorage->pVDIo->pInterfaceIo->Core.pvUser,
3579 pIoStorage->pStorage,
3580 pMetaXfer->Core.Key, &Seg, 1,
3581 pMetaXfer->cbMeta, pIoTask,
3582 &pvTask);
3583 if ( RT_SUCCESS(rcReq)
3584 || rcReq != VERR_VD_ASYNC_IO_IN_PROGRESS)
3585 {
3586 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
3587 vdIoTaskFree(pDisk, pIoTask);
3588 }
3589 else
3590 RTListMove(&pMetaXfer->ListIoCtxWaiting, &pMetaXfer->ListIoCtxShwWrites);
3591 }
3592 else
3593 rcReq = VERR_NO_MEMORY;
3594
3595 /* Cleanup if there was an error or the request completed already. */
3596 if (rcReq != VERR_VD_ASYNC_IO_IN_PROGRESS)
3597 vdIoCtxContinueDeferredList(pIoStorage, &pMetaXfer->ListIoCtxShwWrites, pfnComplete, pvUser, rcReq);
3598 }
3599
3600 /* Remove if not used anymore. */
3601 if (!fFlush)
3602 {
3603 pMetaXfer->cRefs--;
3604 if (!pMetaXfer->cRefs && RTListIsEmpty(&pMetaXfer->ListIoCtxWaiting))
3605 {
3606 /* Remove from the AVL tree. */
3607 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
3608 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
3609 Assert(fRemoved); NOREF(fRemoved);
3610 RTMemFree(pMetaXfer);
3611 }
3612 }
3613 else if (fFlush)
3614 RTMemFree(pMetaXfer);
3615
3616 return VINF_SUCCESS;
3617}
3618
3619/**
3620 * Processes a list of waiting I/O tasks. The disk lock must be held by caller.
3621 *
3622 * @returns nothing.
3623 * @param pDisk The disk to process the list for.
3624 */
3625static void vdIoTaskProcessWaitingList(PVDISK pDisk)
3626{
3627 LogFlowFunc(("pDisk=%#p\n", pDisk));
3628
3629 VD_IS_LOCKED(pDisk);
3630
3631 PVDIOTASK pHead = ASMAtomicXchgPtrT(&pDisk->pIoTasksPendingHead, NULL, PVDIOTASK);
3632
3633 Log(("I/O task list cleared\n"));
3634
3635 /* Reverse order. */
3636 PVDIOTASK pCur = pHead;
3637 pHead = NULL;
3638 while (pCur)
3639 {
3640 PVDIOTASK pInsert = pCur;
3641 pCur = pCur->pNext;
3642 pInsert->pNext = pHead;
3643 pHead = pInsert;
3644 }
3645
3646 while (pHead)
3647 {
3648 PVDIOSTORAGE pIoStorage = pHead->pIoStorage;
3649
3650 if (!pHead->fMeta)
3651 vdUserXferCompleted(pIoStorage, pHead->Type.User.pIoCtx,
3652 pHead->pfnComplete, pHead->pvUser,
3653 pHead->Type.User.cbTransfer, pHead->rcReq);
3654 else
3655 vdMetaXferCompleted(pIoStorage, pHead->pfnComplete, pHead->pvUser,
3656 pHead->Type.Meta.pMetaXfer, pHead->rcReq);
3657
3658 pCur = pHead;
3659 pHead = pHead->pNext;
3660 vdIoTaskFree(pDisk, pCur);
3661 }
3662}
3663
3664/**
3665 * Process any I/O context on the halted list.
3666 *
3667 * @returns nothing.
3668 * @param pDisk The disk.
3669 */
3670static void vdIoCtxProcessHaltedList(PVDISK pDisk)
3671{
3672 LogFlowFunc(("pDisk=%#p\n", pDisk));
3673
3674 VD_IS_LOCKED(pDisk);
3675
3676 /* Get the waiting list and process it in FIFO order. */
3677 PVDIOCTX pIoCtxHead = ASMAtomicXchgPtrT(&pDisk->pIoCtxHaltedHead, NULL, PVDIOCTX);
3678
3679 /* Reverse it. */
3680 PVDIOCTX pCur = pIoCtxHead;
3681 pIoCtxHead = NULL;
3682 while (pCur)
3683 {
3684 PVDIOCTX pInsert = pCur;
3685 pCur = pCur->pIoCtxNext;
3686 pInsert->pIoCtxNext = pIoCtxHead;
3687 pIoCtxHead = pInsert;
3688 }
3689
3690 /* Process now. */
3691 pCur = pIoCtxHead;
3692 while (pCur)
3693 {
3694 PVDIOCTX pTmp = pCur;
3695
3696 pCur = pCur->pIoCtxNext;
3697 pTmp->pIoCtxNext = NULL;
3698
3699 /* Continue */
3700 pTmp->fFlags &= ~VDIOCTX_FLAGS_BLOCKED;
3701 vdIoCtxContinue(pTmp, pTmp->rcReq);
3702 }
3703}
3704
3705/**
3706 * Unlock the disk and process pending tasks.
3707 *
3708 * @returns VBox status code.
3709 * @param pDisk The disk to unlock.
3710 * @param pIoCtxRc The I/O context to get the status code from, optional.
3711 */
3712static int vdDiskUnlock(PVDISK pDisk, PVDIOCTX pIoCtxRc)
3713{
3714 int rc = VINF_SUCCESS;
3715
3716 VD_IS_LOCKED(pDisk);
3717
3718 /*
3719 * Process the list of waiting I/O tasks first
3720 * because they might complete I/O contexts.
3721 * Same for the list of halted I/O contexts.
3722 * Afterwards comes the list of new I/O contexts.
3723 */
3724 vdIoTaskProcessWaitingList(pDisk);
3725 vdIoCtxProcessHaltedList(pDisk);
3726 rc = vdDiskProcessWaitingIoCtx(pDisk, pIoCtxRc);
3727 ASMAtomicXchgBool(&pDisk->fLocked, false);
3728
3729 /*
3730 * Need to check for new I/O tasks and waiting I/O contexts now
3731 * again as other threads might added them while we processed
3732 * previous lists.
3733 */
3734 while ( ASMAtomicUoReadPtrT(&pDisk->pIoCtxHead, PVDIOCTX) != NULL
3735 || ASMAtomicUoReadPtrT(&pDisk->pIoTasksPendingHead, PVDIOTASK) != NULL
3736 || ASMAtomicUoReadPtrT(&pDisk->pIoCtxHaltedHead, PVDIOCTX) != NULL)
3737 {
3738 /* Try lock disk again. */
3739 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
3740 {
3741 vdIoTaskProcessWaitingList(pDisk);
3742 vdIoCtxProcessHaltedList(pDisk);
3743 vdDiskProcessWaitingIoCtx(pDisk, NULL);
3744 ASMAtomicXchgBool(&pDisk->fLocked, false);
3745 }
3746 else /* Let the other thread everything when he unlocks the disk. */
3747 break;
3748 }
3749
3750 return rc;
3751}
3752
3753/**
3754 * Try to lock the disk to complete pressing of the I/O task.
3755 * The completion is deferred if the disk is locked already.
3756 *
3757 * @returns nothing.
3758 * @param pIoTask The I/O task to complete.
3759 */
3760static void vdXferTryLockDiskDeferIoTask(PVDIOTASK pIoTask)
3761{
3762 PVDIOSTORAGE pIoStorage = pIoTask->pIoStorage;
3763 PVDISK pDisk = pIoStorage->pVDIo->pDisk;
3764
3765 Log(("Deferring I/O task pIoTask=%p\n", pIoTask));
3766
3767 /* Put it on the waiting list. */
3768 PVDIOTASK pNext = ASMAtomicUoReadPtrT(&pDisk->pIoTasksPendingHead, PVDIOTASK);
3769 PVDIOTASK pHeadOld;
3770 pIoTask->pNext = pNext;
3771 while (!ASMAtomicCmpXchgExPtr(&pDisk->pIoTasksPendingHead, pIoTask, pNext, &pHeadOld))
3772 {
3773 pNext = pHeadOld;
3774 Assert(pNext != pIoTask);
3775 pIoTask->pNext = pNext;
3776 ASMNopPause();
3777 }
3778
3779 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
3780 {
3781 /* Release disk lock, it will take care of processing all lists. */
3782 vdDiskUnlock(pDisk, NULL);
3783 }
3784}
3785
3786static DECLCALLBACK(int) vdIOIntReqCompleted(void *pvUser, int rcReq)
3787{
3788 PVDIOTASK pIoTask = (PVDIOTASK)pvUser;
3789
3790 LogFlowFunc(("Task completed pIoTask=%#p\n", pIoTask));
3791
3792 pIoTask->rcReq = rcReq;
3793 vdXferTryLockDiskDeferIoTask(pIoTask);
3794 return VINF_SUCCESS;
3795}
3796
3797/**
3798 * VD I/O interface callback for opening a file.
3799 */
3800static DECLCALLBACK(int) vdIOIntOpen(void *pvUser, const char *pszLocation,
3801 unsigned uOpenFlags, PPVDIOSTORAGE ppIoStorage)
3802{
3803 int rc = VINF_SUCCESS;
3804 PVDIO pVDIo = (PVDIO)pvUser;
3805 PVDIOSTORAGE pIoStorage = (PVDIOSTORAGE)RTMemAllocZ(sizeof(VDIOSTORAGE));
3806
3807 if (!pIoStorage)
3808 return VERR_NO_MEMORY;
3809
3810 /* Create the AVl tree. */
3811 pIoStorage->pTreeMetaXfers = (PAVLRFOFFTREE)RTMemAllocZ(sizeof(AVLRFOFFTREE));
3812 if (pIoStorage->pTreeMetaXfers)
3813 {
3814 rc = pVDIo->pInterfaceIo->pfnOpen(pVDIo->pInterfaceIo->Core.pvUser,
3815 pszLocation, uOpenFlags,
3816 vdIOIntReqCompleted,
3817 &pIoStorage->pStorage);
3818 if (RT_SUCCESS(rc))
3819 {
3820 pIoStorage->pVDIo = pVDIo;
3821 *ppIoStorage = pIoStorage;
3822 return VINF_SUCCESS;
3823 }
3824
3825 RTMemFree(pIoStorage->pTreeMetaXfers);
3826 }
3827 else
3828 rc = VERR_NO_MEMORY;
3829
3830 RTMemFree(pIoStorage);
3831 return rc;
3832}
3833
3834static DECLCALLBACK(int) vdIOIntTreeMetaXferDestroy(PAVLRFOFFNODECORE pNode, void *pvUser)
3835{
3836 RT_NOREF2(pNode, pvUser);
3837 AssertMsgFailed(("Tree should be empty at this point!\n"));
3838 return VINF_SUCCESS;
3839}
3840
3841static DECLCALLBACK(int) vdIOIntClose(void *pvUser, PVDIOSTORAGE pIoStorage)
3842{
3843 int rc = VINF_SUCCESS;
3844 PVDIO pVDIo = (PVDIO)pvUser;
3845
3846 /* We free everything here, even if closing the file failed for some reason. */
3847 rc = pVDIo->pInterfaceIo->pfnClose(pVDIo->pInterfaceIo->Core.pvUser, pIoStorage->pStorage);
3848 RTAvlrFileOffsetDestroy(pIoStorage->pTreeMetaXfers, vdIOIntTreeMetaXferDestroy, NULL);
3849 RTMemFree(pIoStorage->pTreeMetaXfers);
3850 RTMemFree(pIoStorage);
3851 return rc;
3852}
3853
3854static DECLCALLBACK(int) vdIOIntDelete(void *pvUser, const char *pcszFilename)
3855{
3856 PVDIO pVDIo = (PVDIO)pvUser;
3857 return pVDIo->pInterfaceIo->pfnDelete(pVDIo->pInterfaceIo->Core.pvUser,
3858 pcszFilename);
3859}
3860
3861static DECLCALLBACK(int) vdIOIntMove(void *pvUser, const char *pcszSrc, const char *pcszDst,
3862 unsigned fMove)
3863{
3864 PVDIO pVDIo = (PVDIO)pvUser;
3865 return pVDIo->pInterfaceIo->pfnMove(pVDIo->pInterfaceIo->Core.pvUser,
3866 pcszSrc, pcszDst, fMove);
3867}
3868
3869static DECLCALLBACK(int) vdIOIntGetFreeSpace(void *pvUser, const char *pcszFilename,
3870 int64_t *pcbFreeSpace)
3871{
3872 PVDIO pVDIo = (PVDIO)pvUser;
3873 return pVDIo->pInterfaceIo->pfnGetFreeSpace(pVDIo->pInterfaceIo->Core.pvUser,
3874 pcszFilename, pcbFreeSpace);
3875}
3876
3877static DECLCALLBACK(int) vdIOIntGetModificationTime(void *pvUser, const char *pcszFilename,
3878 PRTTIMESPEC pModificationTime)
3879{
3880 PVDIO pVDIo = (PVDIO)pvUser;
3881 return pVDIo->pInterfaceIo->pfnGetModificationTime(pVDIo->pInterfaceIo->Core.pvUser,
3882 pcszFilename, pModificationTime);
3883}
3884
3885static DECLCALLBACK(int) vdIOIntGetSize(void *pvUser, PVDIOSTORAGE pIoStorage,
3886 uint64_t *pcbSize)
3887{
3888 PVDIO pVDIo = (PVDIO)pvUser;
3889 return pVDIo->pInterfaceIo->pfnGetSize(pVDIo->pInterfaceIo->Core.pvUser,
3890 pIoStorage->pStorage, pcbSize);
3891}
3892
3893static DECLCALLBACK(int) vdIOIntSetSize(void *pvUser, PVDIOSTORAGE pIoStorage,
3894 uint64_t cbSize)
3895{
3896 PVDIO pVDIo = (PVDIO)pvUser;
3897 return pVDIo->pInterfaceIo->pfnSetSize(pVDIo->pInterfaceIo->Core.pvUser,
3898 pIoStorage->pStorage, cbSize);
3899}
3900
3901static DECLCALLBACK(int) vdIOIntSetAllocationSize(void *pvUser, PVDIOSTORAGE pIoStorage,
3902 uint64_t cbSize, uint32_t fFlags,
3903 PVDINTERFACEPROGRESS pIfProgress,
3904 unsigned uPercentStart, unsigned uPercentSpan)
3905{
3906 PVDIO pVDIo = (PVDIO)pvUser;
3907 int rc = pVDIo->pInterfaceIo->pfnSetAllocationSize(pVDIo->pInterfaceIo->Core.pvUser,
3908 pIoStorage->pStorage, cbSize, fFlags);
3909 if (rc == VERR_NOT_SUPPORTED)
3910 {
3911 /* Fallback if the underlying medium does not support optimized storage allocation. */
3912 uint64_t cbSizeCur = 0;
3913 rc = pVDIo->pInterfaceIo->pfnGetSize(pVDIo->pInterfaceIo->Core.pvUser,
3914 pIoStorage->pStorage, &cbSizeCur);
3915 if (RT_SUCCESS(rc))
3916 {
3917 if (cbSizeCur < cbSize)
3918 {
3919 const size_t cbBuf = 128 * _1K;
3920 void *pvBuf = RTMemTmpAllocZ(cbBuf);
3921 if (RT_LIKELY(pvBuf))
3922 {
3923 uint64_t cbFill = cbSize - cbSizeCur;
3924 uint64_t uOff = 0;
3925
3926 /* Write data to all blocks. */
3927 while ( uOff < cbFill
3928 && RT_SUCCESS(rc))
3929 {
3930 size_t cbChunk = (size_t)RT_MIN(cbFill - uOff, cbBuf);
3931
3932 rc = pVDIo->pInterfaceIo->pfnWriteSync(pVDIo->pInterfaceIo->Core.pvUser,
3933 pIoStorage->pStorage, cbSizeCur + uOff,
3934 pvBuf, cbChunk, NULL);
3935 if (RT_SUCCESS(rc))
3936 {
3937 uOff += cbChunk;
3938
3939 rc = vdIfProgress(pIfProgress, uPercentStart + uOff * uPercentSpan / cbFill);
3940 }
3941 }
3942
3943 RTMemTmpFree(pvBuf);
3944 }
3945 else
3946 rc = VERR_NO_MEMORY;
3947 }
3948 else if (cbSizeCur > cbSize)
3949 rc = pVDIo->pInterfaceIo->pfnSetSize(pVDIo->pInterfaceIo->Core.pvUser,
3950 pIoStorage->pStorage, cbSize);
3951 }
3952 }
3953
3954 if (RT_SUCCESS(rc))
3955 rc = vdIfProgress(pIfProgress, uPercentStart + uPercentSpan);
3956
3957 return rc;
3958}
3959
3960static DECLCALLBACK(int) vdIOIntReadUser(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
3961 PVDIOCTX pIoCtx, size_t cbRead)
3962{
3963 int rc = VINF_SUCCESS;
3964 PVDIO pVDIo = (PVDIO)pvUser;
3965 PVDISK pDisk = pVDIo->pDisk;
3966
3967 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pIoCtx=%#p cbRead=%u\n",
3968 pvUser, pIoStorage, uOffset, pIoCtx, cbRead));
3969
3970 /** @todo Enable check for sync I/O later. */
3971 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
3972 VD_IS_LOCKED(pDisk);
3973
3974 Assert(cbRead > 0);
3975
3976 if (pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
3977 {
3978 RTSGSEG Seg;
3979 unsigned cSegments = 1;
3980 size_t cbTaskRead = 0;
3981
3982 /* Synchronous I/O contexts only have one buffer segment. */
3983 AssertMsgReturn(pIoCtx->Req.Io.SgBuf.cSegs == 1,
3984 ("Invalid number of buffer segments for synchronous I/O context"),
3985 VERR_INVALID_PARAMETER);
3986
3987 cbTaskRead = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, &Seg, &cSegments, cbRead);
3988 Assert(cbRead == cbTaskRead);
3989 Assert(cSegments == 1);
3990 rc = pVDIo->pInterfaceIo->pfnReadSync(pVDIo->pInterfaceIo->Core.pvUser,
3991 pIoStorage->pStorage, uOffset,
3992 Seg.pvSeg, cbRead, NULL);
3993 if (RT_SUCCESS(rc))
3994 {
3995 Assert(cbRead == (uint32_t)cbRead);
3996 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbRead);
3997 }
3998 }
3999 else
4000 {
4001 /* Build the S/G array and spawn a new I/O task */
4002 while (cbRead)
4003 {
4004 RTSGSEG aSeg[VD_IO_TASK_SEGMENTS_MAX];
4005 unsigned cSegments = VD_IO_TASK_SEGMENTS_MAX;
4006 size_t cbTaskRead = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, aSeg, &cSegments, cbRead);
4007
4008 Assert(cSegments > 0);
4009 Assert(cbTaskRead > 0);
4010 AssertMsg(cbTaskRead <= cbRead, ("Invalid number of bytes to read\n"));
4011
4012 LogFlow(("Reading %u bytes into %u segments\n", cbTaskRead, cSegments));
4013
4014#ifdef RT_STRICT
4015 for (unsigned i = 0; i < cSegments; i++)
4016 AssertMsg(aSeg[i].pvSeg && !(aSeg[i].cbSeg % 512),
4017 ("Segment %u is invalid\n", i));
4018#endif
4019
4020 Assert(cbTaskRead == (uint32_t)cbTaskRead);
4021 PVDIOTASK pIoTask = vdIoTaskUserAlloc(pIoStorage, NULL, NULL, pIoCtx, (uint32_t)cbTaskRead);
4022
4023 if (!pIoTask)
4024 return VERR_NO_MEMORY;
4025
4026 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
4027
4028 void *pvTask;
4029 Log(("Spawning pIoTask=%p pIoCtx=%p\n", pIoTask, pIoCtx));
4030 rc = pVDIo->pInterfaceIo->pfnReadAsync(pVDIo->pInterfaceIo->Core.pvUser,
4031 pIoStorage->pStorage, uOffset,
4032 aSeg, cSegments, cbTaskRead, pIoTask,
4033 &pvTask);
4034 if (RT_SUCCESS(rc))
4035 {
4036 AssertMsg(cbTaskRead <= pIoCtx->Req.Io.cbTransferLeft, ("Impossible!\n"));
4037 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTaskRead);
4038 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4039 vdIoTaskFree(pDisk, pIoTask);
4040 }
4041 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4042 {
4043 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4044 vdIoTaskFree(pDisk, pIoTask);
4045 break;
4046 }
4047
4048 uOffset += cbTaskRead;
4049 cbRead -= cbTaskRead;
4050 }
4051 }
4052
4053 LogFlowFunc(("returns rc=%Rrc\n", rc));
4054 return rc;
4055}
4056
4057static DECLCALLBACK(int) vdIOIntWriteUser(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4058 PVDIOCTX pIoCtx, size_t cbWrite, PFNVDXFERCOMPLETED pfnComplete,
4059 void *pvCompleteUser)
4060{
4061 int rc = VINF_SUCCESS;
4062 PVDIO pVDIo = (PVDIO)pvUser;
4063 PVDISK pDisk = pVDIo->pDisk;
4064
4065 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pIoCtx=%#p cbWrite=%u\n",
4066 pvUser, pIoStorage, uOffset, pIoCtx, cbWrite));
4067
4068 /** @todo Enable check for sync I/O later. */
4069 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4070 VD_IS_LOCKED(pDisk);
4071
4072 Assert(cbWrite > 0);
4073
4074 if (pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4075 {
4076 RTSGSEG Seg;
4077 unsigned cSegments = 1;
4078 size_t cbTaskWrite = 0;
4079
4080 /* Synchronous I/O contexts only have one buffer segment. */
4081 AssertMsgReturn(pIoCtx->Req.Io.SgBuf.cSegs == 1,
4082 ("Invalid number of buffer segments for synchronous I/O context"),
4083 VERR_INVALID_PARAMETER);
4084
4085 cbTaskWrite = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, &Seg, &cSegments, cbWrite);
4086 Assert(cbWrite == cbTaskWrite);
4087 Assert(cSegments == 1);
4088 rc = pVDIo->pInterfaceIo->pfnWriteSync(pVDIo->pInterfaceIo->Core.pvUser,
4089 pIoStorage->pStorage, uOffset,
4090 Seg.pvSeg, cbWrite, NULL);
4091 if (RT_SUCCESS(rc))
4092 {
4093 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbWrite);
4094 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbWrite);
4095 }
4096 }
4097 else
4098 {
4099 /* Build the S/G array and spawn a new I/O task */
4100 while (cbWrite)
4101 {
4102 RTSGSEG aSeg[VD_IO_TASK_SEGMENTS_MAX];
4103 unsigned cSegments = VD_IO_TASK_SEGMENTS_MAX;
4104 size_t cbTaskWrite = 0;
4105
4106 cbTaskWrite = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, aSeg, &cSegments, cbWrite);
4107
4108 Assert(cSegments > 0);
4109 Assert(cbTaskWrite > 0);
4110 AssertMsg(cbTaskWrite <= cbWrite, ("Invalid number of bytes to write\n"));
4111
4112 LogFlow(("Writing %u bytes from %u segments\n", cbTaskWrite, cSegments));
4113
4114#ifdef DEBUG
4115 for (unsigned i = 0; i < cSegments; i++)
4116 AssertMsg(aSeg[i].pvSeg && !(aSeg[i].cbSeg % 512),
4117 ("Segment %u is invalid\n", i));
4118#endif
4119
4120 Assert(cbTaskWrite == (uint32_t)cbTaskWrite);
4121 PVDIOTASK pIoTask = vdIoTaskUserAlloc(pIoStorage, pfnComplete, pvCompleteUser, pIoCtx, (uint32_t)cbTaskWrite);
4122
4123 if (!pIoTask)
4124 return VERR_NO_MEMORY;
4125
4126 ASMAtomicIncU32(&pIoCtx->cDataTransfersPending);
4127
4128 void *pvTask;
4129 Log(("Spawning pIoTask=%p pIoCtx=%p\n", pIoTask, pIoCtx));
4130 rc = pVDIo->pInterfaceIo->pfnWriteAsync(pVDIo->pInterfaceIo->Core.pvUser,
4131 pIoStorage->pStorage,
4132 uOffset, aSeg, cSegments,
4133 cbTaskWrite, pIoTask, &pvTask);
4134 if (RT_SUCCESS(rc))
4135 {
4136 AssertMsg(cbTaskWrite <= pIoCtx->Req.Io.cbTransferLeft, ("Impossible!\n"));
4137 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbTaskWrite);
4138 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4139 vdIoTaskFree(pDisk, pIoTask);
4140 }
4141 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4142 {
4143 ASMAtomicDecU32(&pIoCtx->cDataTransfersPending);
4144 vdIoTaskFree(pDisk, pIoTask);
4145 break;
4146 }
4147
4148 uOffset += cbTaskWrite;
4149 cbWrite -= cbTaskWrite;
4150 }
4151 }
4152
4153 LogFlowFunc(("returns rc=%Rrc\n", rc));
4154 return rc;
4155}
4156
4157static DECLCALLBACK(int) vdIOIntReadMeta(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4158 void *pvBuf, size_t cbRead, PVDIOCTX pIoCtx,
4159 PPVDMETAXFER ppMetaXfer, PFNVDXFERCOMPLETED pfnComplete,
4160 void *pvCompleteUser)
4161{
4162 PVDIO pVDIo = (PVDIO)pvUser;
4163 PVDISK pDisk = pVDIo->pDisk;
4164 int rc = VINF_SUCCESS;
4165 RTSGSEG Seg;
4166 PVDIOTASK pIoTask;
4167 PVDMETAXFER pMetaXfer = NULL;
4168 void *pvTask = NULL;
4169
4170 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pvBuf=%#p cbRead=%u\n",
4171 pvUser, pIoStorage, uOffset, pvBuf, cbRead));
4172
4173 AssertMsgReturn( pIoCtx
4174 || (!ppMetaXfer && !pfnComplete && !pvCompleteUser),
4175 ("A synchronous metadata read is requested but the parameters are wrong\n"),
4176 VERR_INVALID_POINTER);
4177
4178 /** @todo Enable check for sync I/O later. */
4179 if ( pIoCtx
4180 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4181 VD_IS_LOCKED(pDisk);
4182
4183 if ( !pIoCtx
4184 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4185 {
4186 /* Handle synchronous metadata I/O. */
4187 /** @todo Integrate with metadata transfers below. */
4188 rc = pVDIo->pInterfaceIo->pfnReadSync(pVDIo->pInterfaceIo->Core.pvUser,
4189 pIoStorage->pStorage, uOffset,
4190 pvBuf, cbRead, NULL);
4191 if (ppMetaXfer)
4192 *ppMetaXfer = NULL;
4193 }
4194 else
4195 {
4196 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGet(pIoStorage->pTreeMetaXfers, uOffset);
4197 if (!pMetaXfer)
4198 {
4199#ifdef RT_STRICT
4200 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGetBestFit(pIoStorage->pTreeMetaXfers, uOffset, false /* fAbove */);
4201 AssertMsg(!pMetaXfer || (pMetaXfer->Core.Key + (RTFOFF)pMetaXfer->cbMeta <= (RTFOFF)uOffset),
4202 ("Overlapping meta transfers!\n"));
4203#endif
4204
4205 /* Allocate a new meta transfer. */
4206 pMetaXfer = vdMetaXferAlloc(pIoStorage, uOffset, cbRead);
4207 if (!pMetaXfer)
4208 return VERR_NO_MEMORY;
4209
4210 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvCompleteUser, pMetaXfer);
4211 if (!pIoTask)
4212 {
4213 RTMemFree(pMetaXfer);
4214 return VERR_NO_MEMORY;
4215 }
4216
4217 Seg.cbSeg = cbRead;
4218 Seg.pvSeg = pMetaXfer->abData;
4219
4220 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_READ);
4221 rc = pVDIo->pInterfaceIo->pfnReadAsync(pVDIo->pInterfaceIo->Core.pvUser,
4222 pIoStorage->pStorage,
4223 uOffset, &Seg, 1,
4224 cbRead, pIoTask, &pvTask);
4225
4226 if (RT_SUCCESS(rc) || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4227 {
4228 bool fInserted = RTAvlrFileOffsetInsert(pIoStorage->pTreeMetaXfers, &pMetaXfer->Core);
4229 Assert(fInserted); NOREF(fInserted);
4230 }
4231 else
4232 RTMemFree(pMetaXfer);
4233
4234 if (RT_SUCCESS(rc))
4235 {
4236 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4237 vdIoTaskFree(pDisk, pIoTask);
4238 }
4239 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS && !pfnComplete)
4240 rc = VERR_VD_NOT_ENOUGH_METADATA;
4241 }
4242
4243 Assert(VALID_PTR(pMetaXfer) || RT_FAILURE(rc));
4244
4245 if (RT_SUCCESS(rc) || rc == VERR_VD_NOT_ENOUGH_METADATA || rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4246 {
4247 /* If it is pending add the request to the list. */
4248 if (VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_READ)
4249 {
4250 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4251 AssertPtr(pDeferred);
4252
4253 RTListInit(&pDeferred->NodeDeferred);
4254 pDeferred->pIoCtx = pIoCtx;
4255
4256 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4257 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4258 rc = VERR_VD_NOT_ENOUGH_METADATA;
4259 }
4260 else
4261 {
4262 /* Transfer the data. */
4263 pMetaXfer->cRefs++;
4264 Assert(pMetaXfer->cbMeta >= cbRead);
4265 Assert(pMetaXfer->Core.Key == (RTFOFF)uOffset);
4266 if (pMetaXfer->pbDataShw)
4267 memcpy(pvBuf, pMetaXfer->pbDataShw, cbRead);
4268 else
4269 memcpy(pvBuf, pMetaXfer->abData, cbRead);
4270 *ppMetaXfer = pMetaXfer;
4271 }
4272 }
4273 }
4274
4275 LogFlowFunc(("returns rc=%Rrc\n", rc));
4276 return rc;
4277}
4278
4279static DECLCALLBACK(int) vdIOIntWriteMeta(void *pvUser, PVDIOSTORAGE pIoStorage, uint64_t uOffset,
4280 const void *pvBuf, size_t cbWrite, PVDIOCTX pIoCtx,
4281 PFNVDXFERCOMPLETED pfnComplete, void *pvCompleteUser)
4282{
4283 PVDIO pVDIo = (PVDIO)pvUser;
4284 PVDISK pDisk = pVDIo->pDisk;
4285 int rc = VINF_SUCCESS;
4286 RTSGSEG Seg;
4287 PVDIOTASK pIoTask;
4288 PVDMETAXFER pMetaXfer = NULL;
4289 bool fInTree = false;
4290 void *pvTask = NULL;
4291
4292 LogFlowFunc(("pvUser=%#p pIoStorage=%#p uOffset=%llu pvBuf=%#p cbWrite=%u\n",
4293 pvUser, pIoStorage, uOffset, pvBuf, cbWrite));
4294
4295 AssertMsgReturn( pIoCtx
4296 || (!pfnComplete && !pvCompleteUser),
4297 ("A synchronous metadata write is requested but the parameters are wrong\n"),
4298 VERR_INVALID_POINTER);
4299
4300 /** @todo Enable check for sync I/O later. */
4301 if ( pIoCtx
4302 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4303 VD_IS_LOCKED(pDisk);
4304
4305 if ( !pIoCtx
4306 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4307 {
4308 /* Handle synchronous metadata I/O. */
4309 /** @todo Integrate with metadata transfers below. */
4310 rc = pVDIo->pInterfaceIo->pfnWriteSync(pVDIo->pInterfaceIo->Core.pvUser,
4311 pIoStorage->pStorage, uOffset,
4312 pvBuf, cbWrite, NULL);
4313 }
4314 else
4315 {
4316 pMetaXfer = (PVDMETAXFER)RTAvlrFileOffsetGet(pIoStorage->pTreeMetaXfers, uOffset);
4317 if (!pMetaXfer)
4318 {
4319 /* Allocate a new meta transfer. */
4320 pMetaXfer = vdMetaXferAlloc(pIoStorage, uOffset, cbWrite);
4321 if (!pMetaXfer)
4322 return VERR_NO_MEMORY;
4323 }
4324 else
4325 {
4326 Assert(pMetaXfer->cbMeta >= cbWrite);
4327 Assert(pMetaXfer->Core.Key == (RTFOFF)uOffset);
4328 fInTree = true;
4329 }
4330
4331 if (VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE)
4332 {
4333 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvCompleteUser, pMetaXfer);
4334 if (!pIoTask)
4335 {
4336 RTMemFree(pMetaXfer);
4337 return VERR_NO_MEMORY;
4338 }
4339
4340 memcpy(pMetaXfer->abData, pvBuf, cbWrite);
4341 Seg.cbSeg = cbWrite;
4342 Seg.pvSeg = pMetaXfer->abData;
4343
4344 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4345
4346 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_WRITE);
4347 rc = pVDIo->pInterfaceIo->pfnWriteAsync(pVDIo->pInterfaceIo->Core.pvUser,
4348 pIoStorage->pStorage,
4349 uOffset, &Seg, 1, cbWrite, pIoTask,
4350 &pvTask);
4351 if (RT_SUCCESS(rc))
4352 {
4353 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4354 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
4355 vdIoTaskFree(pDisk, pIoTask);
4356 if (fInTree && !pMetaXfer->cRefs)
4357 {
4358 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4359 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4360 AssertMsg(fRemoved, ("Metadata transfer wasn't removed\n")); NOREF(fRemoved);
4361 RTMemFree(pMetaXfer);
4362 pMetaXfer = NULL;
4363 }
4364 }
4365 else if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4366 {
4367 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4368 AssertPtr(pDeferred);
4369
4370 RTListInit(&pDeferred->NodeDeferred);
4371 pDeferred->pIoCtx = pIoCtx;
4372
4373 if (!fInTree)
4374 {
4375 bool fInserted = RTAvlrFileOffsetInsert(pIoStorage->pTreeMetaXfers, &pMetaXfer->Core);
4376 Assert(fInserted); NOREF(fInserted);
4377 }
4378
4379 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4380 }
4381 else
4382 {
4383 RTMemFree(pMetaXfer);
4384 pMetaXfer = NULL;
4385 }
4386 }
4387 else
4388 {
4389 /* I/O is in progress, update shadow buffer and add to waiting list. */
4390 Assert(VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_WRITE);
4391 if (!pMetaXfer->pbDataShw)
4392 {
4393 /* Allocate shadow buffer and set initial state. */
4394 LogFlowFunc(("pMetaXfer=%#p Creating shadow buffer\n", pMetaXfer));
4395 pMetaXfer->pbDataShw = (uint8_t *)RTMemAlloc(pMetaXfer->cbMeta);
4396 if (RT_LIKELY(pMetaXfer->pbDataShw))
4397 memcpy(pMetaXfer->pbDataShw, pMetaXfer->abData, pMetaXfer->cbMeta);
4398 else
4399 rc = VERR_NO_MEMORY;
4400 }
4401
4402 if (RT_SUCCESS(rc))
4403 {
4404 /* Update with written data and append to waiting list. */
4405 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4406 if (pDeferred)
4407 {
4408 LogFlowFunc(("pMetaXfer=%#p Updating shadow buffer\n", pMetaXfer));
4409
4410 RTListInit(&pDeferred->NodeDeferred);
4411 pDeferred->pIoCtx = pIoCtx;
4412 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4413 memcpy(pMetaXfer->pbDataShw, pvBuf, cbWrite);
4414 RTListAppend(&pMetaXfer->ListIoCtxShwWrites, &pDeferred->NodeDeferred);
4415 }
4416 else
4417 {
4418 /*
4419 * Free shadow buffer if there is no one depending on it, i.e.
4420 * we just allocated it.
4421 */
4422 if (RTListIsEmpty(&pMetaXfer->ListIoCtxShwWrites))
4423 {
4424 RTMemFree(pMetaXfer->pbDataShw);
4425 pMetaXfer->pbDataShw = NULL;
4426 }
4427 rc = VERR_NO_MEMORY;
4428 }
4429 }
4430 }
4431 }
4432
4433 LogFlowFunc(("returns rc=%Rrc\n", rc));
4434 return rc;
4435}
4436
4437static DECLCALLBACK(void) vdIOIntMetaXferRelease(void *pvUser, PVDMETAXFER pMetaXfer)
4438{
4439 PVDIO pVDIo = (PVDIO)pvUser;
4440 PVDISK pDisk = pVDIo->pDisk;
4441 PVDIOSTORAGE pIoStorage;
4442
4443 /*
4444 * It is possible that we get called with a NULL metadata xfer handle
4445 * for synchronous I/O. Just exit.
4446 */
4447 if (!pMetaXfer)
4448 return;
4449
4450 pIoStorage = pMetaXfer->pIoStorage;
4451
4452 VD_IS_LOCKED(pDisk);
4453
4454 Assert( VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE
4455 || VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_WRITE);
4456 Assert(pMetaXfer->cRefs > 0);
4457
4458 pMetaXfer->cRefs--;
4459 if ( !pMetaXfer->cRefs
4460 && RTListIsEmpty(&pMetaXfer->ListIoCtxWaiting)
4461 && VDMETAXFER_TXDIR_GET(pMetaXfer->fFlags) == VDMETAXFER_TXDIR_NONE)
4462 {
4463 /* Free the meta data entry. */
4464 LogFlow(("Removing meta xfer=%#p\n", pMetaXfer));
4465 bool fRemoved = RTAvlrFileOffsetRemove(pIoStorage->pTreeMetaXfers, pMetaXfer->Core.Key) != NULL;
4466 AssertMsg(fRemoved, ("Metadata transfer wasn't removed\n")); NOREF(fRemoved);
4467
4468 RTMemFree(pMetaXfer);
4469 }
4470}
4471
4472static DECLCALLBACK(int) vdIOIntFlush(void *pvUser, PVDIOSTORAGE pIoStorage, PVDIOCTX pIoCtx,
4473 PFNVDXFERCOMPLETED pfnComplete, void *pvCompleteUser)
4474{
4475 PVDIO pVDIo = (PVDIO)pvUser;
4476 PVDISK pDisk = pVDIo->pDisk;
4477 int rc = VINF_SUCCESS;
4478 PVDIOTASK pIoTask;
4479 PVDMETAXFER pMetaXfer = NULL;
4480 void *pvTask = NULL;
4481
4482 LogFlowFunc(("pvUser=%#p pIoStorage=%#p pIoCtx=%#p\n",
4483 pvUser, pIoStorage, pIoCtx));
4484
4485 AssertMsgReturn( pIoCtx
4486 || (!pfnComplete && !pvCompleteUser),
4487 ("A synchronous metadata write is requested but the parameters are wrong\n"),
4488 VERR_INVALID_POINTER);
4489
4490 /** @todo Enable check for sync I/O later. */
4491 if ( pIoCtx
4492 && !(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4493 VD_IS_LOCKED(pDisk);
4494
4495 if (pVDIo->fIgnoreFlush)
4496 return VINF_SUCCESS;
4497
4498 if ( !pIoCtx
4499 || pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC)
4500 {
4501 /* Handle synchronous flushes. */
4502 /** @todo Integrate with metadata transfers below. */
4503 rc = pVDIo->pInterfaceIo->pfnFlushSync(pVDIo->pInterfaceIo->Core.pvUser,
4504 pIoStorage->pStorage);
4505 }
4506 else
4507 {
4508 /* Allocate a new meta transfer. */
4509 pMetaXfer = vdMetaXferAlloc(pIoStorage, 0, 0);
4510 if (!pMetaXfer)
4511 return VERR_NO_MEMORY;
4512
4513 pIoTask = vdIoTaskMetaAlloc(pIoStorage, pfnComplete, pvUser, pMetaXfer);
4514 if (!pIoTask)
4515 {
4516 RTMemFree(pMetaXfer);
4517 return VERR_NO_MEMORY;
4518 }
4519
4520 ASMAtomicIncU32(&pIoCtx->cMetaTransfersPending);
4521
4522 PVDIOCTXDEFERRED pDeferred = (PVDIOCTXDEFERRED)RTMemAllocZ(sizeof(VDIOCTXDEFERRED));
4523 AssertPtr(pDeferred);
4524
4525 RTListInit(&pDeferred->NodeDeferred);
4526 pDeferred->pIoCtx = pIoCtx;
4527
4528 RTListAppend(&pMetaXfer->ListIoCtxWaiting, &pDeferred->NodeDeferred);
4529 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_FLUSH);
4530 rc = pVDIo->pInterfaceIo->pfnFlushAsync(pVDIo->pInterfaceIo->Core.pvUser,
4531 pIoStorage->pStorage,
4532 pIoTask, &pvTask);
4533 if (RT_SUCCESS(rc))
4534 {
4535 VDMETAXFER_TXDIR_SET(pMetaXfer->fFlags, VDMETAXFER_TXDIR_NONE);
4536 ASMAtomicDecU32(&pIoCtx->cMetaTransfersPending);
4537 vdIoTaskFree(pDisk, pIoTask);
4538 RTMemFree(pDeferred);
4539 RTMemFree(pMetaXfer);
4540 }
4541 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
4542 RTMemFree(pMetaXfer);
4543 }
4544
4545 LogFlowFunc(("returns rc=%Rrc\n", rc));
4546 return rc;
4547}
4548
4549static DECLCALLBACK(size_t) vdIOIntIoCtxCopyTo(void *pvUser, PVDIOCTX pIoCtx,
4550 const void *pvBuf, size_t cbBuf)
4551{
4552 PVDIO pVDIo = (PVDIO)pvUser;
4553 PVDISK pDisk = pVDIo->pDisk;
4554 size_t cbCopied = 0;
4555
4556 /** @todo Enable check for sync I/O later. */
4557 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4558 VD_IS_LOCKED(pDisk);
4559
4560 cbCopied = vdIoCtxCopyTo(pIoCtx, (uint8_t *)pvBuf, cbBuf);
4561 Assert(cbCopied == cbBuf);
4562
4563 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft >= cbCopied); - triggers with vdCopyHelper/dmgRead.
4564 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCopied);
4565
4566 return cbCopied;
4567}
4568
4569static DECLCALLBACK(size_t) vdIOIntIoCtxCopyFrom(void *pvUser, PVDIOCTX pIoCtx,
4570 void *pvBuf, size_t cbBuf)
4571{
4572 PVDIO pVDIo = (PVDIO)pvUser;
4573 PVDISK pDisk = pVDIo->pDisk;
4574 size_t cbCopied = 0;
4575
4576 /** @todo Enable check for sync I/O later. */
4577 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4578 VD_IS_LOCKED(pDisk);
4579
4580 cbCopied = vdIoCtxCopyFrom(pIoCtx, (uint8_t *)pvBuf, cbBuf);
4581 Assert(cbCopied == cbBuf);
4582
4583 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft > cbCopied); - triggers with vdCopyHelper/dmgRead.
4584 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCopied);
4585
4586 return cbCopied;
4587}
4588
4589static DECLCALLBACK(size_t) vdIOIntIoCtxSet(void *pvUser, PVDIOCTX pIoCtx, int ch, size_t cb)
4590{
4591 PVDIO pVDIo = (PVDIO)pvUser;
4592 PVDISK pDisk = pVDIo->pDisk;
4593 size_t cbSet = 0;
4594
4595 /** @todo Enable check for sync I/O later. */
4596 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4597 VD_IS_LOCKED(pDisk);
4598
4599 cbSet = vdIoCtxSet(pIoCtx, ch, cb);
4600 Assert(cbSet == cb);
4601
4602 /// @todo Assert(pIoCtx->Req.Io.cbTransferLeft >= cbSet); - triggers with vdCopyHelper/dmgRead.
4603 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbSet);
4604
4605 return cbSet;
4606}
4607
4608static DECLCALLBACK(size_t) vdIOIntIoCtxSegArrayCreate(void *pvUser, PVDIOCTX pIoCtx,
4609 PRTSGSEG paSeg, unsigned *pcSeg,
4610 size_t cbData)
4611{
4612 PVDIO pVDIo = (PVDIO)pvUser;
4613 PVDISK pDisk = pVDIo->pDisk;
4614 size_t cbCreated = 0;
4615
4616 /** @todo It is possible that this gets called from a filter plugin
4617 * outside of the disk lock. Refine assertion or remove completely. */
4618#if 0
4619 /** @todo Enable check for sync I/O later. */
4620 if (!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC))
4621 VD_IS_LOCKED(pDisk);
4622#else
4623 NOREF(pDisk);
4624#endif
4625
4626 cbCreated = RTSgBufSegArrayCreate(&pIoCtx->Req.Io.SgBuf, paSeg, pcSeg, cbData);
4627 Assert(!paSeg || cbData == cbCreated);
4628
4629 return cbCreated;
4630}
4631
4632static DECLCALLBACK(void) vdIOIntIoCtxCompleted(void *pvUser, PVDIOCTX pIoCtx, int rcReq,
4633 size_t cbCompleted)
4634{
4635 PVDIO pVDIo = (PVDIO)pvUser;
4636 PVDISK pDisk = pVDIo->pDisk;
4637
4638 LogFlowFunc(("pvUser=%#p pIoCtx=%#p rcReq=%Rrc cbCompleted=%zu\n",
4639 pvUser, pIoCtx, rcReq, cbCompleted));
4640
4641 /*
4642 * Grab the disk critical section to avoid races with other threads which
4643 * might still modify the I/O context.
4644 * Example is that iSCSI is doing an asynchronous write but calls us already
4645 * while the other thread is still hanging in vdWriteHelperAsync and couldn't update
4646 * the blocked state yet.
4647 * It can overwrite the state to true before we call vdIoCtxContinue and the
4648 * the request would hang indefinite.
4649 */
4650 ASMAtomicCmpXchgS32(&pIoCtx->rcReq, rcReq, VINF_SUCCESS);
4651 Assert(pIoCtx->Req.Io.cbTransferLeft >= cbCompleted);
4652 ASMAtomicSubU32(&pIoCtx->Req.Io.cbTransferLeft, (uint32_t)cbCompleted);
4653
4654 /* Set next transfer function if the current one finished.
4655 * @todo: Find a better way to prevent vdIoCtxContinue from calling the current helper again. */
4656 if (!pIoCtx->Req.Io.cbTransferLeft)
4657 {
4658 pIoCtx->pfnIoCtxTransfer = pIoCtx->pfnIoCtxTransferNext;
4659 pIoCtx->pfnIoCtxTransferNext = NULL;
4660 }
4661
4662 vdIoCtxAddToWaitingList(&pDisk->pIoCtxHaltedHead, pIoCtx);
4663 if (ASMAtomicCmpXchgBool(&pDisk->fLocked, true, false))
4664 {
4665 /* Immediately drop the lock again, it will take care of processing the list. */
4666 vdDiskUnlock(pDisk, NULL);
4667 }
4668}
4669
4670static DECLCALLBACK(bool) vdIOIntIoCtxIsSynchronous(void *pvUser, PVDIOCTX pIoCtx)
4671{
4672 NOREF(pvUser);
4673 return !!(pIoCtx->fFlags & VDIOCTX_FLAGS_SYNC);
4674}
4675
4676static DECLCALLBACK(bool) vdIOIntIoCtxIsZero(void *pvUser, PVDIOCTX pIoCtx, size_t cbCheck,
4677 bool fAdvance)
4678{
4679 NOREF(pvUser);
4680
4681 bool fIsZero = RTSgBufIsZero(&pIoCtx->Req.Io.SgBuf, cbCheck);
4682 if (fIsZero && fAdvance)
4683 RTSgBufAdvance(&pIoCtx->Req.Io.SgBuf, cbCheck);
4684
4685 return fIsZero;
4686}
4687
4688static DECLCALLBACK(size_t) vdIOIntIoCtxGetDataUnitSize(void *pvUser, PVDIOCTX pIoCtx)
4689{
4690 RT_NOREF1(pIoCtx);
4691 PVDIO pVDIo = (PVDIO)pvUser;
4692 PVDISK pDisk = pVDIo->pDisk;
4693 size_t cbSector = 0;
4694
4695 PVDIMAGE pImage = vdGetImageByNumber(pDisk, VD_LAST_IMAGE);
4696 AssertPtrReturn(pImage, 0);
4697
4698 PCVDREGIONLIST pRegionList = NULL;
4699 int rc = pImage->Backend->pfnQueryRegions(pImage->pBackendData, &pRegionList);
4700 if (RT_SUCCESS(rc))
4701 {
4702 cbSector = pRegionList->aRegions[0].cbBlock;
4703
4704 AssertPtr(pImage->Backend->pfnRegionListRelease);
4705 pImage->Backend->pfnRegionListRelease(pImage->pBackendData, pRegionList);
4706 }
4707
4708 return cbSector;
4709}
4710
4711/**
4712 * VD I/O interface callback for opening a file (limited version for VDGetFormat).
4713 */
4714static DECLCALLBACK(int) vdIOIntOpenLimited(void *pvUser, const char *pszLocation,
4715 uint32_t fOpen, PPVDIOSTORAGE ppIoStorage)
4716{
4717 int rc = VINF_SUCCESS;
4718 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4719 PVDIOSTORAGE pIoStorage = (PVDIOSTORAGE)RTMemAllocZ(sizeof(VDIOSTORAGE));
4720
4721 if (!pIoStorage)
4722 return VERR_NO_MEMORY;
4723
4724 rc = pInterfaceIo->pfnOpen(NULL, pszLocation, fOpen, NULL, &pIoStorage->pStorage);
4725 if (RT_SUCCESS(rc))
4726 *ppIoStorage = pIoStorage;
4727 else
4728 RTMemFree(pIoStorage);
4729
4730 return rc;
4731}
4732
4733static DECLCALLBACK(int) vdIOIntCloseLimited(void *pvUser, PVDIOSTORAGE pIoStorage)
4734{
4735 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4736 int rc = pInterfaceIo->pfnClose(NULL, pIoStorage->pStorage);
4737
4738 RTMemFree(pIoStorage);
4739 return rc;
4740}
4741
4742static DECLCALLBACK(int) vdIOIntDeleteLimited(void *pvUser, const char *pcszFilename)
4743{
4744 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4745 return pInterfaceIo->pfnDelete(NULL, pcszFilename);
4746}
4747
4748static DECLCALLBACK(int) vdIOIntMoveLimited(void *pvUser, const char *pcszSrc,
4749 const char *pcszDst, unsigned fMove)
4750{
4751 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4752 return pInterfaceIo->pfnMove(NULL, pcszSrc, pcszDst, fMove);
4753}
4754
4755static DECLCALLBACK(int) vdIOIntGetFreeSpaceLimited(void *pvUser, const char *pcszFilename,
4756 int64_t *pcbFreeSpace)
4757{
4758 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4759 return pInterfaceIo->pfnGetFreeSpace(NULL, pcszFilename, pcbFreeSpace);
4760}
4761
4762static DECLCALLBACK(int) vdIOIntGetModificationTimeLimited(void *pvUser,
4763 const char *pcszFilename,
4764 PRTTIMESPEC pModificationTime)
4765{
4766 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4767 return pInterfaceIo->pfnGetModificationTime(NULL, pcszFilename, pModificationTime);
4768}
4769
4770static DECLCALLBACK(int) vdIOIntGetSizeLimited(void *pvUser, PVDIOSTORAGE pIoStorage,
4771 uint64_t *pcbSize)
4772{
4773 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4774 return pInterfaceIo->pfnGetSize(NULL, pIoStorage->pStorage, pcbSize);
4775}
4776
4777static DECLCALLBACK(int) vdIOIntSetSizeLimited(void *pvUser, PVDIOSTORAGE pIoStorage,
4778 uint64_t cbSize)
4779{
4780 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4781 return pInterfaceIo->pfnSetSize(NULL, pIoStorage->pStorage, cbSize);
4782}
4783
4784static DECLCALLBACK(int) vdIOIntWriteUserLimited(void *pvUser, PVDIOSTORAGE pStorage,
4785 uint64_t uOffset, PVDIOCTX pIoCtx,
4786 size_t cbWrite,
4787 PFNVDXFERCOMPLETED pfnComplete,
4788 void *pvCompleteUser)
4789{
4790 NOREF(pvUser);
4791 NOREF(pStorage);
4792 NOREF(uOffset);
4793 NOREF(pIoCtx);
4794 NOREF(cbWrite);
4795 NOREF(pfnComplete);
4796 NOREF(pvCompleteUser);
4797 AssertMsgFailedReturn(("This needs to be implemented when called\n"), VERR_NOT_IMPLEMENTED);
4798}
4799
4800static DECLCALLBACK(int) vdIOIntReadUserLimited(void *pvUser, PVDIOSTORAGE pStorage,
4801 uint64_t uOffset, PVDIOCTX pIoCtx,
4802 size_t cbRead)
4803{
4804 NOREF(pvUser);
4805 NOREF(pStorage);
4806 NOREF(uOffset);
4807 NOREF(pIoCtx);
4808 NOREF(cbRead);
4809 AssertMsgFailedReturn(("This needs to be implemented when called\n"), VERR_NOT_IMPLEMENTED);
4810}
4811
4812static DECLCALLBACK(int) vdIOIntWriteMetaLimited(void *pvUser, PVDIOSTORAGE pStorage,
4813 uint64_t uOffset, const void *pvBuffer,
4814 size_t cbBuffer, PVDIOCTX pIoCtx,
4815 PFNVDXFERCOMPLETED pfnComplete,
4816 void *pvCompleteUser)
4817{
4818 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4819
4820 AssertMsgReturn(!pIoCtx && !pfnComplete && !pvCompleteUser,
4821 ("Async I/O not implemented for the limited interface"),
4822 VERR_NOT_SUPPORTED);
4823
4824 return pInterfaceIo->pfnWriteSync(NULL, pStorage->pStorage, uOffset, pvBuffer, cbBuffer, NULL);
4825}
4826
4827static DECLCALLBACK(int) vdIOIntReadMetaLimited(void *pvUser, PVDIOSTORAGE pStorage,
4828 uint64_t uOffset, void *pvBuffer,
4829 size_t cbBuffer, PVDIOCTX pIoCtx,
4830 PPVDMETAXFER ppMetaXfer,
4831 PFNVDXFERCOMPLETED pfnComplete,
4832 void *pvCompleteUser)
4833{
4834 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4835
4836 AssertMsgReturn(!pIoCtx && !ppMetaXfer && !pfnComplete && !pvCompleteUser,
4837 ("Async I/O not implemented for the limited interface"),
4838 VERR_NOT_SUPPORTED);
4839
4840 return pInterfaceIo->pfnReadSync(NULL, pStorage->pStorage, uOffset, pvBuffer, cbBuffer, NULL);
4841}
4842
4843#if 0 /* unsed */
4844static int vdIOIntMetaXferReleaseLimited(void *pvUser, PVDMETAXFER pMetaXfer)
4845{
4846 /* This is a NOP in this case. */
4847 NOREF(pvUser);
4848 NOREF(pMetaXfer);
4849 return VINF_SUCCESS;
4850}
4851#endif
4852
4853static DECLCALLBACK(int) vdIOIntFlushLimited(void *pvUser, PVDIOSTORAGE pStorage,
4854 PVDIOCTX pIoCtx,
4855 PFNVDXFERCOMPLETED pfnComplete,
4856 void *pvCompleteUser)
4857{
4858 PVDINTERFACEIO pInterfaceIo = (PVDINTERFACEIO)pvUser;
4859
4860 AssertMsgReturn(!pIoCtx && !pfnComplete && !pvCompleteUser,
4861 ("Async I/O not implemented for the limited interface"),
4862 VERR_NOT_SUPPORTED);
4863
4864 return pInterfaceIo->pfnFlushSync(NULL, pStorage->pStorage);
4865}
4866
4867/**
4868 * internal: send output to the log (unconditionally).
4869 */
4870static DECLCALLBACK(int) vdLogMessage(void *pvUser, const char *pszFormat, va_list args)
4871{
4872 NOREF(pvUser);
4873 RTLogPrintfV(pszFormat, args);
4874 return VINF_SUCCESS;
4875}
4876
4877DECLINLINE(int) vdMessageWrapper(PVDISK pDisk, const char *pszFormat, ...)
4878{
4879 va_list va;
4880 va_start(va, pszFormat);
4881 int rc = pDisk->pInterfaceError->pfnMessage(pDisk->pInterfaceError->Core.pvUser,
4882 pszFormat, va);
4883 va_end(va);
4884 return rc;
4885}
4886
4887
4888/**
4889 * internal: adjust PCHS geometry
4890 */
4891static void vdFixupPCHSGeometry(PVDGEOMETRY pPCHS, uint64_t cbSize)
4892{
4893 /* Fix broken PCHS geometry. Can happen for two reasons: either the backend
4894 * mixes up PCHS and LCHS, or the application used to create the source
4895 * image has put garbage in it. Additionally, if the PCHS geometry covers
4896 * more than the image size, set it back to the default. */
4897 if ( pPCHS->cHeads > 16
4898 || pPCHS->cSectors > 63
4899 || pPCHS->cCylinders == 0
4900 || (uint64_t)pPCHS->cHeads * pPCHS->cSectors * pPCHS->cCylinders * 512 > cbSize)
4901 {
4902 Assert(!(RT_MIN(cbSize / 512 / 16 / 63, 16383) - (uint32_t)RT_MIN(cbSize / 512 / 16 / 63, 16383)));
4903 pPCHS->cCylinders = (uint32_t)RT_MIN(cbSize / 512 / 16 / 63, 16383);
4904 pPCHS->cHeads = 16;
4905 pPCHS->cSectors = 63;
4906 }
4907}
4908
4909/**
4910 * internal: adjust PCHS geometry
4911 */
4912static void vdFixupLCHSGeometry(PVDGEOMETRY pLCHS, uint64_t cbSize)
4913{
4914 /* Fix broken LCHS geometry. Can happen for two reasons: either the backend
4915 * mixes up PCHS and LCHS, or the application used to create the source
4916 * image has put garbage in it. The fix in this case is to clear the LCHS
4917 * geometry to trigger autodetection when it is used next. If the geometry
4918 * already says "please autodetect" (cylinders=0) keep it. */
4919 if ( ( pLCHS->cHeads > 255
4920 || pLCHS->cHeads == 0
4921 || pLCHS->cSectors > 63
4922 || pLCHS->cSectors == 0)
4923 && pLCHS->cCylinders != 0)
4924 {
4925 pLCHS->cCylinders = 0;
4926 pLCHS->cHeads = 0;
4927 pLCHS->cSectors = 0;
4928 }
4929 /* Always recompute the number of cylinders stored in the LCHS
4930 * geometry if it isn't set to "autotedetect" at the moment.
4931 * This is very useful if the destination image size is
4932 * larger or smaller than the source image size. Do not modify
4933 * the number of heads and sectors. Windows guests hate it. */
4934 if ( pLCHS->cCylinders != 0
4935 && pLCHS->cHeads != 0 /* paranoia */
4936 && pLCHS->cSectors != 0 /* paranoia */)
4937 {
4938 Assert(!(RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024) - (uint32_t)RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024)));
4939 pLCHS->cCylinders = (uint32_t)RT_MIN(cbSize / 512 / pLCHS->cHeads / pLCHS->cSectors, 1024);
4940 }
4941}
4942
4943/**
4944 * Sets the I/O callbacks of the given interface to the fallback methods
4945 *
4946 * @returns nothing.
4947 * @param pIfIo The I/O interface to setup.
4948 */
4949static void vdIfIoFallbackCallbacksSetup(PVDINTERFACEIO pIfIo)
4950{
4951 pIfIo->pfnOpen = vdIOOpenFallback;
4952 pIfIo->pfnClose = vdIOCloseFallback;
4953 pIfIo->pfnDelete = vdIODeleteFallback;
4954 pIfIo->pfnMove = vdIOMoveFallback;
4955 pIfIo->pfnGetFreeSpace = vdIOGetFreeSpaceFallback;
4956 pIfIo->pfnGetModificationTime = vdIOGetModificationTimeFallback;
4957 pIfIo->pfnGetSize = vdIOGetSizeFallback;
4958 pIfIo->pfnSetSize = vdIOSetSizeFallback;
4959 pIfIo->pfnSetAllocationSize = vdIOSetAllocationSizeFallback;
4960 pIfIo->pfnReadSync = vdIOReadSyncFallback;
4961 pIfIo->pfnWriteSync = vdIOWriteSyncFallback;
4962 pIfIo->pfnFlushSync = vdIOFlushSyncFallback;
4963 pIfIo->pfnReadAsync = vdIOReadAsyncFallback;
4964 pIfIo->pfnWriteAsync = vdIOWriteAsyncFallback;
4965 pIfIo->pfnFlushAsync = vdIOFlushAsyncFallback;
4966}
4967
4968/**
4969 * Sets the internal I/O callbacks of the given interface.
4970 *
4971 * @returns nothing.
4972 * @param pIfIoInt The internal I/O interface to setup.
4973 */
4974static void vdIfIoIntCallbacksSetup(PVDINTERFACEIOINT pIfIoInt)
4975{
4976 pIfIoInt->pfnOpen = vdIOIntOpen;
4977 pIfIoInt->pfnClose = vdIOIntClose;
4978 pIfIoInt->pfnDelete = vdIOIntDelete;
4979 pIfIoInt->pfnMove = vdIOIntMove;
4980 pIfIoInt->pfnGetFreeSpace = vdIOIntGetFreeSpace;
4981 pIfIoInt->pfnGetModificationTime = vdIOIntGetModificationTime;
4982 pIfIoInt->pfnGetSize = vdIOIntGetSize;
4983 pIfIoInt->pfnSetSize = vdIOIntSetSize;
4984 pIfIoInt->pfnSetAllocationSize = vdIOIntSetAllocationSize;
4985 pIfIoInt->pfnReadUser = vdIOIntReadUser;
4986 pIfIoInt->pfnWriteUser = vdIOIntWriteUser;
4987 pIfIoInt->pfnReadMeta = vdIOIntReadMeta;
4988 pIfIoInt->pfnWriteMeta = vdIOIntWriteMeta;
4989 pIfIoInt->pfnMetaXferRelease = vdIOIntMetaXferRelease;
4990 pIfIoInt->pfnFlush = vdIOIntFlush;
4991 pIfIoInt->pfnIoCtxCopyFrom = vdIOIntIoCtxCopyFrom;
4992 pIfIoInt->pfnIoCtxCopyTo = vdIOIntIoCtxCopyTo;
4993 pIfIoInt->pfnIoCtxSet = vdIOIntIoCtxSet;
4994 pIfIoInt->pfnIoCtxSegArrayCreate = vdIOIntIoCtxSegArrayCreate;
4995 pIfIoInt->pfnIoCtxCompleted = vdIOIntIoCtxCompleted;
4996 pIfIoInt->pfnIoCtxIsSynchronous = vdIOIntIoCtxIsSynchronous;
4997 pIfIoInt->pfnIoCtxIsZero = vdIOIntIoCtxIsZero;
4998 pIfIoInt->pfnIoCtxGetDataUnitSize = vdIOIntIoCtxGetDataUnitSize;
4999}
5000
5001/**
5002 * Internally used completion handler for synchronous I/O contexts.
5003 */
5004static DECLCALLBACK(void) vdIoCtxSyncComplete(void *pvUser1, void *pvUser2, int rcReq)
5005{
5006 RT_NOREF2(pvUser1, rcReq);
5007 RTSEMEVENT hEvent = (RTSEMEVENT)pvUser2;
5008
5009 RTSemEventSignal(hEvent);
5010}
5011
5012/**
5013 * Initializes HDD backends.
5014 *
5015 * @returns VBox status code.
5016 */
5017VBOXDDU_DECL(int) VDInit(void)
5018{
5019 int rc = vdPluginInit();
5020 LogRel(("VD: VDInit finished with %Rrc\n", rc));
5021 return rc;
5022}
5023
5024/**
5025 * Destroys loaded HDD backends.
5026 *
5027 * @returns VBox status code.
5028 */
5029VBOXDDU_DECL(int) VDShutdown(void)
5030{
5031 return vdPluginTerm();
5032}
5033
5034/**
5035 * Loads a single plugin given by filename.
5036 *
5037 * @returns VBox status code.
5038 * @param pszFilename The plugin filename to load.
5039 */
5040VBOXDDU_DECL(int) VDPluginLoadFromFilename(const char *pszFilename)
5041{
5042 if (!vdPluginIsInitialized())
5043 {
5044 int rc = VDInit();
5045 if (RT_FAILURE(rc))
5046 return rc;
5047 }
5048
5049 return vdPluginLoadFromFilename(pszFilename);
5050}
5051
5052/**
5053 * Load all plugins from a given path.
5054 *
5055 * @returns VBox statuse code.
5056 * @param pszPath The path to load plugins from.
5057 */
5058VBOXDDU_DECL(int) VDPluginLoadFromPath(const char *pszPath)
5059{
5060 if (!vdPluginIsInitialized())
5061 {
5062 int rc = VDInit();
5063 if (RT_FAILURE(rc))
5064 return rc;
5065 }
5066
5067 return vdPluginLoadFromPath(pszPath);
5068}
5069
5070/**
5071 * Unloads a single plugin given by filename.
5072 *
5073 * @returns VBox status code.
5074 * @param pszFilename The plugin filename to unload.
5075 */
5076VBOXDDU_DECL(int) VDPluginUnloadFromFilename(const char *pszFilename)
5077{
5078 if (!vdPluginIsInitialized())
5079 {
5080 int rc = VDInit();
5081 if (RT_FAILURE(rc))
5082 return rc;
5083 }
5084
5085 return vdPluginUnloadFromFilename(pszFilename);
5086}
5087
5088/**
5089 * Unload all plugins from a given path.
5090 *
5091 * @returns VBox statuse code.
5092 * @param pszPath The path to unload plugins from.
5093 */
5094VBOXDDU_DECL(int) VDPluginUnloadFromPath(const char *pszPath)
5095{
5096 if (!vdPluginIsInitialized())
5097 {
5098 int rc = VDInit();
5099 if (RT_FAILURE(rc))
5100 return rc;
5101 }
5102
5103 return vdPluginUnloadFromPath(pszPath);
5104}
5105
5106/**
5107 * Lists all HDD backends and their capabilities in a caller-provided buffer.
5108 *
5109 * @returns VBox status code.
5110 * VERR_BUFFER_OVERFLOW if not enough space is passed.
5111 * @param cEntriesAlloc Number of list entries available.
5112 * @param pEntries Pointer to array for the entries.
5113 * @param pcEntriesUsed Number of entries returned.
5114 */
5115VBOXDDU_DECL(int) VDBackendInfo(unsigned cEntriesAlloc, PVDBACKENDINFO pEntries,
5116 unsigned *pcEntriesUsed)
5117{
5118 int rc = VINF_SUCCESS;
5119
5120 LogFlowFunc(("cEntriesAlloc=%u pEntries=%#p pcEntriesUsed=%#p\n", cEntriesAlloc, pEntries, pcEntriesUsed));
5121 /* Check arguments. */
5122 AssertMsgReturn(cEntriesAlloc,
5123 ("cEntriesAlloc=%u\n", cEntriesAlloc),
5124 VERR_INVALID_PARAMETER);
5125 AssertMsgReturn(VALID_PTR(pEntries),
5126 ("pEntries=%#p\n", pEntries),
5127 VERR_INVALID_PARAMETER);
5128 AssertMsgReturn(VALID_PTR(pcEntriesUsed),
5129 ("pcEntriesUsed=%#p\n", pcEntriesUsed),
5130 VERR_INVALID_PARAMETER);
5131 if (!vdPluginIsInitialized())
5132 VDInit();
5133
5134 uint32_t cBackends = vdGetImageBackendCount();
5135 if (cEntriesAlloc < cBackends)
5136 {
5137 *pcEntriesUsed = cBackends;
5138 return VERR_BUFFER_OVERFLOW;
5139 }
5140
5141 for (unsigned i = 0; i < cBackends; i++)
5142 {
5143 PCVDIMAGEBACKEND pBackend;
5144 rc = vdQueryImageBackend(i, &pBackend);
5145 AssertRC(rc);
5146
5147 pEntries[i].pszBackend = pBackend->pszBackendName;
5148 pEntries[i].uBackendCaps = pBackend->uBackendCaps;
5149 pEntries[i].paFileExtensions = pBackend->paFileExtensions;
5150 pEntries[i].paConfigInfo = pBackend->paConfigInfo;
5151 pEntries[i].pfnComposeLocation = pBackend->pfnComposeLocation;
5152 pEntries[i].pfnComposeName = pBackend->pfnComposeName;
5153 }
5154
5155 LogFlowFunc(("returns %Rrc *pcEntriesUsed=%u\n", rc, cBackends));
5156 *pcEntriesUsed = cBackends;
5157 return rc;
5158}
5159
5160/**
5161 * Lists the capabilities of a backend identified by its name.
5162 *
5163 * @returns VBox status code.
5164 * @param pszBackend The backend name.
5165 * @param pEntry Pointer to an entry.
5166 */
5167VBOXDDU_DECL(int) VDBackendInfoOne(const char *pszBackend, PVDBACKENDINFO pEntry)
5168{
5169 LogFlowFunc(("pszBackend=%#p pEntry=%#p\n", pszBackend, pEntry));
5170 /* Check arguments. */
5171 AssertMsgReturn(VALID_PTR(pszBackend),
5172 ("pszBackend=%#p\n", pszBackend),
5173 VERR_INVALID_PARAMETER);
5174 AssertMsgReturn(VALID_PTR(pEntry),
5175 ("pEntry=%#p\n", pEntry),
5176 VERR_INVALID_PARAMETER);
5177 if (!vdPluginIsInitialized())
5178 VDInit();
5179
5180 PCVDIMAGEBACKEND pBackend;
5181 int rc = vdFindImageBackend(pszBackend, &pBackend);
5182 if (RT_SUCCESS(rc))
5183 {
5184 pEntry->pszBackend = pBackend->pszBackendName;
5185 pEntry->uBackendCaps = pBackend->uBackendCaps;
5186 pEntry->paFileExtensions = pBackend->paFileExtensions;
5187 pEntry->paConfigInfo = pBackend->paConfigInfo;
5188 }
5189
5190 return rc;
5191}
5192
5193/**
5194 * Lists all filters and their capabilities in a caller-provided buffer.
5195 *
5196 * @return VBox status code.
5197 * VERR_BUFFER_OVERFLOW if not enough space is passed.
5198 * @param cEntriesAlloc Number of list entries available.
5199 * @param pEntries Pointer to array for the entries.
5200 * @param pcEntriesUsed Number of entries returned.
5201 */
5202VBOXDDU_DECL(int) VDFilterInfo(unsigned cEntriesAlloc, PVDFILTERINFO pEntries,
5203 unsigned *pcEntriesUsed)
5204{
5205 int rc = VINF_SUCCESS;
5206
5207 LogFlowFunc(("cEntriesAlloc=%u pEntries=%#p pcEntriesUsed=%#p\n", cEntriesAlloc, pEntries, pcEntriesUsed));
5208 /* Check arguments. */
5209 AssertMsgReturn(cEntriesAlloc,
5210 ("cEntriesAlloc=%u\n", cEntriesAlloc),
5211 VERR_INVALID_PARAMETER);
5212 AssertMsgReturn(VALID_PTR(pEntries),
5213 ("pEntries=%#p\n", pEntries),
5214 VERR_INVALID_PARAMETER);
5215 AssertMsgReturn(VALID_PTR(pcEntriesUsed),
5216 ("pcEntriesUsed=%#p\n", pcEntriesUsed),
5217 VERR_INVALID_PARAMETER);
5218 if (!vdPluginIsInitialized())
5219 VDInit();
5220
5221 uint32_t cBackends = vdGetFilterBackendCount();
5222 if (cEntriesAlloc < cBackends)
5223 {
5224 *pcEntriesUsed = cBackends;
5225 return VERR_BUFFER_OVERFLOW;
5226 }
5227
5228 for (unsigned i = 0; i < cBackends; i++)
5229 {
5230 PCVDFILTERBACKEND pBackend;
5231 rc = vdQueryFilterBackend(i, &pBackend);
5232 pEntries[i].pszFilter = pBackend->pszBackendName;
5233 pEntries[i].paConfigInfo = pBackend->paConfigInfo;
5234 }
5235
5236 LogFlowFunc(("returns %Rrc *pcEntriesUsed=%u\n", rc, cBackends));
5237 *pcEntriesUsed = cBackends;
5238 return rc;
5239}
5240
5241/**
5242 * Lists the capabilities of a filter identified by its name.
5243 *
5244 * @return VBox status code.
5245 * @param pszFilter The filter name (case insensitive).
5246 * @param pEntry Pointer to an entry.
5247 */
5248VBOXDDU_DECL(int) VDFilterInfoOne(const char *pszFilter, PVDFILTERINFO pEntry)
5249{
5250 LogFlowFunc(("pszFilter=%#p pEntry=%#p\n", pszFilter, pEntry));
5251 /* Check arguments. */
5252 AssertMsgReturn(VALID_PTR(pszFilter),
5253 ("pszFilter=%#p\n", pszFilter),
5254 VERR_INVALID_PARAMETER);
5255 AssertMsgReturn(VALID_PTR(pEntry),
5256 ("pEntry=%#p\n", pEntry),
5257 VERR_INVALID_PARAMETER);
5258 if (!vdPluginIsInitialized())
5259 VDInit();
5260
5261 PCVDFILTERBACKEND pBackend;
5262 int rc = vdFindFilterBackend(pszFilter, &pBackend);
5263 if (RT_SUCCESS(rc))
5264 {
5265 pEntry->pszFilter = pBackend->pszBackendName;
5266 pEntry->paConfigInfo = pBackend->paConfigInfo;
5267 }
5268
5269 return rc;
5270}
5271
5272/**
5273 * Allocates and initializes an empty HDD container.
5274 * No image files are opened.
5275 *
5276 * @returns VBox status code.
5277 * @param pVDIfsDisk Pointer to the per-disk VD interface list.
5278 * @param enmType Type of the image container.
5279 * @param ppDisk Where to store the reference to HDD container.
5280 */
5281VBOXDDU_DECL(int) VDCreate(PVDINTERFACE pVDIfsDisk, VDTYPE enmType, PVDISK *ppDisk)
5282{
5283 int rc = VINF_SUCCESS;
5284 PVDISK pDisk = NULL;
5285
5286 LogFlowFunc(("pVDIfsDisk=%#p\n", pVDIfsDisk));
5287 do
5288 {
5289 /* Check arguments. */
5290 AssertMsgBreakStmt(VALID_PTR(ppDisk),
5291 ("ppDisk=%#p\n", ppDisk),
5292 rc = VERR_INVALID_PARAMETER);
5293
5294 pDisk = (PVDISK)RTMemAllocZ(sizeof(VDISK));
5295 if (pDisk)
5296 {
5297 pDisk->u32Signature = VDISK_SIGNATURE;
5298 pDisk->enmType = enmType;
5299 pDisk->cImages = 0;
5300 pDisk->pBase = NULL;
5301 pDisk->pLast = NULL;
5302 pDisk->cbSize = 0;
5303 pDisk->PCHSGeometry.cCylinders = 0;
5304 pDisk->PCHSGeometry.cHeads = 0;
5305 pDisk->PCHSGeometry.cSectors = 0;
5306 pDisk->LCHSGeometry.cCylinders = 0;
5307 pDisk->LCHSGeometry.cHeads = 0;
5308 pDisk->LCHSGeometry.cSectors = 0;
5309 pDisk->pVDIfsDisk = pVDIfsDisk;
5310 pDisk->pInterfaceError = NULL;
5311 pDisk->pInterfaceThreadSync = NULL;
5312 pDisk->pIoCtxLockOwner = NULL;
5313 pDisk->pIoCtxHead = NULL;
5314 pDisk->fLocked = false;
5315 pDisk->hMemCacheIoCtx = NIL_RTMEMCACHE;
5316 pDisk->hMemCacheIoTask = NIL_RTMEMCACHE;
5317 RTListInit(&pDisk->ListFilterChainWrite);
5318 RTListInit(&pDisk->ListFilterChainRead);
5319
5320 /* Create the I/O ctx cache */
5321 rc = RTMemCacheCreate(&pDisk->hMemCacheIoCtx, sizeof(VDIOCTX), 0, UINT32_MAX,
5322 NULL, NULL, NULL, 0);
5323 if (RT_FAILURE(rc))
5324 break;
5325
5326 /* Create the I/O task cache */
5327 rc = RTMemCacheCreate(&pDisk->hMemCacheIoTask, sizeof(VDIOTASK), 0, UINT32_MAX,
5328 NULL, NULL, NULL, 0);
5329 if (RT_FAILURE(rc))
5330 break;
5331
5332 pDisk->pInterfaceError = VDIfErrorGet(pVDIfsDisk);
5333 pDisk->pInterfaceThreadSync = VDIfThreadSyncGet(pVDIfsDisk);
5334
5335 *ppDisk = pDisk;
5336 }
5337 else
5338 {
5339 rc = VERR_NO_MEMORY;
5340 break;
5341 }
5342 } while (0);
5343
5344 if ( RT_FAILURE(rc)
5345 && pDisk)
5346 {
5347 if (pDisk->hMemCacheIoCtx != NIL_RTMEMCACHE)
5348 RTMemCacheDestroy(pDisk->hMemCacheIoCtx);
5349 if (pDisk->hMemCacheIoTask != NIL_RTMEMCACHE)
5350 RTMemCacheDestroy(pDisk->hMemCacheIoTask);
5351 }
5352
5353 LogFlowFunc(("returns %Rrc (pDisk=%#p)\n", rc, pDisk));
5354 return rc;
5355}
5356
5357/**
5358 * Destroys HDD container.
5359 * If container has opened image files they will be closed.
5360 *
5361 * @returns VBox status code.
5362 * @param pDisk Pointer to HDD container.
5363 */
5364VBOXDDU_DECL(int) VDDestroy(PVDISK pDisk)
5365{
5366 int rc = VINF_SUCCESS;
5367 LogFlowFunc(("pDisk=%#p\n", pDisk));
5368 do
5369 {
5370 /* sanity check */
5371 AssertPtrBreak(pDisk);
5372 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5373 Assert(!pDisk->fLocked);
5374
5375 rc = VDCloseAll(pDisk);
5376 int rc2 = VDFilterRemoveAll(pDisk);
5377 if (RT_SUCCESS(rc))
5378 rc = rc2;
5379
5380 RTMemCacheDestroy(pDisk->hMemCacheIoCtx);
5381 RTMemCacheDestroy(pDisk->hMemCacheIoTask);
5382 RTMemFree(pDisk);
5383 } while (0);
5384 LogFlowFunc(("returns %Rrc\n", rc));
5385 return rc;
5386}
5387
5388/**
5389 * Try to get the backend name which can use this image.
5390 *
5391 * @returns VBox status code.
5392 * VINF_SUCCESS if a plugin was found.
5393 * ppszFormat contains the string which can be used as backend name.
5394 * VERR_NOT_SUPPORTED if no backend was found.
5395 * @param pVDIfsDisk Pointer to the per-disk VD interface list.
5396 * @param pVDIfsImage Pointer to the per-image VD interface list.
5397 * @param pszFilename Name of the image file for which the backend is queried.
5398 * @param ppszFormat Receives pointer of the UTF-8 string which contains the format name.
5399 * The returned pointer must be freed using RTStrFree().
5400 */
5401VBOXDDU_DECL(int) VDGetFormat(PVDINTERFACE pVDIfsDisk, PVDINTERFACE pVDIfsImage,
5402 const char *pszFilename, char **ppszFormat, VDTYPE *penmType)
5403{
5404 int rc = VERR_NOT_SUPPORTED;
5405 VDINTERFACEIOINT VDIfIoInt;
5406 VDINTERFACEIO VDIfIoFallback;
5407 PVDINTERFACEIO pInterfaceIo;
5408
5409 LogFlowFunc(("pszFilename=\"%s\"\n", pszFilename));
5410 /* Check arguments. */
5411 AssertMsgReturn(VALID_PTR(pszFilename) && *pszFilename,
5412 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5413 VERR_INVALID_PARAMETER);
5414 AssertMsgReturn(VALID_PTR(ppszFormat),
5415 ("ppszFormat=%#p\n", ppszFormat),
5416 VERR_INVALID_PARAMETER);
5417 AssertMsgReturn(VALID_PTR(penmType),
5418 ("penmType=%#p\n", penmType),
5419 VERR_INVALID_PARAMETER);
5420
5421 if (!vdPluginIsInitialized())
5422 VDInit();
5423
5424 pInterfaceIo = VDIfIoGet(pVDIfsImage);
5425 if (!pInterfaceIo)
5426 {
5427 /*
5428 * Caller doesn't provide an I/O interface, create our own using the
5429 * native file API.
5430 */
5431 vdIfIoFallbackCallbacksSetup(&VDIfIoFallback);
5432 pInterfaceIo = &VDIfIoFallback;
5433 }
5434
5435 /* Set up the internal I/O interface. */
5436 AssertReturn(!VDIfIoIntGet(pVDIfsImage), VERR_INVALID_PARAMETER);
5437 VDIfIoInt.pfnOpen = vdIOIntOpenLimited;
5438 VDIfIoInt.pfnClose = vdIOIntCloseLimited;
5439 VDIfIoInt.pfnDelete = vdIOIntDeleteLimited;
5440 VDIfIoInt.pfnMove = vdIOIntMoveLimited;
5441 VDIfIoInt.pfnGetFreeSpace = vdIOIntGetFreeSpaceLimited;
5442 VDIfIoInt.pfnGetModificationTime = vdIOIntGetModificationTimeLimited;
5443 VDIfIoInt.pfnGetSize = vdIOIntGetSizeLimited;
5444 VDIfIoInt.pfnSetSize = vdIOIntSetSizeLimited;
5445 VDIfIoInt.pfnReadUser = vdIOIntReadUserLimited;
5446 VDIfIoInt.pfnWriteUser = vdIOIntWriteUserLimited;
5447 VDIfIoInt.pfnReadMeta = vdIOIntReadMetaLimited;
5448 VDIfIoInt.pfnWriteMeta = vdIOIntWriteMetaLimited;
5449 VDIfIoInt.pfnFlush = vdIOIntFlushLimited;
5450 rc = VDInterfaceAdd(&VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
5451 pInterfaceIo, sizeof(VDINTERFACEIOINT), &pVDIfsImage);
5452 AssertRC(rc);
5453
5454 /* Find the backend supporting this file format. */
5455 for (unsigned i = 0; i < vdGetImageBackendCount(); i++)
5456 {
5457 PCVDIMAGEBACKEND pBackend;
5458 rc = vdQueryImageBackend(i, &pBackend);
5459 AssertRC(rc);
5460
5461 if (pBackend->pfnProbe)
5462 {
5463 rc = pBackend->pfnProbe(pszFilename, pVDIfsDisk, pVDIfsImage, penmType);
5464 if ( RT_SUCCESS(rc)
5465 /* The correct backend has been found, but there is a small
5466 * incompatibility so that the file cannot be used. Stop here
5467 * and signal success - the actual open will of course fail,
5468 * but that will create a really sensible error message. */
5469
5470 /** @todo r=bird: this bit of code is _certifiably_ _insane_ as it allows
5471 * simple stuff like VERR_EOF to pass thru. I've just amended it with
5472 * disallowing VERR_EOF too, but someone needs to pick up the courage to
5473 * fix this stuff properly or at least update the docs!
5474 * (Parallels returns VERR_EOF, btw.) */
5475
5476 || ( rc != VERR_VD_GEN_INVALID_HEADER
5477 && rc != VERR_VD_VDI_INVALID_HEADER
5478 && rc != VERR_VD_VMDK_INVALID_HEADER
5479 && rc != VERR_VD_ISCSI_INVALID_HEADER
5480 && rc != VERR_VD_VHD_INVALID_HEADER
5481 && rc != VERR_VD_RAW_INVALID_HEADER
5482 && rc != VERR_VD_RAW_SIZE_MODULO_512
5483 && rc != VERR_VD_RAW_SIZE_MODULO_2048
5484 && rc != VERR_VD_RAW_SIZE_OPTICAL_TOO_SMALL
5485 && rc != VERR_VD_RAW_SIZE_FLOPPY_TOO_BIG
5486 && rc != VERR_VD_PARALLELS_INVALID_HEADER
5487 && rc != VERR_VD_DMG_INVALID_HEADER
5488 && rc != VERR_EOF /* bird for viso */
5489 ))
5490 {
5491 /* Copy the name into the new string. */
5492 char *pszFormat = RTStrDup(pBackend->pszBackendName);
5493 if (!pszFormat)
5494 {
5495 rc = VERR_NO_MEMORY;
5496 break;
5497 }
5498 *ppszFormat = pszFormat;
5499 /* Do not consider the typical file access errors as success,
5500 * which allows the caller to deal with such issues. */
5501 if ( rc != VERR_ACCESS_DENIED
5502 && rc != VERR_PATH_NOT_FOUND
5503 && rc != VERR_FILE_NOT_FOUND)
5504 rc = VINF_SUCCESS;
5505 break;
5506 }
5507 rc = VERR_NOT_SUPPORTED;
5508 }
5509 }
5510
5511 /* Try the cache backends. */
5512 if (rc == VERR_NOT_SUPPORTED)
5513 {
5514 for (unsigned i = 0; i < vdGetCacheBackendCount(); i++)
5515 {
5516 PCVDCACHEBACKEND pBackend;
5517 rc = vdQueryCacheBackend(i, &pBackend);
5518 AssertRC(rc);
5519
5520 if (pBackend->pfnProbe)
5521 {
5522 rc = pBackend->pfnProbe(pszFilename, pVDIfsDisk, pVDIfsImage);
5523 if ( RT_SUCCESS(rc)
5524 || (rc != VERR_VD_GEN_INVALID_HEADER))
5525 {
5526 /* Copy the name into the new string. */
5527 char *pszFormat = RTStrDup(pBackend->pszBackendName);
5528 if (!pszFormat)
5529 {
5530 rc = VERR_NO_MEMORY;
5531 break;
5532 }
5533 *ppszFormat = pszFormat;
5534 rc = VINF_SUCCESS;
5535 break;
5536 }
5537 rc = VERR_NOT_SUPPORTED;
5538 }
5539 }
5540 }
5541
5542 LogFlowFunc(("returns %Rrc *ppszFormat=\"%s\"\n", rc, *ppszFormat));
5543 return rc;
5544}
5545
5546/**
5547 * Opens an image file.
5548 *
5549 * The first opened image file in HDD container must have a base image type,
5550 * others (next opened images) must be a differencing or undo images.
5551 * Linkage is checked for differencing image to be in consistence with the previously opened image.
5552 * When another differencing image is opened and the last image was opened in read/write access
5553 * mode, then the last image is reopened in read-only with deny write sharing mode. This allows
5554 * other processes to use images in read-only mode too.
5555 *
5556 * Note that the image is opened in read-only mode if a read/write open is not possible.
5557 * Use VDIsReadOnly to check open mode.
5558 *
5559 * @returns VBox status code.
5560 * @param pDisk Pointer to HDD container.
5561 * @param pszBackend Name of the image file backend to use.
5562 * @param pszFilename Name of the image file to open.
5563 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
5564 * @param pVDIfsImage Pointer to the per-image VD interface list.
5565 */
5566VBOXDDU_DECL(int) VDOpen(PVDISK pDisk, const char *pszBackend,
5567 const char *pszFilename, unsigned uOpenFlags,
5568 PVDINTERFACE pVDIfsImage)
5569{
5570 int rc = VINF_SUCCESS;
5571 int rc2;
5572 bool fLockWrite = false;
5573 PVDIMAGE pImage = NULL;
5574
5575 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uOpenFlags=%#x, pVDIfsImage=%#p\n",
5576 pDisk, pszBackend, pszFilename, uOpenFlags, pVDIfsImage));
5577
5578 do
5579 {
5580 /* sanity check */
5581 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
5582 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5583
5584 /* Check arguments. */
5585 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
5586 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
5587 rc = VERR_INVALID_PARAMETER);
5588 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
5589 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5590 rc = VERR_INVALID_PARAMETER);
5591 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
5592 ("uOpenFlags=%#x\n", uOpenFlags),
5593 rc = VERR_INVALID_PARAMETER);
5594 AssertMsgBreakStmt( !(uOpenFlags & VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS)
5595 || (uOpenFlags & VD_OPEN_FLAGS_READONLY),
5596 ("uOpenFlags=%#x\n", uOpenFlags),
5597 rc = VERR_INVALID_PARAMETER);
5598
5599 /*
5600 * Destroy the current discard state first which might still have pending blocks
5601 * for the currently opened image which will be switched to readonly mode.
5602 */
5603 /* Lock disk for writing, as we modify pDisk information below. */
5604 rc2 = vdThreadStartWrite(pDisk);
5605 AssertRC(rc2);
5606 fLockWrite = true;
5607 rc = vdDiscardStateDestroy(pDisk);
5608 if (RT_FAILURE(rc))
5609 break;
5610 rc2 = vdThreadFinishWrite(pDisk);
5611 AssertRC(rc2);
5612 fLockWrite = false;
5613
5614 /* Set up image descriptor. */
5615 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
5616 if (!pImage)
5617 {
5618 rc = VERR_NO_MEMORY;
5619 break;
5620 }
5621 pImage->pszFilename = RTStrDup(pszFilename);
5622 if (!pImage->pszFilename)
5623 {
5624 rc = VERR_NO_MEMORY;
5625 break;
5626 }
5627
5628 pImage->VDIo.pDisk = pDisk;
5629 pImage->pVDIfsImage = pVDIfsImage;
5630
5631 rc = vdFindImageBackend(pszBackend, &pImage->Backend);
5632 if (RT_FAILURE(rc))
5633 break;
5634 if (!pImage->Backend)
5635 {
5636 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
5637 N_("VD: unknown backend name '%s'"), pszBackend);
5638 break;
5639 }
5640
5641 /*
5642 * Fail if the backend can't do async I/O but the
5643 * flag is set.
5644 */
5645 if ( !(pImage->Backend->uBackendCaps & VD_CAP_ASYNC)
5646 && (uOpenFlags & VD_OPEN_FLAGS_ASYNC_IO))
5647 {
5648 rc = vdError(pDisk, VERR_NOT_SUPPORTED, RT_SRC_POS,
5649 N_("VD: Backend '%s' does not support async I/O"), pszBackend);
5650 break;
5651 }
5652
5653 /*
5654 * Fail if the backend doesn't support the discard operation but the
5655 * flag is set.
5656 */
5657 if ( !(pImage->Backend->uBackendCaps & VD_CAP_DISCARD)
5658 && (uOpenFlags & VD_OPEN_FLAGS_DISCARD))
5659 {
5660 rc = vdError(pDisk, VERR_VD_DISCARD_NOT_SUPPORTED, RT_SRC_POS,
5661 N_("VD: Backend '%s' does not support discard"), pszBackend);
5662 break;
5663 }
5664
5665 /* Set up the I/O interface. */
5666 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
5667 if (!pImage->VDIo.pInterfaceIo)
5668 {
5669 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
5670 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
5671 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
5672 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
5673 }
5674
5675 /* Set up the internal I/O interface. */
5676 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
5677 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
5678 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
5679 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
5680 AssertRC(rc);
5681
5682 pImage->uOpenFlags = uOpenFlags & (VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_DISCARD | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS);
5683 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
5684 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
5685 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS),
5686 pDisk->pVDIfsDisk,
5687 pImage->pVDIfsImage,
5688 pDisk->enmType,
5689 &pImage->pBackendData);
5690 /*
5691 * If the image is corrupted and there is a repair method try to repair it
5692 * first if it was openend in read-write mode and open again afterwards.
5693 */
5694 if ( RT_UNLIKELY(rc == VERR_VD_IMAGE_CORRUPTED)
5695 && !(uOpenFlags & VD_OPEN_FLAGS_READONLY)
5696 && pImage->Backend->pfnRepair)
5697 {
5698 rc = pImage->Backend->pfnRepair(pszFilename, pDisk->pVDIfsDisk, pImage->pVDIfsImage, 0 /* fFlags */);
5699 if (RT_SUCCESS(rc))
5700 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
5701 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS),
5702 pDisk->pVDIfsDisk,
5703 pImage->pVDIfsImage,
5704 pDisk->enmType,
5705 &pImage->pBackendData);
5706 else
5707 {
5708 rc = vdError(pDisk, rc, RT_SRC_POS,
5709 N_("VD: error %Rrc repairing corrupted image file '%s'"), rc, pszFilename);
5710 break;
5711 }
5712 }
5713 else if (RT_UNLIKELY(rc == VERR_VD_IMAGE_CORRUPTED))
5714 {
5715 rc = vdError(pDisk, rc, RT_SRC_POS,
5716 N_("VD: Image file '%s' is corrupted and can't be opened"), pszFilename);
5717 break;
5718 }
5719
5720 /* If the open in read-write mode failed, retry in read-only mode. */
5721 if (RT_FAILURE(rc))
5722 {
5723 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY)
5724 && ( rc == VERR_ACCESS_DENIED
5725 || rc == VERR_PERMISSION_DENIED
5726 || rc == VERR_WRITE_PROTECT
5727 || rc == VERR_SHARING_VIOLATION
5728 || rc == VERR_FILE_LOCK_FAILED))
5729 rc = pImage->Backend->pfnOpen(pImage->pszFilename,
5730 (uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS))
5731 | VD_OPEN_FLAGS_READONLY,
5732 pDisk->pVDIfsDisk,
5733 pImage->pVDIfsImage,
5734 pDisk->enmType,
5735 &pImage->pBackendData);
5736 if (RT_FAILURE(rc))
5737 {
5738 rc = vdError(pDisk, rc, RT_SRC_POS,
5739 N_("VD: error %Rrc opening image file '%s'"), rc, pszFilename);
5740 break;
5741 }
5742 }
5743
5744 /* Lock disk for writing, as we modify pDisk information below. */
5745 rc2 = vdThreadStartWrite(pDisk);
5746 AssertRC(rc2);
5747 fLockWrite = true;
5748
5749 pImage->VDIo.pBackendData = pImage->pBackendData;
5750
5751 /* Check image type. As the image itself has only partial knowledge
5752 * whether it's a base image or not, this info is derived here. The
5753 * base image can be fixed or normal, all others must be normal or
5754 * diff images. Some image formats don't distinguish between normal
5755 * and diff images, so this must be corrected here. */
5756 unsigned uImageFlags;
5757 uImageFlags = pImage->Backend->pfnGetImageFlags(pImage->pBackendData);
5758 if (RT_FAILURE(rc))
5759 uImageFlags = VD_IMAGE_FLAGS_NONE;
5760 if ( RT_SUCCESS(rc)
5761 && !(uOpenFlags & VD_OPEN_FLAGS_INFO))
5762 {
5763 if ( pDisk->cImages == 0
5764 && (uImageFlags & VD_IMAGE_FLAGS_DIFF))
5765 {
5766 rc = VERR_VD_INVALID_TYPE;
5767 break;
5768 }
5769 else if (pDisk->cImages != 0)
5770 {
5771 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
5772 {
5773 rc = VERR_VD_INVALID_TYPE;
5774 break;
5775 }
5776 else
5777 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
5778 }
5779 }
5780
5781 /* Ensure we always get correct diff information, even if the backend
5782 * doesn't actually have a stored flag for this. It must not return
5783 * bogus information for the parent UUID if it is not a diff image. */
5784 RTUUID parentUuid;
5785 RTUuidClear(&parentUuid);
5786 rc2 = pImage->Backend->pfnGetParentUuid(pImage->pBackendData, &parentUuid);
5787 if (RT_SUCCESS(rc2) && !RTUuidIsNull(&parentUuid))
5788 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
5789
5790 pImage->uImageFlags = uImageFlags;
5791
5792 /* Force sane optimization settings. It's not worth avoiding writes
5793 * to fixed size images. The overhead would have almost no payback. */
5794 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
5795 pImage->uOpenFlags |= VD_OPEN_FLAGS_HONOR_SAME;
5796
5797 /** @todo optionally check UUIDs */
5798
5799 /* Cache disk information. */
5800 pDisk->cbSize = vdImageGetSize(pImage);
5801
5802 /* Cache PCHS geometry. */
5803 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
5804 &pDisk->PCHSGeometry);
5805 if (RT_FAILURE(rc2))
5806 {
5807 pDisk->PCHSGeometry.cCylinders = 0;
5808 pDisk->PCHSGeometry.cHeads = 0;
5809 pDisk->PCHSGeometry.cSectors = 0;
5810 }
5811 else
5812 {
5813 /* Make sure the PCHS geometry is properly clipped. */
5814 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
5815 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
5816 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
5817 }
5818
5819 /* Cache LCHS geometry. */
5820 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
5821 &pDisk->LCHSGeometry);
5822 if (RT_FAILURE(rc2))
5823 {
5824 pDisk->LCHSGeometry.cCylinders = 0;
5825 pDisk->LCHSGeometry.cHeads = 0;
5826 pDisk->LCHSGeometry.cSectors = 0;
5827 }
5828 else
5829 {
5830 /* Make sure the LCHS geometry is properly clipped. */
5831 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
5832 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
5833 }
5834
5835 if (pDisk->cImages != 0)
5836 {
5837 /* Switch previous image to read-only mode. */
5838 unsigned uOpenFlagsPrevImg;
5839 uOpenFlagsPrevImg = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
5840 if (!(uOpenFlagsPrevImg & VD_OPEN_FLAGS_READONLY))
5841 {
5842 uOpenFlagsPrevImg |= VD_OPEN_FLAGS_READONLY;
5843 rc = pDisk->pLast->Backend->pfnSetOpenFlags(pDisk->pLast->pBackendData, uOpenFlagsPrevImg);
5844 }
5845 }
5846
5847 if (RT_SUCCESS(rc))
5848 {
5849 /* Image successfully opened, make it the last image. */
5850 vdAddImageToList(pDisk, pImage);
5851 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
5852 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
5853 }
5854 else
5855 {
5856 /* Error detected, but image opened. Close image. */
5857 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, false);
5858 AssertRC(rc2);
5859 pImage->pBackendData = NULL;
5860 }
5861 } while (0);
5862
5863 if (RT_UNLIKELY(fLockWrite))
5864 {
5865 rc2 = vdThreadFinishWrite(pDisk);
5866 AssertRC(rc2);
5867 }
5868
5869 if (RT_FAILURE(rc))
5870 {
5871 if (pImage)
5872 {
5873 if (pImage->pszFilename)
5874 RTStrFree(pImage->pszFilename);
5875 RTMemFree(pImage);
5876 }
5877 }
5878
5879 LogFlowFunc(("returns %Rrc\n", rc));
5880 return rc;
5881}
5882
5883/**
5884 * Opens a cache image.
5885 *
5886 * @return VBox status code.
5887 * @param pDisk Pointer to the HDD container which should use the cache image.
5888 * @param pszBackend Name of the cache file backend to use (case insensitive).
5889 * @param pszFilename Name of the cache image to open.
5890 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
5891 * @param pVDIfsCache Pointer to the per-cache VD interface list.
5892 */
5893VBOXDDU_DECL(int) VDCacheOpen(PVDISK pDisk, const char *pszBackend,
5894 const char *pszFilename, unsigned uOpenFlags,
5895 PVDINTERFACE pVDIfsCache)
5896{
5897 int rc = VINF_SUCCESS;
5898 int rc2;
5899 bool fLockWrite = false;
5900 PVDCACHE pCache = NULL;
5901
5902 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uOpenFlags=%#x, pVDIfsCache=%#p\n",
5903 pDisk, pszBackend, pszFilename, uOpenFlags, pVDIfsCache));
5904
5905 do
5906 {
5907 /* sanity check */
5908 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
5909 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
5910
5911 /* Check arguments. */
5912 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
5913 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
5914 rc = VERR_INVALID_PARAMETER);
5915 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
5916 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
5917 rc = VERR_INVALID_PARAMETER);
5918 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
5919 ("uOpenFlags=%#x\n", uOpenFlags),
5920 rc = VERR_INVALID_PARAMETER);
5921
5922 /* Set up image descriptor. */
5923 pCache = (PVDCACHE)RTMemAllocZ(sizeof(VDCACHE));
5924 if (!pCache)
5925 {
5926 rc = VERR_NO_MEMORY;
5927 break;
5928 }
5929 pCache->pszFilename = RTStrDup(pszFilename);
5930 if (!pCache->pszFilename)
5931 {
5932 rc = VERR_NO_MEMORY;
5933 break;
5934 }
5935
5936 pCache->VDIo.pDisk = pDisk;
5937 pCache->pVDIfsCache = pVDIfsCache;
5938
5939 rc = vdFindCacheBackend(pszBackend, &pCache->Backend);
5940 if (RT_FAILURE(rc))
5941 break;
5942 if (!pCache->Backend)
5943 {
5944 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
5945 N_("VD: unknown backend name '%s'"), pszBackend);
5946 break;
5947 }
5948
5949 /* Set up the I/O interface. */
5950 pCache->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsCache);
5951 if (!pCache->VDIo.pInterfaceIo)
5952 {
5953 vdIfIoFallbackCallbacksSetup(&pCache->VDIo.VDIfIo);
5954 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
5955 pDisk, sizeof(VDINTERFACEIO), &pVDIfsCache);
5956 pCache->VDIo.pInterfaceIo = &pCache->VDIo.VDIfIo;
5957 }
5958
5959 /* Set up the internal I/O interface. */
5960 AssertBreakStmt(!VDIfIoIntGet(pVDIfsCache), rc = VERR_INVALID_PARAMETER);
5961 vdIfIoIntCallbacksSetup(&pCache->VDIo.VDIfIoInt);
5962 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
5963 &pCache->VDIo, sizeof(VDINTERFACEIOINT), &pCache->pVDIfsCache);
5964 AssertRC(rc);
5965
5966 pCache->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
5967 rc = pCache->Backend->pfnOpen(pCache->pszFilename,
5968 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
5969 pDisk->pVDIfsDisk,
5970 pCache->pVDIfsCache,
5971 &pCache->pBackendData);
5972 /* If the open in read-write mode failed, retry in read-only mode. */
5973 if (RT_FAILURE(rc))
5974 {
5975 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY)
5976 && ( rc == VERR_ACCESS_DENIED
5977 || rc == VERR_PERMISSION_DENIED
5978 || rc == VERR_WRITE_PROTECT
5979 || rc == VERR_SHARING_VIOLATION
5980 || rc == VERR_FILE_LOCK_FAILED))
5981 rc = pCache->Backend->pfnOpen(pCache->pszFilename,
5982 (uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME)
5983 | VD_OPEN_FLAGS_READONLY,
5984 pDisk->pVDIfsDisk,
5985 pCache->pVDIfsCache,
5986 &pCache->pBackendData);
5987 if (RT_FAILURE(rc))
5988 {
5989 rc = vdError(pDisk, rc, RT_SRC_POS,
5990 N_("VD: error %Rrc opening image file '%s'"), rc, pszFilename);
5991 break;
5992 }
5993 }
5994
5995 /* Lock disk for writing, as we modify pDisk information below. */
5996 rc2 = vdThreadStartWrite(pDisk);
5997 AssertRC(rc2);
5998 fLockWrite = true;
5999
6000 /*
6001 * Check that the modification UUID of the cache and last image
6002 * match. If not the image was modified in-between without the cache.
6003 * The cache might contain stale data.
6004 */
6005 RTUUID UuidImage, UuidCache;
6006
6007 rc = pCache->Backend->pfnGetModificationUuid(pCache->pBackendData,
6008 &UuidCache);
6009 if (RT_SUCCESS(rc))
6010 {
6011 rc = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6012 &UuidImage);
6013 if (RT_SUCCESS(rc))
6014 {
6015 if (RTUuidCompare(&UuidImage, &UuidCache))
6016 rc = VERR_VD_CACHE_NOT_UP_TO_DATE;
6017 }
6018 }
6019
6020 /*
6021 * We assume that the user knows what he is doing if one of the images
6022 * doesn't support the modification uuid.
6023 */
6024 if (rc == VERR_NOT_SUPPORTED)
6025 rc = VINF_SUCCESS;
6026
6027 if (RT_SUCCESS(rc))
6028 {
6029 /* Cache successfully opened, make it the current one. */
6030 if (!pDisk->pCache)
6031 pDisk->pCache = pCache;
6032 else
6033 rc = VERR_VD_CACHE_ALREADY_EXISTS;
6034 }
6035
6036 if (RT_FAILURE(rc))
6037 {
6038 /* Error detected, but image opened. Close image. */
6039 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, false);
6040 AssertRC(rc2);
6041 pCache->pBackendData = NULL;
6042 }
6043 } while (0);
6044
6045 if (RT_UNLIKELY(fLockWrite))
6046 {
6047 rc2 = vdThreadFinishWrite(pDisk);
6048 AssertRC(rc2);
6049 }
6050
6051 if (RT_FAILURE(rc))
6052 {
6053 if (pCache)
6054 {
6055 if (pCache->pszFilename)
6056 RTStrFree(pCache->pszFilename);
6057 RTMemFree(pCache);
6058 }
6059 }
6060
6061 LogFlowFunc(("returns %Rrc\n", rc));
6062 return rc;
6063}
6064
6065VBOXDDU_DECL(int) VDFilterAdd(PVDISK pDisk, const char *pszFilter, uint32_t fFlags,
6066 PVDINTERFACE pVDIfsFilter)
6067{
6068 int rc = VINF_SUCCESS;
6069 int rc2;
6070 bool fLockWrite = false;
6071 PVDFILTER pFilter = NULL;
6072
6073 LogFlowFunc(("pDisk=%#p pszFilter=\"%s\" pVDIfsFilter=%#p\n",
6074 pDisk, pszFilter, pVDIfsFilter));
6075
6076 do
6077 {
6078 /* sanity check */
6079 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6080 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6081
6082 /* Check arguments. */
6083 AssertMsgBreakStmt(VALID_PTR(pszFilter) && *pszFilter,
6084 ("pszFilter=%#p \"%s\"\n", pszFilter, pszFilter),
6085 rc = VERR_INVALID_PARAMETER);
6086
6087 AssertMsgBreakStmt(!(fFlags & ~VD_FILTER_FLAGS_MASK),
6088 ("Invalid flags set (fFlags=%#x)\n", fFlags),
6089 rc = VERR_INVALID_PARAMETER);
6090
6091 /* Set up image descriptor. */
6092 pFilter = (PVDFILTER)RTMemAllocZ(sizeof(VDFILTER));
6093 if (!pFilter)
6094 {
6095 rc = VERR_NO_MEMORY;
6096 break;
6097 }
6098
6099 rc = vdFindFilterBackend(pszFilter, &pFilter->pBackend);
6100 if (RT_FAILURE(rc))
6101 break;
6102 if (!pFilter->pBackend)
6103 {
6104 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6105 N_("VD: unknown filter backend name '%s'"), pszFilter);
6106 break;
6107 }
6108
6109 pFilter->VDIo.pDisk = pDisk;
6110 pFilter->pVDIfsFilter = pVDIfsFilter;
6111
6112 /* Set up the internal I/O interface. */
6113 AssertBreakStmt(!VDIfIoIntGet(pVDIfsFilter), rc = VERR_INVALID_PARAMETER);
6114 vdIfIoIntCallbacksSetup(&pFilter->VDIo.VDIfIoInt);
6115 rc = VDInterfaceAdd(&pFilter->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6116 &pFilter->VDIo, sizeof(VDINTERFACEIOINT), &pFilter->pVDIfsFilter);
6117 AssertRC(rc);
6118
6119 rc = pFilter->pBackend->pfnCreate(pDisk->pVDIfsDisk, fFlags & VD_FILTER_FLAGS_INFO,
6120 pFilter->pVDIfsFilter, &pFilter->pvBackendData);
6121 if (RT_FAILURE(rc))
6122 break;
6123
6124 /* Lock disk for writing, as we modify pDisk information below. */
6125 rc2 = vdThreadStartWrite(pDisk);
6126 AssertRC(rc2);
6127 fLockWrite = true;
6128
6129 /* Add filter to chains. */
6130 if (fFlags & VD_FILTER_FLAGS_WRITE)
6131 {
6132 RTListAppend(&pDisk->ListFilterChainWrite, &pFilter->ListNodeChainWrite);
6133 vdFilterRetain(pFilter);
6134 }
6135
6136 if (fFlags & VD_FILTER_FLAGS_READ)
6137 {
6138 RTListAppend(&pDisk->ListFilterChainRead, &pFilter->ListNodeChainRead);
6139 vdFilterRetain(pFilter);
6140 }
6141 } while (0);
6142
6143 if (RT_UNLIKELY(fLockWrite))
6144 {
6145 rc2 = vdThreadFinishWrite(pDisk);
6146 AssertRC(rc2);
6147 }
6148
6149 if (RT_FAILURE(rc))
6150 {
6151 if (pFilter)
6152 RTMemFree(pFilter);
6153 }
6154
6155 LogFlowFunc(("returns %Rrc\n", rc));
6156 return rc;
6157}
6158
6159/**
6160 * Creates and opens a new base image file.
6161 *
6162 * @returns VBox status code.
6163 * @param pDisk Pointer to HDD container.
6164 * @param pszBackend Name of the image file backend to use.
6165 * @param pszFilename Name of the image file to create.
6166 * @param cbSize Image size in bytes.
6167 * @param uImageFlags Flags specifying special image features.
6168 * @param pszComment Pointer to image comment. NULL is ok.
6169 * @param pPCHSGeometry Pointer to physical disk geometry <= (16383,16,63). Not NULL.
6170 * @param pLCHSGeometry Pointer to logical disk geometry <= (x,255,63). Not NULL.
6171 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6172 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6173 * @param pVDIfsImage Pointer to the per-image VD interface list.
6174 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6175 */
6176VBOXDDU_DECL(int) VDCreateBase(PVDISK pDisk, const char *pszBackend,
6177 const char *pszFilename, uint64_t cbSize,
6178 unsigned uImageFlags, const char *pszComment,
6179 PCVDGEOMETRY pPCHSGeometry,
6180 PCVDGEOMETRY pLCHSGeometry,
6181 PCRTUUID pUuid, unsigned uOpenFlags,
6182 PVDINTERFACE pVDIfsImage,
6183 PVDINTERFACE pVDIfsOperation)
6184{
6185 int rc = VINF_SUCCESS;
6186 int rc2;
6187 bool fLockWrite = false, fLockRead = false;
6188 PVDIMAGE pImage = NULL;
6189 RTUUID uuid;
6190
6191 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" cbSize=%llu uImageFlags=%#x pszComment=\"%s\" PCHS=%u/%u/%u LCHS=%u/%u/%u Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6192 pDisk, pszBackend, pszFilename, cbSize, uImageFlags, pszComment,
6193 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
6194 pPCHSGeometry->cSectors, pLCHSGeometry->cCylinders,
6195 pLCHSGeometry->cHeads, pLCHSGeometry->cSectors, pUuid,
6196 uOpenFlags, pVDIfsImage, pVDIfsOperation));
6197
6198 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6199
6200 do
6201 {
6202 /* sanity check */
6203 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6204 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6205
6206 /* Check arguments. */
6207 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6208 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6209 rc = VERR_INVALID_PARAMETER);
6210 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6211 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6212 rc = VERR_INVALID_PARAMETER);
6213 AssertMsgBreakStmt(cbSize,
6214 ("cbSize=%llu\n", cbSize),
6215 rc = VERR_INVALID_PARAMETER);
6216 if (cbSize % 512)
6217 {
6218 rc = vdError(pDisk, VERR_VD_INVALID_SIZE, RT_SRC_POS,
6219 N_("VD: The given disk size %llu is not aligned on a sector boundary (512 bytes)"), cbSize);
6220 break;
6221 }
6222 AssertMsgBreakStmt( ((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0)
6223 || ((uImageFlags & (VD_IMAGE_FLAGS_FIXED | VD_IMAGE_FLAGS_DIFF)) != VD_IMAGE_FLAGS_FIXED),
6224 ("uImageFlags=%#x\n", uImageFlags),
6225 rc = VERR_INVALID_PARAMETER);
6226 /* The PCHS geometry fields may be 0 to leave it for later. */
6227 AssertMsgBreakStmt( VALID_PTR(pPCHSGeometry)
6228 && pPCHSGeometry->cHeads <= 16
6229 && pPCHSGeometry->cSectors <= 63,
6230 ("pPCHSGeometry=%#p PCHS=%u/%u/%u\n", pPCHSGeometry,
6231 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
6232 pPCHSGeometry->cSectors),
6233 rc = VERR_INVALID_PARAMETER);
6234 /* The LCHS geometry fields may be 0 to leave it to later autodetection. */
6235 AssertMsgBreakStmt( VALID_PTR(pLCHSGeometry)
6236 && pLCHSGeometry->cHeads <= 255
6237 && pLCHSGeometry->cSectors <= 63,
6238 ("pLCHSGeometry=%#p LCHS=%u/%u/%u\n", pLCHSGeometry,
6239 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads,
6240 pLCHSGeometry->cSectors),
6241 rc = VERR_INVALID_PARAMETER);
6242 /* The UUID may be NULL. */
6243 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6244 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6245 rc = VERR_INVALID_PARAMETER);
6246 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6247 ("uOpenFlags=%#x\n", uOpenFlags),
6248 rc = VERR_INVALID_PARAMETER);
6249
6250 /* Check state. Needs a temporary read lock. Holding the write lock
6251 * all the time would be blocking other activities for too long. */
6252 rc2 = vdThreadStartRead(pDisk);
6253 AssertRC(rc2);
6254 fLockRead = true;
6255 AssertMsgBreakStmt(pDisk->cImages == 0,
6256 ("Create base image cannot be done with other images open\n"),
6257 rc = VERR_VD_INVALID_STATE);
6258 rc2 = vdThreadFinishRead(pDisk);
6259 AssertRC(rc2);
6260 fLockRead = false;
6261
6262 /* Set up image descriptor. */
6263 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
6264 if (!pImage)
6265 {
6266 rc = VERR_NO_MEMORY;
6267 break;
6268 }
6269 pImage->pszFilename = RTStrDup(pszFilename);
6270 if (!pImage->pszFilename)
6271 {
6272 rc = VERR_NO_MEMORY;
6273 break;
6274 }
6275 pImage->VDIo.pDisk = pDisk;
6276 pImage->pVDIfsImage = pVDIfsImage;
6277
6278 /* Set up the I/O interface. */
6279 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
6280 if (!pImage->VDIo.pInterfaceIo)
6281 {
6282 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
6283 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6284 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
6285 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
6286 }
6287
6288 /* Set up the internal I/O interface. */
6289 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
6290 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
6291 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6292 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
6293 AssertRC(rc);
6294
6295 rc = vdFindImageBackend(pszBackend, &pImage->Backend);
6296 if (RT_FAILURE(rc))
6297 break;
6298 if (!pImage->Backend)
6299 {
6300 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6301 N_("VD: unknown backend name '%s'"), pszBackend);
6302 break;
6303 }
6304 if (!(pImage->Backend->uBackendCaps & ( VD_CAP_CREATE_FIXED
6305 | VD_CAP_CREATE_DYNAMIC)))
6306 {
6307 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6308 N_("VD: backend '%s' cannot create base images"), pszBackend);
6309 break;
6310 }
6311 if ( ( (uImageFlags & VD_VMDK_IMAGE_FLAGS_SPLIT_2G)
6312 && !(pImage->Backend->uBackendCaps & VD_CAP_CREATE_SPLIT_2G))
6313 || ( (uImageFlags & VD_VMDK_IMAGE_FLAGS_STREAM_OPTIMIZED)
6314 && RTStrICmp(pszBackend, "VMDK")))
6315 {
6316 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6317 N_("VD: backend '%s' does not support the selected image variant"), pszBackend);
6318 break;
6319 }
6320
6321 /* Create UUID if the caller didn't specify one. */
6322 if (!pUuid)
6323 {
6324 rc = RTUuidCreate(&uuid);
6325 if (RT_FAILURE(rc))
6326 {
6327 rc = vdError(pDisk, rc, RT_SRC_POS,
6328 N_("VD: cannot generate UUID for image '%s'"),
6329 pszFilename);
6330 break;
6331 }
6332 pUuid = &uuid;
6333 }
6334
6335 pImage->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6336 uImageFlags &= ~VD_IMAGE_FLAGS_DIFF;
6337 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6338 rc = pImage->Backend->pfnCreate(pImage->pszFilename, cbSize,
6339 uImageFlags, pszComment, pPCHSGeometry,
6340 pLCHSGeometry, pUuid,
6341 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6342 0, 99,
6343 pDisk->pVDIfsDisk,
6344 pImage->pVDIfsImage,
6345 pVDIfsOperation,
6346 pDisk->enmType,
6347 &pImage->pBackendData);
6348
6349 if (RT_SUCCESS(rc))
6350 {
6351 pImage->VDIo.pBackendData = pImage->pBackendData;
6352 pImage->uImageFlags = uImageFlags;
6353
6354 /* Force sane optimization settings. It's not worth avoiding writes
6355 * to fixed size images. The overhead would have almost no payback. */
6356 if (uImageFlags & VD_IMAGE_FLAGS_FIXED)
6357 pImage->uOpenFlags |= VD_OPEN_FLAGS_HONOR_SAME;
6358
6359 /* Lock disk for writing, as we modify pDisk information below. */
6360 rc2 = vdThreadStartWrite(pDisk);
6361 AssertRC(rc2);
6362 fLockWrite = true;
6363
6364 /** @todo optionally check UUIDs */
6365
6366 /* Re-check state, as the lock wasn't held and another image
6367 * creation call could have been done by another thread. */
6368 AssertMsgStmt(pDisk->cImages == 0,
6369 ("Create base image cannot be done with other images open\n"),
6370 rc = VERR_VD_INVALID_STATE);
6371 }
6372
6373 if (RT_SUCCESS(rc))
6374 {
6375 /* Cache disk information. */
6376 pDisk->cbSize = vdImageGetSize(pImage);
6377
6378 /* Cache PCHS geometry. */
6379 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
6380 &pDisk->PCHSGeometry);
6381 if (RT_FAILURE(rc2))
6382 {
6383 pDisk->PCHSGeometry.cCylinders = 0;
6384 pDisk->PCHSGeometry.cHeads = 0;
6385 pDisk->PCHSGeometry.cSectors = 0;
6386 }
6387 else
6388 {
6389 /* Make sure the CHS geometry is properly clipped. */
6390 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
6391 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
6392 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
6393 }
6394
6395 /* Cache LCHS geometry. */
6396 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
6397 &pDisk->LCHSGeometry);
6398 if (RT_FAILURE(rc2))
6399 {
6400 pDisk->LCHSGeometry.cCylinders = 0;
6401 pDisk->LCHSGeometry.cHeads = 0;
6402 pDisk->LCHSGeometry.cSectors = 0;
6403 }
6404 else
6405 {
6406 /* Make sure the CHS geometry is properly clipped. */
6407 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
6408 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
6409 }
6410
6411 /* Image successfully opened, make it the last image. */
6412 vdAddImageToList(pDisk, pImage);
6413 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
6414 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
6415 }
6416 else
6417 {
6418 /* Error detected, image may or may not be opened. Close and delete
6419 * image if it was opened. */
6420 if (pImage->pBackendData)
6421 {
6422 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, true);
6423 AssertRC(rc2);
6424 pImage->pBackendData = NULL;
6425 }
6426 }
6427 } while (0);
6428
6429 if (RT_UNLIKELY(fLockWrite))
6430 {
6431 rc2 = vdThreadFinishWrite(pDisk);
6432 AssertRC(rc2);
6433 }
6434 else if (RT_UNLIKELY(fLockRead))
6435 {
6436 rc2 = vdThreadFinishRead(pDisk);
6437 AssertRC(rc2);
6438 }
6439
6440 if (RT_FAILURE(rc))
6441 {
6442 if (pImage)
6443 {
6444 if (pImage->pszFilename)
6445 RTStrFree(pImage->pszFilename);
6446 RTMemFree(pImage);
6447 }
6448 }
6449
6450 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6451 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6452
6453 LogFlowFunc(("returns %Rrc\n", rc));
6454 return rc;
6455}
6456
6457/**
6458 * Creates and opens a new differencing image file in HDD container.
6459 * See comments for VDOpen function about differencing images.
6460 *
6461 * @returns VBox status code.
6462 * @param pDisk Pointer to HDD container.
6463 * @param pszBackend Name of the image file backend to use.
6464 * @param pszFilename Name of the differencing image file to create.
6465 * @param uImageFlags Flags specifying special image features.
6466 * @param pszComment Pointer to image comment. NULL is ok.
6467 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6468 * @param pParentUuid New parent UUID of the image. If NULL, the UUID is queried automatically.
6469 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6470 * @param pVDIfsImage Pointer to the per-image VD interface list.
6471 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6472 */
6473VBOXDDU_DECL(int) VDCreateDiff(PVDISK pDisk, const char *pszBackend,
6474 const char *pszFilename, unsigned uImageFlags,
6475 const char *pszComment, PCRTUUID pUuid,
6476 PCRTUUID pParentUuid, unsigned uOpenFlags,
6477 PVDINTERFACE pVDIfsImage,
6478 PVDINTERFACE pVDIfsOperation)
6479{
6480 int rc = VINF_SUCCESS;
6481 int rc2;
6482 bool fLockWrite = false, fLockRead = false;
6483 PVDIMAGE pImage = NULL;
6484 RTUUID uuid;
6485
6486 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" uImageFlags=%#x pszComment=\"%s\" Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6487 pDisk, pszBackend, pszFilename, uImageFlags, pszComment, pUuid, uOpenFlags, pVDIfsImage, pVDIfsOperation));
6488
6489 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6490
6491 do
6492 {
6493 /* sanity check */
6494 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6495 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6496
6497 /* Check arguments. */
6498 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6499 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6500 rc = VERR_INVALID_PARAMETER);
6501 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6502 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6503 rc = VERR_INVALID_PARAMETER);
6504 AssertMsgBreakStmt((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0,
6505 ("uImageFlags=%#x\n", uImageFlags),
6506 rc = VERR_INVALID_PARAMETER);
6507 /* The UUID may be NULL. */
6508 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6509 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6510 rc = VERR_INVALID_PARAMETER);
6511 /* The parent UUID may be NULL. */
6512 AssertMsgBreakStmt(pParentUuid == NULL || VALID_PTR(pParentUuid),
6513 ("pParentUuid=%#p ParentUUID=%RTuuid\n", pParentUuid, pParentUuid),
6514 rc = VERR_INVALID_PARAMETER);
6515 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6516 ("uOpenFlags=%#x\n", uOpenFlags),
6517 rc = VERR_INVALID_PARAMETER);
6518
6519 /* Check state. Needs a temporary read lock. Holding the write lock
6520 * all the time would be blocking other activities for too long. */
6521 rc2 = vdThreadStartRead(pDisk);
6522 AssertRC(rc2);
6523 fLockRead = true;
6524 AssertMsgBreakStmt(pDisk->cImages != 0,
6525 ("Create diff image cannot be done without other images open\n"),
6526 rc = VERR_VD_INVALID_STATE);
6527 rc2 = vdThreadFinishRead(pDisk);
6528 AssertRC(rc2);
6529 fLockRead = false;
6530
6531 /*
6532 * Destroy the current discard state first which might still have pending blocks
6533 * for the currently opened image which will be switched to readonly mode.
6534 */
6535 /* Lock disk for writing, as we modify pDisk information below. */
6536 rc2 = vdThreadStartWrite(pDisk);
6537 AssertRC(rc2);
6538 fLockWrite = true;
6539 rc = vdDiscardStateDestroy(pDisk);
6540 if (RT_FAILURE(rc))
6541 break;
6542 rc2 = vdThreadFinishWrite(pDisk);
6543 AssertRC(rc2);
6544 fLockWrite = false;
6545
6546 /* Set up image descriptor. */
6547 pImage = (PVDIMAGE)RTMemAllocZ(sizeof(VDIMAGE));
6548 if (!pImage)
6549 {
6550 rc = VERR_NO_MEMORY;
6551 break;
6552 }
6553 pImage->pszFilename = RTStrDup(pszFilename);
6554 if (!pImage->pszFilename)
6555 {
6556 rc = VERR_NO_MEMORY;
6557 break;
6558 }
6559
6560 rc = vdFindImageBackend(pszBackend, &pImage->Backend);
6561 if (RT_FAILURE(rc))
6562 break;
6563 if (!pImage->Backend)
6564 {
6565 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6566 N_("VD: unknown backend name '%s'"), pszBackend);
6567 break;
6568 }
6569 if ( !(pImage->Backend->uBackendCaps & VD_CAP_DIFF)
6570 || !(pImage->Backend->uBackendCaps & ( VD_CAP_CREATE_FIXED
6571 | VD_CAP_CREATE_DYNAMIC)))
6572 {
6573 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6574 N_("VD: backend '%s' cannot create diff images"), pszBackend);
6575 break;
6576 }
6577
6578 pImage->VDIo.pDisk = pDisk;
6579 pImage->pVDIfsImage = pVDIfsImage;
6580
6581 /* Set up the I/O interface. */
6582 pImage->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsImage);
6583 if (!pImage->VDIo.pInterfaceIo)
6584 {
6585 vdIfIoFallbackCallbacksSetup(&pImage->VDIo.VDIfIo);
6586 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6587 pDisk, sizeof(VDINTERFACEIO), &pVDIfsImage);
6588 pImage->VDIo.pInterfaceIo = &pImage->VDIo.VDIfIo;
6589 }
6590
6591 /* Set up the internal I/O interface. */
6592 AssertBreakStmt(!VDIfIoIntGet(pVDIfsImage), rc = VERR_INVALID_PARAMETER);
6593 vdIfIoIntCallbacksSetup(&pImage->VDIo.VDIfIoInt);
6594 rc = VDInterfaceAdd(&pImage->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6595 &pImage->VDIo, sizeof(VDINTERFACEIOINT), &pImage->pVDIfsImage);
6596 AssertRC(rc);
6597
6598 /* Create UUID if the caller didn't specify one. */
6599 if (!pUuid)
6600 {
6601 rc = RTUuidCreate(&uuid);
6602 if (RT_FAILURE(rc))
6603 {
6604 rc = vdError(pDisk, rc, RT_SRC_POS,
6605 N_("VD: cannot generate UUID for image '%s'"),
6606 pszFilename);
6607 break;
6608 }
6609 pUuid = &uuid;
6610 }
6611
6612 pImage->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6613 pImage->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6614 uImageFlags |= VD_IMAGE_FLAGS_DIFF;
6615 rc = pImage->Backend->pfnCreate(pImage->pszFilename, pDisk->cbSize,
6616 uImageFlags | VD_IMAGE_FLAGS_DIFF,
6617 pszComment, &pDisk->PCHSGeometry,
6618 &pDisk->LCHSGeometry, pUuid,
6619 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6620 0, 99,
6621 pDisk->pVDIfsDisk,
6622 pImage->pVDIfsImage,
6623 pVDIfsOperation,
6624 pDisk->enmType,
6625 &pImage->pBackendData);
6626
6627 if (RT_SUCCESS(rc))
6628 {
6629 pImage->VDIo.pBackendData = pImage->pBackendData;
6630 pImage->uImageFlags = uImageFlags;
6631
6632 /* Lock disk for writing, as we modify pDisk information below. */
6633 rc2 = vdThreadStartWrite(pDisk);
6634 AssertRC(rc2);
6635 fLockWrite = true;
6636
6637 /* Switch previous image to read-only mode. */
6638 unsigned uOpenFlagsPrevImg;
6639 uOpenFlagsPrevImg = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
6640 if (!(uOpenFlagsPrevImg & VD_OPEN_FLAGS_READONLY))
6641 {
6642 uOpenFlagsPrevImg |= VD_OPEN_FLAGS_READONLY;
6643 rc = pDisk->pLast->Backend->pfnSetOpenFlags(pDisk->pLast->pBackendData, uOpenFlagsPrevImg);
6644 }
6645
6646 /** @todo optionally check UUIDs */
6647
6648 /* Re-check state, as the lock wasn't held and another image
6649 * creation call could have been done by another thread. */
6650 AssertMsgStmt(pDisk->cImages != 0,
6651 ("Create diff image cannot be done without other images open\n"),
6652 rc = VERR_VD_INVALID_STATE);
6653 }
6654
6655 if (RT_SUCCESS(rc))
6656 {
6657 RTUUID Uuid;
6658 RTTIMESPEC ts;
6659
6660 if (pParentUuid && !RTUuidIsNull(pParentUuid))
6661 {
6662 Uuid = *pParentUuid;
6663 pImage->Backend->pfnSetParentUuid(pImage->pBackendData, &Uuid);
6664 }
6665 else
6666 {
6667 rc2 = pDisk->pLast->Backend->pfnGetUuid(pDisk->pLast->pBackendData,
6668 &Uuid);
6669 if (RT_SUCCESS(rc2))
6670 pImage->Backend->pfnSetParentUuid(pImage->pBackendData, &Uuid);
6671 }
6672 rc2 = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6673 &Uuid);
6674 if (RT_SUCCESS(rc2))
6675 pImage->Backend->pfnSetParentModificationUuid(pImage->pBackendData,
6676 &Uuid);
6677 if (pDisk->pLast->Backend->pfnGetTimestamp)
6678 rc2 = pDisk->pLast->Backend->pfnGetTimestamp(pDisk->pLast->pBackendData,
6679 &ts);
6680 else
6681 rc2 = VERR_NOT_IMPLEMENTED;
6682 if (RT_SUCCESS(rc2) && pImage->Backend->pfnSetParentTimestamp)
6683 pImage->Backend->pfnSetParentTimestamp(pImage->pBackendData, &ts);
6684
6685 if (pImage->Backend->pfnSetParentFilename)
6686 rc2 = pImage->Backend->pfnSetParentFilename(pImage->pBackendData, pDisk->pLast->pszFilename);
6687 }
6688
6689 if (RT_SUCCESS(rc))
6690 {
6691 /* Image successfully opened, make it the last image. */
6692 vdAddImageToList(pDisk, pImage);
6693 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
6694 pDisk->uModified = VD_IMAGE_MODIFIED_FIRST;
6695 }
6696 else
6697 {
6698 /* Error detected, but image opened. Close and delete image. */
6699 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, true);
6700 AssertRC(rc2);
6701 pImage->pBackendData = NULL;
6702 }
6703 } while (0);
6704
6705 if (RT_UNLIKELY(fLockWrite))
6706 {
6707 rc2 = vdThreadFinishWrite(pDisk);
6708 AssertRC(rc2);
6709 }
6710 else if (RT_UNLIKELY(fLockRead))
6711 {
6712 rc2 = vdThreadFinishRead(pDisk);
6713 AssertRC(rc2);
6714 }
6715
6716 if (RT_FAILURE(rc))
6717 {
6718 if (pImage)
6719 {
6720 if (pImage->pszFilename)
6721 RTStrFree(pImage->pszFilename);
6722 RTMemFree(pImage);
6723 }
6724 }
6725
6726 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6727 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6728
6729 LogFlowFunc(("returns %Rrc\n", rc));
6730 return rc;
6731}
6732
6733
6734/**
6735 * Creates and opens new cache image file in HDD container.
6736 *
6737 * @return VBox status code.
6738 * @param pDisk Name of the cache file backend to use (case insensitive).
6739 * @param pszFilename Name of the differencing cache file to create.
6740 * @param cbSize Maximum size of the cache.
6741 * @param uImageFlags Flags specifying special cache features.
6742 * @param pszComment Pointer to image comment. NULL is ok.
6743 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
6744 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
6745 * @param pVDIfsCache Pointer to the per-cache VD interface list.
6746 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6747 */
6748VBOXDDU_DECL(int) VDCreateCache(PVDISK pDisk, const char *pszBackend,
6749 const char *pszFilename, uint64_t cbSize,
6750 unsigned uImageFlags, const char *pszComment,
6751 PCRTUUID pUuid, unsigned uOpenFlags,
6752 PVDINTERFACE pVDIfsCache, PVDINTERFACE pVDIfsOperation)
6753{
6754 int rc = VINF_SUCCESS;
6755 int rc2;
6756 bool fLockWrite = false, fLockRead = false;
6757 PVDCACHE pCache = NULL;
6758 RTUUID uuid;
6759
6760 LogFlowFunc(("pDisk=%#p pszBackend=\"%s\" pszFilename=\"%s\" cbSize=%llu uImageFlags=%#x pszComment=\"%s\" Uuid=%RTuuid uOpenFlags=%#x pVDIfsImage=%#p pVDIfsOperation=%#p\n",
6761 pDisk, pszBackend, pszFilename, cbSize, uImageFlags, pszComment, pUuid, uOpenFlags, pVDIfsCache, pVDIfsOperation));
6762
6763 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6764
6765 do
6766 {
6767 /* sanity check */
6768 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6769 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6770
6771 /* Check arguments. */
6772 AssertMsgBreakStmt(VALID_PTR(pszBackend) && *pszBackend,
6773 ("pszBackend=%#p \"%s\"\n", pszBackend, pszBackend),
6774 rc = VERR_INVALID_PARAMETER);
6775 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
6776 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
6777 rc = VERR_INVALID_PARAMETER);
6778 AssertMsgBreakStmt(cbSize,
6779 ("cbSize=%llu\n", cbSize),
6780 rc = VERR_INVALID_PARAMETER);
6781 AssertMsgBreakStmt((uImageFlags & ~VD_IMAGE_FLAGS_MASK) == 0,
6782 ("uImageFlags=%#x\n", uImageFlags),
6783 rc = VERR_INVALID_PARAMETER);
6784 /* The UUID may be NULL. */
6785 AssertMsgBreakStmt(pUuid == NULL || VALID_PTR(pUuid),
6786 ("pUuid=%#p UUID=%RTuuid\n", pUuid, pUuid),
6787 rc = VERR_INVALID_PARAMETER);
6788 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
6789 ("uOpenFlags=%#x\n", uOpenFlags),
6790 rc = VERR_INVALID_PARAMETER);
6791
6792 /* Check state. Needs a temporary read lock. Holding the write lock
6793 * all the time would be blocking other activities for too long. */
6794 rc2 = vdThreadStartRead(pDisk);
6795 AssertRC(rc2);
6796 fLockRead = true;
6797 AssertMsgBreakStmt(!pDisk->pCache,
6798 ("Create cache image cannot be done with a cache already attached\n"),
6799 rc = VERR_VD_CACHE_ALREADY_EXISTS);
6800 rc2 = vdThreadFinishRead(pDisk);
6801 AssertRC(rc2);
6802 fLockRead = false;
6803
6804 /* Set up image descriptor. */
6805 pCache = (PVDCACHE)RTMemAllocZ(sizeof(VDCACHE));
6806 if (!pCache)
6807 {
6808 rc = VERR_NO_MEMORY;
6809 break;
6810 }
6811 pCache->pszFilename = RTStrDup(pszFilename);
6812 if (!pCache->pszFilename)
6813 {
6814 rc = VERR_NO_MEMORY;
6815 break;
6816 }
6817
6818 rc = vdFindCacheBackend(pszBackend, &pCache->Backend);
6819 if (RT_FAILURE(rc))
6820 break;
6821 if (!pCache->Backend)
6822 {
6823 rc = vdError(pDisk, VERR_INVALID_PARAMETER, RT_SRC_POS,
6824 N_("VD: unknown backend name '%s'"), pszBackend);
6825 break;
6826 }
6827
6828 pCache->VDIo.pDisk = pDisk;
6829 pCache->pVDIfsCache = pVDIfsCache;
6830
6831 /* Set up the I/O interface. */
6832 pCache->VDIo.pInterfaceIo = VDIfIoGet(pVDIfsCache);
6833 if (!pCache->VDIo.pInterfaceIo)
6834 {
6835 vdIfIoFallbackCallbacksSetup(&pCache->VDIo.VDIfIo);
6836 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIo.Core, "VD_IO", VDINTERFACETYPE_IO,
6837 pDisk, sizeof(VDINTERFACEIO), &pVDIfsCache);
6838 pCache->VDIo.pInterfaceIo = &pCache->VDIo.VDIfIo;
6839 }
6840
6841 /* Set up the internal I/O interface. */
6842 AssertBreakStmt(!VDIfIoIntGet(pVDIfsCache), rc = VERR_INVALID_PARAMETER);
6843 vdIfIoIntCallbacksSetup(&pCache->VDIo.VDIfIoInt);
6844 rc = VDInterfaceAdd(&pCache->VDIo.VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
6845 &pCache->VDIo, sizeof(VDINTERFACEIOINT), &pCache->pVDIfsCache);
6846 AssertRC(rc);
6847
6848 /* Create UUID if the caller didn't specify one. */
6849 if (!pUuid)
6850 {
6851 rc = RTUuidCreate(&uuid);
6852 if (RT_FAILURE(rc))
6853 {
6854 rc = vdError(pDisk, rc, RT_SRC_POS,
6855 N_("VD: cannot generate UUID for image '%s'"),
6856 pszFilename);
6857 break;
6858 }
6859 pUuid = &uuid;
6860 }
6861
6862 pCache->uOpenFlags = uOpenFlags & VD_OPEN_FLAGS_HONOR_SAME;
6863 pCache->VDIo.fIgnoreFlush = (uOpenFlags & VD_OPEN_FLAGS_IGNORE_FLUSH) != 0;
6864 rc = pCache->Backend->pfnCreate(pCache->pszFilename, cbSize,
6865 uImageFlags,
6866 pszComment, pUuid,
6867 uOpenFlags & ~VD_OPEN_FLAGS_HONOR_SAME,
6868 0, 99,
6869 pDisk->pVDIfsDisk,
6870 pCache->pVDIfsCache,
6871 pVDIfsOperation,
6872 &pCache->pBackendData);
6873
6874 if (RT_SUCCESS(rc))
6875 {
6876 /* Lock disk for writing, as we modify pDisk information below. */
6877 rc2 = vdThreadStartWrite(pDisk);
6878 AssertRC(rc2);
6879 fLockWrite = true;
6880
6881 pCache->VDIo.pBackendData = pCache->pBackendData;
6882
6883 /* Re-check state, as the lock wasn't held and another image
6884 * creation call could have been done by another thread. */
6885 AssertMsgStmt(!pDisk->pCache,
6886 ("Create cache image cannot be done with another cache open\n"),
6887 rc = VERR_VD_CACHE_ALREADY_EXISTS);
6888 }
6889
6890 if ( RT_SUCCESS(rc)
6891 && pDisk->pLast)
6892 {
6893 RTUUID UuidModification;
6894
6895 /* Set same modification Uuid as the last image. */
6896 rc = pDisk->pLast->Backend->pfnGetModificationUuid(pDisk->pLast->pBackendData,
6897 &UuidModification);
6898 if (RT_SUCCESS(rc))
6899 {
6900 rc = pCache->Backend->pfnSetModificationUuid(pCache->pBackendData,
6901 &UuidModification);
6902 }
6903
6904 if (rc == VERR_NOT_SUPPORTED)
6905 rc = VINF_SUCCESS;
6906 }
6907
6908 if (RT_SUCCESS(rc))
6909 {
6910 /* Cache successfully created. */
6911 pDisk->pCache = pCache;
6912 }
6913 else
6914 {
6915 /* Error detected, but image opened. Close and delete image. */
6916 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, true);
6917 AssertRC(rc2);
6918 pCache->pBackendData = NULL;
6919 }
6920 } while (0);
6921
6922 if (RT_UNLIKELY(fLockWrite))
6923 {
6924 rc2 = vdThreadFinishWrite(pDisk);
6925 AssertRC(rc2);
6926 }
6927 else if (RT_UNLIKELY(fLockRead))
6928 {
6929 rc2 = vdThreadFinishRead(pDisk);
6930 AssertRC(rc2);
6931 }
6932
6933 if (RT_FAILURE(rc))
6934 {
6935 if (pCache)
6936 {
6937 if (pCache->pszFilename)
6938 RTStrFree(pCache->pszFilename);
6939 RTMemFree(pCache);
6940 }
6941 }
6942
6943 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
6944 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
6945
6946 LogFlowFunc(("returns %Rrc\n", rc));
6947 return rc;
6948}
6949
6950/**
6951 * Merges two images (not necessarily with direct parent/child relationship).
6952 * As a side effect the source image and potentially the other images which
6953 * are also merged to the destination are deleted from both the disk and the
6954 * images in the HDD container.
6955 *
6956 * @returns VBox status code.
6957 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
6958 * @param pDisk Pointer to HDD container.
6959 * @param nImageFrom Name of the image file to merge from.
6960 * @param nImageTo Name of the image file to merge to.
6961 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
6962 */
6963VBOXDDU_DECL(int) VDMerge(PVDISK pDisk, unsigned nImageFrom,
6964 unsigned nImageTo, PVDINTERFACE pVDIfsOperation)
6965{
6966 int rc = VINF_SUCCESS;
6967 int rc2;
6968 bool fLockWrite = false, fLockRead = false;
6969 void *pvBuf = NULL;
6970
6971 LogFlowFunc(("pDisk=%#p nImageFrom=%u nImageTo=%u pVDIfsOperation=%#p\n",
6972 pDisk, nImageFrom, nImageTo, pVDIfsOperation));
6973
6974 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
6975
6976 do
6977 {
6978 /* sanity check */
6979 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
6980 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
6981
6982 /* For simplicity reasons lock for writing as the image reopen below
6983 * might need it. After all the reopen is usually needed. */
6984 rc2 = vdThreadStartWrite(pDisk);
6985 AssertRC(rc2);
6986 fLockWrite = true;
6987 PVDIMAGE pImageFrom = vdGetImageByNumber(pDisk, nImageFrom);
6988 PVDIMAGE pImageTo = vdGetImageByNumber(pDisk, nImageTo);
6989 if (!pImageFrom || !pImageTo)
6990 {
6991 rc = VERR_VD_IMAGE_NOT_FOUND;
6992 break;
6993 }
6994 AssertBreakStmt(pImageFrom != pImageTo, rc = VERR_INVALID_PARAMETER);
6995
6996 /* Make sure destination image is writable. */
6997 unsigned uOpenFlags = pImageTo->Backend->pfnGetOpenFlags(pImageTo->pBackendData);
6998 if (uOpenFlags & VD_OPEN_FLAGS_READONLY)
6999 {
7000 /*
7001 * Clear skip consistency checks because the image is made writable now and
7002 * skipping consistency checks is only possible for readonly images.
7003 */
7004 uOpenFlags &= ~(VD_OPEN_FLAGS_READONLY | VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS);
7005 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7006 uOpenFlags);
7007 if (RT_FAILURE(rc))
7008 break;
7009 }
7010
7011 /* Get size of destination image. */
7012 uint64_t cbSize = vdImageGetSize(pImageTo);
7013 rc2 = vdThreadFinishWrite(pDisk);
7014 AssertRC(rc2);
7015 fLockWrite = false;
7016
7017 /* Allocate tmp buffer. */
7018 pvBuf = RTMemTmpAlloc(VD_MERGE_BUFFER_SIZE);
7019 if (!pvBuf)
7020 {
7021 rc = VERR_NO_MEMORY;
7022 break;
7023 }
7024
7025 /* Merging is done directly on the images itself. This potentially
7026 * causes trouble if the disk is full in the middle of operation. */
7027 if (nImageFrom < nImageTo)
7028 {
7029 /* Merge parent state into child. This means writing all not
7030 * allocated blocks in the destination image which are allocated in
7031 * the images to be merged. */
7032 uint64_t uOffset = 0;
7033 uint64_t cbRemaining = cbSize;
7034 do
7035 {
7036 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
7037 RTSGSEG SegmentBuf;
7038 RTSGBUF SgBuf;
7039 VDIOCTX IoCtx;
7040
7041 SegmentBuf.pvSeg = pvBuf;
7042 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
7043 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
7044 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, 0, 0, NULL,
7045 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
7046
7047 /* Need to hold the write lock during a read-write operation. */
7048 rc2 = vdThreadStartWrite(pDisk);
7049 AssertRC(rc2);
7050 fLockWrite = true;
7051
7052 rc = pImageTo->Backend->pfnRead(pImageTo->pBackendData,
7053 uOffset, cbThisRead,
7054 &IoCtx, &cbThisRead);
7055 if (rc == VERR_VD_BLOCK_FREE)
7056 {
7057 /* Search for image with allocated block. Do not attempt to
7058 * read more than the previous reads marked as valid.
7059 * Otherwise this would return stale data when different
7060 * block sizes are used for the images. */
7061 for (PVDIMAGE pCurrImage = pImageTo->pPrev;
7062 pCurrImage != NULL && pCurrImage != pImageFrom->pPrev && rc == VERR_VD_BLOCK_FREE;
7063 pCurrImage = pCurrImage->pPrev)
7064 {
7065 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
7066 uOffset, cbThisRead,
7067 &IoCtx, &cbThisRead);
7068 }
7069
7070 if (rc != VERR_VD_BLOCK_FREE)
7071 {
7072 if (RT_FAILURE(rc))
7073 break;
7074 /* Updating the cache is required because this might be a live merge. */
7075 rc = vdWriteHelperEx(pDisk, pImageTo, pImageFrom->pPrev,
7076 uOffset, pvBuf, cbThisRead,
7077 VDIOCTX_FLAGS_READ_UPDATE_CACHE, 0);
7078 if (RT_FAILURE(rc))
7079 break;
7080 }
7081 else
7082 rc = VINF_SUCCESS;
7083 }
7084 else if (RT_FAILURE(rc))
7085 break;
7086
7087 rc2 = vdThreadFinishWrite(pDisk);
7088 AssertRC(rc2);
7089 fLockWrite = false;
7090
7091 uOffset += cbThisRead;
7092 cbRemaining -= cbThisRead;
7093
7094 if (pIfProgress && pIfProgress->pfnProgress)
7095 {
7096 /** @todo r=klaus: this can update the progress to the same
7097 * percentage over and over again if the image format makes
7098 * relatively small increments. */
7099 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
7100 uOffset * 99 / cbSize);
7101 if (RT_FAILURE(rc))
7102 break;
7103 }
7104 } while (uOffset < cbSize);
7105 }
7106 else
7107 {
7108 /*
7109 * We may need to update the parent uuid of the child coming after
7110 * the last image to be merged. We have to reopen it read/write.
7111 *
7112 * This is done before we do the actual merge to prevent an
7113 * inconsistent chain if the mode change fails for some reason.
7114 */
7115 if (pImageFrom->pNext)
7116 {
7117 PVDIMAGE pImageChild = pImageFrom->pNext;
7118
7119 /* Take the write lock. */
7120 rc2 = vdThreadStartWrite(pDisk);
7121 AssertRC(rc2);
7122 fLockWrite = true;
7123
7124 /* We need to open the image in read/write mode. */
7125 uOpenFlags = pImageChild->Backend->pfnGetOpenFlags(pImageChild->pBackendData);
7126
7127 if (uOpenFlags & VD_OPEN_FLAGS_READONLY)
7128 {
7129 uOpenFlags &= ~VD_OPEN_FLAGS_READONLY;
7130 rc = pImageChild->Backend->pfnSetOpenFlags(pImageChild->pBackendData,
7131 uOpenFlags);
7132 if (RT_FAILURE(rc))
7133 break;
7134 }
7135
7136 rc2 = vdThreadFinishWrite(pDisk);
7137 AssertRC(rc2);
7138 fLockWrite = false;
7139 }
7140
7141 /* If the merge is from the last image we have to relay all writes
7142 * to the merge destination as well, so that concurrent writes
7143 * (in case of a live merge) are handled correctly. */
7144 if (!pImageFrom->pNext)
7145 {
7146 /* Take the write lock. */
7147 rc2 = vdThreadStartWrite(pDisk);
7148 AssertRC(rc2);
7149 fLockWrite = true;
7150
7151 pDisk->pImageRelay = pImageTo;
7152
7153 rc2 = vdThreadFinishWrite(pDisk);
7154 AssertRC(rc2);
7155 fLockWrite = false;
7156 }
7157
7158 /* Merge child state into parent. This means writing all blocks
7159 * which are allocated in the image up to the source image to the
7160 * destination image. */
7161 uint64_t uOffset = 0;
7162 uint64_t cbRemaining = cbSize;
7163 do
7164 {
7165 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
7166 RTSGSEG SegmentBuf;
7167 RTSGBUF SgBuf;
7168 VDIOCTX IoCtx;
7169
7170 rc = VERR_VD_BLOCK_FREE;
7171
7172 SegmentBuf.pvSeg = pvBuf;
7173 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
7174 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
7175 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, 0, 0, NULL,
7176 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
7177
7178 /* Need to hold the write lock during a read-write operation. */
7179 rc2 = vdThreadStartWrite(pDisk);
7180 AssertRC(rc2);
7181 fLockWrite = true;
7182
7183 /* Search for image with allocated block. Do not attempt to
7184 * read more than the previous reads marked as valid. Otherwise
7185 * this would return stale data when different block sizes are
7186 * used for the images. */
7187 for (PVDIMAGE pCurrImage = pImageFrom;
7188 pCurrImage != NULL && pCurrImage != pImageTo && rc == VERR_VD_BLOCK_FREE;
7189 pCurrImage = pCurrImage->pPrev)
7190 {
7191 rc = pCurrImage->Backend->pfnRead(pCurrImage->pBackendData,
7192 uOffset, cbThisRead,
7193 &IoCtx, &cbThisRead);
7194 }
7195
7196 if (rc != VERR_VD_BLOCK_FREE)
7197 {
7198 if (RT_FAILURE(rc))
7199 break;
7200 rc = vdWriteHelper(pDisk, pImageTo, uOffset, pvBuf,
7201 cbThisRead, VDIOCTX_FLAGS_READ_UPDATE_CACHE);
7202 if (RT_FAILURE(rc))
7203 break;
7204 }
7205 else
7206 rc = VINF_SUCCESS;
7207
7208 rc2 = vdThreadFinishWrite(pDisk);
7209 AssertRC(rc2);
7210 fLockWrite = false;
7211
7212 uOffset += cbThisRead;
7213 cbRemaining -= cbThisRead;
7214
7215 if (pIfProgress && pIfProgress->pfnProgress)
7216 {
7217 /** @todo r=klaus: this can update the progress to the same
7218 * percentage over and over again if the image format makes
7219 * relatively small increments. */
7220 rc = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
7221 uOffset * 99 / cbSize);
7222 if (RT_FAILURE(rc))
7223 break;
7224 }
7225 } while (uOffset < cbSize);
7226
7227 /* In case we set up a "write proxy" image above we must clear
7228 * this again now to prevent stray writes. Failure or not. */
7229 if (!pImageFrom->pNext)
7230 {
7231 /* Take the write lock. */
7232 rc2 = vdThreadStartWrite(pDisk);
7233 AssertRC(rc2);
7234 fLockWrite = true;
7235
7236 pDisk->pImageRelay = NULL;
7237
7238 rc2 = vdThreadFinishWrite(pDisk);
7239 AssertRC(rc2);
7240 fLockWrite = false;
7241 }
7242 }
7243
7244 /*
7245 * Leave in case of an error to avoid corrupted data in the image chain
7246 * (includes cancelling the operation by the user).
7247 */
7248 if (RT_FAILURE(rc))
7249 break;
7250
7251 /* Need to hold the write lock while finishing the merge. */
7252 rc2 = vdThreadStartWrite(pDisk);
7253 AssertRC(rc2);
7254 fLockWrite = true;
7255
7256 /* Update parent UUID so that image chain is consistent.
7257 * The two attempts work around the problem that some backends
7258 * (e.g. iSCSI) do not support UUIDs, so we exploit the fact that
7259 * so far there can only be one such image in the chain. */
7260 /** @todo needs a better long-term solution, passing the UUID
7261 * knowledge from the caller or some such */
7262 RTUUID Uuid;
7263 PVDIMAGE pImageChild = NULL;
7264 if (nImageFrom < nImageTo)
7265 {
7266 if (pImageFrom->pPrev)
7267 {
7268 /* plan A: ask the parent itself for its UUID */
7269 rc = pImageFrom->pPrev->Backend->pfnGetUuid(pImageFrom->pPrev->pBackendData,
7270 &Uuid);
7271 if (RT_FAILURE(rc))
7272 {
7273 /* plan B: ask the child of the parent for parent UUID */
7274 rc = pImageFrom->Backend->pfnGetParentUuid(pImageFrom->pBackendData,
7275 &Uuid);
7276 }
7277 AssertRC(rc);
7278 }
7279 else
7280 RTUuidClear(&Uuid);
7281 rc = pImageTo->Backend->pfnSetParentUuid(pImageTo->pBackendData,
7282 &Uuid);
7283 AssertRC(rc);
7284 }
7285 else
7286 {
7287 /* Update the parent uuid of the child of the last merged image. */
7288 if (pImageFrom->pNext)
7289 {
7290 /* plan A: ask the parent itself for its UUID */
7291 rc = pImageTo->Backend->pfnGetUuid(pImageTo->pBackendData,
7292 &Uuid);
7293 if (RT_FAILURE(rc))
7294 {
7295 /* plan B: ask the child of the parent for parent UUID */
7296 rc = pImageTo->pNext->Backend->pfnGetParentUuid(pImageTo->pNext->pBackendData,
7297 &Uuid);
7298 }
7299 AssertRC(rc);
7300
7301 rc = pImageFrom->Backend->pfnSetParentUuid(pImageFrom->pNext->pBackendData,
7302 &Uuid);
7303 AssertRC(rc);
7304
7305 pImageChild = pImageFrom->pNext;
7306 }
7307 }
7308
7309 /* Delete the no longer needed images. */
7310 PVDIMAGE pImg = pImageFrom, pTmp;
7311 while (pImg != pImageTo)
7312 {
7313 if (nImageFrom < nImageTo)
7314 pTmp = pImg->pNext;
7315 else
7316 pTmp = pImg->pPrev;
7317 vdRemoveImageFromList(pDisk, pImg);
7318 pImg->Backend->pfnClose(pImg->pBackendData, true);
7319 RTMemFree(pImg->pszFilename);
7320 RTMemFree(pImg);
7321 pImg = pTmp;
7322 }
7323
7324 /* Make sure destination image is back to read only if necessary. */
7325 if (pImageTo != pDisk->pLast)
7326 {
7327 uOpenFlags = pImageTo->Backend->pfnGetOpenFlags(pImageTo->pBackendData);
7328 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
7329 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7330 uOpenFlags);
7331 if (RT_FAILURE(rc))
7332 break;
7333 }
7334
7335 /*
7336 * Make sure the child is readonly
7337 * for the child -> parent merge direction
7338 * if necessary.
7339 */
7340 if ( nImageFrom > nImageTo
7341 && pImageChild
7342 && pImageChild != pDisk->pLast)
7343 {
7344 uOpenFlags = pImageChild->Backend->pfnGetOpenFlags(pImageChild->pBackendData);
7345 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
7346 rc = pImageChild->Backend->pfnSetOpenFlags(pImageChild->pBackendData,
7347 uOpenFlags);
7348 if (RT_FAILURE(rc))
7349 break;
7350 }
7351 } while (0);
7352
7353 if (RT_UNLIKELY(fLockWrite))
7354 {
7355 rc2 = vdThreadFinishWrite(pDisk);
7356 AssertRC(rc2);
7357 }
7358 else if (RT_UNLIKELY(fLockRead))
7359 {
7360 rc2 = vdThreadFinishRead(pDisk);
7361 AssertRC(rc2);
7362 }
7363
7364 if (pvBuf)
7365 RTMemTmpFree(pvBuf);
7366
7367 if (RT_SUCCESS(rc) && pIfProgress && pIfProgress->pfnProgress)
7368 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7369
7370 LogFlowFunc(("returns %Rrc\n", rc));
7371 return rc;
7372}
7373
7374/**
7375 * Copies an image from one HDD container to another - extended version.
7376 * The copy is opened in the target HDD container.
7377 * It is possible to convert between different image formats, because the
7378 * backend for the destination may be different from the source.
7379 * If both the source and destination reference the same HDD container,
7380 * then the image is moved (by copying/deleting or renaming) to the new location.
7381 * The source container is unchanged if the move operation fails, otherwise
7382 * the image at the new location is opened in the same way as the old one was.
7383 *
7384 * @note The read/write accesses across disks are not synchronized, just the
7385 * accesses to each disk. Once there is a use case which requires a defined
7386 * read/write behavior in this situation this needs to be extended.
7387 *
7388 * @returns VBox status code.
7389 * @retval VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7390 * @param pDiskFrom Pointer to source HDD container.
7391 * @param nImage Image number, counts from 0. 0 is always base image of container.
7392 * @param pDiskTo Pointer to destination HDD container.
7393 * @param pszBackend Name of the image file backend to use (may be NULL to use the same as the source, case insensitive).
7394 * @param pszFilename New name of the image (may be NULL to specify that the
7395 * copy destination is the destination container, or
7396 * if pDiskFrom == pDiskTo, i.e. when moving).
7397 * @param fMoveByRename If true, attempt to perform a move by renaming (if successful the new size is ignored).
7398 * @param cbSize New image size (0 means leave unchanged).
7399 * @param nImageFromSame todo
7400 * @param nImageToSame todo
7401 * @param uImageFlags Flags specifying special destination image features.
7402 * @param pDstUuid New UUID of the destination image. If NULL, a new UUID is created.
7403 * This parameter is used if and only if a true copy is created.
7404 * In all rename/move cases or copy to existing image cases the modification UUIDs are copied over.
7405 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
7406 * Only used if the destination image is created.
7407 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7408 * @param pDstVDIfsImage Pointer to the per-image VD interface list, for the
7409 * destination image.
7410 * @param pDstVDIfsOperation Pointer to the per-operation VD interface list,
7411 * for the destination operation.
7412 */
7413VBOXDDU_DECL(int) VDCopyEx(PVDISK pDiskFrom, unsigned nImage, PVDISK pDiskTo,
7414 const char *pszBackend, const char *pszFilename,
7415 bool fMoveByRename, uint64_t cbSize,
7416 unsigned nImageFromSame, unsigned nImageToSame,
7417 unsigned uImageFlags, PCRTUUID pDstUuid,
7418 unsigned uOpenFlags, PVDINTERFACE pVDIfsOperation,
7419 PVDINTERFACE pDstVDIfsImage,
7420 PVDINTERFACE pDstVDIfsOperation)
7421{
7422 int rc = VINF_SUCCESS;
7423 int rc2;
7424 bool fLockReadFrom = false, fLockWriteFrom = false, fLockWriteTo = false;
7425 PVDIMAGE pImageTo = NULL;
7426
7427 LogFlowFunc(("pDiskFrom=%#p nImage=%u pDiskTo=%#p pszBackend=\"%s\" pszFilename=\"%s\" fMoveByRename=%d cbSize=%llu nImageFromSame=%u nImageToSame=%u uImageFlags=%#x pDstUuid=%#p uOpenFlags=%#x pVDIfsOperation=%#p pDstVDIfsImage=%#p pDstVDIfsOperation=%#p\n",
7428 pDiskFrom, nImage, pDiskTo, pszBackend, pszFilename, fMoveByRename, cbSize, nImageFromSame, nImageToSame, uImageFlags, pDstUuid, uOpenFlags, pVDIfsOperation, pDstVDIfsImage, pDstVDIfsOperation));
7429
7430 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7431 PVDINTERFACEPROGRESS pDstIfProgress = VDIfProgressGet(pDstVDIfsOperation);
7432
7433 do {
7434 /* Check arguments. */
7435 AssertMsgBreakStmt(VALID_PTR(pDiskFrom), ("pDiskFrom=%#p\n", pDiskFrom),
7436 rc = VERR_INVALID_PARAMETER);
7437 AssertMsg(pDiskFrom->u32Signature == VDISK_SIGNATURE,
7438 ("u32Signature=%08x\n", pDiskFrom->u32Signature));
7439
7440 rc2 = vdThreadStartRead(pDiskFrom);
7441 AssertRC(rc2);
7442 fLockReadFrom = true;
7443 PVDIMAGE pImageFrom = vdGetImageByNumber(pDiskFrom, nImage);
7444 AssertPtrBreakStmt(pImageFrom, rc = VERR_VD_IMAGE_NOT_FOUND);
7445 AssertMsgBreakStmt(VALID_PTR(pDiskTo), ("pDiskTo=%#p\n", pDiskTo),
7446 rc = VERR_INVALID_PARAMETER);
7447 AssertMsg(pDiskTo->u32Signature == VDISK_SIGNATURE,
7448 ("u32Signature=%08x\n", pDiskTo->u32Signature));
7449 AssertMsgBreakStmt( (nImageFromSame < nImage || nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN)
7450 && (nImageToSame < pDiskTo->cImages || nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7451 && ( (nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN && nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7452 || (nImageFromSame != VD_IMAGE_CONTENT_UNKNOWN && nImageToSame != VD_IMAGE_CONTENT_UNKNOWN)),
7453 ("nImageFromSame=%u nImageToSame=%u\n", nImageFromSame, nImageToSame),
7454 rc = VERR_INVALID_PARAMETER);
7455
7456 /* Move the image. */
7457 if (pDiskFrom == pDiskTo)
7458 {
7459 /* Rename only works when backends are the same, are file based
7460 * and the rename method is implemented. */
7461 if ( fMoveByRename
7462 && !RTStrICmp(pszBackend, pImageFrom->Backend->pszBackendName)
7463 && pImageFrom->Backend->uBackendCaps & VD_CAP_FILE
7464 && pImageFrom->Backend->pfnRename)
7465 {
7466 rc2 = vdThreadFinishRead(pDiskFrom);
7467 AssertRC(rc2);
7468 fLockReadFrom = false;
7469
7470 rc2 = vdThreadStartWrite(pDiskFrom);
7471 AssertRC(rc2);
7472 fLockWriteFrom = true;
7473 rc = pImageFrom->Backend->pfnRename(pImageFrom->pBackendData, pszFilename ? pszFilename : pImageFrom->pszFilename);
7474 break;
7475 }
7476
7477 /** @todo Moving (including shrinking/growing) of the image is
7478 * requested, but the rename attempt failed or it wasn't possible.
7479 * Must now copy image to temp location. */
7480 AssertReleaseMsgFailed(("VDCopy: moving by copy/delete not implemented\n"));
7481 }
7482
7483 /* pszFilename is allowed to be NULL, as this indicates copy to the existing image. */
7484 AssertMsgBreakStmt(pszFilename == NULL || (VALID_PTR(pszFilename) && *pszFilename),
7485 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
7486 rc = VERR_INVALID_PARAMETER);
7487
7488 uint64_t cbSizeFrom;
7489 cbSizeFrom = vdImageGetSize(pImageFrom);
7490 if (cbSizeFrom == 0)
7491 {
7492 rc = VERR_VD_VALUE_NOT_FOUND;
7493 break;
7494 }
7495
7496 VDGEOMETRY PCHSGeometryFrom = {0, 0, 0};
7497 VDGEOMETRY LCHSGeometryFrom = {0, 0, 0};
7498 pImageFrom->Backend->pfnGetPCHSGeometry(pImageFrom->pBackendData, &PCHSGeometryFrom);
7499 pImageFrom->Backend->pfnGetLCHSGeometry(pImageFrom->pBackendData, &LCHSGeometryFrom);
7500
7501 RTUUID ImageUuid, ImageModificationUuid;
7502 if (pDiskFrom != pDiskTo)
7503 {
7504 if (pDstUuid)
7505 ImageUuid = *pDstUuid;
7506 else
7507 RTUuidCreate(&ImageUuid);
7508 }
7509 else
7510 {
7511 rc = pImageFrom->Backend->pfnGetUuid(pImageFrom->pBackendData, &ImageUuid);
7512 if (RT_FAILURE(rc))
7513 RTUuidCreate(&ImageUuid);
7514 }
7515 rc = pImageFrom->Backend->pfnGetModificationUuid(pImageFrom->pBackendData, &ImageModificationUuid);
7516 if (RT_FAILURE(rc))
7517 RTUuidClear(&ImageModificationUuid);
7518
7519 char szComment[1024];
7520 rc = pImageFrom->Backend->pfnGetComment(pImageFrom->pBackendData, szComment, sizeof(szComment));
7521 if (RT_FAILURE(rc))
7522 szComment[0] = '\0';
7523 else
7524 szComment[sizeof(szComment) - 1] = '\0';
7525
7526 rc2 = vdThreadFinishRead(pDiskFrom);
7527 AssertRC(rc2);
7528 fLockReadFrom = false;
7529
7530 rc2 = vdThreadStartRead(pDiskTo);
7531 AssertRC(rc2);
7532 unsigned cImagesTo = pDiskTo->cImages;
7533 rc2 = vdThreadFinishRead(pDiskTo);
7534 AssertRC(rc2);
7535
7536 if (pszFilename)
7537 {
7538 if (cbSize == 0)
7539 cbSize = cbSizeFrom;
7540
7541 /* Create destination image with the properties of source image. */
7542 /** @todo replace the VDCreateDiff/VDCreateBase calls by direct
7543 * calls to the backend. Unifies the code and reduces the API
7544 * dependencies. Would also make the synchronization explicit. */
7545 if (cImagesTo > 0)
7546 {
7547 rc = VDCreateDiff(pDiskTo, pszBackend, pszFilename,
7548 uImageFlags, szComment, &ImageUuid,
7549 NULL /* pParentUuid */,
7550 uOpenFlags & ~VD_OPEN_FLAGS_READONLY,
7551 pDstVDIfsImage, NULL);
7552
7553 rc2 = vdThreadStartWrite(pDiskTo);
7554 AssertRC(rc2);
7555 fLockWriteTo = true;
7556 } else {
7557 /** @todo hack to force creation of a fixed image for
7558 * the RAW backend, which can't handle anything else. */
7559 if (!RTStrICmp(pszBackend, "RAW"))
7560 uImageFlags |= VD_IMAGE_FLAGS_FIXED;
7561
7562 vdFixupPCHSGeometry(&PCHSGeometryFrom, cbSize);
7563 vdFixupLCHSGeometry(&LCHSGeometryFrom, cbSize);
7564
7565 rc = VDCreateBase(pDiskTo, pszBackend, pszFilename, cbSize,
7566 uImageFlags, szComment,
7567 &PCHSGeometryFrom, &LCHSGeometryFrom,
7568 NULL, uOpenFlags & ~VD_OPEN_FLAGS_READONLY,
7569 pDstVDIfsImage, NULL);
7570
7571 rc2 = vdThreadStartWrite(pDiskTo);
7572 AssertRC(rc2);
7573 fLockWriteTo = true;
7574
7575 if (RT_SUCCESS(rc) && !RTUuidIsNull(&ImageUuid))
7576 pDiskTo->pLast->Backend->pfnSetUuid(pDiskTo->pLast->pBackendData, &ImageUuid);
7577 }
7578 if (RT_FAILURE(rc))
7579 break;
7580
7581 pImageTo = pDiskTo->pLast;
7582 AssertPtrBreakStmt(pImageTo, rc = VERR_VD_IMAGE_NOT_FOUND);
7583
7584 cbSize = RT_MIN(cbSize, cbSizeFrom);
7585 }
7586 else
7587 {
7588 pImageTo = pDiskTo->pLast;
7589 AssertPtrBreakStmt(pImageTo, rc = VERR_VD_IMAGE_NOT_FOUND);
7590
7591 uint64_t cbSizeTo;
7592 cbSizeTo = vdImageGetSize(pImageTo);
7593 if (cbSizeTo == 0)
7594 {
7595 rc = VERR_VD_VALUE_NOT_FOUND;
7596 break;
7597 }
7598
7599 if (cbSize == 0)
7600 cbSize = RT_MIN(cbSizeFrom, cbSizeTo);
7601
7602 vdFixupPCHSGeometry(&PCHSGeometryFrom, cbSize);
7603 vdFixupLCHSGeometry(&LCHSGeometryFrom, cbSize);
7604
7605 /* Update the geometry in the destination image. */
7606 pImageTo->Backend->pfnSetPCHSGeometry(pImageTo->pBackendData, &PCHSGeometryFrom);
7607 pImageTo->Backend->pfnSetLCHSGeometry(pImageTo->pBackendData, &LCHSGeometryFrom);
7608 }
7609
7610 rc2 = vdThreadFinishWrite(pDiskTo);
7611 AssertRC(rc2);
7612 fLockWriteTo = false;
7613
7614 /* Whether we can take the optimized copy path (false) or not.
7615 * Don't optimize if the image existed or if it is a child image. */
7616 bool fSuppressRedundantIo = ( !(pszFilename == NULL || cImagesTo > 0)
7617 || (nImageToSame != VD_IMAGE_CONTENT_UNKNOWN));
7618 unsigned cImagesFromReadBack, cImagesToReadBack;
7619
7620 if (nImageFromSame == VD_IMAGE_CONTENT_UNKNOWN)
7621 cImagesFromReadBack = 0;
7622 else
7623 {
7624 if (nImage == VD_LAST_IMAGE)
7625 cImagesFromReadBack = pDiskFrom->cImages - nImageFromSame - 1;
7626 else
7627 cImagesFromReadBack = nImage - nImageFromSame;
7628 }
7629
7630 if (nImageToSame == VD_IMAGE_CONTENT_UNKNOWN)
7631 cImagesToReadBack = 0;
7632 else
7633 cImagesToReadBack = pDiskTo->cImages - nImageToSame - 1;
7634
7635 /* Copy the data. */
7636 rc = vdCopyHelper(pDiskFrom, pImageFrom, pDiskTo, cbSize,
7637 cImagesFromReadBack, cImagesToReadBack,
7638 fSuppressRedundantIo, pIfProgress, pDstIfProgress);
7639
7640 if (RT_SUCCESS(rc))
7641 {
7642 rc2 = vdThreadStartWrite(pDiskTo);
7643 AssertRC(rc2);
7644 fLockWriteTo = true;
7645
7646 /* Only set modification UUID if it is non-null, since the source
7647 * backend might not provide a valid modification UUID. */
7648 if (!RTUuidIsNull(&ImageModificationUuid))
7649 pImageTo->Backend->pfnSetModificationUuid(pImageTo->pBackendData, &ImageModificationUuid);
7650
7651 /* Set the requested open flags if they differ from the value
7652 * required for creating the image and copying the contents. */
7653 if ( pImageTo && pszFilename
7654 && uOpenFlags != (uOpenFlags & ~VD_OPEN_FLAGS_READONLY))
7655 rc = pImageTo->Backend->pfnSetOpenFlags(pImageTo->pBackendData,
7656 uOpenFlags);
7657 }
7658 } while (0);
7659
7660 if (RT_FAILURE(rc) && pImageTo && pszFilename)
7661 {
7662 /* Take the write lock only if it is not taken. Not worth making the
7663 * above code even more complicated. */
7664 if (RT_UNLIKELY(!fLockWriteTo))
7665 {
7666 rc2 = vdThreadStartWrite(pDiskTo);
7667 AssertRC(rc2);
7668 fLockWriteTo = true;
7669 }
7670 /* Error detected, but new image created. Remove image from list. */
7671 vdRemoveImageFromList(pDiskTo, pImageTo);
7672
7673 /* Close and delete image. */
7674 rc2 = pImageTo->Backend->pfnClose(pImageTo->pBackendData, true);
7675 AssertRC(rc2);
7676 pImageTo->pBackendData = NULL;
7677
7678 /* Free remaining resources. */
7679 if (pImageTo->pszFilename)
7680 RTStrFree(pImageTo->pszFilename);
7681
7682 RTMemFree(pImageTo);
7683 }
7684
7685 if (RT_UNLIKELY(fLockWriteTo))
7686 {
7687 rc2 = vdThreadFinishWrite(pDiskTo);
7688 AssertRC(rc2);
7689 }
7690 if (RT_UNLIKELY(fLockWriteFrom))
7691 {
7692 rc2 = vdThreadFinishWrite(pDiskFrom);
7693 AssertRC(rc2);
7694 }
7695 else if (RT_UNLIKELY(fLockReadFrom))
7696 {
7697 rc2 = vdThreadFinishRead(pDiskFrom);
7698 AssertRC(rc2);
7699 }
7700
7701 if (RT_SUCCESS(rc))
7702 {
7703 if (pIfProgress && pIfProgress->pfnProgress)
7704 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7705 if (pDstIfProgress && pDstIfProgress->pfnProgress)
7706 pDstIfProgress->pfnProgress(pDstIfProgress->Core.pvUser, 100);
7707 }
7708
7709 LogFlowFunc(("returns %Rrc\n", rc));
7710 return rc;
7711}
7712
7713/**
7714 * Copies an image from one HDD container to another.
7715 * The copy is opened in the target HDD container.
7716 * It is possible to convert between different image formats, because the
7717 * backend for the destination may be different from the source.
7718 * If both the source and destination reference the same HDD container,
7719 * then the image is moved (by copying/deleting or renaming) to the new location.
7720 * The source container is unchanged if the move operation fails, otherwise
7721 * the image at the new location is opened in the same way as the old one was.
7722 *
7723 * @returns VBox status code.
7724 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7725 * @param pDiskFrom Pointer to source HDD container.
7726 * @param nImage Image number, counts from 0. 0 is always base image of container.
7727 * @param pDiskTo Pointer to destination HDD container.
7728 * @param pszBackend Name of the image file backend to use.
7729 * @param pszFilename New name of the image (may be NULL if pDiskFrom == pDiskTo).
7730 * @param fMoveByRename If true, attempt to perform a move by renaming (if successful the new size is ignored).
7731 * @param cbSize New image size (0 means leave unchanged).
7732 * @param uImageFlags Flags specifying special destination image features.
7733 * @param pDstUuid New UUID of the destination image. If NULL, a new UUID is created.
7734 * This parameter is used if and only if a true copy is created.
7735 * In all rename/move cases the UUIDs are copied over.
7736 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
7737 * Only used if the destination image is created.
7738 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7739 * @param pDstVDIfsImage Pointer to the per-image VD interface list, for the
7740 * destination image.
7741 * @param pDstVDIfsOperation Pointer to the per-image VD interface list,
7742 * for the destination image.
7743 */
7744VBOXDDU_DECL(int) VDCopy(PVDISK pDiskFrom, unsigned nImage, PVDISK pDiskTo,
7745 const char *pszBackend, const char *pszFilename,
7746 bool fMoveByRename, uint64_t cbSize,
7747 unsigned uImageFlags, PCRTUUID pDstUuid,
7748 unsigned uOpenFlags, PVDINTERFACE pVDIfsOperation,
7749 PVDINTERFACE pDstVDIfsImage,
7750 PVDINTERFACE pDstVDIfsOperation)
7751{
7752 return VDCopyEx(pDiskFrom, nImage, pDiskTo, pszBackend, pszFilename, fMoveByRename,
7753 cbSize, VD_IMAGE_CONTENT_UNKNOWN, VD_IMAGE_CONTENT_UNKNOWN,
7754 uImageFlags, pDstUuid, uOpenFlags, pVDIfsOperation,
7755 pDstVDIfsImage, pDstVDIfsOperation);
7756}
7757
7758/**
7759 * Optimizes the storage consumption of an image. Typically the unused blocks
7760 * have to be wiped with zeroes to achieve a substantial reduced storage use.
7761 * Another optimization done is reordering the image blocks, which can provide
7762 * a significant performance boost, as reads and writes tend to use less random
7763 * file offsets.
7764 *
7765 * @return VBox status code.
7766 * @return VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
7767 * @return VERR_VD_IMAGE_READ_ONLY if image is not writable.
7768 * @return VERR_NOT_SUPPORTED if this kind of image can be compacted, but
7769 * the code for this isn't implemented yet.
7770 * @param pDisk Pointer to HDD container.
7771 * @param nImage Image number, counts from 0. 0 is always base image of container.
7772 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7773 */
7774VBOXDDU_DECL(int) VDCompact(PVDISK pDisk, unsigned nImage,
7775 PVDINTERFACE pVDIfsOperation)
7776{
7777 int rc = VINF_SUCCESS;
7778 int rc2;
7779 bool fLockRead = false, fLockWrite = false;
7780 void *pvBuf = NULL;
7781 void *pvTmp = NULL;
7782
7783 LogFlowFunc(("pDisk=%#p nImage=%u pVDIfsOperation=%#p\n",
7784 pDisk, nImage, pVDIfsOperation));
7785
7786 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7787
7788 do {
7789 /* Check arguments. */
7790 AssertMsgBreakStmt(VALID_PTR(pDisk), ("pDisk=%#p\n", pDisk),
7791 rc = VERR_INVALID_PARAMETER);
7792 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE,
7793 ("u32Signature=%08x\n", pDisk->u32Signature));
7794
7795 rc2 = vdThreadStartRead(pDisk);
7796 AssertRC(rc2);
7797 fLockRead = true;
7798
7799 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
7800 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
7801
7802 /* If there is no compact callback for not file based backends then
7803 * the backend doesn't need compaction. No need to make much fuss about
7804 * this. For file based ones signal this as not yet supported. */
7805 if (!pImage->Backend->pfnCompact)
7806 {
7807 if (pImage->Backend->uBackendCaps & VD_CAP_FILE)
7808 rc = VERR_NOT_SUPPORTED;
7809 else
7810 rc = VINF_SUCCESS;
7811 break;
7812 }
7813
7814 /* Insert interface for reading parent state into per-operation list,
7815 * if there is a parent image. */
7816 VDINTERFACEPARENTSTATE VDIfParent;
7817 VDPARENTSTATEDESC ParentUser;
7818 if (pImage->pPrev)
7819 {
7820 VDIfParent.pfnParentRead = vdParentRead;
7821 ParentUser.pDisk = pDisk;
7822 ParentUser.pImage = pImage->pPrev;
7823 rc = VDInterfaceAdd(&VDIfParent.Core, "VDCompact_ParentState", VDINTERFACETYPE_PARENTSTATE,
7824 &ParentUser, sizeof(VDINTERFACEPARENTSTATE), &pVDIfsOperation);
7825 AssertRC(rc);
7826 }
7827
7828 rc2 = vdThreadFinishRead(pDisk);
7829 AssertRC(rc2);
7830 fLockRead = false;
7831
7832 rc2 = vdThreadStartWrite(pDisk);
7833 AssertRC(rc2);
7834 fLockWrite = true;
7835
7836 rc = pImage->Backend->pfnCompact(pImage->pBackendData,
7837 0, 99,
7838 pDisk->pVDIfsDisk,
7839 pImage->pVDIfsImage,
7840 pVDIfsOperation);
7841 } while (0);
7842
7843 if (RT_UNLIKELY(fLockWrite))
7844 {
7845 rc2 = vdThreadFinishWrite(pDisk);
7846 AssertRC(rc2);
7847 }
7848 else if (RT_UNLIKELY(fLockRead))
7849 {
7850 rc2 = vdThreadFinishRead(pDisk);
7851 AssertRC(rc2);
7852 }
7853
7854 if (pvBuf)
7855 RTMemTmpFree(pvBuf);
7856 if (pvTmp)
7857 RTMemTmpFree(pvTmp);
7858
7859 if (RT_SUCCESS(rc))
7860 {
7861 if (pIfProgress && pIfProgress->pfnProgress)
7862 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7863 }
7864
7865 LogFlowFunc(("returns %Rrc\n", rc));
7866 return rc;
7867}
7868
7869/**
7870 * Resizes the given disk image to the given size.
7871 *
7872 * @return VBox status
7873 * @return VERR_VD_IMAGE_READ_ONLY if image is not writable.
7874 * @return VERR_NOT_SUPPORTED if this kind of image can be compacted, but
7875 *
7876 * @param pDisk Pointer to the HDD container.
7877 * @param cbSize New size of the image.
7878 * @param pPCHSGeometry Pointer to the new physical disk geometry <= (16383,16,63). Not NULL.
7879 * @param pLCHSGeometry Pointer to the new logical disk geometry <= (x,255,63). Not NULL.
7880 * @param pVDIfsOperation Pointer to the per-operation VD interface list.
7881 */
7882VBOXDDU_DECL(int) VDResize(PVDISK pDisk, uint64_t cbSize,
7883 PCVDGEOMETRY pPCHSGeometry,
7884 PCVDGEOMETRY pLCHSGeometry,
7885 PVDINTERFACE pVDIfsOperation)
7886{
7887 /** @todo r=klaus resizing was designed to be part of VDCopy, so having a separate function is not desirable. */
7888 int rc = VINF_SUCCESS;
7889 int rc2;
7890 bool fLockRead = false, fLockWrite = false;
7891
7892 LogFlowFunc(("pDisk=%#p cbSize=%llu pVDIfsOperation=%#p\n",
7893 pDisk, cbSize, pVDIfsOperation));
7894
7895 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
7896
7897 do {
7898 /* Check arguments. */
7899 AssertMsgBreakStmt(VALID_PTR(pDisk), ("pDisk=%#p\n", pDisk),
7900 rc = VERR_INVALID_PARAMETER);
7901 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE,
7902 ("u32Signature=%08x\n", pDisk->u32Signature));
7903
7904 rc2 = vdThreadStartRead(pDisk);
7905 AssertRC(rc2);
7906 fLockRead = true;
7907
7908 /* Must have at least one image in the chain, will resize last. */
7909 AssertMsgBreakStmt(pDisk->cImages >= 1, ("cImages=%u\n", pDisk->cImages),
7910 rc = VERR_NOT_SUPPORTED);
7911
7912 PVDIMAGE pImage = pDisk->pLast;
7913
7914 /* If there is no compact callback for not file based backends then
7915 * the backend doesn't need compaction. No need to make much fuss about
7916 * this. For file based ones signal this as not yet supported. */
7917 if (!pImage->Backend->pfnResize)
7918 {
7919 if (pImage->Backend->uBackendCaps & VD_CAP_FILE)
7920 rc = VERR_NOT_SUPPORTED;
7921 else
7922 rc = VINF_SUCCESS;
7923 break;
7924 }
7925
7926 rc2 = vdThreadFinishRead(pDisk);
7927 AssertRC(rc2);
7928 fLockRead = false;
7929
7930 rc2 = vdThreadStartWrite(pDisk);
7931 AssertRC(rc2);
7932 fLockWrite = true;
7933
7934 VDGEOMETRY PCHSGeometryOld;
7935 VDGEOMETRY LCHSGeometryOld;
7936 PCVDGEOMETRY pPCHSGeometryNew;
7937 PCVDGEOMETRY pLCHSGeometryNew;
7938
7939 if (pPCHSGeometry->cCylinders == 0)
7940 {
7941 /* Auto-detect marker, calculate new value ourself. */
7942 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData, &PCHSGeometryOld);
7943 if (RT_SUCCESS(rc) && (PCHSGeometryOld.cCylinders != 0))
7944 PCHSGeometryOld.cCylinders = RT_MIN(cbSize / 512 / PCHSGeometryOld.cHeads / PCHSGeometryOld.cSectors, 16383);
7945 else if (rc == VERR_VD_GEOMETRY_NOT_SET)
7946 rc = VINF_SUCCESS;
7947
7948 pPCHSGeometryNew = &PCHSGeometryOld;
7949 }
7950 else
7951 pPCHSGeometryNew = pPCHSGeometry;
7952
7953 if (pLCHSGeometry->cCylinders == 0)
7954 {
7955 /* Auto-detect marker, calculate new value ourself. */
7956 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData, &LCHSGeometryOld);
7957 if (RT_SUCCESS(rc) && (LCHSGeometryOld.cCylinders != 0))
7958 LCHSGeometryOld.cCylinders = cbSize / 512 / LCHSGeometryOld.cHeads / LCHSGeometryOld.cSectors;
7959 else if (rc == VERR_VD_GEOMETRY_NOT_SET)
7960 rc = VINF_SUCCESS;
7961
7962 pLCHSGeometryNew = &LCHSGeometryOld;
7963 }
7964 else
7965 pLCHSGeometryNew = pLCHSGeometry;
7966
7967 if (RT_SUCCESS(rc))
7968 rc = pImage->Backend->pfnResize(pImage->pBackendData,
7969 cbSize,
7970 pPCHSGeometryNew,
7971 pLCHSGeometryNew,
7972 0, 99,
7973 pDisk->pVDIfsDisk,
7974 pImage->pVDIfsImage,
7975 pVDIfsOperation);
7976 } while (0);
7977
7978 if (RT_UNLIKELY(fLockWrite))
7979 {
7980 rc2 = vdThreadFinishWrite(pDisk);
7981 AssertRC(rc2);
7982 }
7983 else if (RT_UNLIKELY(fLockRead))
7984 {
7985 rc2 = vdThreadFinishRead(pDisk);
7986 AssertRC(rc2);
7987 }
7988
7989 if (RT_SUCCESS(rc))
7990 {
7991 if (pIfProgress && pIfProgress->pfnProgress)
7992 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
7993
7994 pDisk->cbSize = cbSize;
7995 }
7996
7997 LogFlowFunc(("returns %Rrc\n", rc));
7998 return rc;
7999}
8000
8001VBOXDDU_DECL(int) VDPrepareWithFilters(PVDISK pDisk, PVDINTERFACE pVDIfsOperation)
8002{
8003 int rc = VINF_SUCCESS;
8004 int rc2;
8005 bool fLockRead = false, fLockWrite = false;
8006
8007 LogFlowFunc(("pDisk=%#p pVDIfsOperation=%#p\n", pDisk, pVDIfsOperation));
8008
8009 PVDINTERFACEPROGRESS pIfProgress = VDIfProgressGet(pVDIfsOperation);
8010
8011 do {
8012 /* Check arguments. */
8013 AssertMsgBreakStmt(VALID_PTR(pDisk), ("pDisk=%#p\n", pDisk),
8014 rc = VERR_INVALID_PARAMETER);
8015 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE,
8016 ("u32Signature=%08x\n", pDisk->u32Signature));
8017
8018 rc2 = vdThreadStartRead(pDisk);
8019 AssertRC(rc2);
8020 fLockRead = true;
8021
8022 /* Must have at least one image in the chain. */
8023 AssertMsgBreakStmt(pDisk->cImages >= 1, ("cImages=%u\n", pDisk->cImages),
8024 rc = VERR_VD_NOT_OPENED);
8025
8026 unsigned uOpenFlags = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
8027 AssertMsgBreakStmt(!(uOpenFlags & VD_OPEN_FLAGS_READONLY),
8028 ("Last image should be read write"),
8029 rc = VERR_VD_IMAGE_READ_ONLY);
8030
8031 rc2 = vdThreadFinishRead(pDisk);
8032 AssertRC(rc2);
8033 fLockRead = false;
8034
8035 rc2 = vdThreadStartWrite(pDisk);
8036 AssertRC(rc2);
8037 fLockWrite = true;
8038
8039 /*
8040 * Open all images in the chain in read write mode first to avoid running
8041 * into an error in the middle of the process.
8042 */
8043 PVDIMAGE pImage = pDisk->pBase;
8044
8045 while (pImage)
8046 {
8047 uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
8048 if (uOpenFlags & VD_OPEN_FLAGS_READONLY)
8049 {
8050 /*
8051 * Clear skip consistency checks because the image is made writable now and
8052 * skipping consistency checks is only possible for readonly images.
8053 */
8054 uOpenFlags &= ~(VD_OPEN_FLAGS_READONLY | VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS);
8055 rc = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData, uOpenFlags);
8056 if (RT_FAILURE(rc))
8057 break;
8058 }
8059 pImage = pImage->pNext;
8060 }
8061
8062 if (RT_SUCCESS(rc))
8063 {
8064 unsigned cImgCur = 0;
8065 unsigned uPercentStart = 0;
8066 unsigned uPercentSpan = 100 / pDisk->cImages - 1;
8067
8068 /* Allocate tmp buffer. */
8069 void *pvBuf = RTMemTmpAlloc(VD_MERGE_BUFFER_SIZE);
8070 if (!pvBuf)
8071 {
8072 rc = VERR_NO_MEMORY;
8073 break;
8074 }
8075
8076 pImage = pDisk->pBase;
8077 pDisk->fLocked = true;
8078
8079 while ( pImage
8080 && RT_SUCCESS(rc))
8081 {
8082 /* Get size of image. */
8083 uint64_t cbSize = vdImageGetSize(pImage);
8084 uint64_t cbSizeFile = pImage->Backend->pfnGetFileSize(pImage->pBackendData);
8085 uint64_t cbFileWritten = 0;
8086 uint64_t uOffset = 0;
8087 uint64_t cbRemaining = cbSize;
8088
8089 do
8090 {
8091 size_t cbThisRead = RT_MIN(VD_MERGE_BUFFER_SIZE, cbRemaining);
8092 RTSGSEG SegmentBuf;
8093 RTSGBUF SgBuf;
8094 VDIOCTX IoCtx;
8095
8096 SegmentBuf.pvSeg = pvBuf;
8097 SegmentBuf.cbSeg = VD_MERGE_BUFFER_SIZE;
8098 RTSgBufInit(&SgBuf, &SegmentBuf, 1);
8099 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_READ, 0, 0, NULL,
8100 &SgBuf, NULL, NULL, VDIOCTX_FLAGS_SYNC);
8101
8102 rc = pImage->Backend->pfnRead(pImage->pBackendData, uOffset,
8103 cbThisRead, &IoCtx, &cbThisRead);
8104 if (rc != VERR_VD_BLOCK_FREE)
8105 {
8106 if (RT_FAILURE(rc))
8107 break;
8108
8109 /* Apply filter chains. */
8110 rc = vdFilterChainApplyRead(pDisk, uOffset, cbThisRead, &IoCtx);
8111 if (RT_FAILURE(rc))
8112 break;
8113
8114 rc = vdFilterChainApplyWrite(pDisk, uOffset, cbThisRead, &IoCtx);
8115 if (RT_FAILURE(rc))
8116 break;
8117
8118 RTSgBufReset(&SgBuf);
8119 size_t cbThisWrite = 0;
8120 size_t cbPreRead = 0;
8121 size_t cbPostRead = 0;
8122 rc = pImage->Backend->pfnWrite(pImage->pBackendData, uOffset,
8123 cbThisRead, &IoCtx, &cbThisWrite,
8124 &cbPreRead, &cbPostRead, 0);
8125 if (RT_FAILURE(rc))
8126 break;
8127 Assert(cbThisWrite == cbThisRead);
8128 cbFileWritten += cbThisWrite;
8129 }
8130 else
8131 rc = VINF_SUCCESS;
8132
8133 uOffset += cbThisRead;
8134 cbRemaining -= cbThisRead;
8135
8136 if (pIfProgress && pIfProgress->pfnProgress)
8137 {
8138 rc2 = pIfProgress->pfnProgress(pIfProgress->Core.pvUser,
8139 uPercentStart + cbFileWritten * uPercentSpan / cbSizeFile);
8140 AssertRC(rc2); /* Cancelling this operation without leaving an inconsistent state is not possible. */
8141 }
8142 } while (uOffset < cbSize);
8143
8144 pImage = pImage->pNext;
8145 cImgCur++;
8146 uPercentStart += uPercentSpan;
8147 }
8148
8149 pDisk->fLocked = false;
8150 if (pvBuf)
8151 RTMemTmpFree(pvBuf);
8152 }
8153
8154 /* Change images except last one back to readonly. */
8155 pImage = pDisk->pBase;
8156 while ( pImage != pDisk->pLast
8157 && pImage)
8158 {
8159 uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
8160 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
8161 rc2 = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData, uOpenFlags);
8162 if (RT_FAILURE(rc2))
8163 {
8164 if (RT_SUCCESS(rc))
8165 rc = rc2;
8166 break;
8167 }
8168 pImage = pImage->pNext;
8169 }
8170 } while (0);
8171
8172 if (RT_UNLIKELY(fLockWrite))
8173 {
8174 rc2 = vdThreadFinishWrite(pDisk);
8175 AssertRC(rc2);
8176 }
8177 else if (RT_UNLIKELY(fLockRead))
8178 {
8179 rc2 = vdThreadFinishRead(pDisk);
8180 AssertRC(rc2);
8181 }
8182
8183 if ( RT_SUCCESS(rc)
8184 && pIfProgress
8185 && pIfProgress->pfnProgress)
8186 pIfProgress->pfnProgress(pIfProgress->Core.pvUser, 100);
8187
8188 LogFlowFunc(("returns %Rrc\n", rc));
8189 return rc;
8190}
8191
8192/**
8193 * Closes the last opened image file in HDD container.
8194 * If previous image file was opened in read-only mode (the normal case) and
8195 * the last opened image is in read-write mode then the previous image will be
8196 * reopened in read/write mode.
8197 *
8198 * @returns VBox status code.
8199 * @returns VERR_VD_NOT_OPENED if no image is opened in HDD container.
8200 * @param pDisk Pointer to HDD container.
8201 * @param fDelete If true, delete the image from the host disk.
8202 */
8203VBOXDDU_DECL(int) VDClose(PVDISK pDisk, bool fDelete)
8204{
8205 int rc = VINF_SUCCESS;
8206 int rc2;
8207 bool fLockWrite = false;
8208
8209 LogFlowFunc(("pDisk=%#p fDelete=%d\n", pDisk, fDelete));
8210 do
8211 {
8212 /* sanity check */
8213 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8214 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8215
8216 /* Not worth splitting this up into a read lock phase and write
8217 * lock phase, as closing an image is a relatively fast operation
8218 * dominated by the part which needs the write lock. */
8219 rc2 = vdThreadStartWrite(pDisk);
8220 AssertRC(rc2);
8221 fLockWrite = true;
8222
8223 PVDIMAGE pImage = pDisk->pLast;
8224 if (!pImage)
8225 {
8226 rc = VERR_VD_NOT_OPENED;
8227 break;
8228 }
8229
8230 /* Destroy the current discard state first which might still have pending blocks. */
8231 rc = vdDiscardStateDestroy(pDisk);
8232 if (RT_FAILURE(rc))
8233 break;
8234
8235 unsigned uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
8236 /* Remove image from list of opened images. */
8237 vdRemoveImageFromList(pDisk, pImage);
8238 /* Close (and optionally delete) image. */
8239 rc = pImage->Backend->pfnClose(pImage->pBackendData, fDelete);
8240 /* Free remaining resources related to the image. */
8241 RTStrFree(pImage->pszFilename);
8242 RTMemFree(pImage);
8243
8244 pImage = pDisk->pLast;
8245 if (!pImage)
8246 break;
8247
8248 /* If disk was previously in read/write mode, make sure it will stay
8249 * like this (if possible) after closing this image. Set the open flags
8250 * accordingly. */
8251 if (!(uOpenFlags & VD_OPEN_FLAGS_READONLY))
8252 {
8253 uOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
8254 uOpenFlags &= ~ VD_OPEN_FLAGS_READONLY;
8255 rc = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData, uOpenFlags);
8256 }
8257
8258 /* Cache disk information. */
8259 pDisk->cbSize = vdImageGetSize(pImage);
8260
8261 /* Cache PCHS geometry. */
8262 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8263 &pDisk->PCHSGeometry);
8264 if (RT_FAILURE(rc2))
8265 {
8266 pDisk->PCHSGeometry.cCylinders = 0;
8267 pDisk->PCHSGeometry.cHeads = 0;
8268 pDisk->PCHSGeometry.cSectors = 0;
8269 }
8270 else
8271 {
8272 /* Make sure the PCHS geometry is properly clipped. */
8273 pDisk->PCHSGeometry.cCylinders = RT_MIN(pDisk->PCHSGeometry.cCylinders, 16383);
8274 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 16);
8275 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
8276 }
8277
8278 /* Cache LCHS geometry. */
8279 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
8280 &pDisk->LCHSGeometry);
8281 if (RT_FAILURE(rc2))
8282 {
8283 pDisk->LCHSGeometry.cCylinders = 0;
8284 pDisk->LCHSGeometry.cHeads = 0;
8285 pDisk->LCHSGeometry.cSectors = 0;
8286 }
8287 else
8288 {
8289 /* Make sure the LCHS geometry is properly clipped. */
8290 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
8291 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
8292 }
8293 } while (0);
8294
8295 if (RT_UNLIKELY(fLockWrite))
8296 {
8297 rc2 = vdThreadFinishWrite(pDisk);
8298 AssertRC(rc2);
8299 }
8300
8301 LogFlowFunc(("returns %Rrc\n", rc));
8302 return rc;
8303}
8304
8305/**
8306 * Closes the currently opened cache image file in HDD container.
8307 *
8308 * @return VBox status code.
8309 * @return VERR_VD_NOT_OPENED if no cache is opened in HDD container.
8310 * @param pDisk Pointer to HDD container.
8311 * @param fDelete If true, delete the image from the host disk.
8312 */
8313VBOXDDU_DECL(int) VDCacheClose(PVDISK pDisk, bool fDelete)
8314{
8315 int rc = VINF_SUCCESS;
8316 int rc2;
8317 bool fLockWrite = false;
8318 PVDCACHE pCache = NULL;
8319
8320 LogFlowFunc(("pDisk=%#p fDelete=%d\n", pDisk, fDelete));
8321
8322 do
8323 {
8324 /* sanity check */
8325 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8326 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8327
8328 rc2 = vdThreadStartWrite(pDisk);
8329 AssertRC(rc2);
8330 fLockWrite = true;
8331
8332 AssertPtrBreakStmt(pDisk->pCache, rc = VERR_VD_CACHE_NOT_FOUND);
8333
8334 pCache = pDisk->pCache;
8335 pDisk->pCache = NULL;
8336
8337 pCache->Backend->pfnClose(pCache->pBackendData, fDelete);
8338 if (pCache->pszFilename)
8339 RTStrFree(pCache->pszFilename);
8340 RTMemFree(pCache);
8341 } while (0);
8342
8343 if (RT_LIKELY(fLockWrite))
8344 {
8345 rc2 = vdThreadFinishWrite(pDisk);
8346 AssertRC(rc2);
8347 }
8348
8349 LogFlowFunc(("returns %Rrc\n", rc));
8350 return rc;
8351}
8352
8353VBOXDDU_DECL(int) VDFilterRemove(PVDISK pDisk, uint32_t fFlags)
8354{
8355 int rc = VINF_SUCCESS;
8356 int rc2;
8357 bool fLockWrite = false;
8358 PVDFILTER pFilter = NULL;
8359
8360 LogFlowFunc(("pDisk=%#p\n", pDisk));
8361
8362 do
8363 {
8364 /* sanity check */
8365 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8366 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8367
8368 AssertMsgBreakStmt(!(fFlags & ~VD_FILTER_FLAGS_MASK),
8369 ("Invalid flags set (fFlags=%#x)\n", fFlags),
8370 rc = VERR_INVALID_PARAMETER);
8371
8372 rc2 = vdThreadStartWrite(pDisk);
8373 AssertRC(rc2);
8374 fLockWrite = true;
8375
8376 if (fFlags & VD_FILTER_FLAGS_WRITE)
8377 {
8378 AssertBreakStmt(!RTListIsEmpty(&pDisk->ListFilterChainWrite), rc = VERR_VD_NOT_OPENED);
8379 pFilter = RTListGetLast(&pDisk->ListFilterChainWrite, VDFILTER, ListNodeChainWrite);
8380 AssertPtr(pFilter);
8381 RTListNodeRemove(&pFilter->ListNodeChainWrite);
8382 vdFilterRelease(pFilter);
8383 }
8384
8385 if (fFlags & VD_FILTER_FLAGS_READ)
8386 {
8387 AssertBreakStmt(!RTListIsEmpty(&pDisk->ListFilterChainRead), rc = VERR_VD_NOT_OPENED);
8388 pFilter = RTListGetLast(&pDisk->ListFilterChainRead, VDFILTER, ListNodeChainRead);
8389 AssertPtr(pFilter);
8390 RTListNodeRemove(&pFilter->ListNodeChainRead);
8391 vdFilterRelease(pFilter);
8392 }
8393 } while (0);
8394
8395 if (RT_LIKELY(fLockWrite))
8396 {
8397 rc2 = vdThreadFinishWrite(pDisk);
8398 AssertRC(rc2);
8399 }
8400
8401 LogFlowFunc(("returns %Rrc\n", rc));
8402 return rc;
8403}
8404
8405/**
8406 * Closes all opened image files in HDD container.
8407 *
8408 * @returns VBox status code.
8409 * @param pDisk Pointer to HDD container.
8410 */
8411VBOXDDU_DECL(int) VDCloseAll(PVDISK pDisk)
8412{
8413 int rc = VINF_SUCCESS;
8414 int rc2;
8415 bool fLockWrite = false;
8416
8417 LogFlowFunc(("pDisk=%#p\n", pDisk));
8418 do
8419 {
8420 /* sanity check */
8421 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8422 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8423
8424 /* Lock the entire operation. */
8425 rc2 = vdThreadStartWrite(pDisk);
8426 AssertRC(rc2);
8427 fLockWrite = true;
8428
8429 PVDCACHE pCache = pDisk->pCache;
8430 if (pCache)
8431 {
8432 rc2 = pCache->Backend->pfnClose(pCache->pBackendData, false);
8433 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
8434 rc = rc2;
8435
8436 if (pCache->pszFilename)
8437 RTStrFree(pCache->pszFilename);
8438 RTMemFree(pCache);
8439 }
8440
8441 PVDIMAGE pImage = pDisk->pLast;
8442 while (VALID_PTR(pImage))
8443 {
8444 PVDIMAGE pPrev = pImage->pPrev;
8445 /* Remove image from list of opened images. */
8446 vdRemoveImageFromList(pDisk, pImage);
8447 /* Close image. */
8448 rc2 = pImage->Backend->pfnClose(pImage->pBackendData, false);
8449 if (RT_FAILURE(rc2) && RT_SUCCESS(rc))
8450 rc = rc2;
8451 /* Free remaining resources related to the image. */
8452 RTStrFree(pImage->pszFilename);
8453 RTMemFree(pImage);
8454 pImage = pPrev;
8455 }
8456 Assert(!VALID_PTR(pDisk->pLast));
8457 } while (0);
8458
8459 if (RT_UNLIKELY(fLockWrite))
8460 {
8461 rc2 = vdThreadFinishWrite(pDisk);
8462 AssertRC(rc2);
8463 }
8464
8465 LogFlowFunc(("returns %Rrc\n", rc));
8466 return rc;
8467}
8468
8469/**
8470 * Removes all filters of the given HDD container.
8471 *
8472 * @return VBox status code.
8473 * @param pDisk Pointer to HDD container.
8474 */
8475VBOXDDU_DECL(int) VDFilterRemoveAll(PVDISK pDisk)
8476{
8477 int rc = VINF_SUCCESS;
8478 int rc2;
8479 bool fLockWrite = false;
8480
8481 LogFlowFunc(("pDisk=%#p\n", pDisk));
8482 do
8483 {
8484 /* sanity check */
8485 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8486 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8487
8488 /* Lock the entire operation. */
8489 rc2 = vdThreadStartWrite(pDisk);
8490 AssertRC(rc2);
8491 fLockWrite = true;
8492
8493 PVDFILTER pFilter, pFilterNext;
8494 RTListForEachSafe(&pDisk->ListFilterChainWrite, pFilter, pFilterNext, VDFILTER, ListNodeChainWrite)
8495 {
8496 RTListNodeRemove(&pFilter->ListNodeChainWrite);
8497 vdFilterRelease(pFilter);
8498 }
8499
8500 RTListForEachSafe(&pDisk->ListFilterChainRead, pFilter, pFilterNext, VDFILTER, ListNodeChainRead)
8501 {
8502 RTListNodeRemove(&pFilter->ListNodeChainRead);
8503 vdFilterRelease(pFilter);
8504 }
8505 Assert(RTListIsEmpty(&pDisk->ListFilterChainRead));
8506 Assert(RTListIsEmpty(&pDisk->ListFilterChainWrite));
8507 } while (0);
8508
8509 if (RT_UNLIKELY(fLockWrite))
8510 {
8511 rc2 = vdThreadFinishWrite(pDisk);
8512 AssertRC(rc2);
8513 }
8514
8515 LogFlowFunc(("returns %Rrc\n", rc));
8516 return rc;
8517}
8518
8519/**
8520 * Read data from virtual HDD.
8521 *
8522 * @returns VBox status code.
8523 * @retval VERR_VD_NOT_OPENED if no image is opened in HDD container.
8524 * @param pDisk Pointer to HDD container.
8525 * @param uOffset Offset of first reading byte from start of disk.
8526 * @param pvBuf Pointer to buffer for reading data.
8527 * @param cbRead Number of bytes to read.
8528 */
8529VBOXDDU_DECL(int) VDRead(PVDISK pDisk, uint64_t uOffset, void *pvBuf,
8530 size_t cbRead)
8531{
8532 int rc = VINF_SUCCESS;
8533 int rc2;
8534 bool fLockRead = false;
8535
8536 LogFlowFunc(("pDisk=%#p uOffset=%llu pvBuf=%p cbRead=%zu\n",
8537 pDisk, uOffset, pvBuf, cbRead));
8538 do
8539 {
8540 /* sanity check */
8541 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8542 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8543
8544 /* Check arguments. */
8545 AssertMsgBreakStmt(VALID_PTR(pvBuf),
8546 ("pvBuf=%#p\n", pvBuf),
8547 rc = VERR_INVALID_PARAMETER);
8548 AssertMsgBreakStmt(cbRead,
8549 ("cbRead=%zu\n", cbRead),
8550 rc = VERR_INVALID_PARAMETER);
8551
8552 rc2 = vdThreadStartRead(pDisk);
8553 AssertRC(rc2);
8554 fLockRead = true;
8555
8556 PVDIMAGE pImage = pDisk->pLast;
8557 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8558
8559 if (uOffset + cbRead > pDisk->cbSize)
8560 {
8561 /* Floppy images might be smaller than the standard expected by
8562 the floppy controller code. So, we won't fail here. */
8563 AssertMsgBreakStmt(pDisk->enmType == VDTYPE_FLOPPY,
8564 ("uOffset=%llu cbRead=%zu pDisk->cbSize=%llu\n",
8565 uOffset, cbRead, pDisk->cbSize),
8566 rc = VERR_EOF);
8567 memset(pvBuf, 0xf6, cbRead); /* f6h = format.com filler byte */
8568 if (uOffset >= pDisk->cbSize)
8569 break;
8570 cbRead = pDisk->cbSize - uOffset;
8571 }
8572
8573 rc = vdReadHelper(pDisk, pImage, uOffset, pvBuf, cbRead,
8574 true /* fUpdateCache */);
8575 } while (0);
8576
8577 if (RT_UNLIKELY(fLockRead))
8578 {
8579 rc2 = vdThreadFinishRead(pDisk);
8580 AssertRC(rc2);
8581 }
8582
8583 LogFlowFunc(("returns %Rrc\n", rc));
8584 return rc;
8585}
8586
8587/**
8588 * Write data to virtual HDD.
8589 *
8590 * @returns VBox status code.
8591 * @retval VERR_VD_NOT_OPENED if no image is opened in HDD container.
8592 * @param pDisk Pointer to HDD container.
8593 * @param uOffset Offset of the first byte being
8594 * written from start of disk.
8595 * @param pvBuf Pointer to buffer for writing data.
8596 * @param cbWrite Number of bytes to write.
8597 */
8598VBOXDDU_DECL(int) VDWrite(PVDISK pDisk, uint64_t uOffset, const void *pvBuf,
8599 size_t cbWrite)
8600{
8601 int rc = VINF_SUCCESS;
8602 int rc2;
8603 bool fLockWrite = false;
8604
8605 LogFlowFunc(("pDisk=%#p uOffset=%llu pvBuf=%p cbWrite=%zu\n",
8606 pDisk, uOffset, pvBuf, cbWrite));
8607 do
8608 {
8609 /* sanity check */
8610 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8611 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8612
8613 /* Check arguments. */
8614 AssertMsgBreakStmt(VALID_PTR(pvBuf),
8615 ("pvBuf=%#p\n", pvBuf),
8616 rc = VERR_INVALID_PARAMETER);
8617 AssertMsgBreakStmt(cbWrite,
8618 ("cbWrite=%zu\n", cbWrite),
8619 rc = VERR_INVALID_PARAMETER);
8620
8621 rc2 = vdThreadStartWrite(pDisk);
8622 AssertRC(rc2);
8623 fLockWrite = true;
8624
8625 AssertMsgBreakStmt(uOffset + cbWrite <= pDisk->cbSize,
8626 ("uOffset=%llu cbWrite=%zu pDisk->cbSize=%llu\n",
8627 uOffset, cbWrite, pDisk->cbSize),
8628 rc = VERR_INVALID_PARAMETER);
8629
8630 PVDIMAGE pImage = pDisk->pLast;
8631 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8632
8633 vdSetModifiedFlag(pDisk);
8634 rc = vdWriteHelper(pDisk, pImage, uOffset, pvBuf, cbWrite,
8635 VDIOCTX_FLAGS_READ_UPDATE_CACHE);
8636 if (RT_FAILURE(rc))
8637 break;
8638
8639 /* If there is a merge (in the direction towards a parent) running
8640 * concurrently then we have to also "relay" the write to this parent,
8641 * as the merge position might be already past the position where
8642 * this write is going. The "context" of the write can come from the
8643 * natural chain, since merging either already did or will take care
8644 * of the "other" content which is might be needed to fill the block
8645 * to a full allocation size. The cache doesn't need to be touched
8646 * as this write is covered by the previous one. */
8647 if (RT_UNLIKELY(pDisk->pImageRelay))
8648 rc = vdWriteHelper(pDisk, pDisk->pImageRelay, uOffset,
8649 pvBuf, cbWrite, VDIOCTX_FLAGS_DEFAULT);
8650 } while (0);
8651
8652 if (RT_UNLIKELY(fLockWrite))
8653 {
8654 rc2 = vdThreadFinishWrite(pDisk);
8655 AssertRC(rc2);
8656 }
8657
8658 LogFlowFunc(("returns %Rrc\n", rc));
8659 return rc;
8660}
8661
8662/**
8663 * Make sure the on disk representation of a virtual HDD is up to date.
8664 *
8665 * @returns VBox status code.
8666 * @retval VERR_VD_NOT_OPENED if no image is opened in HDD container.
8667 * @param pDisk Pointer to HDD container.
8668 */
8669VBOXDDU_DECL(int) VDFlush(PVDISK pDisk)
8670{
8671 int rc = VINF_SUCCESS;
8672 int rc2;
8673 bool fLockWrite = false;
8674
8675 LogFlowFunc(("pDisk=%#p\n", pDisk));
8676 do
8677 {
8678 /* sanity check */
8679 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8680 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8681
8682 rc2 = vdThreadStartWrite(pDisk);
8683 AssertRC(rc2);
8684 fLockWrite = true;
8685
8686 PVDIMAGE pImage = pDisk->pLast;
8687 AssertPtrBreakStmt(pImage, rc = VERR_VD_NOT_OPENED);
8688
8689 VDIOCTX IoCtx;
8690 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
8691
8692 rc = RTSemEventCreate(&hEventComplete);
8693 if (RT_FAILURE(rc))
8694 break;
8695
8696 vdIoCtxInit(&IoCtx, pDisk, VDIOCTXTXDIR_FLUSH, 0, 0, pImage, NULL,
8697 NULL, vdFlushHelperAsync, VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE);
8698
8699 IoCtx.Type.Root.pfnComplete = vdIoCtxSyncComplete;
8700 IoCtx.Type.Root.pvUser1 = pDisk;
8701 IoCtx.Type.Root.pvUser2 = hEventComplete;
8702 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
8703
8704 RTSemEventDestroy(hEventComplete);
8705 } while (0);
8706
8707 if (RT_UNLIKELY(fLockWrite))
8708 {
8709 rc2 = vdThreadFinishWrite(pDisk);
8710 AssertRC(rc2);
8711 }
8712
8713 LogFlowFunc(("returns %Rrc\n", rc));
8714 return rc;
8715}
8716
8717/**
8718 * Get number of opened images in HDD container.
8719 *
8720 * @returns Number of opened images for HDD container. 0 if no images have been opened.
8721 * @param pDisk Pointer to HDD container.
8722 */
8723VBOXDDU_DECL(unsigned) VDGetCount(PVDISK pDisk)
8724{
8725 unsigned cImages;
8726 int rc2;
8727 bool fLockRead = false;
8728
8729 LogFlowFunc(("pDisk=%#p\n", pDisk));
8730 do
8731 {
8732 /* sanity check */
8733 AssertPtrBreakStmt(pDisk, cImages = 0);
8734 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8735
8736 rc2 = vdThreadStartRead(pDisk);
8737 AssertRC(rc2);
8738 fLockRead = true;
8739
8740 cImages = pDisk->cImages;
8741 } while (0);
8742
8743 if (RT_UNLIKELY(fLockRead))
8744 {
8745 rc2 = vdThreadFinishRead(pDisk);
8746 AssertRC(rc2);
8747 }
8748
8749 LogFlowFunc(("returns %u\n", cImages));
8750 return cImages;
8751}
8752
8753/**
8754 * Get read/write mode of HDD container.
8755 *
8756 * @returns Virtual disk ReadOnly status.
8757 * @returns true if no image is opened in HDD container.
8758 * @param pDisk Pointer to HDD container.
8759 */
8760VBOXDDU_DECL(bool) VDIsReadOnly(PVDISK pDisk)
8761{
8762 bool fReadOnly;
8763 int rc2;
8764 bool fLockRead = false;
8765
8766 LogFlowFunc(("pDisk=%#p\n", pDisk));
8767 do
8768 {
8769 /* sanity check */
8770 AssertPtrBreakStmt(pDisk, fReadOnly = false);
8771 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8772
8773 rc2 = vdThreadStartRead(pDisk);
8774 AssertRC(rc2);
8775 fLockRead = true;
8776
8777 PVDIMAGE pImage = pDisk->pLast;
8778 AssertPtrBreakStmt(pImage, fReadOnly = true);
8779
8780 unsigned uOpenFlags;
8781 uOpenFlags = pDisk->pLast->Backend->pfnGetOpenFlags(pDisk->pLast->pBackendData);
8782 fReadOnly = !!(uOpenFlags & VD_OPEN_FLAGS_READONLY);
8783 } while (0);
8784
8785 if (RT_UNLIKELY(fLockRead))
8786 {
8787 rc2 = vdThreadFinishRead(pDisk);
8788 AssertRC(rc2);
8789 }
8790
8791 LogFlowFunc(("returns %d\n", fReadOnly));
8792 return fReadOnly;
8793}
8794
8795/**
8796 * Get sector size of an image in HDD container.
8797 *
8798 * @return Virtual disk sector size in bytes.
8799 * @return 0 if image with specified number was not opened.
8800 * @param pDisk Pointer to HDD container.
8801 * @param nImage Image number, counts from 0. 0 is always base image of container.
8802 */
8803VBOXDDU_DECL(uint32_t) VDGetSectorSize(PVDISK pDisk, unsigned nImage)
8804{
8805 uint64_t cbSector;
8806 int rc2;
8807 bool fLockRead = false;
8808
8809 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8810 do
8811 {
8812 /* sanity check */
8813 AssertPtrBreakStmt(pDisk, cbSector = 0);
8814 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8815
8816 rc2 = vdThreadStartRead(pDisk);
8817 AssertRC(rc2);
8818 fLockRead = true;
8819
8820 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8821 AssertPtrBreakStmt(pImage, cbSector = 0);
8822
8823 PCVDREGIONLIST pRegionList = NULL;
8824 int rc = pImage->Backend->pfnQueryRegions(pImage->pBackendData, &pRegionList);
8825 if (RT_SUCCESS(rc))
8826 {
8827 AssertBreakStmt(pRegionList->cRegions == 1, cbSector = 0);
8828 cbSector = pRegionList->aRegions[0].cbBlock;
8829
8830 AssertPtr(pImage->Backend->pfnRegionListRelease);
8831 pImage->Backend->pfnRegionListRelease(pImage->pBackendData, pRegionList);
8832 }
8833 else
8834 cbSector = 0;
8835 } while (0);
8836
8837 if (RT_UNLIKELY(fLockRead))
8838 {
8839 rc2 = vdThreadFinishRead(pDisk);
8840 AssertRC(rc2);
8841 }
8842
8843 LogFlowFunc(("returns %u\n", cbSector));
8844 return cbSector;
8845}
8846
8847/**
8848 * Get total capacity of an image in HDD container.
8849 *
8850 * @returns Virtual disk size in bytes.
8851 * @returns 0 if no image with specified number was not opened.
8852 * @param pDisk Pointer to HDD container.
8853 * @param nImage Image number, counts from 0. 0 is always base image of container.
8854 */
8855VBOXDDU_DECL(uint64_t) VDGetSize(PVDISK pDisk, unsigned nImage)
8856{
8857 uint64_t cbSize;
8858 int rc2;
8859 bool fLockRead = false;
8860
8861 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8862 do
8863 {
8864 /* sanity check */
8865 AssertPtrBreakStmt(pDisk, cbSize = 0);
8866 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8867
8868 rc2 = vdThreadStartRead(pDisk);
8869 AssertRC(rc2);
8870 fLockRead = true;
8871
8872 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8873 AssertPtrBreakStmt(pImage, cbSize = 0);
8874
8875 cbSize = vdImageGetSize(pImage);
8876 } while (0);
8877
8878 if (RT_UNLIKELY(fLockRead))
8879 {
8880 rc2 = vdThreadFinishRead(pDisk);
8881 AssertRC(rc2);
8882 }
8883
8884 LogFlowFunc(("returns %llu\n", cbSize));
8885 return cbSize;
8886}
8887
8888/**
8889 * Get total file size of an image in HDD container.
8890 *
8891 * @returns Virtual disk size in bytes.
8892 * @returns 0 if no image is opened in HDD container.
8893 * @param pDisk Pointer to HDD container.
8894 * @param nImage Image number, counts from 0. 0 is always base image of container.
8895 */
8896VBOXDDU_DECL(uint64_t) VDGetFileSize(PVDISK pDisk, unsigned nImage)
8897{
8898 uint64_t cbSize;
8899 int rc2;
8900 bool fLockRead = false;
8901
8902 LogFlowFunc(("pDisk=%#p nImage=%u\n", pDisk, nImage));
8903 do
8904 {
8905 /* sanity check */
8906 AssertPtrBreakStmt(pDisk, cbSize = 0);
8907 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8908
8909 rc2 = vdThreadStartRead(pDisk);
8910 AssertRC(rc2);
8911 fLockRead = true;
8912
8913 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8914 AssertPtrBreakStmt(pImage, cbSize = 0);
8915 cbSize = pImage->Backend->pfnGetFileSize(pImage->pBackendData);
8916 } while (0);
8917
8918 if (RT_UNLIKELY(fLockRead))
8919 {
8920 rc2 = vdThreadFinishRead(pDisk);
8921 AssertRC(rc2);
8922 }
8923
8924 LogFlowFunc(("returns %llu\n", cbSize));
8925 return cbSize;
8926}
8927
8928/**
8929 * Get virtual disk PCHS geometry stored in HDD container.
8930 *
8931 * @returns VBox status code.
8932 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8933 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8934 * @param pDisk Pointer to HDD container.
8935 * @param nImage Image number, counts from 0. 0 is always base image of container.
8936 * @param pPCHSGeometry Where to store PCHS geometry. Not NULL.
8937 */
8938VBOXDDU_DECL(int) VDGetPCHSGeometry(PVDISK pDisk, unsigned nImage,
8939 PVDGEOMETRY pPCHSGeometry)
8940{
8941 int rc = VINF_SUCCESS;
8942 int rc2;
8943 bool fLockRead = false;
8944
8945 LogFlowFunc(("pDisk=%#p nImage=%u pPCHSGeometry=%#p\n",
8946 pDisk, nImage, pPCHSGeometry));
8947 do
8948 {
8949 /* sanity check */
8950 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
8951 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
8952
8953 /* Check arguments. */
8954 AssertMsgBreakStmt(VALID_PTR(pPCHSGeometry),
8955 ("pPCHSGeometry=%#p\n", pPCHSGeometry),
8956 rc = VERR_INVALID_PARAMETER);
8957
8958 rc2 = vdThreadStartRead(pDisk);
8959 AssertRC(rc2);
8960 fLockRead = true;
8961
8962 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
8963 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
8964
8965 if (pImage == pDisk->pLast)
8966 {
8967 /* Use cached information if possible. */
8968 if (pDisk->PCHSGeometry.cCylinders != 0)
8969 *pPCHSGeometry = pDisk->PCHSGeometry;
8970 else
8971 rc = VERR_VD_GEOMETRY_NOT_SET;
8972 }
8973 else
8974 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
8975 pPCHSGeometry);
8976 } while (0);
8977
8978 if (RT_UNLIKELY(fLockRead))
8979 {
8980 rc2 = vdThreadFinishRead(pDisk);
8981 AssertRC(rc2);
8982 }
8983
8984 LogFlowFunc(("%Rrc (PCHS=%u/%u/%u)\n", rc,
8985 pDisk->PCHSGeometry.cCylinders, pDisk->PCHSGeometry.cHeads,
8986 pDisk->PCHSGeometry.cSectors));
8987 return rc;
8988}
8989
8990/**
8991 * Store virtual disk PCHS geometry in HDD container.
8992 *
8993 * Note that in case of unrecoverable error all images in HDD container will be closed.
8994 *
8995 * @returns VBox status code.
8996 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
8997 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
8998 * @param pDisk Pointer to HDD container.
8999 * @param nImage Image number, counts from 0. 0 is always base image of container.
9000 * @param pPCHSGeometry Where to load PCHS geometry from. Not NULL.
9001 */
9002VBOXDDU_DECL(int) VDSetPCHSGeometry(PVDISK pDisk, unsigned nImage,
9003 PCVDGEOMETRY pPCHSGeometry)
9004{
9005 int rc = VINF_SUCCESS;
9006 int rc2;
9007 bool fLockWrite = false;
9008
9009 LogFlowFunc(("pDisk=%#p nImage=%u pPCHSGeometry=%#p PCHS=%u/%u/%u\n",
9010 pDisk, nImage, pPCHSGeometry, pPCHSGeometry->cCylinders,
9011 pPCHSGeometry->cHeads, pPCHSGeometry->cSectors));
9012 do
9013 {
9014 /* sanity check */
9015 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9016 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9017
9018 /* Check arguments. */
9019 AssertMsgBreakStmt( VALID_PTR(pPCHSGeometry)
9020 && pPCHSGeometry->cHeads <= 16
9021 && pPCHSGeometry->cSectors <= 63,
9022 ("pPCHSGeometry=%#p PCHS=%u/%u/%u\n", pPCHSGeometry,
9023 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads,
9024 pPCHSGeometry->cSectors),
9025 rc = VERR_INVALID_PARAMETER);
9026
9027 rc2 = vdThreadStartWrite(pDisk);
9028 AssertRC(rc2);
9029 fLockWrite = true;
9030
9031 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9032 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9033
9034 if (pImage == pDisk->pLast)
9035 {
9036 if ( pPCHSGeometry->cCylinders != pDisk->PCHSGeometry.cCylinders
9037 || pPCHSGeometry->cHeads != pDisk->PCHSGeometry.cHeads
9038 || pPCHSGeometry->cSectors != pDisk->PCHSGeometry.cSectors)
9039 {
9040 /* Only update geometry if it is changed. Avoids similar checks
9041 * in every backend. Most of the time the new geometry is set
9042 * to the previous values, so no need to go through the hassle
9043 * of updating an image which could be opened in read-only mode
9044 * right now. */
9045 rc = pImage->Backend->pfnSetPCHSGeometry(pImage->pBackendData,
9046 pPCHSGeometry);
9047
9048 /* Cache new geometry values in any case. */
9049 rc2 = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
9050 &pDisk->PCHSGeometry);
9051 if (RT_FAILURE(rc2))
9052 {
9053 pDisk->PCHSGeometry.cCylinders = 0;
9054 pDisk->PCHSGeometry.cHeads = 0;
9055 pDisk->PCHSGeometry.cSectors = 0;
9056 }
9057 else
9058 {
9059 /* Make sure the CHS geometry is properly clipped. */
9060 pDisk->PCHSGeometry.cHeads = RT_MIN(pDisk->PCHSGeometry.cHeads, 255);
9061 pDisk->PCHSGeometry.cSectors = RT_MIN(pDisk->PCHSGeometry.cSectors, 63);
9062 }
9063 }
9064 }
9065 else
9066 {
9067 VDGEOMETRY PCHS;
9068 rc = pImage->Backend->pfnGetPCHSGeometry(pImage->pBackendData,
9069 &PCHS);
9070 if ( RT_FAILURE(rc)
9071 || pPCHSGeometry->cCylinders != PCHS.cCylinders
9072 || pPCHSGeometry->cHeads != PCHS.cHeads
9073 || pPCHSGeometry->cSectors != PCHS.cSectors)
9074 {
9075 /* Only update geometry if it is changed. Avoids similar checks
9076 * in every backend. Most of the time the new geometry is set
9077 * to the previous values, so no need to go through the hassle
9078 * of updating an image which could be opened in read-only mode
9079 * right now. */
9080 rc = pImage->Backend->pfnSetPCHSGeometry(pImage->pBackendData,
9081 pPCHSGeometry);
9082 }
9083 }
9084 } while (0);
9085
9086 if (RT_UNLIKELY(fLockWrite))
9087 {
9088 rc2 = vdThreadFinishWrite(pDisk);
9089 AssertRC(rc2);
9090 }
9091
9092 LogFlowFunc(("returns %Rrc\n", rc));
9093 return rc;
9094}
9095
9096/**
9097 * Get virtual disk LCHS geometry stored in HDD container.
9098 *
9099 * @returns VBox status code.
9100 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9101 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
9102 * @param pDisk Pointer to HDD container.
9103 * @param nImage Image number, counts from 0. 0 is always base image of container.
9104 * @param pLCHSGeometry Where to store LCHS geometry. Not NULL.
9105 */
9106VBOXDDU_DECL(int) VDGetLCHSGeometry(PVDISK pDisk, unsigned nImage,
9107 PVDGEOMETRY pLCHSGeometry)
9108{
9109 int rc = VINF_SUCCESS;
9110 int rc2;
9111 bool fLockRead = false;
9112
9113 LogFlowFunc(("pDisk=%#p nImage=%u pLCHSGeometry=%#p\n",
9114 pDisk, nImage, pLCHSGeometry));
9115 do
9116 {
9117 /* sanity check */
9118 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9119 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9120
9121 /* Check arguments. */
9122 AssertMsgBreakStmt(VALID_PTR(pLCHSGeometry),
9123 ("pLCHSGeometry=%#p\n", pLCHSGeometry),
9124 rc = VERR_INVALID_PARAMETER);
9125
9126 rc2 = vdThreadStartRead(pDisk);
9127 AssertRC(rc2);
9128 fLockRead = true;
9129
9130 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9131 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9132
9133 if (pImage == pDisk->pLast)
9134 {
9135 /* Use cached information if possible. */
9136 if (pDisk->LCHSGeometry.cCylinders != 0)
9137 *pLCHSGeometry = pDisk->LCHSGeometry;
9138 else
9139 rc = VERR_VD_GEOMETRY_NOT_SET;
9140 }
9141 else
9142 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
9143 pLCHSGeometry);
9144 } while (0);
9145
9146 if (RT_UNLIKELY(fLockRead))
9147 {
9148 rc2 = vdThreadFinishRead(pDisk);
9149 AssertRC(rc2);
9150 }
9151
9152 LogFlowFunc((": %Rrc (LCHS=%u/%u/%u)\n", rc,
9153 pDisk->LCHSGeometry.cCylinders, pDisk->LCHSGeometry.cHeads,
9154 pDisk->LCHSGeometry.cSectors));
9155 return rc;
9156}
9157
9158/**
9159 * Store virtual disk LCHS geometry in HDD container.
9160 *
9161 * Note that in case of unrecoverable error all images in HDD container will be closed.
9162 *
9163 * @returns VBox status code.
9164 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9165 * @returns VERR_VD_GEOMETRY_NOT_SET if no geometry present in the HDD container.
9166 * @param pDisk Pointer to HDD container.
9167 * @param nImage Image number, counts from 0. 0 is always base image of container.
9168 * @param pLCHSGeometry Where to load LCHS geometry from. Not NULL.
9169 */
9170VBOXDDU_DECL(int) VDSetLCHSGeometry(PVDISK pDisk, unsigned nImage,
9171 PCVDGEOMETRY pLCHSGeometry)
9172{
9173 int rc = VINF_SUCCESS;
9174 int rc2;
9175 bool fLockWrite = false;
9176
9177 LogFlowFunc(("pDisk=%#p nImage=%u pLCHSGeometry=%#p LCHS=%u/%u/%u\n",
9178 pDisk, nImage, pLCHSGeometry, pLCHSGeometry->cCylinders,
9179 pLCHSGeometry->cHeads, pLCHSGeometry->cSectors));
9180 do
9181 {
9182 /* sanity check */
9183 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9184 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9185
9186 /* Check arguments. */
9187 AssertMsgBreakStmt( VALID_PTR(pLCHSGeometry)
9188 && pLCHSGeometry->cHeads <= 255
9189 && pLCHSGeometry->cSectors <= 63,
9190 ("pLCHSGeometry=%#p LCHS=%u/%u/%u\n", pLCHSGeometry,
9191 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads,
9192 pLCHSGeometry->cSectors),
9193 rc = VERR_INVALID_PARAMETER);
9194
9195 rc2 = vdThreadStartWrite(pDisk);
9196 AssertRC(rc2);
9197 fLockWrite = true;
9198
9199 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9200 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9201
9202 if (pImage == pDisk->pLast)
9203 {
9204 if ( pLCHSGeometry->cCylinders != pDisk->LCHSGeometry.cCylinders
9205 || pLCHSGeometry->cHeads != pDisk->LCHSGeometry.cHeads
9206 || pLCHSGeometry->cSectors != pDisk->LCHSGeometry.cSectors)
9207 {
9208 /* Only update geometry if it is changed. Avoids similar checks
9209 * in every backend. Most of the time the new geometry is set
9210 * to the previous values, so no need to go through the hassle
9211 * of updating an image which could be opened in read-only mode
9212 * right now. */
9213 rc = pImage->Backend->pfnSetLCHSGeometry(pImage->pBackendData,
9214 pLCHSGeometry);
9215
9216 /* Cache new geometry values in any case. */
9217 rc2 = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
9218 &pDisk->LCHSGeometry);
9219 if (RT_FAILURE(rc2))
9220 {
9221 pDisk->LCHSGeometry.cCylinders = 0;
9222 pDisk->LCHSGeometry.cHeads = 0;
9223 pDisk->LCHSGeometry.cSectors = 0;
9224 }
9225 else
9226 {
9227 /* Make sure the CHS geometry is properly clipped. */
9228 pDisk->LCHSGeometry.cHeads = RT_MIN(pDisk->LCHSGeometry.cHeads, 255);
9229 pDisk->LCHSGeometry.cSectors = RT_MIN(pDisk->LCHSGeometry.cSectors, 63);
9230 }
9231 }
9232 }
9233 else
9234 {
9235 VDGEOMETRY LCHS;
9236 rc = pImage->Backend->pfnGetLCHSGeometry(pImage->pBackendData,
9237 &LCHS);
9238 if ( RT_FAILURE(rc)
9239 || pLCHSGeometry->cCylinders != LCHS.cCylinders
9240 || pLCHSGeometry->cHeads != LCHS.cHeads
9241 || pLCHSGeometry->cSectors != LCHS.cSectors)
9242 {
9243 /* Only update geometry if it is changed. Avoids similar checks
9244 * in every backend. Most of the time the new geometry is set
9245 * to the previous values, so no need to go through the hassle
9246 * of updating an image which could be opened in read-only mode
9247 * right now. */
9248 rc = pImage->Backend->pfnSetLCHSGeometry(pImage->pBackendData,
9249 pLCHSGeometry);
9250 }
9251 }
9252 } while (0);
9253
9254 if (RT_UNLIKELY(fLockWrite))
9255 {
9256 rc2 = vdThreadFinishWrite(pDisk);
9257 AssertRC(rc2);
9258 }
9259
9260 LogFlowFunc(("returns %Rrc\n", rc));
9261 return rc;
9262}
9263
9264/**
9265 * Queries the available regions of an image in the given VD container.
9266 *
9267 * @return VBox status code.
9268 * @retval VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9269 * @retval VERR_NOT_SUPPORTED if the image backend doesn't support region lists.
9270 * @param pDisk Pointer to HDD container.
9271 * @param nImage Image number, counts from 0. 0 is always base image of container.
9272 * @param fFlags Combination of VD_REGION_LIST_F_* flags.
9273 * @param ppRegionList Where to store the pointer to the region list on success, must be freed
9274 * with VDRegionListFree().
9275 */
9276VBOXDDU_DECL(int) VDQueryRegions(PVDISK pDisk, unsigned nImage, uint32_t fFlags,
9277 PPVDREGIONLIST ppRegionList)
9278{
9279 int rc = VINF_SUCCESS;
9280 int rc2;
9281 bool fLockRead = false;
9282
9283 LogFlowFunc(("pDisk=%#p nImage=%u fFlags=%#x ppRegionList=%#p\n",
9284 pDisk, nImage, fFlags, ppRegionList));
9285 do
9286 {
9287 /* sanity check */
9288 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9289 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9290
9291 /* Check arguments. */
9292 AssertMsgBreakStmt(VALID_PTR(ppRegionList),
9293 ("ppRegionList=%#p\n", ppRegionList),
9294 rc = VERR_INVALID_PARAMETER);
9295
9296 rc2 = vdThreadStartRead(pDisk);
9297 AssertRC(rc2);
9298 fLockRead = true;
9299
9300 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9301 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9302
9303 PCVDREGIONLIST pRegionList = NULL;
9304 rc = pImage->Backend->pfnQueryRegions(pImage->pBackendData, &pRegionList);
9305 if (RT_SUCCESS(rc))
9306 {
9307 rc = vdRegionListConv(pRegionList, fFlags, ppRegionList);
9308
9309 AssertPtr(pImage->Backend->pfnRegionListRelease);
9310 pImage->Backend->pfnRegionListRelease(pImage->pBackendData, pRegionList);
9311 }
9312 } while (0);
9313
9314 if (RT_UNLIKELY(fLockRead))
9315 {
9316 rc2 = vdThreadFinishRead(pDisk);
9317 AssertRC(rc2);
9318 }
9319
9320 LogFlowFunc((": %Rrc\n", rc));
9321 return rc;
9322}
9323
9324/**
9325 * Frees a region list previously queried with VDQueryRegions().
9326 *
9327 * @return nothing.
9328 * @param pRegionList The region list to free.
9329 */
9330VBOXDDU_DECL(void) VDRegionListFree(PVDREGIONLIST pRegionList)
9331{
9332 RTMemFree(pRegionList);
9333}
9334
9335/**
9336 * Get version of image in HDD container.
9337 *
9338 * @returns VBox status code.
9339 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9340 * @param pDisk Pointer to HDD container.
9341 * @param nImage Image number, counts from 0. 0 is always base image of container.
9342 * @param puVersion Where to store the image version.
9343 */
9344VBOXDDU_DECL(int) VDGetVersion(PVDISK pDisk, unsigned nImage,
9345 unsigned *puVersion)
9346{
9347 int rc = VINF_SUCCESS;
9348 int rc2;
9349 bool fLockRead = false;
9350
9351 LogFlowFunc(("pDisk=%#p nImage=%u puVersion=%#p\n",
9352 pDisk, nImage, puVersion));
9353 do
9354 {
9355 /* sanity check */
9356 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9357 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9358
9359 /* Check arguments. */
9360 AssertMsgBreakStmt(VALID_PTR(puVersion),
9361 ("puVersion=%#p\n", puVersion),
9362 rc = VERR_INVALID_PARAMETER);
9363
9364 rc2 = vdThreadStartRead(pDisk);
9365 AssertRC(rc2);
9366 fLockRead = true;
9367
9368 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9369 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9370
9371 *puVersion = pImage->Backend->pfnGetVersion(pImage->pBackendData);
9372 } while (0);
9373
9374 if (RT_UNLIKELY(fLockRead))
9375 {
9376 rc2 = vdThreadFinishRead(pDisk);
9377 AssertRC(rc2);
9378 }
9379
9380 LogFlowFunc(("returns %Rrc uVersion=%#x\n", rc, *puVersion));
9381 return rc;
9382}
9383
9384/**
9385 * List the capabilities of image backend in HDD container.
9386 *
9387 * @returns VBox status code.
9388 * @retval VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9389 * @param pDisk Pointer to the HDD container.
9390 * @param nImage Image number, counts from 0. 0 is always base image of container.
9391 * @param pBackendInfo Where to store the backend information.
9392 */
9393VBOXDDU_DECL(int) VDBackendInfoSingle(PVDISK pDisk, unsigned nImage,
9394 PVDBACKENDINFO pBackendInfo)
9395{
9396 int rc = VINF_SUCCESS;
9397 int rc2;
9398 bool fLockRead = false;
9399
9400 LogFlowFunc(("pDisk=%#p nImage=%u pBackendInfo=%#p\n",
9401 pDisk, nImage, pBackendInfo));
9402 do
9403 {
9404 /* sanity check */
9405 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9406 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9407
9408 /* Check arguments. */
9409 AssertMsgBreakStmt(VALID_PTR(pBackendInfo),
9410 ("pBackendInfo=%#p\n", pBackendInfo),
9411 rc = VERR_INVALID_PARAMETER);
9412
9413 rc2 = vdThreadStartRead(pDisk);
9414 AssertRC(rc2);
9415 fLockRead = true;
9416
9417 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9418 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9419
9420 pBackendInfo->pszBackend = pImage->Backend->pszBackendName;
9421 pBackendInfo->uBackendCaps = pImage->Backend->uBackendCaps;
9422 pBackendInfo->paFileExtensions = pImage->Backend->paFileExtensions;
9423 pBackendInfo->paConfigInfo = pImage->Backend->paConfigInfo;
9424 } while (0);
9425
9426 if (RT_UNLIKELY(fLockRead))
9427 {
9428 rc2 = vdThreadFinishRead(pDisk);
9429 AssertRC(rc2);
9430 }
9431
9432 LogFlowFunc(("returns %Rrc\n", rc));
9433 return rc;
9434}
9435
9436/**
9437 * Get flags of image in HDD container.
9438 *
9439 * @returns VBox status code.
9440 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9441 * @param pDisk Pointer to HDD container.
9442 * @param nImage Image number, counts from 0. 0 is always base image of container.
9443 * @param puImageFlags Where to store the image flags.
9444 */
9445VBOXDDU_DECL(int) VDGetImageFlags(PVDISK pDisk, unsigned nImage,
9446 unsigned *puImageFlags)
9447{
9448 int rc = VINF_SUCCESS;
9449 int rc2;
9450 bool fLockRead = false;
9451
9452 LogFlowFunc(("pDisk=%#p nImage=%u puImageFlags=%#p\n",
9453 pDisk, nImage, puImageFlags));
9454 do
9455 {
9456 /* sanity check */
9457 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9458 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9459
9460 /* Check arguments. */
9461 AssertMsgBreakStmt(VALID_PTR(puImageFlags),
9462 ("puImageFlags=%#p\n", puImageFlags),
9463 rc = VERR_INVALID_PARAMETER);
9464
9465 rc2 = vdThreadStartRead(pDisk);
9466 AssertRC(rc2);
9467 fLockRead = true;
9468
9469 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9470 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9471
9472 *puImageFlags = pImage->uImageFlags;
9473 } while (0);
9474
9475 if (RT_UNLIKELY(fLockRead))
9476 {
9477 rc2 = vdThreadFinishRead(pDisk);
9478 AssertRC(rc2);
9479 }
9480
9481 LogFlowFunc(("returns %Rrc uImageFlags=%#x\n", rc, *puImageFlags));
9482 return rc;
9483}
9484
9485/**
9486 * Get open flags of image in HDD container.
9487 *
9488 * @returns VBox status code.
9489 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9490 * @param pDisk Pointer to HDD container.
9491 * @param nImage Image number, counts from 0. 0 is always base image of container.
9492 * @param puOpenFlags Where to store the image open flags.
9493 */
9494VBOXDDU_DECL(int) VDGetOpenFlags(PVDISK pDisk, unsigned nImage,
9495 unsigned *puOpenFlags)
9496{
9497 int rc = VINF_SUCCESS;
9498 int rc2;
9499 bool fLockRead = false;
9500
9501 LogFlowFunc(("pDisk=%#p nImage=%u puOpenFlags=%#p\n",
9502 pDisk, nImage, puOpenFlags));
9503 do
9504 {
9505 /* sanity check */
9506 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9507 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9508
9509 /* Check arguments. */
9510 AssertMsgBreakStmt(VALID_PTR(puOpenFlags),
9511 ("puOpenFlags=%#p\n", puOpenFlags),
9512 rc = VERR_INVALID_PARAMETER);
9513
9514 rc2 = vdThreadStartRead(pDisk);
9515 AssertRC(rc2);
9516 fLockRead = true;
9517
9518 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9519 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9520
9521 *puOpenFlags = pImage->Backend->pfnGetOpenFlags(pImage->pBackendData);
9522 } while (0);
9523
9524 if (RT_UNLIKELY(fLockRead))
9525 {
9526 rc2 = vdThreadFinishRead(pDisk);
9527 AssertRC(rc2);
9528 }
9529
9530 LogFlowFunc(("returns %Rrc uOpenFlags=%#x\n", rc, *puOpenFlags));
9531 return rc;
9532}
9533
9534/**
9535 * Set open flags of image in HDD container.
9536 * This operation may cause file locking changes and/or files being reopened.
9537 * Note that in case of unrecoverable error all images in HDD container will be closed.
9538 *
9539 * @returns VBox status code.
9540 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9541 * @param pDisk Pointer to HDD container.
9542 * @param nImage Image number, counts from 0. 0 is always base image of container.
9543 * @param uOpenFlags Image file open mode, see VD_OPEN_FLAGS_* constants.
9544 */
9545VBOXDDU_DECL(int) VDSetOpenFlags(PVDISK pDisk, unsigned nImage,
9546 unsigned uOpenFlags)
9547{
9548 int rc;
9549 int rc2;
9550 bool fLockWrite = false;
9551
9552 LogFlowFunc(("pDisk=%#p uOpenFlags=%#u\n", pDisk, uOpenFlags));
9553 do
9554 {
9555 /* sanity check */
9556 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9557 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9558
9559 /* Check arguments. */
9560 AssertMsgBreakStmt((uOpenFlags & ~VD_OPEN_FLAGS_MASK) == 0,
9561 ("uOpenFlags=%#x\n", uOpenFlags),
9562 rc = VERR_INVALID_PARAMETER);
9563
9564 rc2 = vdThreadStartWrite(pDisk);
9565 AssertRC(rc2);
9566 fLockWrite = true;
9567
9568 /* Destroy any discard state because the image might be changed to readonly mode. */
9569 rc = vdDiscardStateDestroy(pDisk);
9570 if (RT_FAILURE(rc))
9571 break;
9572
9573 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9574 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9575
9576 rc = pImage->Backend->pfnSetOpenFlags(pImage->pBackendData,
9577 uOpenFlags & ~(VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS));
9578 if (RT_SUCCESS(rc))
9579 pImage->uOpenFlags = uOpenFlags & (VD_OPEN_FLAGS_HONOR_SAME | VD_OPEN_FLAGS_DISCARD | VD_OPEN_FLAGS_IGNORE_FLUSH | VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS);
9580 } while (0);
9581
9582 if (RT_UNLIKELY(fLockWrite))
9583 {
9584 rc2 = vdThreadFinishWrite(pDisk);
9585 AssertRC(rc2);
9586 }
9587
9588 LogFlowFunc(("returns %Rrc\n", rc));
9589 return rc;
9590}
9591
9592/**
9593 * Get base filename of image in HDD container. Some image formats use
9594 * other filenames as well, so don't use this for anything but informational
9595 * purposes.
9596 *
9597 * @returns VBox status code.
9598 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9599 * @returns VERR_BUFFER_OVERFLOW if pszFilename buffer too small to hold filename.
9600 * @param pDisk Pointer to HDD container.
9601 * @param nImage Image number, counts from 0. 0 is always base image of container.
9602 * @param pszFilename Where to store the image file name.
9603 * @param cbFilename Size of buffer pszFilename points to.
9604 */
9605VBOXDDU_DECL(int) VDGetFilename(PVDISK pDisk, unsigned nImage,
9606 char *pszFilename, unsigned cbFilename)
9607{
9608 int rc;
9609 int rc2;
9610 bool fLockRead = false;
9611
9612 LogFlowFunc(("pDisk=%#p nImage=%u pszFilename=%#p cbFilename=%u\n",
9613 pDisk, nImage, pszFilename, cbFilename));
9614 do
9615 {
9616 /* sanity check */
9617 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9618 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9619
9620 /* Check arguments. */
9621 AssertMsgBreakStmt(VALID_PTR(pszFilename) && *pszFilename,
9622 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
9623 rc = VERR_INVALID_PARAMETER);
9624 AssertMsgBreakStmt(cbFilename,
9625 ("cbFilename=%u\n", cbFilename),
9626 rc = VERR_INVALID_PARAMETER);
9627
9628 rc2 = vdThreadStartRead(pDisk);
9629 AssertRC(rc2);
9630 fLockRead = true;
9631
9632 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9633 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9634
9635 size_t cb = strlen(pImage->pszFilename);
9636 if (cb <= cbFilename)
9637 {
9638 strcpy(pszFilename, pImage->pszFilename);
9639 rc = VINF_SUCCESS;
9640 }
9641 else
9642 {
9643 strncpy(pszFilename, pImage->pszFilename, cbFilename - 1);
9644 pszFilename[cbFilename - 1] = '\0';
9645 rc = VERR_BUFFER_OVERFLOW;
9646 }
9647 } while (0);
9648
9649 if (RT_UNLIKELY(fLockRead))
9650 {
9651 rc2 = vdThreadFinishRead(pDisk);
9652 AssertRC(rc2);
9653 }
9654
9655 LogFlowFunc(("returns %Rrc, pszFilename=\"%s\"\n", rc, pszFilename));
9656 return rc;
9657}
9658
9659/**
9660 * Get the comment line of image in HDD container.
9661 *
9662 * @returns VBox status code.
9663 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9664 * @returns VERR_BUFFER_OVERFLOW if pszComment buffer too small to hold comment text.
9665 * @param pDisk Pointer to HDD container.
9666 * @param nImage Image number, counts from 0. 0 is always base image of container.
9667 * @param pszComment Where to store the comment string of image. NULL is ok.
9668 * @param cbComment The size of pszComment buffer. 0 is ok.
9669 */
9670VBOXDDU_DECL(int) VDGetComment(PVDISK pDisk, unsigned nImage,
9671 char *pszComment, unsigned cbComment)
9672{
9673 int rc;
9674 int rc2;
9675 bool fLockRead = false;
9676
9677 LogFlowFunc(("pDisk=%#p nImage=%u pszComment=%#p cbComment=%u\n",
9678 pDisk, nImage, pszComment, cbComment));
9679 do
9680 {
9681 /* sanity check */
9682 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9683 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9684
9685 /* Check arguments. */
9686 AssertMsgBreakStmt(VALID_PTR(pszComment),
9687 ("pszComment=%#p \"%s\"\n", pszComment, pszComment),
9688 rc = VERR_INVALID_PARAMETER);
9689 AssertMsgBreakStmt(cbComment,
9690 ("cbComment=%u\n", cbComment),
9691 rc = VERR_INVALID_PARAMETER);
9692
9693 rc2 = vdThreadStartRead(pDisk);
9694 AssertRC(rc2);
9695 fLockRead = true;
9696
9697 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9698 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9699
9700 rc = pImage->Backend->pfnGetComment(pImage->pBackendData, pszComment,
9701 cbComment);
9702 } while (0);
9703
9704 if (RT_UNLIKELY(fLockRead))
9705 {
9706 rc2 = vdThreadFinishRead(pDisk);
9707 AssertRC(rc2);
9708 }
9709
9710 LogFlowFunc(("returns %Rrc, pszComment=\"%s\"\n", rc, pszComment));
9711 return rc;
9712}
9713
9714/**
9715 * Changes the comment line of image in HDD container.
9716 *
9717 * @returns VBox status code.
9718 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9719 * @param pDisk Pointer to HDD container.
9720 * @param nImage Image number, counts from 0. 0 is always base image of container.
9721 * @param pszComment New comment string (UTF-8). NULL is allowed to reset the comment.
9722 */
9723VBOXDDU_DECL(int) VDSetComment(PVDISK pDisk, unsigned nImage,
9724 const char *pszComment)
9725{
9726 int rc;
9727 int rc2;
9728 bool fLockWrite = false;
9729
9730 LogFlowFunc(("pDisk=%#p nImage=%u pszComment=%#p \"%s\"\n",
9731 pDisk, nImage, pszComment, pszComment));
9732 do
9733 {
9734 /* sanity check */
9735 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9736 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9737
9738 /* Check arguments. */
9739 AssertMsgBreakStmt(VALID_PTR(pszComment) || pszComment == NULL,
9740 ("pszComment=%#p \"%s\"\n", pszComment, pszComment),
9741 rc = VERR_INVALID_PARAMETER);
9742
9743 rc2 = vdThreadStartWrite(pDisk);
9744 AssertRC(rc2);
9745 fLockWrite = true;
9746
9747 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9748 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9749
9750 rc = pImage->Backend->pfnSetComment(pImage->pBackendData, pszComment);
9751 } while (0);
9752
9753 if (RT_UNLIKELY(fLockWrite))
9754 {
9755 rc2 = vdThreadFinishWrite(pDisk);
9756 AssertRC(rc2);
9757 }
9758
9759 LogFlowFunc(("returns %Rrc\n", rc));
9760 return rc;
9761}
9762
9763
9764/**
9765 * Get UUID of image in HDD container.
9766 *
9767 * @returns VBox status code.
9768 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9769 * @param pDisk Pointer to HDD container.
9770 * @param nImage Image number, counts from 0. 0 is always base image of container.
9771 * @param pUuid Where to store the image creation UUID.
9772 */
9773VBOXDDU_DECL(int) VDGetUuid(PVDISK pDisk, unsigned nImage, PRTUUID pUuid)
9774{
9775 int rc;
9776 int rc2;
9777 bool fLockRead = false;
9778
9779 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9780 do
9781 {
9782 /* sanity check */
9783 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9784 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9785
9786 /* Check arguments. */
9787 AssertMsgBreakStmt(VALID_PTR(pUuid),
9788 ("pUuid=%#p\n", pUuid),
9789 rc = VERR_INVALID_PARAMETER);
9790
9791 rc2 = vdThreadStartRead(pDisk);
9792 AssertRC(rc2);
9793 fLockRead = true;
9794
9795 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9796 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9797
9798 rc = pImage->Backend->pfnGetUuid(pImage->pBackendData, pUuid);
9799 } while (0);
9800
9801 if (RT_UNLIKELY(fLockRead))
9802 {
9803 rc2 = vdThreadFinishRead(pDisk);
9804 AssertRC(rc2);
9805 }
9806
9807 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9808 return rc;
9809}
9810
9811/**
9812 * Set the image's UUID. Should not be used by normal applications.
9813 *
9814 * @returns VBox status code.
9815 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9816 * @param pDisk Pointer to HDD container.
9817 * @param nImage Image number, counts from 0. 0 is always base image of container.
9818 * @param pUuid New UUID of the image. If NULL, a new UUID is created.
9819 */
9820VBOXDDU_DECL(int) VDSetUuid(PVDISK pDisk, unsigned nImage, PCRTUUID pUuid)
9821{
9822 int rc;
9823 int rc2;
9824 bool fLockWrite = false;
9825
9826 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9827 pDisk, nImage, pUuid, pUuid));
9828 do
9829 {
9830 /* sanity check */
9831 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9832 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9833
9834 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9835 ("pUuid=%#p\n", pUuid),
9836 rc = VERR_INVALID_PARAMETER);
9837
9838 rc2 = vdThreadStartWrite(pDisk);
9839 AssertRC(rc2);
9840 fLockWrite = true;
9841
9842 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9843 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9844
9845 RTUUID Uuid;
9846 if (!pUuid)
9847 {
9848 RTUuidCreate(&Uuid);
9849 pUuid = &Uuid;
9850 }
9851 rc = pImage->Backend->pfnSetUuid(pImage->pBackendData, pUuid);
9852 } while (0);
9853
9854 if (RT_UNLIKELY(fLockWrite))
9855 {
9856 rc2 = vdThreadFinishWrite(pDisk);
9857 AssertRC(rc2);
9858 }
9859
9860 LogFlowFunc(("returns %Rrc\n", rc));
9861 return rc;
9862}
9863
9864/**
9865 * Get last modification UUID of image in HDD container.
9866 *
9867 * @returns VBox status code.
9868 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9869 * @param pDisk Pointer to HDD container.
9870 * @param nImage Image number, counts from 0. 0 is always base image of container.
9871 * @param pUuid Where to store the image modification UUID.
9872 */
9873VBOXDDU_DECL(int) VDGetModificationUuid(PVDISK pDisk, unsigned nImage, PRTUUID pUuid)
9874{
9875 int rc = VINF_SUCCESS;
9876 int rc2;
9877 bool fLockRead = false;
9878
9879 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9880 do
9881 {
9882 /* sanity check */
9883 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9884 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9885
9886 /* Check arguments. */
9887 AssertMsgBreakStmt(VALID_PTR(pUuid),
9888 ("pUuid=%#p\n", pUuid),
9889 rc = VERR_INVALID_PARAMETER);
9890
9891 rc2 = vdThreadStartRead(pDisk);
9892 AssertRC(rc2);
9893 fLockRead = true;
9894
9895 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9896 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9897
9898 rc = pImage->Backend->pfnGetModificationUuid(pImage->pBackendData,
9899 pUuid);
9900 } while (0);
9901
9902 if (RT_UNLIKELY(fLockRead))
9903 {
9904 rc2 = vdThreadFinishRead(pDisk);
9905 AssertRC(rc2);
9906 }
9907
9908 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
9909 return rc;
9910}
9911
9912/**
9913 * Set the image's last modification UUID. Should not be used by normal applications.
9914 *
9915 * @returns VBox status code.
9916 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9917 * @param pDisk Pointer to HDD container.
9918 * @param nImage Image number, counts from 0. 0 is always base image of container.
9919 * @param pUuid New modification UUID of the image. If NULL, a new UUID is created.
9920 */
9921VBOXDDU_DECL(int) VDSetModificationUuid(PVDISK pDisk, unsigned nImage, PCRTUUID pUuid)
9922{
9923 int rc;
9924 int rc2;
9925 bool fLockWrite = false;
9926
9927 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
9928 pDisk, nImage, pUuid, pUuid));
9929 do
9930 {
9931 /* sanity check */
9932 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9933 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9934
9935 /* Check arguments. */
9936 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
9937 ("pUuid=%#p\n", pUuid),
9938 rc = VERR_INVALID_PARAMETER);
9939
9940 rc2 = vdThreadStartWrite(pDisk);
9941 AssertRC(rc2);
9942 fLockWrite = true;
9943
9944 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
9945 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
9946
9947 RTUUID Uuid;
9948 if (!pUuid)
9949 {
9950 RTUuidCreate(&Uuid);
9951 pUuid = &Uuid;
9952 }
9953 rc = pImage->Backend->pfnSetModificationUuid(pImage->pBackendData,
9954 pUuid);
9955 } while (0);
9956
9957 if (RT_UNLIKELY(fLockWrite))
9958 {
9959 rc2 = vdThreadFinishWrite(pDisk);
9960 AssertRC(rc2);
9961 }
9962
9963 LogFlowFunc(("returns %Rrc\n", rc));
9964 return rc;
9965}
9966
9967/**
9968 * Get parent UUID of image in HDD container.
9969 *
9970 * @returns VBox status code.
9971 * @returns VERR_VD_IMAGE_NOT_FOUND if image with specified number was not opened.
9972 * @param pDisk Pointer to HDD container.
9973 * @param nImage Image number, counts from 0. 0 is always base image of container.
9974 * @param pUuid Where to store the parent image UUID.
9975 */
9976VBOXDDU_DECL(int) VDGetParentUuid(PVDISK pDisk, unsigned nImage,
9977 PRTUUID pUuid)
9978{
9979 int rc = VINF_SUCCESS;
9980 int rc2;
9981 bool fLockRead = false;
9982
9983 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p\n", pDisk, nImage, pUuid));
9984 do
9985 {
9986 /* sanity check */
9987 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
9988 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
9989
9990 /* Check arguments. */
9991 AssertMsgBreakStmt(VALID_PTR(pUuid),
9992 ("pUuid=%#p\n", pUuid),
9993 rc = VERR_INVALID_PARAMETER);
9994
9995 rc2 = vdThreadStartRead(pDisk);
9996 AssertRC(rc2);
9997 fLockRead = true;
9998
9999 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
10000 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
10001
10002 rc = pImage->Backend->pfnGetParentUuid(pImage->pBackendData, pUuid);
10003 } while (0);
10004
10005 if (RT_UNLIKELY(fLockRead))
10006 {
10007 rc2 = vdThreadFinishRead(pDisk);
10008 AssertRC(rc2);
10009 }
10010
10011 LogFlowFunc(("returns %Rrc, Uuid={%RTuuid}\n", rc, pUuid));
10012 return rc;
10013}
10014
10015/**
10016 * Set the image's parent UUID. Should not be used by normal applications.
10017 *
10018 * @returns VBox status code.
10019 * @param pDisk Pointer to HDD container.
10020 * @param nImage Image number, counts from 0. 0 is always base image of container.
10021 * @param pUuid New parent UUID of the image. If NULL, a new UUID is created.
10022 */
10023VBOXDDU_DECL(int) VDSetParentUuid(PVDISK pDisk, unsigned nImage,
10024 PCRTUUID pUuid)
10025{
10026 int rc;
10027 int rc2;
10028 bool fLockWrite = false;
10029
10030 LogFlowFunc(("pDisk=%#p nImage=%u pUuid=%#p {%RTuuid}\n",
10031 pDisk, nImage, pUuid, pUuid));
10032 do
10033 {
10034 /* sanity check */
10035 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10036 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10037
10038 /* Check arguments. */
10039 AssertMsgBreakStmt(VALID_PTR(pUuid) || pUuid == NULL,
10040 ("pUuid=%#p\n", pUuid),
10041 rc = VERR_INVALID_PARAMETER);
10042
10043 rc2 = vdThreadStartWrite(pDisk);
10044 AssertRC(rc2);
10045 fLockWrite = true;
10046
10047 PVDIMAGE pImage = vdGetImageByNumber(pDisk, nImage);
10048 AssertPtrBreakStmt(pImage, rc = VERR_VD_IMAGE_NOT_FOUND);
10049
10050 RTUUID Uuid;
10051 if (!pUuid)
10052 {
10053 RTUuidCreate(&Uuid);
10054 pUuid = &Uuid;
10055 }
10056 rc = pImage->Backend->pfnSetParentUuid(pImage->pBackendData, pUuid);
10057 } while (0);
10058
10059 if (RT_UNLIKELY(fLockWrite))
10060 {
10061 rc2 = vdThreadFinishWrite(pDisk);
10062 AssertRC(rc2);
10063 }
10064
10065 LogFlowFunc(("returns %Rrc\n", rc));
10066 return rc;
10067}
10068
10069
10070/**
10071 * Debug helper - dumps all opened images in HDD container into the log file.
10072 *
10073 * @param pDisk Pointer to HDD container.
10074 */
10075VBOXDDU_DECL(void) VDDumpImages(PVDISK pDisk)
10076{
10077 int rc2;
10078 bool fLockRead = false;
10079
10080 do
10081 {
10082 /* sanity check */
10083 AssertPtrBreak(pDisk);
10084 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10085
10086 if (!pDisk->pInterfaceError || !VALID_PTR(pDisk->pInterfaceError->pfnMessage))
10087 pDisk->pInterfaceError->pfnMessage = vdLogMessage;
10088
10089 rc2 = vdThreadStartRead(pDisk);
10090 AssertRC(rc2);
10091 fLockRead = true;
10092
10093 vdMessageWrapper(pDisk, "--- Dumping VD Disk, Images=%u\n", pDisk->cImages);
10094 for (PVDIMAGE pImage = pDisk->pBase; pImage; pImage = pImage->pNext)
10095 {
10096 vdMessageWrapper(pDisk, "Dumping VD image \"%s\" (Backend=%s)\n",
10097 pImage->pszFilename, pImage->Backend->pszBackendName);
10098 pImage->Backend->pfnDump(pImage->pBackendData);
10099 }
10100 } while (0);
10101
10102 if (RT_UNLIKELY(fLockRead))
10103 {
10104 rc2 = vdThreadFinishRead(pDisk);
10105 AssertRC(rc2);
10106 }
10107}
10108
10109
10110VBOXDDU_DECL(int) VDDiscardRanges(PVDISK pDisk, PCRTRANGE paRanges, unsigned cRanges)
10111{
10112 int rc;
10113 int rc2;
10114 bool fLockWrite = false;
10115
10116 LogFlowFunc(("pDisk=%#p paRanges=%#p cRanges=%u\n",
10117 pDisk, paRanges, cRanges));
10118 do
10119 {
10120 /* sanity check */
10121 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10122 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10123
10124 /* Check arguments. */
10125 AssertMsgBreakStmt(cRanges,
10126 ("cRanges=%u\n", cRanges),
10127 rc = VERR_INVALID_PARAMETER);
10128 AssertMsgBreakStmt(VALID_PTR(paRanges),
10129 ("paRanges=%#p\n", paRanges),
10130 rc = VERR_INVALID_PARAMETER);
10131
10132 rc2 = vdThreadStartWrite(pDisk);
10133 AssertRC(rc2);
10134 fLockWrite = true;
10135
10136 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10137
10138 AssertMsgBreakStmt(pDisk->pLast->uOpenFlags & VD_OPEN_FLAGS_DISCARD,
10139 ("Discarding not supported\n"),
10140 rc = VERR_NOT_SUPPORTED);
10141
10142 VDIOCTX IoCtx;
10143 RTSEMEVENT hEventComplete = NIL_RTSEMEVENT;
10144
10145 rc = RTSemEventCreate(&hEventComplete);
10146 if (RT_FAILURE(rc))
10147 break;
10148
10149 vdIoCtxDiscardInit(&IoCtx, pDisk, paRanges, cRanges,
10150 vdIoCtxSyncComplete, pDisk, hEventComplete, NULL,
10151 vdDiscardHelperAsync, VDIOCTX_FLAGS_SYNC | VDIOCTX_FLAGS_DONT_FREE);
10152 rc = vdIoCtxProcessSync(&IoCtx, hEventComplete);
10153
10154 RTSemEventDestroy(hEventComplete);
10155 } while (0);
10156
10157 if (RT_UNLIKELY(fLockWrite))
10158 {
10159 rc2 = vdThreadFinishWrite(pDisk);
10160 AssertRC(rc2);
10161 }
10162
10163 LogFlowFunc(("returns %Rrc\n", rc));
10164 return rc;
10165}
10166
10167
10168VBOXDDU_DECL(int) VDAsyncRead(PVDISK pDisk, uint64_t uOffset, size_t cbRead,
10169 PCRTSGBUF pcSgBuf,
10170 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10171 void *pvUser1, void *pvUser2)
10172{
10173 int rc = VERR_VD_BLOCK_FREE;
10174 int rc2;
10175 bool fLockRead = false;
10176 PVDIOCTX pIoCtx = NULL;
10177
10178 LogFlowFunc(("pDisk=%#p uOffset=%llu pcSgBuf=%#p cbRead=%zu pvUser1=%#p pvUser2=%#p\n",
10179 pDisk, uOffset, pcSgBuf, cbRead, pvUser1, pvUser2));
10180
10181 do
10182 {
10183 /* sanity check */
10184 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10185 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10186
10187 /* Check arguments. */
10188 AssertMsgBreakStmt(cbRead,
10189 ("cbRead=%zu\n", cbRead),
10190 rc = VERR_INVALID_PARAMETER);
10191 AssertMsgBreakStmt(VALID_PTR(pcSgBuf),
10192 ("pcSgBuf=%#p\n", pcSgBuf),
10193 rc = VERR_INVALID_PARAMETER);
10194
10195 rc2 = vdThreadStartRead(pDisk);
10196 AssertRC(rc2);
10197 fLockRead = true;
10198
10199 AssertMsgBreakStmt(uOffset + cbRead <= pDisk->cbSize,
10200 ("uOffset=%llu cbRead=%zu pDisk->cbSize=%llu\n",
10201 uOffset, cbRead, pDisk->cbSize),
10202 rc = VERR_INVALID_PARAMETER);
10203 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10204
10205 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_READ, uOffset,
10206 cbRead, pDisk->pLast, pcSgBuf,
10207 pfnComplete, pvUser1, pvUser2,
10208 NULL, vdReadHelperAsync,
10209 VDIOCTX_FLAGS_ZERO_FREE_BLOCKS);
10210 if (!pIoCtx)
10211 {
10212 rc = VERR_NO_MEMORY;
10213 break;
10214 }
10215
10216 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10217 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10218 {
10219 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10220 vdIoCtxFree(pDisk, pIoCtx);
10221 else
10222 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10223 }
10224 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10225 vdIoCtxFree(pDisk, pIoCtx);
10226
10227 } while (0);
10228
10229 if (RT_UNLIKELY(fLockRead) && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10230 {
10231 rc2 = vdThreadFinishRead(pDisk);
10232 AssertRC(rc2);
10233 }
10234
10235 LogFlowFunc(("returns %Rrc\n", rc));
10236 return rc;
10237}
10238
10239
10240VBOXDDU_DECL(int) VDAsyncWrite(PVDISK pDisk, uint64_t uOffset, size_t cbWrite,
10241 PCRTSGBUF pcSgBuf,
10242 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10243 void *pvUser1, void *pvUser2)
10244{
10245 int rc;
10246 int rc2;
10247 bool fLockWrite = false;
10248 PVDIOCTX pIoCtx = NULL;
10249
10250 LogFlowFunc(("pDisk=%#p uOffset=%llu cSgBuf=%#p cbWrite=%zu pvUser1=%#p pvUser2=%#p\n",
10251 pDisk, uOffset, pcSgBuf, cbWrite, pvUser1, pvUser2));
10252 do
10253 {
10254 /* sanity check */
10255 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10256 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10257
10258 /* Check arguments. */
10259 AssertMsgBreakStmt(cbWrite,
10260 ("cbWrite=%zu\n", cbWrite),
10261 rc = VERR_INVALID_PARAMETER);
10262 AssertMsgBreakStmt(VALID_PTR(pcSgBuf),
10263 ("pcSgBuf=%#p\n", pcSgBuf),
10264 rc = VERR_INVALID_PARAMETER);
10265
10266 rc2 = vdThreadStartWrite(pDisk);
10267 AssertRC(rc2);
10268 fLockWrite = true;
10269
10270 AssertMsgBreakStmt(uOffset + cbWrite <= pDisk->cbSize,
10271 ("uOffset=%llu cbWrite=%zu pDisk->cbSize=%llu\n",
10272 uOffset, cbWrite, pDisk->cbSize),
10273 rc = VERR_INVALID_PARAMETER);
10274 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10275
10276 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_WRITE, uOffset,
10277 cbWrite, pDisk->pLast, pcSgBuf,
10278 pfnComplete, pvUser1, pvUser2,
10279 NULL, vdWriteHelperAsync,
10280 VDIOCTX_FLAGS_DEFAULT);
10281 if (!pIoCtx)
10282 {
10283 rc = VERR_NO_MEMORY;
10284 break;
10285 }
10286
10287 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10288 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10289 {
10290 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10291 vdIoCtxFree(pDisk, pIoCtx);
10292 else
10293 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10294 }
10295 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10296 vdIoCtxFree(pDisk, pIoCtx);
10297 } while (0);
10298
10299 if (RT_UNLIKELY(fLockWrite) && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10300 {
10301 rc2 = vdThreadFinishWrite(pDisk);
10302 AssertRC(rc2);
10303 }
10304
10305 LogFlowFunc(("returns %Rrc\n", rc));
10306 return rc;
10307}
10308
10309
10310VBOXDDU_DECL(int) VDAsyncFlush(PVDISK pDisk, PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10311 void *pvUser1, void *pvUser2)
10312{
10313 int rc;
10314 int rc2;
10315 bool fLockWrite = false;
10316 PVDIOCTX pIoCtx = NULL;
10317
10318 LogFlowFunc(("pDisk=%#p\n", pDisk));
10319
10320 do
10321 {
10322 /* sanity check */
10323 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10324 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10325
10326 rc2 = vdThreadStartWrite(pDisk);
10327 AssertRC(rc2);
10328 fLockWrite = true;
10329
10330 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10331
10332 pIoCtx = vdIoCtxRootAlloc(pDisk, VDIOCTXTXDIR_FLUSH, 0,
10333 0, pDisk->pLast, NULL,
10334 pfnComplete, pvUser1, pvUser2,
10335 NULL, vdFlushHelperAsync,
10336 VDIOCTX_FLAGS_DEFAULT);
10337 if (!pIoCtx)
10338 {
10339 rc = VERR_NO_MEMORY;
10340 break;
10341 }
10342
10343 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10344 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10345 {
10346 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10347 vdIoCtxFree(pDisk, pIoCtx);
10348 else
10349 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10350 }
10351 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10352 vdIoCtxFree(pDisk, pIoCtx);
10353 } while (0);
10354
10355 if (RT_UNLIKELY(fLockWrite) && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10356 {
10357 rc2 = vdThreadFinishWrite(pDisk);
10358 AssertRC(rc2);
10359 }
10360
10361 LogFlowFunc(("returns %Rrc\n", rc));
10362 return rc;
10363}
10364
10365VBOXDDU_DECL(int) VDAsyncDiscardRanges(PVDISK pDisk, PCRTRANGE paRanges, unsigned cRanges,
10366 PFNVDASYNCTRANSFERCOMPLETE pfnComplete,
10367 void *pvUser1, void *pvUser2)
10368{
10369 int rc;
10370 int rc2;
10371 bool fLockWrite = false;
10372 PVDIOCTX pIoCtx = NULL;
10373
10374 LogFlowFunc(("pDisk=%#p\n", pDisk));
10375
10376 do
10377 {
10378 /* sanity check */
10379 AssertPtrBreakStmt(pDisk, rc = VERR_INVALID_PARAMETER);
10380 AssertMsg(pDisk->u32Signature == VDISK_SIGNATURE, ("u32Signature=%08x\n", pDisk->u32Signature));
10381
10382 rc2 = vdThreadStartWrite(pDisk);
10383 AssertRC(rc2);
10384 fLockWrite = true;
10385
10386 AssertPtrBreakStmt(pDisk->pLast, rc = VERR_VD_NOT_OPENED);
10387
10388 pIoCtx = vdIoCtxDiscardAlloc(pDisk, paRanges, cRanges,
10389 pfnComplete, pvUser1, pvUser2, NULL,
10390 vdDiscardHelperAsync,
10391 VDIOCTX_FLAGS_DEFAULT);
10392 if (!pIoCtx)
10393 {
10394 rc = VERR_NO_MEMORY;
10395 break;
10396 }
10397
10398 rc = vdIoCtxProcessTryLockDefer(pIoCtx);
10399 if (rc == VINF_VD_ASYNC_IO_FINISHED)
10400 {
10401 if (ASMAtomicCmpXchgBool(&pIoCtx->fComplete, true, false))
10402 vdIoCtxFree(pDisk, pIoCtx);
10403 else
10404 rc = VERR_VD_ASYNC_IO_IN_PROGRESS; /* Let the other handler complete the request. */
10405 }
10406 else if (rc != VERR_VD_ASYNC_IO_IN_PROGRESS) /* Another error */
10407 vdIoCtxFree(pDisk, pIoCtx);
10408 } while (0);
10409
10410 if (RT_UNLIKELY(fLockWrite) && (rc != VERR_VD_ASYNC_IO_IN_PROGRESS))
10411 {
10412 rc2 = vdThreadFinishWrite(pDisk);
10413 AssertRC(rc2);
10414 }
10415
10416 LogFlowFunc(("returns %Rrc\n", rc));
10417 return rc;
10418}
10419
10420VBOXDDU_DECL(int) VDRepair(PVDINTERFACE pVDIfsDisk, PVDINTERFACE pVDIfsImage,
10421 const char *pszFilename, const char *pszBackend,
10422 uint32_t fFlags)
10423{
10424 int rc = VERR_NOT_SUPPORTED;
10425 PCVDIMAGEBACKEND pBackend = NULL;
10426 VDINTERFACEIOINT VDIfIoInt;
10427 VDINTERFACEIO VDIfIoFallback;
10428 PVDINTERFACEIO pInterfaceIo;
10429
10430 LogFlowFunc(("pszFilename=\"%s\"\n", pszFilename));
10431 /* Check arguments. */
10432 AssertMsgReturn(VALID_PTR(pszFilename) && *pszFilename,
10433 ("pszFilename=%#p \"%s\"\n", pszFilename, pszFilename),
10434 VERR_INVALID_PARAMETER);
10435 AssertMsgReturn(VALID_PTR(pszBackend),
10436 ("pszBackend=%#p\n", pszBackend),
10437 VERR_INVALID_PARAMETER);
10438 AssertMsgReturn((fFlags & ~VD_REPAIR_FLAGS_MASK) == 0,
10439 ("fFlags=%#x\n", fFlags),
10440 VERR_INVALID_PARAMETER);
10441
10442 pInterfaceIo = VDIfIoGet(pVDIfsImage);
10443 if (!pInterfaceIo)
10444 {
10445 /*
10446 * Caller doesn't provide an I/O interface, create our own using the
10447 * native file API.
10448 */
10449 vdIfIoFallbackCallbacksSetup(&VDIfIoFallback);
10450 pInterfaceIo = &VDIfIoFallback;
10451 }
10452
10453 /* Set up the internal I/O interface. */
10454 AssertReturn(!VDIfIoIntGet(pVDIfsImage), VERR_INVALID_PARAMETER);
10455 VDIfIoInt.pfnOpen = vdIOIntOpenLimited;
10456 VDIfIoInt.pfnClose = vdIOIntCloseLimited;
10457 VDIfIoInt.pfnDelete = vdIOIntDeleteLimited;
10458 VDIfIoInt.pfnMove = vdIOIntMoveLimited;
10459 VDIfIoInt.pfnGetFreeSpace = vdIOIntGetFreeSpaceLimited;
10460 VDIfIoInt.pfnGetModificationTime = vdIOIntGetModificationTimeLimited;
10461 VDIfIoInt.pfnGetSize = vdIOIntGetSizeLimited;
10462 VDIfIoInt.pfnSetSize = vdIOIntSetSizeLimited;
10463 VDIfIoInt.pfnReadUser = vdIOIntReadUserLimited;
10464 VDIfIoInt.pfnWriteUser = vdIOIntWriteUserLimited;
10465 VDIfIoInt.pfnReadMeta = vdIOIntReadMetaLimited;
10466 VDIfIoInt.pfnWriteMeta = vdIOIntWriteMetaLimited;
10467 VDIfIoInt.pfnFlush = vdIOIntFlushLimited;
10468 rc = VDInterfaceAdd(&VDIfIoInt.Core, "VD_IOINT", VDINTERFACETYPE_IOINT,
10469 pInterfaceIo, sizeof(VDINTERFACEIOINT), &pVDIfsImage);
10470 AssertRC(rc);
10471
10472 rc = vdFindImageBackend(pszBackend, &pBackend);
10473 if (RT_SUCCESS(rc))
10474 {
10475 if (pBackend->pfnRepair)
10476 rc = pBackend->pfnRepair(pszFilename, pVDIfsDisk, pVDIfsImage, fFlags);
10477 else
10478 rc = VERR_VD_IMAGE_REPAIR_NOT_SUPPORTED;
10479 }
10480
10481 LogFlowFunc(("returns %Rrc\n", rc));
10482 return rc;
10483}
10484
10485
10486/*
10487 * generic plugin functions
10488 */
10489
10490/**
10491 * @interface_method_impl{VDIMAGEBACKEND,pfnComposeLocation}
10492 */
10493DECLCALLBACK(int) genericFileComposeLocation(PVDINTERFACE pConfig, char **pszLocation)
10494{
10495 RT_NOREF1(pConfig);
10496 *pszLocation = NULL;
10497 return VINF_SUCCESS;
10498}
10499
10500/**
10501 * @interface_method_impl{VDIMAGEBACKEND,pfnComposeName}
10502 */
10503DECLCALLBACK(int) genericFileComposeName(PVDINTERFACE pConfig, char **pszName)
10504{
10505 RT_NOREF1(pConfig);
10506 *pszName = NULL;
10507 return VINF_SUCCESS;
10508}
10509
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette