VirtualBox

source: vbox/trunk/src/VBox/Devices/Storage/DrvVD.cpp@ 64623

Last change on this file since 64623 was 64407, checked in by vboxsync, 8 years ago

Devices/Storage: Add callback to query the actual transfer size of an I/O request if PDMIMEDIAEX is used, useful to calculate the amount of data transferred for requests where the transfer size can be different from the guest buffer size (e.g. SCSI)

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 195.3 KB
Line 
1/* $Id: DrvVD.cpp 64407 2016-10-25 11:53:00Z vboxsync $ */
2/** @file
3 * DrvVD - Generic VBox disk media driver.
4 */
5
6/*
7 * Copyright (C) 2006-2016 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*********************************************************************************************************************************
20* Header files *
21*********************************************************************************************************************************/
22#define LOG_GROUP LOG_GROUP_DRV_VD
23#include <VBox/vd.h>
24#include <VBox/vmm/pdmdrv.h>
25#include <VBox/vmm/pdmstorageifs.h>
26#include <VBox/vmm/pdmasynccompletion.h>
27#include <VBox/vmm/pdmblkcache.h>
28#include <VBox/vmm/ssm.h>
29#include <iprt/asm.h>
30#include <iprt/alloc.h>
31#include <iprt/assert.h>
32#include <iprt/uuid.h>
33#include <iprt/file.h>
34#include <iprt/string.h>
35#include <iprt/tcp.h>
36#include <iprt/semaphore.h>
37#include <iprt/sg.h>
38#include <iprt/poll.h>
39#include <iprt/pipe.h>
40#include <iprt/system.h>
41#include <iprt/memsafer.h>
42#include <iprt/memcache.h>
43#include <iprt/list.h>
44
45#ifdef VBOX_WITH_INIP
46/* All lwip header files are not C++ safe. So hack around this. */
47RT_C_DECLS_BEGIN
48#include <lwip/opt.h>
49#include <lwip/inet.h>
50#include <lwip/tcp.h>
51#include <lwip/sockets.h>
52# if LWIP_IPV6
53# include <lwip/inet6.h>
54# endif
55RT_C_DECLS_END
56#endif /* VBOX_WITH_INIP */
57
58#include "HBDMgmt.h"
59#include "IOBufMgmt.h"
60
61#include "VBoxDD.h"
62
63#ifdef VBOX_WITH_INIP
64/* Small hack to get at lwIP initialized status */
65extern bool DevINIPConfigured(void);
66#endif /* VBOX_WITH_INIP */
67
68
69/** @def VBOX_PERIODIC_FLUSH
70 * Enable support for periodically flushing the VDI to disk. This may prove
71 * useful for those nasty problems with the ultra-slow host filesystems.
72 * If this is enabled, it can be configured via the CFGM key
73 * "VBoxInternal/Devices/piix3ide/0/LUN#<x>/Config/FlushInterval". @verbatim<x>@endverbatim
74 * must be replaced with the correct LUN number of the disk that should
75 * do the periodic flushes. The value of the key is the number of bytes
76 * written between flushes. A value of 0 (the default) denotes no flushes. */
77#define VBOX_PERIODIC_FLUSH
78
79/** @def VBOX_IGNORE_FLUSH
80 * Enable support for ignoring VDI flush requests. This can be useful for
81 * filesystems that show bad guest IDE write performance (especially with
82 * Windows guests). NOTE that this does not disable the flushes caused by
83 * the periodic flush cache feature above.
84 * If this feature is enabled, it can be configured via the CFGM key
85 * "VBoxInternal/Devices/piix3ide/0/LUN#<x>/Config/IgnoreFlush". @verbatim<x>@endverbatim
86 * must be replaced with the correct LUN number of the disk that should
87 * ignore flush requests. The value of the key is a boolean. The default
88 * is to ignore flushes, i.e. true. */
89#define VBOX_IGNORE_FLUSH
90
91
92/*********************************************************************************************************************************
93* Defined types, constants and macros *
94*********************************************************************************************************************************/
95
96/** Converts a pointer to VBOXDISK::IMedia to a PVBOXDISK. */
97#define PDMIMEDIA_2_VBOXDISK(pInterface) \
98 ( (PVBOXDISK)((uintptr_t)pInterface - RT_OFFSETOF(VBOXDISK, IMedia)) )
99
100/** Saved state version of an I/O request .*/
101#define DRVVD_IOREQ_SAVED_STATE_VERSION UINT32_C(1)
102/** Maximum number of request errors in the release log before muting. */
103#define DRVVD_MAX_LOG_REL_ERRORS 100
104
105/** Forward declaration for the dis kcontainer. */
106typedef struct VBOXDISK *PVBOXDISK;
107
108/**
109 * VBox disk container, image information, private part.
110 */
111
112typedef struct VBOXIMAGE
113{
114 /** Pointer to next image. */
115 struct VBOXIMAGE *pNext;
116 /** Pointer to list of VD interfaces. Per-image. */
117 PVDINTERFACE pVDIfsImage;
118 /** Configuration information interface. */
119 VDINTERFACECONFIG VDIfConfig;
120 /** TCP network stack interface. */
121 VDINTERFACETCPNET VDIfTcpNet;
122 /** I/O interface. */
123 VDINTERFACEIO VDIfIo;
124} VBOXIMAGE, *PVBOXIMAGE;
125
126/**
127 * Storage backend data.
128 */
129typedef struct DRVVDSTORAGEBACKEND
130{
131 /** PDM async completion end point. */
132 PPDMASYNCCOMPLETIONENDPOINT pEndpoint;
133 /** The template. */
134 PPDMASYNCCOMPLETIONTEMPLATE pTemplate;
135 /** Event semaphore for synchronous operations. */
136 RTSEMEVENT EventSem;
137 /** Flag whether a synchronous operation is currently pending. */
138 volatile bool fSyncIoPending;
139 /** Return code of the last completed request. */
140 int rcReqLast;
141 /** Callback routine */
142 PFNVDCOMPLETED pfnCompleted;
143} DRVVDSTORAGEBACKEND, *PDRVVDSTORAGEBACKEND;
144
145/**
146 * VD I/O request state.
147 */
148typedef enum VDIOREQSTATE
149{
150 /** Invalid. */
151 VDIOREQSTATE_INVALID = 0,
152 /** The request is not in use and resides on the free list. */
153 VDIOREQSTATE_FREE,
154 /** The request was just allocated and is not active. */
155 VDIOREQSTATE_ALLOCATED,
156 /** The request was allocated and is in use. */
157 VDIOREQSTATE_ACTIVE,
158 /** The request was suspended and is not actively processed. */
159 VDIOREQSTATE_SUSPENDED,
160 /** The request is in the last step of completion and syncs memory. */
161 VDIOREQSTATE_COMPLETING,
162 /** The request completed. */
163 VDIOREQSTATE_COMPLETED,
164 /** The request was aborted but wasn't returned as complete from the storage
165 * layer below us. */
166 VDIOREQSTATE_CANCELED,
167 /** 32bit hack. */
168 VDIOREQSTATE_32BIT_HACK = 0x7fffffff
169} VDIOREQSTATE;
170
171/**
172 * VD I/O Request.
173 */
174typedef struct PDMMEDIAEXIOREQINT
175{
176 /** List node for the list of allocated requests. */
177 RTLISTNODE NdAllocatedList;
178 /** List for requests waiting for I/O memory or on the redo list. */
179 RTLISTNODE NdLstWait;
180 /** I/O request type. */
181 PDMMEDIAEXIOREQTYPE enmType;
182 /** Request state. */
183 volatile VDIOREQSTATE enmState;
184 /** I/O request ID. */
185 PDMMEDIAEXIOREQID uIoReqId;
186 /** Pointer to the disk container. */
187 PVBOXDISK pDisk;
188 /** Flags. */
189 uint32_t fFlags;
190 /** Timestamp when the request was submitted. */
191 uint64_t tsSubmit;
192 /** Type dependent data. */
193 union
194 {
195 /** Read/Write request sepcific data. */
196 struct
197 {
198 /** Start offset of the request. */
199 uint64_t offStart;
200 /** Size of the request. */
201 size_t cbReq;
202 /** Size left for this request. */
203 size_t cbReqLeft;
204 /** Size of the allocated I/O buffer. */
205 size_t cbIoBuf;
206 /** I/O buffer descriptor. */
207 IOBUFDESC IoBuf;
208 } ReadWrite;
209 /** Discard specific data. */
210 struct
211 {
212 /** Pointer to array of ranges to discard. */
213 PRTRANGE paRanges;
214 /** Number of ranges to discard. */
215 unsigned cRanges;
216 } Discard;
217 };
218 /** Allocator specific memory - variable size. */
219 uint8_t abAlloc[1];
220} PDMMEDIAEXIOREQINT;
221/** Pointer to a VD I/O request. */
222typedef PDMMEDIAEXIOREQINT *PPDMMEDIAEXIOREQINT;
223
224/**
225 * Structure for holding a list of allocated requests.
226 */
227typedef struct VDLSTIOREQALLOC
228{
229 /** Mutex protecting the table of allocated requests. */
230 RTSEMFASTMUTEX hMtxLstIoReqAlloc;
231 /** List anchor. */
232 RTLISTANCHOR LstIoReqAlloc;
233} VDLSTIOREQALLOC;
234typedef VDLSTIOREQALLOC *PVDLSTIOREQALLOC;
235
236/** Number of bins for allocated requests. */
237#define DRVVD_VDIOREQ_ALLOC_BINS 8
238
239/**
240 * VBox disk container media main structure, private part.
241 *
242 * @implements PDMIMEDIA
243 * @implements PDMIMEDIAEX
244 * @implements PDMIMOUNT
245 * @implements VDINTERFACEERROR
246 * @implements VDINTERFACETCPNET
247 * @implements VDINTERFACEASYNCIO
248 * @implements VDINTERFACECONFIG
249 */
250typedef struct VBOXDISK
251{
252 /** The VBox disk container. */
253 PVBOXHDD pDisk;
254 /** The media interface. */
255 PDMIMEDIA IMedia;
256 /** Media port. */
257 PPDMIMEDIAPORT pDrvMediaPort;
258 /** Pointer to the driver instance. */
259 PPDMDRVINS pDrvIns;
260 /** Flag whether suspend has changed image open mode to read only. */
261 bool fTempReadOnly;
262 /** Flag whether to use the runtime (true) or startup error facility. */
263 bool fErrorUseRuntime;
264 /** Pointer to list of VD interfaces. Per-disk. */
265 PVDINTERFACE pVDIfsDisk;
266 /** Error interface. */
267 VDINTERFACEERROR VDIfError;
268 /** Thread synchronization interface. */
269 VDINTERFACETHREADSYNC VDIfThreadSync;
270
271 /** Flag whether opened disk supports async I/O operations. */
272 bool fAsyncIOSupported;
273 /** Pointer to the list of data we need to keep per image. */
274 PVBOXIMAGE pImages;
275 /** Flag whether the media should allow concurrent open for writing. */
276 bool fShareable;
277 /** Flag whether a merge operation has been set up. */
278 bool fMergePending;
279 /** Synchronization to prevent destruction before merge finishes. */
280 RTSEMFASTMUTEX MergeCompleteMutex;
281 /** Synchronization between merge and other image accesses. */
282 RTSEMRW MergeLock;
283 /** Source image index for merging. */
284 unsigned uMergeSource;
285 /** Target image index for merging. */
286 unsigned uMergeTarget;
287
288 /** Flag whether boot acceleration is enabled. */
289 bool fBootAccelEnabled;
290 /** Flag whether boot acceleration is currently active. */
291 bool fBootAccelActive;
292 /** Size of the disk, used for read truncation. */
293 uint64_t cbDisk;
294 /** Size of the configured buffer. */
295 size_t cbBootAccelBuffer;
296 /** Start offset for which the buffer holds data. */
297 uint64_t offDisk;
298 /** Number of valid bytes in the buffer. */
299 size_t cbDataValid;
300 /** The disk buffer. */
301 uint8_t *pbData;
302 /** Bandwidth group the disk is assigned to. */
303 char *pszBwGroup;
304 /** Flag whether async I/O using the host cache is enabled. */
305 bool fAsyncIoWithHostCache;
306
307 /** I/O interface for a cache image. */
308 VDINTERFACEIO VDIfIoCache;
309 /** Interface list for the cache image. */
310 PVDINTERFACE pVDIfsCache;
311
312 /** The block cache handle if configured. */
313 PPDMBLKCACHE pBlkCache;
314 /** Host block device manager. */
315 HBDMGR hHbdMgr;
316
317 /** Drive type. */
318 PDMMEDIATYPE enmType;
319 /** Locked indicator. */
320 bool fLocked;
321 /** Mountable indicator. */
322 bool fMountable;
323 /** Visible to the BIOS. */
324 bool fBiosVisible;
325 /** Flag whether this medium should be presented as non rotational. */
326 bool fNonRotational;
327#ifdef VBOX_PERIODIC_FLUSH
328 /** HACK: Configuration value for number of bytes written after which to flush. */
329 uint32_t cbFlushInterval;
330 /** HACK: Current count for the number of bytes written since the last flush. */
331 uint32_t cbDataWritten;
332#endif /* VBOX_PERIODIC_FLUSH */
333#ifdef VBOX_IGNORE_FLUSH
334 /** HACK: Disable flushes for this drive. */
335 bool fIgnoreFlush;
336 /** Disable async flushes for this drive. */
337 bool fIgnoreFlushAsync;
338#endif /* VBOX_IGNORE_FLUSH */
339 /** Our mountable interface. */
340 PDMIMOUNT IMount;
341 /** Pointer to the mount notify interface above us. */
342 PPDMIMOUNTNOTIFY pDrvMountNotify;
343 /** Uuid of the drive. */
344 RTUUID Uuid;
345 /** BIOS PCHS Geometry. */
346 PDMMEDIAGEOMETRY PCHSGeometry;
347 /** BIOS LCHS Geometry. */
348 PDMMEDIAGEOMETRY LCHSGeometry;
349
350 /** Cryptographic support
351 * @{ */
352 /** Pointer to the CFGM node containing the config of the crypto filter
353 * if enable. */
354 PCFGMNODE pCfgCrypto;
355 /** Config interface for the encryption filter. */
356 VDINTERFACECONFIG VDIfCfg;
357 /** Crypto interface for the encryption filter. */
358 VDINTERFACECRYPTO VDIfCrypto;
359 /** The secret key interface used to retrieve keys. */
360 PPDMISECKEY pIfSecKey;
361 /** The secret key helper interface used to notify about missing keys. */
362 PPDMISECKEYHLP pIfSecKeyHlp;
363 /** @} */
364
365 /** @name IMEDIAEX interface support specific members.
366 * @{ */
367 /** Pointer to the IMEDIAEXPORT interface above us. */
368 PPDMIMEDIAEXPORT pDrvMediaExPort;
369 /** Our extended media interface. */
370 PDMIMEDIAEX IMediaEx;
371 /** Memory cache for the I/O requests. */
372 RTMEMCACHE hIoReqCache;
373 /** I/O buffer manager. */
374 IOBUFMGR hIoBufMgr;
375 /** Active request counter. */
376 volatile uint32_t cIoReqsActive;
377 /** Bins for allocated requests. */
378 VDLSTIOREQALLOC aIoReqAllocBins[DRVVD_VDIOREQ_ALLOC_BINS];
379 /** List of requests for I/O memory to be available - VDIOREQ::NdLstWait. */
380 RTLISTANCHOR LstIoReqIoBufWait;
381 /** Critical section protecting the list of requests waiting for I/O memory. */
382 RTCRITSECT CritSectIoReqsIoBufWait;
383 /** Number of requests waiting for a I/O buffer. */
384 volatile uint32_t cIoReqsWaiting;
385 /** Flag whether we have to resubmit requests on resume because the
386 * VM was suspended due to a recoverable I/O error.
387 */
388 volatile bool fRedo;
389 /** List of requests we have to redo. */
390 RTLISTANCHOR LstIoReqRedo;
391 /** Criticial section protecting the list of waiting requests. */
392 RTCRITSECT CritSectIoReqRedo;
393 /** Number of errors logged so far. */
394 unsigned cErrors;
395 /** @} */
396} VBOXDISK;
397
398
399/*********************************************************************************************************************************
400* Internal Functions *
401*********************************************************************************************************************************/
402
403static DECLCALLBACK(void) drvvdMediaExIoReqComplete(void *pvUser1, void *pvUser2, int rcReq);
404static void drvvdPowerOffOrDestructOrUnmount(PPDMDRVINS pDrvIns);
405DECLINLINE(void) drvvdMediaExIoReqBufFree(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq);
406static int drvvdMediaExIoReqCompleteWorker(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, int rcReq, bool fUpNotify);
407static int drvvdMediaExIoReqReadWriteProcess(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, bool fUpNotify);
408
409/**
410 * Internal: allocate new image descriptor and put it in the list
411 */
412static PVBOXIMAGE drvvdNewImage(PVBOXDISK pThis)
413{
414 AssertPtr(pThis);
415 PVBOXIMAGE pImage = (PVBOXIMAGE)RTMemAllocZ(sizeof(VBOXIMAGE));
416 if (pImage)
417 {
418 pImage->pVDIfsImage = NULL;
419 PVBOXIMAGE *pp = &pThis->pImages;
420 while (*pp != NULL)
421 pp = &(*pp)->pNext;
422 *pp = pImage;
423 pImage->pNext = NULL;
424 }
425
426 return pImage;
427}
428
429/**
430 * Internal: free the list of images descriptors.
431 */
432static void drvvdFreeImages(PVBOXDISK pThis)
433{
434 while (pThis->pImages != NULL)
435 {
436 PVBOXIMAGE p = pThis->pImages;
437 pThis->pImages = pThis->pImages->pNext;
438 RTMemFree(p);
439 }
440}
441
442
443/**
444 * Make the image temporarily read-only.
445 *
446 * @returns VBox status code.
447 * @param pThis The driver instance data.
448 */
449static int drvvdSetReadonly(PVBOXDISK pThis)
450{
451 int rc = VINF_SUCCESS;
452 if ( pThis->pDisk
453 && !VDIsReadOnly(pThis->pDisk))
454 {
455 unsigned uOpenFlags;
456 rc = VDGetOpenFlags(pThis->pDisk, VD_LAST_IMAGE, &uOpenFlags);
457 AssertRC(rc);
458 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
459 rc = VDSetOpenFlags(pThis->pDisk, VD_LAST_IMAGE, uOpenFlags);
460 AssertRC(rc);
461 pThis->fTempReadOnly = true;
462 }
463 return rc;
464}
465
466
467/**
468 * Undo the temporary read-only status of the image.
469 *
470 * @returns VBox status code.
471 * @param pThis The driver instance data.
472 */
473static int drvvdSetWritable(PVBOXDISK pThis)
474{
475 int rc = VINF_SUCCESS;
476 if (pThis->fTempReadOnly)
477 {
478 unsigned uOpenFlags;
479 rc = VDGetOpenFlags(pThis->pDisk, VD_LAST_IMAGE, &uOpenFlags);
480 AssertRC(rc);
481 uOpenFlags &= ~VD_OPEN_FLAGS_READONLY;
482 rc = VDSetOpenFlags(pThis->pDisk, VD_LAST_IMAGE, uOpenFlags);
483 if (RT_SUCCESS(rc))
484 pThis->fTempReadOnly = false;
485 else
486 AssertRC(rc);
487 }
488 return rc;
489}
490
491
492/*********************************************************************************************************************************
493* Error reporting callback *
494*********************************************************************************************************************************/
495
496static DECLCALLBACK(void) drvvdErrorCallback(void *pvUser, int rc, RT_SRC_POS_DECL,
497 const char *pszFormat, va_list va)
498{
499 PPDMDRVINS pDrvIns = (PPDMDRVINS)pvUser;
500 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
501 if (pThis->fErrorUseRuntime)
502 /* We must not pass VMSETRTERR_FLAGS_FATAL as it could lead to a
503 * deadlock: We are probably executed in a thread context != EMT
504 * and the EM thread would wait until every thread is suspended
505 * but we would wait for the EM thread ... */
506
507 PDMDrvHlpVMSetRuntimeErrorV(pDrvIns, /* fFlags=*/ 0, "DrvVD", pszFormat, va);
508 else
509 PDMDrvHlpVMSetErrorV(pDrvIns, rc, RT_SRC_POS_ARGS, pszFormat, va);
510}
511
512
513/*********************************************************************************************************************************
514* VD Async I/O interface implementation *
515*********************************************************************************************************************************/
516
517#ifdef VBOX_WITH_PDM_ASYNC_COMPLETION
518
519static DECLCALLBACK(void) drvvdAsyncTaskCompleted(PPDMDRVINS pDrvIns, void *pvTemplateUser, void *pvUser, int rcReq)
520{
521 RT_NOREF(pDrvIns);
522 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pvTemplateUser;
523
524 LogFlowFunc(("pDrvIns=%#p pvTemplateUser=%#p pvUser=%#p rcReq=%d\n",
525 pDrvIns, pvTemplateUser, pvUser, rcReq));
526
527 if (pStorageBackend->fSyncIoPending)
528 {
529 Assert(!pvUser);
530 pStorageBackend->rcReqLast = rcReq;
531 ASMAtomicWriteBool(&pStorageBackend->fSyncIoPending, false);
532 RTSemEventSignal(pStorageBackend->EventSem);
533 }
534 else
535 {
536 int rc;
537
538 AssertPtr(pvUser);
539
540 AssertPtr(pStorageBackend->pfnCompleted);
541 rc = pStorageBackend->pfnCompleted(pvUser, rcReq);
542 AssertRC(rc);
543 }
544}
545
546static DECLCALLBACK(int) drvvdAsyncIOOpen(void *pvUser, const char *pszLocation,
547 uint32_t fOpen,
548 PFNVDCOMPLETED pfnCompleted,
549 void **ppStorage)
550{
551 PVBOXDISK pThis = (PVBOXDISK)pvUser;
552 PDRVVDSTORAGEBACKEND pStorageBackend = NULL;
553 int rc = VINF_SUCCESS;
554
555 /*
556 * Check whether the backend wants to open a block device and try to prepare it
557 * if we didn't claim it yet.
558 *
559 * We only create a block device manager on demand to not waste any resources.
560 */
561 if (HBDMgrIsBlockDevice(pszLocation))
562 {
563 if (pThis->hHbdMgr == NIL_HBDMGR)
564 rc = HBDMgrCreate(&pThis->hHbdMgr);
565
566 if ( RT_SUCCESS(rc)
567 && !HBDMgrIsBlockDeviceClaimed(pThis->hHbdMgr, pszLocation))
568 rc = HBDMgrClaimBlockDevice(pThis->hHbdMgr, pszLocation);
569
570 if (RT_FAILURE(rc))
571 return rc;
572 }
573
574 pStorageBackend = (PDRVVDSTORAGEBACKEND)RTMemAllocZ(sizeof(DRVVDSTORAGEBACKEND));
575 if (pStorageBackend)
576 {
577 pStorageBackend->fSyncIoPending = false;
578 pStorageBackend->rcReqLast = VINF_SUCCESS;
579 pStorageBackend->pfnCompleted = pfnCompleted;
580
581 rc = RTSemEventCreate(&pStorageBackend->EventSem);
582 if (RT_SUCCESS(rc))
583 {
584 rc = PDMDrvHlpAsyncCompletionTemplateCreate(pThis->pDrvIns, &pStorageBackend->pTemplate,
585 drvvdAsyncTaskCompleted, pStorageBackend, "AsyncTaskCompleted");
586 if (RT_SUCCESS(rc))
587 {
588 uint32_t fFlags = (fOpen & RTFILE_O_ACCESS_MASK) == RTFILE_O_READ
589 ? PDMACEP_FILE_FLAGS_READ_ONLY
590 : 0;
591 if (pThis->fShareable)
592 {
593 Assert((fOpen & RTFILE_O_DENY_MASK) == RTFILE_O_DENY_NONE);
594
595 fFlags |= PDMACEP_FILE_FLAGS_DONT_LOCK;
596 }
597 if (pThis->fAsyncIoWithHostCache)
598 fFlags |= PDMACEP_FILE_FLAGS_HOST_CACHE_ENABLED;
599
600 rc = PDMR3AsyncCompletionEpCreateForFile(&pStorageBackend->pEndpoint,
601 pszLocation, fFlags,
602 pStorageBackend->pTemplate);
603
604 if (RT_SUCCESS(rc))
605 {
606 if (pThis->pszBwGroup)
607 rc = PDMR3AsyncCompletionEpSetBwMgr(pStorageBackend->pEndpoint, pThis->pszBwGroup);
608
609 if (RT_SUCCESS(rc))
610 {
611 LogFlow(("drvvdAsyncIOOpen: Successfully opened '%s'; fOpen=%#x pStorage=%p\n",
612 pszLocation, fOpen, pStorageBackend));
613 *ppStorage = pStorageBackend;
614 return VINF_SUCCESS;
615 }
616
617 PDMR3AsyncCompletionEpClose(pStorageBackend->pEndpoint);
618 }
619
620 PDMR3AsyncCompletionTemplateDestroy(pStorageBackend->pTemplate);
621 }
622 RTSemEventDestroy(pStorageBackend->EventSem);
623 }
624 RTMemFree(pStorageBackend);
625 }
626 else
627 rc = VERR_NO_MEMORY;
628
629 return rc;
630}
631
632static DECLCALLBACK(int) drvvdAsyncIOClose(void *pvUser, void *pStorage)
633{
634 RT_NOREF(pvUser);
635 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
636
637 /*
638 * We don't unclaim any block devices on purpose here because they
639 * might get reopened shortly (switching to readonly during suspend)
640 *
641 * Block devices will get unclaimed during destruction of the driver.
642 */
643
644 PDMR3AsyncCompletionEpClose(pStorageBackend->pEndpoint);
645 PDMR3AsyncCompletionTemplateDestroy(pStorageBackend->pTemplate);
646 RTSemEventDestroy(pStorageBackend->EventSem);
647 RTMemFree(pStorageBackend);
648 return VINF_SUCCESS;;
649}
650
651static DECLCALLBACK(int) drvvdAsyncIOReadSync(void *pvUser, void *pStorage, uint64_t uOffset,
652 void *pvBuf, size_t cbRead, size_t *pcbRead)
653{
654 RT_NOREF(pvUser);
655 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
656 RTSGSEG DataSeg;
657 PPDMASYNCCOMPLETIONTASK pTask;
658
659 bool fOld = ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, true);
660 Assert(!fOld); NOREF(fOld);
661 DataSeg.cbSeg = cbRead;
662 DataSeg.pvSeg = pvBuf;
663
664 int rc = PDMR3AsyncCompletionEpRead(pStorageBackend->pEndpoint, uOffset, &DataSeg, 1, cbRead, NULL, &pTask);
665 if (RT_FAILURE(rc))
666 return rc;
667
668 if (rc == VINF_AIO_TASK_PENDING)
669 {
670 /* Wait */
671 rc = RTSemEventWait(pStorageBackend->EventSem, RT_INDEFINITE_WAIT);
672 AssertRC(rc);
673 }
674 else
675 ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, false);
676
677 if (pcbRead)
678 *pcbRead = cbRead;
679
680 return pStorageBackend->rcReqLast;
681}
682
683static DECLCALLBACK(int) drvvdAsyncIOWriteSync(void *pvUser, void *pStorage, uint64_t uOffset,
684 const void *pvBuf, size_t cbWrite, size_t *pcbWritten)
685{
686 RT_NOREF(pvUser);
687 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
688 RTSGSEG DataSeg;
689 PPDMASYNCCOMPLETIONTASK pTask;
690
691 bool fOld = ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, true);
692 Assert(!fOld); NOREF(fOld);
693 DataSeg.cbSeg = cbWrite;
694 DataSeg.pvSeg = (void *)pvBuf;
695
696 int rc = PDMR3AsyncCompletionEpWrite(pStorageBackend->pEndpoint, uOffset, &DataSeg, 1, cbWrite, NULL, &pTask);
697 if (RT_FAILURE(rc))
698 return rc;
699
700 if (rc == VINF_AIO_TASK_PENDING)
701 {
702 /* Wait */
703 rc = RTSemEventWait(pStorageBackend->EventSem, RT_INDEFINITE_WAIT);
704 AssertRC(rc);
705 }
706 else
707 ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, false);
708
709 if (pcbWritten)
710 *pcbWritten = cbWrite;
711
712 return pStorageBackend->rcReqLast;
713}
714
715static DECLCALLBACK(int) drvvdAsyncIOFlushSync(void *pvUser, void *pStorage)
716{
717 RT_NOREF(pvUser);
718 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
719 PPDMASYNCCOMPLETIONTASK pTask;
720
721 LogFlowFunc(("pvUser=%#p pStorage=%#p\n", pvUser, pStorage));
722
723 bool fOld = ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, true);
724 Assert(!fOld); NOREF(fOld);
725
726 int rc = PDMR3AsyncCompletionEpFlush(pStorageBackend->pEndpoint, NULL, &pTask);
727 if (RT_FAILURE(rc))
728 return rc;
729
730 if (rc == VINF_AIO_TASK_PENDING)
731 {
732 /* Wait */
733 LogFlowFunc(("Waiting for flush to complete\n"));
734 rc = RTSemEventWait(pStorageBackend->EventSem, RT_INDEFINITE_WAIT);
735 AssertRC(rc);
736 }
737 else
738 ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, false);
739
740 return pStorageBackend->rcReqLast;
741}
742
743static DECLCALLBACK(int) drvvdAsyncIOReadAsync(void *pvUser, void *pStorage, uint64_t uOffset,
744 PCRTSGSEG paSegments, size_t cSegments,
745 size_t cbRead, void *pvCompletion,
746 void **ppTask)
747{
748 RT_NOREF(pvUser);
749 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
750
751 int rc = PDMR3AsyncCompletionEpRead(pStorageBackend->pEndpoint, uOffset, paSegments, (unsigned)cSegments, cbRead,
752 pvCompletion, (PPPDMASYNCCOMPLETIONTASK)ppTask);
753 if (rc == VINF_AIO_TASK_PENDING)
754 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
755
756 return rc;
757}
758
759static DECLCALLBACK(int) drvvdAsyncIOWriteAsync(void *pvUser, void *pStorage, uint64_t uOffset,
760 PCRTSGSEG paSegments, size_t cSegments,
761 size_t cbWrite, void *pvCompletion,
762 void **ppTask)
763{
764 RT_NOREF(pvUser);
765 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
766
767 int rc = PDMR3AsyncCompletionEpWrite(pStorageBackend->pEndpoint, uOffset, paSegments, (unsigned)cSegments, cbWrite,
768 pvCompletion, (PPPDMASYNCCOMPLETIONTASK)ppTask);
769 if (rc == VINF_AIO_TASK_PENDING)
770 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
771
772 return rc;
773}
774
775static DECLCALLBACK(int) drvvdAsyncIOFlushAsync(void *pvUser, void *pStorage,
776 void *pvCompletion, void **ppTask)
777{
778 RT_NOREF(pvUser);
779 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
780
781 int rc = PDMR3AsyncCompletionEpFlush(pStorageBackend->pEndpoint, pvCompletion,
782 (PPPDMASYNCCOMPLETIONTASK)ppTask);
783 if (rc == VINF_AIO_TASK_PENDING)
784 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
785
786 return rc;
787}
788
789static DECLCALLBACK(int) drvvdAsyncIOGetSize(void *pvUser, void *pStorage, uint64_t *pcbSize)
790{
791 RT_NOREF(pvUser);
792 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
793
794 return PDMR3AsyncCompletionEpGetSize(pStorageBackend->pEndpoint, pcbSize);
795}
796
797static DECLCALLBACK(int) drvvdAsyncIOSetSize(void *pvUser, void *pStorage, uint64_t cbSize)
798{
799 RT_NOREF(pvUser);
800 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
801
802 return PDMR3AsyncCompletionEpSetSize(pStorageBackend->pEndpoint, cbSize);
803}
804
805static DECLCALLBACK(int) drvvdAsyncIOSetAllocationSize(void *pvUser, void *pvStorage, uint64_t cbSize, uint32_t fFlags)
806{
807 RT_NOREF(pvUser, pvStorage, cbSize, fFlags);
808 return VERR_NOT_SUPPORTED;
809}
810
811#endif /* VBOX_WITH_PDM_ASYNC_COMPLETION */
812
813
814/*********************************************************************************************************************************
815* VD Thread Synchronization interface implementation *
816*********************************************************************************************************************************/
817
818static DECLCALLBACK(int) drvvdThreadStartRead(void *pvUser)
819{
820 PVBOXDISK pThis = (PVBOXDISK)pvUser;
821
822 return RTSemRWRequestRead(pThis->MergeLock, RT_INDEFINITE_WAIT);
823}
824
825static DECLCALLBACK(int) drvvdThreadFinishRead(void *pvUser)
826{
827 PVBOXDISK pThis = (PVBOXDISK)pvUser;
828
829 return RTSemRWReleaseRead(pThis->MergeLock);
830}
831
832static DECLCALLBACK(int) drvvdThreadStartWrite(void *pvUser)
833{
834 PVBOXDISK pThis = (PVBOXDISK)pvUser;
835
836 return RTSemRWRequestWrite(pThis->MergeLock, RT_INDEFINITE_WAIT);
837}
838
839static DECLCALLBACK(int) drvvdThreadFinishWrite(void *pvUser)
840{
841 PVBOXDISK pThis = (PVBOXDISK)pvUser;
842
843 return RTSemRWReleaseWrite(pThis->MergeLock);
844}
845
846
847/*********************************************************************************************************************************
848* VD Configuration interface implementation *
849*********************************************************************************************************************************/
850
851static DECLCALLBACK(bool) drvvdCfgAreKeysValid(void *pvUser, const char *pszzValid)
852{
853 return CFGMR3AreValuesValid((PCFGMNODE)pvUser, pszzValid);
854}
855
856static DECLCALLBACK(int) drvvdCfgQuerySize(void *pvUser, const char *pszName, size_t *pcb)
857{
858 return CFGMR3QuerySize((PCFGMNODE)pvUser, pszName, pcb);
859}
860
861static DECLCALLBACK(int) drvvdCfgQuery(void *pvUser, const char *pszName, char *pszString, size_t cchString)
862{
863 return CFGMR3QueryString((PCFGMNODE)pvUser, pszName, pszString, cchString);
864}
865
866static DECLCALLBACK(int) drvvdCfgQueryBytes(void *pvUser, const char *pszName, void *ppvData, size_t cbData)
867{
868 return CFGMR3QueryBytes((PCFGMNODE)pvUser, pszName, ppvData, cbData);
869}
870
871
872/*******************************************************************************
873* VD Crypto interface implementation for the encryption support *
874*******************************************************************************/
875
876static DECLCALLBACK(int) drvvdCryptoKeyRetain(void *pvUser, const char *pszId, const uint8_t **ppbKey, size_t *pcbKey)
877{
878 PVBOXDISK pThis = (PVBOXDISK)pvUser;
879 int rc = VINF_SUCCESS;
880
881 AssertPtr(pThis->pIfSecKey);
882 if (pThis->pIfSecKey)
883 rc = pThis->pIfSecKey->pfnKeyRetain(pThis->pIfSecKey, pszId, ppbKey, pcbKey);
884 else
885 rc = VERR_NOT_SUPPORTED;
886
887 return rc;
888}
889
890static DECLCALLBACK(int) drvvdCryptoKeyRelease(void *pvUser, const char *pszId)
891{
892 PVBOXDISK pThis = (PVBOXDISK)pvUser;
893 int rc = VINF_SUCCESS;
894
895 AssertPtr(pThis->pIfSecKey);
896 if (pThis->pIfSecKey)
897 rc = pThis->pIfSecKey->pfnKeyRelease(pThis->pIfSecKey, pszId);
898 else
899 rc = VERR_NOT_SUPPORTED;
900
901 return rc;
902}
903
904static DECLCALLBACK(int) drvvdCryptoKeyStorePasswordRetain(void *pvUser, const char *pszId, const char **ppszPassword)
905{
906 PVBOXDISK pThis = (PVBOXDISK)pvUser;
907 int rc = VINF_SUCCESS;
908
909 AssertPtr(pThis->pIfSecKey);
910 if (pThis->pIfSecKey)
911 rc = pThis->pIfSecKey->pfnPasswordRetain(pThis->pIfSecKey, pszId, ppszPassword);
912 else
913 rc = VERR_NOT_SUPPORTED;
914
915 return rc;
916}
917
918static DECLCALLBACK(int) drvvdCryptoKeyStorePasswordRelease(void *pvUser, const char *pszId)
919{
920 PVBOXDISK pThis = (PVBOXDISK)pvUser;
921 int rc = VINF_SUCCESS;
922
923 AssertPtr(pThis->pIfSecKey);
924 if (pThis->pIfSecKey)
925 rc = pThis->pIfSecKey->pfnPasswordRelease(pThis->pIfSecKey, pszId);
926 else
927 rc = VERR_NOT_SUPPORTED;
928
929 return rc;
930}
931
932#ifdef VBOX_WITH_INIP
933
934
935/*********************************************************************************************************************************
936* VD TCP network stack interface implementation - INIP case *
937*********************************************************************************************************************************/
938
939/**
940 * vvl: this structure duplicate meaning of sockaddr,
941 * perhaps it'd be better to get rid of it.
942 */
943typedef union INIPSOCKADDRUNION
944{
945 struct sockaddr Addr;
946 struct sockaddr_in Ipv4;
947#if LWIP_IPV6
948 struct sockaddr_in6 Ipv6;
949#endif
950} INIPSOCKADDRUNION;
951
952typedef struct INIPSOCKET
953{
954 int hSock;
955} INIPSOCKET, *PINIPSOCKET;
956
957static DECLCALLBACK(int) drvvdINIPFlush(VDSOCKET Sock);
958
959/** @interface_method_impl{VDINTERFACETCPNET,pfnSocketCreate} */
960static DECLCALLBACK(int) drvvdINIPSocketCreate(uint32_t fFlags, PVDSOCKET pSock)
961{
962 PINIPSOCKET pSocketInt = NULL;
963
964 /*
965 * The extended select method is not supported because it is impossible to wakeup
966 * the thread.
967 */
968 if (fFlags & VD_INTERFACETCPNET_CONNECT_EXTENDED_SELECT)
969 return VERR_NOT_SUPPORTED;
970
971 pSocketInt = (PINIPSOCKET)RTMemAllocZ(sizeof(INIPSOCKET));
972 if (pSocketInt)
973 {
974 pSocketInt->hSock = INT32_MAX;
975 *pSock = (VDSOCKET)pSocketInt;
976 return VINF_SUCCESS;
977 }
978
979 return VERR_NO_MEMORY;
980}
981
982/** @interface_method_impl{VDINTERFACETCPNET,pfnSocketCreate} */
983static DECLCALLBACK(int) drvvdINIPSocketDestroy(VDSOCKET Sock)
984{
985 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
986
987 RTMemFree(pSocketInt);
988 return VINF_SUCCESS;
989}
990
991/** @interface_method_impl{VDINTERFACETCPNET,pfnClientConnect} */
992static DECLCALLBACK(int) drvvdINIPClientConnect(VDSOCKET Sock, const char *pszAddress, uint32_t uPort,
993 RTMSINTERVAL cMillies)
994{
995 int rc = VINF_SUCCESS;
996 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
997 int iInetFamily = PF_INET;
998 struct in_addr ip;
999#if LWIP_IPV6
1000 ip6_addr_t ip6;
1001 RT_ZERO(ip6);
1002#endif
1003
1004 NOREF(cMillies); /* LwIP doesn't support connect timeout. */
1005 RT_ZERO(ip); /* Shut up MSC. */
1006
1007 /* Check whether lwIP is set up in this VM instance. */
1008 if (!DevINIPConfigured())
1009 {
1010 LogRelFunc(("no IP stack\n"));
1011 return VERR_NET_HOST_UNREACHABLE;
1012 }
1013 /* Resolve hostname. As there is no standard resolver for lwIP yet,
1014 * just accept numeric IP addresses for now. */
1015#if LWIP_IPV6
1016 if (inet6_aton(pszAddress, &ip6))
1017 iInetFamily = PF_INET6;
1018 else /* concatination with if */
1019#endif
1020 if (!lwip_inet_aton(pszAddress, &ip))
1021 {
1022 LogRelFunc(("cannot resolve IP %s\n", pszAddress));
1023 return VERR_NET_HOST_UNREACHABLE;
1024 }
1025 /* Create socket and connect. */
1026 int iSock = lwip_socket(iInetFamily, SOCK_STREAM, 0);
1027 if (iSock != -1)
1028 {
1029 struct sockaddr *pSockAddr = NULL;
1030 struct sockaddr_in InAddr = {0};
1031#if LWIP_IPV6
1032 struct sockaddr_in6 In6Addr = {0};
1033#endif
1034 if (iInetFamily == PF_INET)
1035 {
1036 InAddr.sin_family = AF_INET;
1037 InAddr.sin_port = htons(uPort);
1038 InAddr.sin_addr = ip;
1039 InAddr.sin_len = sizeof(InAddr);
1040 pSockAddr = (struct sockaddr *)&InAddr;
1041 }
1042#if LWIP_IPV6
1043 else
1044 {
1045 In6Addr.sin6_family = AF_INET6;
1046 In6Addr.sin6_port = htons(uPort);
1047 memcpy(&In6Addr.sin6_addr, &ip6, sizeof(ip6));
1048 In6Addr.sin6_len = sizeof(In6Addr);
1049 pSockAddr = (struct sockaddr *)&In6Addr;
1050 }
1051#endif
1052 if ( pSockAddr
1053 && !lwip_connect(iSock, pSockAddr, pSockAddr->sa_len))
1054 {
1055 pSocketInt->hSock = iSock;
1056 return VINF_SUCCESS;
1057 }
1058 rc = VERR_NET_CONNECTION_REFUSED; /** @todo real solution needed */
1059 lwip_close(iSock);
1060 }
1061 else
1062 rc = VERR_NET_CONNECTION_REFUSED; /** @todo real solution needed */
1063 return rc;
1064}
1065
1066/** @interface_method_impl{VDINTERFACETCPNET,pfnClientClose} */
1067static DECLCALLBACK(int) drvvdINIPClientClose(VDSOCKET Sock)
1068{
1069 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1070
1071 lwip_close(pSocketInt->hSock);
1072 pSocketInt->hSock = INT32_MAX;
1073 return VINF_SUCCESS; /** @todo real solution needed */
1074}
1075
1076/** @interface_method_impl{VDINTERFACETCPNET,pfnIsClientConnected} */
1077static DECLCALLBACK(bool) drvvdINIPIsClientConnected(VDSOCKET Sock)
1078{
1079 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1080
1081 return pSocketInt->hSock != INT32_MAX;
1082}
1083
1084/** @interface_method_impl{VDINTERFACETCPNET,pfnSelectOne} */
1085static DECLCALLBACK(int) drvvdINIPSelectOne(VDSOCKET Sock, RTMSINTERVAL cMillies)
1086{
1087 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1088 fd_set fdsetR;
1089 FD_ZERO(&fdsetR);
1090 FD_SET((uintptr_t)pSocketInt->hSock, &fdsetR);
1091 fd_set fdsetE = fdsetR;
1092
1093 int rc;
1094 if (cMillies == RT_INDEFINITE_WAIT)
1095 rc = lwip_select(pSocketInt->hSock + 1, &fdsetR, NULL, &fdsetE, NULL);
1096 else
1097 {
1098 struct timeval timeout;
1099 timeout.tv_sec = cMillies / 1000;
1100 timeout.tv_usec = (cMillies % 1000) * 1000;
1101 rc = lwip_select(pSocketInt->hSock + 1, &fdsetR, NULL, &fdsetE, &timeout);
1102 }
1103 if (rc > 0)
1104 return VINF_SUCCESS;
1105 if (rc == 0)
1106 return VERR_TIMEOUT;
1107 return VERR_NET_CONNECTION_REFUSED; /** @todo real solution needed */
1108}
1109
1110/** @interface_method_impl{VDINTERFACETCPNET,pfnRead} */
1111static DECLCALLBACK(int) drvvdINIPRead(VDSOCKET Sock, void *pvBuffer, size_t cbBuffer, size_t *pcbRead)
1112{
1113 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1114
1115 /* Do params checking */
1116 if (!pvBuffer || !cbBuffer)
1117 {
1118 AssertMsgFailed(("Invalid params\n"));
1119 return VERR_INVALID_PARAMETER;
1120 }
1121
1122 /*
1123 * Read loop.
1124 * If pcbRead is NULL we have to fill the entire buffer!
1125 */
1126 size_t cbRead = 0;
1127 size_t cbToRead = cbBuffer;
1128 for (;;)
1129 {
1130 /** @todo this clipping here is just in case (the send function
1131 * needed it, so I added it here, too). Didn't investigate if this
1132 * really has issues. Better be safe than sorry. */
1133 ssize_t cbBytesRead = lwip_recv(pSocketInt->hSock, (char *)pvBuffer + cbRead,
1134 RT_MIN(cbToRead, 32768), 0);
1135 if (cbBytesRead < 0)
1136 return VERR_NET_CONNECTION_REFUSED; /** @todo real solution */
1137 if (cbBytesRead == 0 && errno) /** @todo r=bird: lwip_recv will not touch errno on Windows. This may apply to other hosts as well */
1138 return VERR_NET_CONNECTION_REFUSED; /** @todo real solution */
1139 if (pcbRead)
1140 {
1141 /* return partial data */
1142 *pcbRead = cbBytesRead;
1143 break;
1144 }
1145
1146 /* read more? */
1147 cbRead += cbBytesRead;
1148 if (cbRead == cbBuffer)
1149 break;
1150
1151 /* next */
1152 cbToRead = cbBuffer - cbRead;
1153 }
1154
1155 return VINF_SUCCESS;
1156}
1157
1158/** @interface_method_impl{VDINTERFACETCPNET,pfnWrite} */
1159static DECLCALLBACK(int) drvvdINIPWrite(VDSOCKET Sock, const void *pvBuffer, size_t cbBuffer)
1160{
1161 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1162
1163 do
1164 {
1165 /** @todo lwip send only supports up to 65535 bytes in a single
1166 * send (stupid limitation buried in the code), so make sure we
1167 * don't get any wraparounds. This should be moved to DevINIP
1168 * stack interface once that's implemented. */
1169 ssize_t cbWritten = lwip_send(pSocketInt->hSock, (void *)pvBuffer,
1170 RT_MIN(cbBuffer, 32768), 0);
1171 if (cbWritten < 0)
1172 return VERR_NET_CONNECTION_REFUSED; /** @todo real solution needed */
1173 AssertMsg(cbBuffer >= (size_t)cbWritten, ("Wrote more than we requested!!! cbWritten=%d cbBuffer=%d\n",
1174 cbWritten, cbBuffer));
1175 cbBuffer -= cbWritten;
1176 pvBuffer = (const char *)pvBuffer + cbWritten;
1177 } while (cbBuffer);
1178
1179 return VINF_SUCCESS;
1180}
1181
1182/** @interface_method_impl{VDINTERFACETCPNET,pfnSgWrite} */
1183static DECLCALLBACK(int) drvvdINIPSgWrite(VDSOCKET Sock, PCRTSGBUF pSgBuf)
1184{
1185 int rc = VINF_SUCCESS;
1186
1187 /* This is an extremely crude emulation, however it's good enough
1188 * for our iSCSI code. INIP has no sendmsg(). */
1189 for (unsigned i = 0; i < pSgBuf->cSegs; i++)
1190 {
1191 rc = drvvdINIPWrite(Sock, pSgBuf->paSegs[i].pvSeg,
1192 pSgBuf->paSegs[i].cbSeg);
1193 if (RT_FAILURE(rc))
1194 break;
1195 }
1196 if (RT_SUCCESS(rc))
1197 drvvdINIPFlush(Sock);
1198
1199 return rc;
1200}
1201
1202/** @interface_method_impl{VDINTERFACETCPNET,pfnFlush} */
1203static DECLCALLBACK(int) drvvdINIPFlush(VDSOCKET Sock)
1204{
1205 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1206
1207 int fFlag = 1;
1208 lwip_setsockopt(pSocketInt->hSock, IPPROTO_TCP, TCP_NODELAY,
1209 (const char *)&fFlag, sizeof(fFlag));
1210 fFlag = 0;
1211 lwip_setsockopt(pSocketInt->hSock, IPPROTO_TCP, TCP_NODELAY,
1212 (const char *)&fFlag, sizeof(fFlag));
1213 return VINF_SUCCESS;
1214}
1215
1216/** @interface_method_impl{VDINTERFACETCPNET,pfnSetSendCoalescing} */
1217static DECLCALLBACK(int) drvvdINIPSetSendCoalescing(VDSOCKET Sock, bool fEnable)
1218{
1219 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1220
1221 int fFlag = fEnable ? 0 : 1;
1222 lwip_setsockopt(pSocketInt->hSock, IPPROTO_TCP, TCP_NODELAY,
1223 (const char *)&fFlag, sizeof(fFlag));
1224 return VINF_SUCCESS;
1225}
1226
1227/** @interface_method_impl{VDINTERFACETCPNET,pfnGetLocalAddress} */
1228static DECLCALLBACK(int) drvvdINIPGetLocalAddress(VDSOCKET Sock, PRTNETADDR pAddr)
1229{
1230 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1231 INIPSOCKADDRUNION u;
1232 socklen_t cbAddr = sizeof(u);
1233 RT_ZERO(u);
1234 if (!lwip_getsockname(pSocketInt->hSock, &u.Addr, &cbAddr))
1235 {
1236 /*
1237 * Convert the address.
1238 */
1239 if ( cbAddr == sizeof(struct sockaddr_in)
1240 && u.Addr.sa_family == AF_INET)
1241 {
1242 RT_ZERO(*pAddr);
1243 pAddr->enmType = RTNETADDRTYPE_IPV4;
1244 pAddr->uPort = RT_N2H_U16(u.Ipv4.sin_port);
1245 pAddr->uAddr.IPv4.u = u.Ipv4.sin_addr.s_addr;
1246 }
1247#if LWIP_IPV6
1248 else if ( cbAddr == sizeof(struct sockaddr_in6)
1249 && u.Addr.sa_family == AF_INET6)
1250 {
1251 RT_ZERO(*pAddr);
1252 pAddr->enmType = RTNETADDRTYPE_IPV6;
1253 pAddr->uPort = RT_N2H_U16(u.Ipv6.sin6_port);
1254 memcpy(&pAddr->uAddr.IPv6, &u.Ipv6.sin6_addr, sizeof(RTNETADDRIPV6));
1255 }
1256#endif
1257 else
1258 return VERR_NET_ADDRESS_FAMILY_NOT_SUPPORTED;
1259 return VINF_SUCCESS;
1260 }
1261 return VERR_NET_OPERATION_NOT_SUPPORTED;
1262}
1263
1264/** @interface_method_impl{VDINTERFACETCPNET,pfnGetPeerAddress} */
1265static DECLCALLBACK(int) drvvdINIPGetPeerAddress(VDSOCKET Sock, PRTNETADDR pAddr)
1266{
1267 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1268 INIPSOCKADDRUNION u;
1269 socklen_t cbAddr = sizeof(u);
1270 RT_ZERO(u);
1271 if (!lwip_getpeername(pSocketInt->hSock, &u.Addr, &cbAddr))
1272 {
1273 /*
1274 * Convert the address.
1275 */
1276 if ( cbAddr == sizeof(struct sockaddr_in)
1277 && u.Addr.sa_family == AF_INET)
1278 {
1279 RT_ZERO(*pAddr);
1280 pAddr->enmType = RTNETADDRTYPE_IPV4;
1281 pAddr->uPort = RT_N2H_U16(u.Ipv4.sin_port);
1282 pAddr->uAddr.IPv4.u = u.Ipv4.sin_addr.s_addr;
1283 }
1284#if LWIP_IPV6
1285 else if ( cbAddr == sizeof(struct sockaddr_in6)
1286 && u.Addr.sa_family == AF_INET6)
1287 {
1288 RT_ZERO(*pAddr);
1289 pAddr->enmType = RTNETADDRTYPE_IPV6;
1290 pAddr->uPort = RT_N2H_U16(u.Ipv6.sin6_port);
1291 memcpy(&pAddr->uAddr.IPv6, &u.Ipv6.sin6_addr, sizeof(RTNETADDRIPV6));
1292 }
1293#endif
1294 else
1295 return VERR_NET_ADDRESS_FAMILY_NOT_SUPPORTED;
1296 return VINF_SUCCESS;
1297 }
1298 return VERR_NET_OPERATION_NOT_SUPPORTED;
1299}
1300
1301/** @interface_method_impl{VDINTERFACETCPNET,pfnSelectOneEx} */
1302static DECLCALLBACK(int) drvvdINIPSelectOneEx(VDSOCKET Sock, uint32_t fEvents, uint32_t *pfEvents, RTMSINTERVAL cMillies)
1303{
1304 RT_NOREF(Sock, fEvents, pfEvents, cMillies);
1305 AssertMsgFailed(("Not supported!\n"));
1306 return VERR_NOT_SUPPORTED;
1307}
1308
1309/** @interface_method_impl{VDINTERFACETCPNET,pfnPoke} */
1310static DECLCALLBACK(int) drvvdINIPPoke(VDSOCKET Sock)
1311{
1312 RT_NOREF(Sock);
1313 AssertMsgFailed(("Not supported!\n"));
1314 return VERR_NOT_SUPPORTED;
1315}
1316
1317#endif /* VBOX_WITH_INIP */
1318
1319
1320/*********************************************************************************************************************************
1321* VD TCP network stack interface implementation - Host TCP case *
1322*********************************************************************************************************************************/
1323
1324/**
1325 * Socket data.
1326 */
1327typedef struct VDSOCKETINT
1328{
1329 /** IPRT socket handle. */
1330 RTSOCKET hSocket;
1331 /** Pollset with the wakeup pipe and socket. */
1332 RTPOLLSET hPollSet;
1333 /** Pipe endpoint - read (in the pollset). */
1334 RTPIPE hPipeR;
1335 /** Pipe endpoint - write. */
1336 RTPIPE hPipeW;
1337 /** Flag whether the thread was woken up. */
1338 volatile bool fWokenUp;
1339 /** Flag whether the thread is waiting in the select call. */
1340 volatile bool fWaiting;
1341 /** Old event mask. */
1342 uint32_t fEventsOld;
1343} VDSOCKETINT, *PVDSOCKETINT;
1344
1345/** Pollset id of the socket. */
1346#define VDSOCKET_POLL_ID_SOCKET 0
1347/** Pollset id of the pipe. */
1348#define VDSOCKET_POLL_ID_PIPE 1
1349
1350/** @interface_method_impl{VDINTERFACETCPNET,pfnSocketCreate} */
1351static DECLCALLBACK(int) drvvdTcpSocketCreate(uint32_t fFlags, PVDSOCKET phVdSock)
1352{
1353 int rc = VINF_SUCCESS;
1354 int rc2 = VINF_SUCCESS;
1355 PVDSOCKETINT pSockInt = NULL;
1356
1357 pSockInt = (PVDSOCKETINT)RTMemAllocZ(sizeof(VDSOCKETINT));
1358 if (!pSockInt)
1359 return VERR_NO_MEMORY;
1360
1361 pSockInt->hSocket = NIL_RTSOCKET;
1362 pSockInt->hPollSet = NIL_RTPOLLSET;
1363 pSockInt->hPipeR = NIL_RTPIPE;
1364 pSockInt->hPipeW = NIL_RTPIPE;
1365 pSockInt->fWokenUp = false;
1366 pSockInt->fWaiting = false;
1367
1368 if (fFlags & VD_INTERFACETCPNET_CONNECT_EXTENDED_SELECT)
1369 {
1370 /* Init pipe and pollset. */
1371 rc = RTPipeCreate(&pSockInt->hPipeR, &pSockInt->hPipeW, 0);
1372 if (RT_SUCCESS(rc))
1373 {
1374 rc = RTPollSetCreate(&pSockInt->hPollSet);
1375 if (RT_SUCCESS(rc))
1376 {
1377 rc = RTPollSetAddPipe(pSockInt->hPollSet, pSockInt->hPipeR,
1378 RTPOLL_EVT_READ, VDSOCKET_POLL_ID_PIPE);
1379 if (RT_SUCCESS(rc))
1380 {
1381 *phVdSock = pSockInt;
1382 return VINF_SUCCESS;
1383 }
1384
1385 RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_PIPE);
1386 rc2 = RTPollSetDestroy(pSockInt->hPollSet);
1387 AssertRC(rc2);
1388 }
1389
1390 rc2 = RTPipeClose(pSockInt->hPipeR);
1391 AssertRC(rc2);
1392 rc2 = RTPipeClose(pSockInt->hPipeW);
1393 AssertRC(rc2);
1394 }
1395 }
1396 else
1397 {
1398 *phVdSock = pSockInt;
1399 return VINF_SUCCESS;
1400 }
1401
1402 RTMemFree(pSockInt);
1403
1404 return rc;
1405}
1406
1407/** @interface_method_impl{VDINTERFACETCPNET,pfnSocketDestroy} */
1408static DECLCALLBACK(int) drvvdTcpSocketDestroy(VDSOCKET hVdSock)
1409{
1410 int rc = VINF_SUCCESS;
1411 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1412
1413 /* Destroy the pipe and pollset if necessary. */
1414 if (pSockInt->hPollSet != NIL_RTPOLLSET)
1415 {
1416 if (pSockInt->hSocket != NIL_RTSOCKET)
1417 {
1418 rc = RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_SOCKET);
1419 Assert(RT_SUCCESS(rc) || rc == VERR_POLL_HANDLE_ID_NOT_FOUND);
1420 }
1421 rc = RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_PIPE);
1422 AssertRC(rc);
1423 rc = RTPollSetDestroy(pSockInt->hPollSet);
1424 AssertRC(rc);
1425 rc = RTPipeClose(pSockInt->hPipeR);
1426 AssertRC(rc);
1427 rc = RTPipeClose(pSockInt->hPipeW);
1428 AssertRC(rc);
1429 }
1430
1431 if (pSockInt->hSocket != NIL_RTSOCKET)
1432 rc = RTTcpClientCloseEx(pSockInt->hSocket, false /*fGracefulShutdown*/);
1433
1434 RTMemFree(pSockInt);
1435
1436 return rc;
1437}
1438
1439/** @interface_method_impl{VDINTERFACETCPNET,pfnClientConnect} */
1440static DECLCALLBACK(int) drvvdTcpClientConnect(VDSOCKET hVdSock, const char *pszAddress, uint32_t uPort,
1441 RTMSINTERVAL cMillies)
1442{
1443 int rc = VINF_SUCCESS;
1444 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1445
1446 rc = RTTcpClientConnectEx(pszAddress, uPort, &pSockInt->hSocket, cMillies, NULL);
1447 if (RT_SUCCESS(rc))
1448 {
1449 /* Add to the pollset if required. */
1450 if (pSockInt->hPollSet != NIL_RTPOLLSET)
1451 {
1452 pSockInt->fEventsOld = RTPOLL_EVT_READ | RTPOLL_EVT_WRITE | RTPOLL_EVT_ERROR;
1453
1454 rc = RTPollSetAddSocket(pSockInt->hPollSet, pSockInt->hSocket,
1455 pSockInt->fEventsOld, VDSOCKET_POLL_ID_SOCKET);
1456 }
1457
1458 if (RT_SUCCESS(rc))
1459 return VINF_SUCCESS;
1460
1461 rc = RTTcpClientCloseEx(pSockInt->hSocket, false /*fGracefulShutdown*/);
1462 }
1463
1464 return rc;
1465}
1466
1467/** @interface_method_impl{VDINTERFACETCPNET,pfnClientClose} */
1468static DECLCALLBACK(int) drvvdTcpClientClose(VDSOCKET hVdSock)
1469{
1470 int rc = VINF_SUCCESS;
1471 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1472
1473 if (pSockInt->hPollSet != NIL_RTPOLLSET)
1474 {
1475 rc = RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_SOCKET);
1476 AssertRC(rc);
1477 }
1478
1479 rc = RTTcpClientCloseEx(pSockInt->hSocket, false /*fGracefulShutdown*/);
1480 pSockInt->hSocket = NIL_RTSOCKET;
1481
1482 return rc;
1483}
1484
1485/** @interface_method_impl{VDINTERFACETCPNET,pfnIsClientConnected} */
1486static DECLCALLBACK(bool) drvvdTcpIsClientConnected(VDSOCKET hVdSock)
1487{
1488 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1489
1490 return pSockInt->hSocket != NIL_RTSOCKET;
1491}
1492
1493/** @interface_method_impl{VDINTERFACETCPNET,pfnSelectOne} */
1494static DECLCALLBACK(int) drvvdTcpSelectOne(VDSOCKET hVdSock, RTMSINTERVAL cMillies)
1495{
1496 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1497
1498 return RTTcpSelectOne(pSockInt->hSocket, cMillies);
1499}
1500
1501/** @interface_method_impl{VDINTERFACETCPNET,pfnRead} */
1502static DECLCALLBACK(int) drvvdTcpRead(VDSOCKET hVdSock, void *pvBuffer, size_t cbBuffer, size_t *pcbRead)
1503{
1504 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1505
1506 return RTTcpRead(pSockInt->hSocket, pvBuffer, cbBuffer, pcbRead);
1507}
1508
1509/** @interface_method_impl{VDINTERFACETCPNET,pfnWrite} */
1510static DECLCALLBACK(int) drvvdTcpWrite(VDSOCKET hVdSock, const void *pvBuffer, size_t cbBuffer)
1511{
1512 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1513
1514 return RTTcpWrite(pSockInt->hSocket, pvBuffer, cbBuffer);
1515}
1516
1517/** @interface_method_impl{VDINTERFACETCPNET,pfnSgWrite} */
1518static DECLCALLBACK(int) drvvdTcpSgWrite(VDSOCKET hVdSock, PCRTSGBUF pSgBuf)
1519{
1520 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1521
1522 return RTTcpSgWrite(pSockInt->hSocket, pSgBuf);
1523}
1524
1525/** @interface_method_impl{VDINTERFACETCPNET,pfnReadNB} */
1526static DECLCALLBACK(int) drvvdTcpReadNB(VDSOCKET hVdSock, void *pvBuffer, size_t cbBuffer, size_t *pcbRead)
1527{
1528 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1529
1530 return RTTcpReadNB(pSockInt->hSocket, pvBuffer, cbBuffer, pcbRead);
1531}
1532
1533/** @interface_method_impl{VDINTERFACETCPNET,pfnWriteNB} */
1534static DECLCALLBACK(int) drvvdTcpWriteNB(VDSOCKET hVdSock, const void *pvBuffer, size_t cbBuffer, size_t *pcbWritten)
1535{
1536 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1537
1538 return RTTcpWriteNB(pSockInt->hSocket, pvBuffer, cbBuffer, pcbWritten);
1539}
1540
1541/** @interface_method_impl{VDINTERFACETCPNET,pfnSgWriteNB} */
1542static DECLCALLBACK(int) drvvdTcpSgWriteNB(VDSOCKET hVdSock, PRTSGBUF pSgBuf, size_t *pcbWritten)
1543{
1544 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1545
1546 return RTTcpSgWriteNB(pSockInt->hSocket, pSgBuf, pcbWritten);
1547}
1548
1549/** @interface_method_impl{VDINTERFACETCPNET,pfnFlush} */
1550static DECLCALLBACK(int) drvvdTcpFlush(VDSOCKET hVdSock)
1551{
1552 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1553
1554 return RTTcpFlush(pSockInt->hSocket);
1555}
1556
1557/** @interface_method_impl{VDINTERFACETCPNET,pfnSetSendCoalescing} */
1558static DECLCALLBACK(int) drvvdTcpSetSendCoalescing(VDSOCKET hVdSock, bool fEnable)
1559{
1560 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1561
1562 return RTTcpSetSendCoalescing(pSockInt->hSocket, fEnable);
1563}
1564
1565/** @interface_method_impl{VDINTERFACETCPNET,pfnGetLocalAddress} */
1566static DECLCALLBACK(int) drvvdTcpGetLocalAddress(VDSOCKET hVdSock, PRTNETADDR pAddr)
1567{
1568 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1569
1570 return RTTcpGetLocalAddress(pSockInt->hSocket, pAddr);
1571}
1572
1573/** @interface_method_impl{VDINTERFACETCPNET,pfnGetPeerAddress} */
1574static DECLCALLBACK(int) drvvdTcpGetPeerAddress(VDSOCKET hVdSock, PRTNETADDR pAddr)
1575{
1576 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1577
1578 return RTTcpGetPeerAddress(pSockInt->hSocket, pAddr);
1579}
1580
1581static DECLCALLBACK(int) drvvdTcpSelectOneExPoll(VDSOCKET hVdSock, uint32_t fEvents,
1582 uint32_t *pfEvents, RTMSINTERVAL cMillies)
1583{
1584 int rc = VINF_SUCCESS;
1585 uint32_t id = 0;
1586 uint32_t fEventsRecv = 0;
1587 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1588
1589 *pfEvents = 0;
1590
1591 if ( pSockInt->fEventsOld != fEvents
1592 && pSockInt->hSocket != NIL_RTSOCKET)
1593 {
1594 uint32_t fPollEvents = 0;
1595
1596 if (fEvents & VD_INTERFACETCPNET_EVT_READ)
1597 fPollEvents |= RTPOLL_EVT_READ;
1598 if (fEvents & VD_INTERFACETCPNET_EVT_WRITE)
1599 fPollEvents |= RTPOLL_EVT_WRITE;
1600 if (fEvents & VD_INTERFACETCPNET_EVT_ERROR)
1601 fPollEvents |= RTPOLL_EVT_ERROR;
1602
1603 rc = RTPollSetEventsChange(pSockInt->hPollSet, VDSOCKET_POLL_ID_SOCKET, fPollEvents);
1604 if (RT_FAILURE(rc))
1605 return rc;
1606
1607 pSockInt->fEventsOld = fEvents;
1608 }
1609
1610 ASMAtomicXchgBool(&pSockInt->fWaiting, true);
1611 if (ASMAtomicXchgBool(&pSockInt->fWokenUp, false))
1612 {
1613 ASMAtomicXchgBool(&pSockInt->fWaiting, false);
1614 return VERR_INTERRUPTED;
1615 }
1616
1617 rc = RTPoll(pSockInt->hPollSet, cMillies, &fEventsRecv, &id);
1618 Assert(RT_SUCCESS(rc) || rc == VERR_TIMEOUT);
1619
1620 ASMAtomicXchgBool(&pSockInt->fWaiting, false);
1621
1622 if (RT_SUCCESS(rc))
1623 {
1624 if (id == VDSOCKET_POLL_ID_SOCKET)
1625 {
1626 fEventsRecv &= RTPOLL_EVT_VALID_MASK;
1627
1628 if (fEventsRecv & RTPOLL_EVT_READ)
1629 *pfEvents |= VD_INTERFACETCPNET_EVT_READ;
1630 if (fEventsRecv & RTPOLL_EVT_WRITE)
1631 *pfEvents |= VD_INTERFACETCPNET_EVT_WRITE;
1632 if (fEventsRecv & RTPOLL_EVT_ERROR)
1633 *pfEvents |= VD_INTERFACETCPNET_EVT_ERROR;
1634 }
1635 else
1636 {
1637 size_t cbRead = 0;
1638 uint8_t abBuf[10];
1639 Assert(id == VDSOCKET_POLL_ID_PIPE);
1640 Assert((fEventsRecv & RTPOLL_EVT_VALID_MASK) == RTPOLL_EVT_READ);
1641
1642 /* We got interrupted, drain the pipe. */
1643 rc = RTPipeRead(pSockInt->hPipeR, abBuf, sizeof(abBuf), &cbRead);
1644 AssertRC(rc);
1645
1646 ASMAtomicXchgBool(&pSockInt->fWokenUp, false);
1647
1648 rc = VERR_INTERRUPTED;
1649 }
1650 }
1651
1652 return rc;
1653}
1654
1655/** @interface_method_impl{VDINTERFACETCPNET,pfnSelectOneEx} */
1656static DECLCALLBACK(int) drvvdTcpSelectOneExNoPoll(VDSOCKET hVdSock, uint32_t fEvents, uint32_t *pfEvents, RTMSINTERVAL cMillies)
1657{
1658 RT_NOREF(cMillies); /** @todo timeouts */
1659 int rc = VINF_SUCCESS;
1660 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1661
1662 *pfEvents = 0;
1663
1664 ASMAtomicXchgBool(&pSockInt->fWaiting, true);
1665 if (ASMAtomicXchgBool(&pSockInt->fWokenUp, false))
1666 {
1667 ASMAtomicXchgBool(&pSockInt->fWaiting, false);
1668 return VERR_INTERRUPTED;
1669 }
1670
1671 if ( pSockInt->hSocket == NIL_RTSOCKET
1672 || !fEvents)
1673 {
1674 /*
1675 * Only the pipe is configured or the caller doesn't wait for a socket event,
1676 * wait until there is something to read from the pipe.
1677 */
1678 size_t cbRead = 0;
1679 char ch = 0;
1680 rc = RTPipeReadBlocking(pSockInt->hPipeR, &ch, 1, &cbRead);
1681 if (RT_SUCCESS(rc))
1682 {
1683 Assert(cbRead == 1);
1684 rc = VERR_INTERRUPTED;
1685 ASMAtomicXchgBool(&pSockInt->fWokenUp, false);
1686 }
1687 }
1688 else
1689 {
1690 uint32_t fSelectEvents = 0;
1691
1692 if (fEvents & VD_INTERFACETCPNET_EVT_READ)
1693 fSelectEvents |= RTSOCKET_EVT_READ;
1694 if (fEvents & VD_INTERFACETCPNET_EVT_WRITE)
1695 fSelectEvents |= RTSOCKET_EVT_WRITE;
1696 if (fEvents & VD_INTERFACETCPNET_EVT_ERROR)
1697 fSelectEvents |= RTSOCKET_EVT_ERROR;
1698
1699 if (fEvents & VD_INTERFACETCPNET_HINT_INTERRUPT)
1700 {
1701 uint32_t fEventsRecv = 0;
1702
1703 /* Make sure the socket is not in the pollset. */
1704 rc = RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_SOCKET);
1705 Assert(RT_SUCCESS(rc) || rc == VERR_POLL_HANDLE_ID_NOT_FOUND);
1706
1707 for (;;)
1708 {
1709 uint32_t id = 0;
1710 rc = RTPoll(pSockInt->hPollSet, 5, &fEvents, &id);
1711 if (rc == VERR_TIMEOUT)
1712 {
1713 /* Check the socket. */
1714 rc = RTTcpSelectOneEx(pSockInt->hSocket, fSelectEvents, &fEventsRecv, 0);
1715 if (RT_SUCCESS(rc))
1716 {
1717 if (fEventsRecv & RTSOCKET_EVT_READ)
1718 *pfEvents |= VD_INTERFACETCPNET_EVT_READ;
1719 if (fEventsRecv & RTSOCKET_EVT_WRITE)
1720 *pfEvents |= VD_INTERFACETCPNET_EVT_WRITE;
1721 if (fEventsRecv & RTSOCKET_EVT_ERROR)
1722 *pfEvents |= VD_INTERFACETCPNET_EVT_ERROR;
1723 break; /* Quit */
1724 }
1725 else if (rc != VERR_TIMEOUT)
1726 break;
1727 }
1728 else if (RT_SUCCESS(rc))
1729 {
1730 size_t cbRead = 0;
1731 uint8_t abBuf[10];
1732 Assert(id == VDSOCKET_POLL_ID_PIPE);
1733 Assert((fEventsRecv & RTPOLL_EVT_VALID_MASK) == RTPOLL_EVT_READ);
1734
1735 /* We got interrupted, drain the pipe. */
1736 rc = RTPipeRead(pSockInt->hPipeR, abBuf, sizeof(abBuf), &cbRead);
1737 AssertRC(rc);
1738
1739 ASMAtomicXchgBool(&pSockInt->fWokenUp, false);
1740
1741 rc = VERR_INTERRUPTED;
1742 break;
1743 }
1744 else
1745 break;
1746 }
1747 }
1748 else /* The caller waits for a socket event. */
1749 {
1750 uint32_t fEventsRecv = 0;
1751
1752 /* Loop until we got woken up or a socket event occurred. */
1753 for (;;)
1754 {
1755 /** @todo find an adaptive wait algorithm based on the
1756 * number of wakeups in the past. */
1757 rc = RTTcpSelectOneEx(pSockInt->hSocket, fSelectEvents, &fEventsRecv, 5);
1758 if (rc == VERR_TIMEOUT)
1759 {
1760 /* Check if there is an event pending. */
1761 size_t cbRead = 0;
1762 char ch = 0;
1763 rc = RTPipeRead(pSockInt->hPipeR, &ch, 1, &cbRead);
1764 if (RT_SUCCESS(rc) && rc != VINF_TRY_AGAIN)
1765 {
1766 Assert(cbRead == 1);
1767 rc = VERR_INTERRUPTED;
1768 ASMAtomicXchgBool(&pSockInt->fWokenUp, false);
1769 break; /* Quit */
1770 }
1771 else
1772 Assert(rc == VINF_TRY_AGAIN);
1773 }
1774 else if (RT_SUCCESS(rc))
1775 {
1776 if (fEventsRecv & RTSOCKET_EVT_READ)
1777 *pfEvents |= VD_INTERFACETCPNET_EVT_READ;
1778 if (fEventsRecv & RTSOCKET_EVT_WRITE)
1779 *pfEvents |= VD_INTERFACETCPNET_EVT_WRITE;
1780 if (fEventsRecv & RTSOCKET_EVT_ERROR)
1781 *pfEvents |= VD_INTERFACETCPNET_EVT_ERROR;
1782 break; /* Quit */
1783 }
1784 else
1785 break;
1786 }
1787 }
1788 }
1789
1790 ASMAtomicXchgBool(&pSockInt->fWaiting, false);
1791
1792 return rc;
1793}
1794
1795/** @interface_method_impl{VDINTERFACETCPNET,pfnPoke} */
1796static DECLCALLBACK(int) drvvdTcpPoke(VDSOCKET hVdSock)
1797{
1798 int rc = VINF_SUCCESS;
1799 size_t cbWritten = 0;
1800 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1801
1802 ASMAtomicXchgBool(&pSockInt->fWokenUp, true);
1803
1804 if (ASMAtomicReadBool(&pSockInt->fWaiting))
1805 {
1806 rc = RTPipeWrite(pSockInt->hPipeW, "", 1, &cbWritten);
1807 Assert(RT_SUCCESS(rc) || cbWritten == 0);
1808 }
1809
1810 return VINF_SUCCESS;
1811}
1812
1813/**
1814 * Checks the prerequisites for encrypted I/O.
1815 *
1816 * @returns VBox status code.
1817 * @param pThis The VD driver instance data.
1818 * @param fSetError Flag whether to set a runtime error.
1819 */
1820static int drvvdKeyCheckPrereqs(PVBOXDISK pThis, bool fSetError)
1821{
1822 if ( pThis->pCfgCrypto
1823 && !pThis->pIfSecKey)
1824 {
1825 AssertPtr(pThis->pIfSecKeyHlp);
1826 pThis->pIfSecKeyHlp->pfnKeyMissingNotify(pThis->pIfSecKeyHlp);
1827
1828 if (fSetError)
1829 {
1830 int rc = PDMDrvHlpVMSetRuntimeError(pThis->pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_DEKMISSING",
1831 N_("VD: The DEK for this disk is missing"));
1832 AssertRC(rc);
1833 }
1834 return VERR_VD_DEK_MISSING;
1835 }
1836
1837 return VINF_SUCCESS;
1838}
1839
1840
1841/*********************************************************************************************************************************
1842* Media interface methods *
1843*********************************************************************************************************************************/
1844
1845/** @interface_method_impl{PDMIMEDIA,pfnRead} */
1846static DECLCALLBACK(int) drvvdRead(PPDMIMEDIA pInterface,
1847 uint64_t off, void *pvBuf, size_t cbRead)
1848{
1849 int rc = VINF_SUCCESS;
1850
1851 LogFlowFunc(("off=%#llx pvBuf=%p cbRead=%d\n", off, pvBuf, cbRead));
1852 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
1853
1854 /*
1855 * Check the state.
1856 */
1857 if (!pThis->pDisk)
1858 {
1859 AssertMsgFailed(("Invalid state! Not mounted!\n"));
1860 return VERR_PDM_MEDIA_NOT_MOUNTED;
1861 }
1862
1863 rc = drvvdKeyCheckPrereqs(pThis, true /* fSetError */);
1864 if (RT_FAILURE(rc))
1865 return rc;
1866
1867 if (!pThis->fBootAccelActive)
1868 rc = VDRead(pThis->pDisk, off, pvBuf, cbRead);
1869 else
1870 {
1871 /* Can we serve the request from the buffer? */
1872 if ( off >= pThis->offDisk
1873 && off - pThis->offDisk < pThis->cbDataValid)
1874 {
1875 size_t cbToCopy = RT_MIN(cbRead, pThis->offDisk + pThis->cbDataValid - off);
1876
1877 memcpy(pvBuf, pThis->pbData + (off - pThis->offDisk), cbToCopy);
1878 cbRead -= cbToCopy;
1879 off += cbToCopy;
1880 pvBuf = (char *)pvBuf + cbToCopy;
1881 }
1882
1883 if ( cbRead > 0
1884 && cbRead < pThis->cbBootAccelBuffer)
1885 {
1886 /* Increase request to the buffer size and read. */
1887 pThis->cbDataValid = RT_MIN(pThis->cbDisk - off, pThis->cbBootAccelBuffer);
1888 pThis->offDisk = off;
1889 rc = VDRead(pThis->pDisk, off, pThis->pbData, pThis->cbDataValid);
1890 if (RT_FAILURE(rc))
1891 pThis->cbDataValid = 0;
1892 else
1893 memcpy(pvBuf, pThis->pbData, cbRead);
1894 }
1895 else if (cbRead >= pThis->cbBootAccelBuffer)
1896 {
1897 pThis->fBootAccelActive = false; /* Deactiviate */
1898 }
1899 }
1900
1901 if (RT_SUCCESS(rc))
1902 Log2(("%s: off=%#llx pvBuf=%p cbRead=%d\n%.*Rhxd\n", __FUNCTION__,
1903 off, pvBuf, cbRead, cbRead, pvBuf));
1904 LogFlowFunc(("returns %Rrc\n", rc));
1905 return rc;
1906}
1907
1908/** @interface_method_impl{PDMIMEDIA,pfnRead} */
1909static DECLCALLBACK(int) drvvdReadPcBios(PPDMIMEDIA pInterface,
1910 uint64_t off, void *pvBuf, size_t cbRead)
1911{
1912 int rc = VINF_SUCCESS;
1913
1914 LogFlowFunc(("off=%#llx pvBuf=%p cbRead=%d\n", off, pvBuf, cbRead));
1915 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
1916
1917 /*
1918 * Check the state.
1919 */
1920 if (!pThis->pDisk)
1921 {
1922 AssertMsgFailed(("Invalid state! Not mounted!\n"));
1923 return VERR_PDM_MEDIA_NOT_MOUNTED;
1924 }
1925
1926 if ( pThis->pCfgCrypto
1927 && !pThis->pIfSecKey)
1928 return VERR_VD_DEK_MISSING;
1929
1930 if (!pThis->fBootAccelActive)
1931 rc = VDRead(pThis->pDisk, off, pvBuf, cbRead);
1932 else
1933 {
1934 /* Can we serve the request from the buffer? */
1935 if ( off >= pThis->offDisk
1936 && off - pThis->offDisk < pThis->cbDataValid)
1937 {
1938 size_t cbToCopy = RT_MIN(cbRead, pThis->offDisk + pThis->cbDataValid - off);
1939
1940 memcpy(pvBuf, pThis->pbData + (off - pThis->offDisk), cbToCopy);
1941 cbRead -= cbToCopy;
1942 off += cbToCopy;
1943 pvBuf = (char *)pvBuf + cbToCopy;
1944 }
1945
1946 if ( cbRead > 0
1947 && cbRead < pThis->cbBootAccelBuffer)
1948 {
1949 /* Increase request to the buffer size and read. */
1950 pThis->cbDataValid = RT_MIN(pThis->cbDisk - off, pThis->cbBootAccelBuffer);
1951 pThis->offDisk = off;
1952 rc = VDRead(pThis->pDisk, off, pThis->pbData, pThis->cbDataValid);
1953 if (RT_FAILURE(rc))
1954 pThis->cbDataValid = 0;
1955 else
1956 memcpy(pvBuf, pThis->pbData, cbRead);
1957 }
1958 else if (cbRead >= pThis->cbBootAccelBuffer)
1959 {
1960 pThis->fBootAccelActive = false; /* Deactiviate */
1961 }
1962 }
1963
1964 if (RT_SUCCESS(rc))
1965 Log2(("%s: off=%#llx pvBuf=%p cbRead=%d\n%.*Rhxd\n", __FUNCTION__,
1966 off, pvBuf, cbRead, cbRead, pvBuf));
1967 LogFlowFunc(("returns %Rrc\n", rc));
1968 return rc;
1969}
1970
1971
1972/** @interface_method_impl{PDMIMEDIA,pfnWrite} */
1973static DECLCALLBACK(int) drvvdWrite(PPDMIMEDIA pInterface,
1974 uint64_t off, const void *pvBuf,
1975 size_t cbWrite)
1976{
1977 LogFlowFunc(("off=%#llx pvBuf=%p cbWrite=%d\n", off, pvBuf, cbWrite));
1978 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
1979 Log2(("%s: off=%#llx pvBuf=%p cbWrite=%d\n%.*Rhxd\n", __FUNCTION__,
1980 off, pvBuf, cbWrite, cbWrite, pvBuf));
1981
1982 /*
1983 * Check the state.
1984 */
1985 if (!pThis->pDisk)
1986 {
1987 AssertMsgFailed(("Invalid state! Not mounted!\n"));
1988 return VERR_PDM_MEDIA_NOT_MOUNTED;
1989 }
1990
1991 /* Set an FTM checkpoint as this operation changes the state permanently. */
1992 PDMDrvHlpFTSetCheckpoint(pThis->pDrvIns, FTMCHECKPOINTTYPE_STORAGE);
1993
1994 int rc = drvvdKeyCheckPrereqs(pThis, true /* fSetError */);
1995 if (RT_FAILURE(rc))
1996 return rc;
1997
1998 /* Invalidate any buffer if boot acceleration is enabled. */
1999 if (pThis->fBootAccelActive)
2000 {
2001 pThis->cbDataValid = 0;
2002 pThis->offDisk = 0;
2003 }
2004
2005 rc = VDWrite(pThis->pDisk, off, pvBuf, cbWrite);
2006#ifdef VBOX_PERIODIC_FLUSH
2007 if (pThis->cbFlushInterval)
2008 {
2009 pThis->cbDataWritten += (uint32_t)cbWrite;
2010 if (pThis->cbDataWritten > pThis->cbFlushInterval)
2011 {
2012 pThis->cbDataWritten = 0;
2013 VDFlush(pThis->pDisk);
2014 }
2015 }
2016#endif /* VBOX_PERIODIC_FLUSH */
2017
2018 LogFlowFunc(("returns %Rrc\n", rc));
2019 return rc;
2020}
2021
2022/** @interface_method_impl{PDMIMEDIA,pfnFlush} */
2023static DECLCALLBACK(int) drvvdFlush(PPDMIMEDIA pInterface)
2024{
2025 LogFlowFunc(("\n"));
2026 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2027
2028 /*
2029 * Check the state.
2030 */
2031 if (!pThis->pDisk)
2032 {
2033 AssertMsgFailed(("Invalid state! Not mounted!\n"));
2034 return VERR_PDM_MEDIA_NOT_MOUNTED;
2035 }
2036
2037#ifdef VBOX_IGNORE_FLUSH
2038 if (pThis->fIgnoreFlush)
2039 return VINF_SUCCESS;
2040#endif /* VBOX_IGNORE_FLUSH */
2041
2042 int rc = VDFlush(pThis->pDisk);
2043 LogFlowFunc(("returns %Rrc\n", rc));
2044 return rc;
2045}
2046
2047/** @interface_method_impl{PDMIMEDIA,pfnMerge} */
2048static DECLCALLBACK(int) drvvdMerge(PPDMIMEDIA pInterface,
2049 PFNSIMPLEPROGRESS pfnProgress,
2050 void *pvUser)
2051{
2052 LogFlowFunc(("\n"));
2053 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2054 int rc = VINF_SUCCESS;
2055
2056 /*
2057 * Check the state.
2058 */
2059 if (!pThis->pDisk)
2060 {
2061 AssertMsgFailed(("Invalid state! Not mounted!\n"));
2062 return VERR_PDM_MEDIA_NOT_MOUNTED;
2063 }
2064
2065 /* Note: There is an unavoidable race between destruction and another
2066 * thread invoking this function. This is handled safely and gracefully by
2067 * atomically invalidating the lock handle in drvvdDestruct. */
2068 int rc2 = RTSemFastMutexRequest(pThis->MergeCompleteMutex);
2069 AssertRC(rc2);
2070 if (RT_SUCCESS(rc2) && pThis->fMergePending)
2071 {
2072 /* Take shortcut: PFNSIMPLEPROGRESS is exactly the same type as
2073 * PFNVDPROGRESS, so there's no need for a conversion function. */
2074 /** @todo maybe introduce a conversion which limits update frequency. */
2075 PVDINTERFACE pVDIfsOperation = NULL;
2076 VDINTERFACEPROGRESS VDIfProgress;
2077 VDIfProgress.pfnProgress = pfnProgress;
2078 rc2 = VDInterfaceAdd(&VDIfProgress.Core, "DrvVD_VDIProgress", VDINTERFACETYPE_PROGRESS,
2079 pvUser, sizeof(VDINTERFACEPROGRESS), &pVDIfsOperation);
2080 AssertRC(rc2);
2081 pThis->fMergePending = false;
2082 rc = VDMerge(pThis->pDisk, pThis->uMergeSource,
2083 pThis->uMergeTarget, pVDIfsOperation);
2084 }
2085 rc2 = RTSemFastMutexRelease(pThis->MergeCompleteMutex);
2086 AssertRC(rc2);
2087 LogFlowFunc(("returns %Rrc\n", rc));
2088 return rc;
2089}
2090
2091/** @interface_method_impl{PDMIMEDIA,pfnSetSecKeyIf} */
2092static DECLCALLBACK(int) drvvdSetSecKeyIf(PPDMIMEDIA pInterface, PPDMISECKEY pIfSecKey, PPDMISECKEYHLP pIfSecKeyHlp)
2093{
2094 LogFlowFunc(("\n"));
2095 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2096 int rc = VINF_SUCCESS;
2097
2098 if (pThis->pCfgCrypto)
2099 {
2100 PVDINTERFACE pVDIfFilter = NULL;
2101
2102 pThis->pIfSecKeyHlp = pIfSecKeyHlp;
2103
2104 if ( pThis->pIfSecKey
2105 && !pIfSecKey)
2106 {
2107 /* Unload the crypto filter first to make sure it doesn't access the keys anymore. */
2108 rc = VDFilterRemove(pThis->pDisk, VD_FILTER_FLAGS_DEFAULT);
2109 AssertRC(rc);
2110
2111 pThis->pIfSecKey = NULL;
2112 }
2113
2114 if ( pIfSecKey
2115 && RT_SUCCESS(rc))
2116 {
2117 pThis->pIfSecKey = pIfSecKey;
2118
2119 rc = VDInterfaceAdd(&pThis->VDIfCfg.Core, "DrvVD_Config", VDINTERFACETYPE_CONFIG,
2120 pThis->pCfgCrypto, sizeof(VDINTERFACECONFIG), &pVDIfFilter);
2121 AssertRC(rc);
2122
2123 rc = VDInterfaceAdd(&pThis->VDIfCrypto.Core, "DrvVD_Crypto", VDINTERFACETYPE_CRYPTO,
2124 pThis, sizeof(VDINTERFACECRYPTO), &pVDIfFilter);
2125 AssertRC(rc);
2126
2127 /* Load the crypt filter plugin. */
2128 rc = VDFilterAdd(pThis->pDisk, "CRYPT", VD_FILTER_FLAGS_DEFAULT, pVDIfFilter);
2129 if (RT_FAILURE(rc))
2130 pThis->pIfSecKey = NULL;
2131 }
2132 }
2133 else
2134 rc = VERR_NOT_SUPPORTED;
2135
2136 LogFlowFunc(("returns %Rrc\n", rc));
2137 return rc;
2138}
2139
2140/** @interface_method_impl{PDMIMEDIA,pfnGetSize} */
2141static DECLCALLBACK(uint64_t) drvvdGetSize(PPDMIMEDIA pInterface)
2142{
2143 LogFlowFunc(("\n"));
2144 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2145
2146 /*
2147 * Check the state.
2148 */
2149 if (!pThis->pDisk)
2150 return 0;
2151
2152 uint64_t cb = VDGetSize(pThis->pDisk, VD_LAST_IMAGE);
2153 LogFlowFunc(("returns %#llx (%llu)\n", cb, cb));
2154 return cb;
2155}
2156
2157/** @interface_method_impl{PDMIMEDIA,pfnGetSectorSize} */
2158static DECLCALLBACK(uint32_t) drvvdGetSectorSize(PPDMIMEDIA pInterface)
2159{
2160 LogFlowFunc(("\n"));
2161 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2162
2163 /*
2164 * Check the state.
2165 */
2166 if (!pThis->pDisk)
2167 return 0;
2168
2169 uint32_t cb = VDGetSectorSize(pThis->pDisk, VD_LAST_IMAGE);
2170 LogFlowFunc(("returns %u\n", cb));
2171 return cb;
2172}
2173
2174/** @interface_method_impl{PDMIMEDIA,pfnIsReadOnly} */
2175static DECLCALLBACK(bool) drvvdIsReadOnly(PPDMIMEDIA pInterface)
2176{
2177 LogFlowFunc(("\n"));
2178 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2179
2180 /*
2181 * Check the state.
2182 */
2183 if (!pThis->pDisk)
2184 return false;
2185
2186 bool f = VDIsReadOnly(pThis->pDisk);
2187 LogFlowFunc(("returns %d\n", f));
2188 return f;
2189}
2190
2191/** @interface_method_impl{PDMIMEDIA,pfnIsNonRotational} */
2192static DECLCALLBACK(bool) drvvdIsNonRotational(PPDMIMEDIA pInterface)
2193{
2194 LogFlowFunc(("\n"));
2195 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2196
2197 return pThis->fNonRotational;
2198}
2199
2200/** @interface_method_impl{PDMIMEDIA,pfnBiosGetPCHSGeometry} */
2201static DECLCALLBACK(int) drvvdBiosGetPCHSGeometry(PPDMIMEDIA pInterface,
2202 PPDMMEDIAGEOMETRY pPCHSGeometry)
2203{
2204 LogFlowFunc(("\n"));
2205 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2206 VDGEOMETRY geo;
2207
2208 /*
2209 * Check the state.
2210 */
2211 if (!pThis->pDisk)
2212 return VERR_PDM_MEDIA_NOT_MOUNTED;
2213
2214 /*
2215 * Use configured/cached values if present.
2216 */
2217 if ( pThis->PCHSGeometry.cCylinders > 0
2218 && pThis->PCHSGeometry.cHeads > 0
2219 && pThis->PCHSGeometry.cSectors > 0)
2220 {
2221 *pPCHSGeometry = pThis->PCHSGeometry;
2222 LogFlow(("%s: returns VINF_SUCCESS {%d,%d,%d}\n", __FUNCTION__, pThis->PCHSGeometry.cCylinders, pThis->PCHSGeometry.cHeads, pThis->PCHSGeometry.cSectors));
2223 return VINF_SUCCESS;
2224 }
2225
2226 int rc = VDGetPCHSGeometry(pThis->pDisk, VD_LAST_IMAGE, &geo);
2227 if (RT_SUCCESS(rc))
2228 {
2229 pPCHSGeometry->cCylinders = geo.cCylinders;
2230 pPCHSGeometry->cHeads = geo.cHeads;
2231 pPCHSGeometry->cSectors = geo.cSectors;
2232 pThis->PCHSGeometry = *pPCHSGeometry;
2233 }
2234 else
2235 {
2236 LogFunc(("geometry not available.\n"));
2237 rc = VERR_PDM_GEOMETRY_NOT_SET;
2238 }
2239 LogFlowFunc(("returns %Rrc (CHS=%d/%d/%d)\n",
2240 rc, pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads, pPCHSGeometry->cSectors));
2241 return rc;
2242}
2243
2244/** @interface_method_impl{PDMIMEDIA,pfnBiosSetPCHSGeometry} */
2245static DECLCALLBACK(int) drvvdBiosSetPCHSGeometry(PPDMIMEDIA pInterface,
2246 PCPDMMEDIAGEOMETRY pPCHSGeometry)
2247{
2248 LogFlowFunc(("CHS=%d/%d/%d\n",
2249 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads, pPCHSGeometry->cSectors));
2250 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2251 VDGEOMETRY geo;
2252
2253 /*
2254 * Check the state.
2255 */
2256 if (!pThis->pDisk)
2257 {
2258 AssertMsgFailed(("Invalid state! Not mounted!\n"));
2259 return VERR_PDM_MEDIA_NOT_MOUNTED;
2260 }
2261
2262 geo.cCylinders = pPCHSGeometry->cCylinders;
2263 geo.cHeads = pPCHSGeometry->cHeads;
2264 geo.cSectors = pPCHSGeometry->cSectors;
2265 int rc = VDSetPCHSGeometry(pThis->pDisk, VD_LAST_IMAGE, &geo);
2266 if (rc == VERR_VD_GEOMETRY_NOT_SET)
2267 rc = VERR_PDM_GEOMETRY_NOT_SET;
2268 if (RT_SUCCESS(rc))
2269 pThis->PCHSGeometry = *pPCHSGeometry;
2270 LogFlowFunc(("returns %Rrc\n", rc));
2271 return rc;
2272}
2273
2274/** @interface_method_impl{PDMIMEDIA,pfnBiosGetLCHSGeometry} */
2275static DECLCALLBACK(int) drvvdBiosGetLCHSGeometry(PPDMIMEDIA pInterface,
2276 PPDMMEDIAGEOMETRY pLCHSGeometry)
2277{
2278 LogFlowFunc(("\n"));
2279 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2280 VDGEOMETRY geo;
2281
2282 /*
2283 * Check the state.
2284 */
2285 if (!pThis->pDisk)
2286 return VERR_PDM_MEDIA_NOT_MOUNTED;
2287
2288 /*
2289 * Use configured/cached values if present.
2290 */
2291 if ( pThis->LCHSGeometry.cCylinders > 0
2292 && pThis->LCHSGeometry.cHeads > 0
2293 && pThis->LCHSGeometry.cSectors > 0)
2294 {
2295 *pLCHSGeometry = pThis->LCHSGeometry;
2296 LogFlow(("%s: returns VINF_SUCCESS {%d,%d,%d}\n", __FUNCTION__, pThis->LCHSGeometry.cCylinders, pThis->LCHSGeometry.cHeads, pThis->LCHSGeometry.cSectors));
2297 return VINF_SUCCESS;
2298 }
2299
2300 int rc = VDGetLCHSGeometry(pThis->pDisk, VD_LAST_IMAGE, &geo);
2301 if (RT_SUCCESS(rc))
2302 {
2303 pLCHSGeometry->cCylinders = geo.cCylinders;
2304 pLCHSGeometry->cHeads = geo.cHeads;
2305 pLCHSGeometry->cSectors = geo.cSectors;
2306 pThis->LCHSGeometry = *pLCHSGeometry;
2307 }
2308 else
2309 {
2310 LogFunc(("geometry not available.\n"));
2311 rc = VERR_PDM_GEOMETRY_NOT_SET;
2312 }
2313 LogFlowFunc(("returns %Rrc (CHS=%d/%d/%d)\n",
2314 rc, pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads, pLCHSGeometry->cSectors));
2315 return rc;
2316}
2317
2318/** @interface_method_impl{PDMIMEDIA,pfnBiosSetLCHSGeometry} */
2319static DECLCALLBACK(int) drvvdBiosSetLCHSGeometry(PPDMIMEDIA pInterface,
2320 PCPDMMEDIAGEOMETRY pLCHSGeometry)
2321{
2322 LogFlowFunc(("CHS=%d/%d/%d\n",
2323 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads, pLCHSGeometry->cSectors));
2324 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2325 VDGEOMETRY geo;
2326
2327 /*
2328 * Check the state.
2329 */
2330 if (!pThis->pDisk)
2331 {
2332 AssertMsgFailed(("Invalid state! Not mounted!\n"));
2333 return VERR_PDM_MEDIA_NOT_MOUNTED;
2334 }
2335
2336 geo.cCylinders = pLCHSGeometry->cCylinders;
2337 geo.cHeads = pLCHSGeometry->cHeads;
2338 geo.cSectors = pLCHSGeometry->cSectors;
2339 int rc = VDSetLCHSGeometry(pThis->pDisk, VD_LAST_IMAGE, &geo);
2340 if (rc == VERR_VD_GEOMETRY_NOT_SET)
2341 rc = VERR_PDM_GEOMETRY_NOT_SET;
2342 if (RT_SUCCESS(rc))
2343 pThis->LCHSGeometry = *pLCHSGeometry;
2344 LogFlowFunc(("returns %Rrc\n", rc));
2345 return rc;
2346}
2347
2348/** @interface_method_impl{PDMIMEDIA,pfnBiosIsVisible} */
2349static DECLCALLBACK(bool) drvvdBiosIsVisible(PPDMIMEDIA pInterface)
2350{
2351 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2352 LogFlow(("drvvdBiosIsVisible: returns %d\n", pThis->fBiosVisible));
2353 return pThis->fBiosVisible;
2354}
2355
2356/** @interface_method_impl{PDMIMEDIA,pfnGetType} */
2357static DECLCALLBACK(PDMMEDIATYPE) drvvdGetType(PPDMIMEDIA pInterface)
2358{
2359 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2360 LogFlow(("drvvdBiosIsVisible: returns %d\n", pThis->fBiosVisible));
2361 return pThis->enmType;
2362}
2363
2364/** @interface_method_impl{PDMIMEDIA,pfnGetUuid} */
2365static DECLCALLBACK(int) drvvdGetUuid(PPDMIMEDIA pInterface, PRTUUID pUuid)
2366{
2367 LogFlowFunc(("\n"));
2368 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2369
2370 /*
2371 * Copy the uuid.
2372 */
2373 *pUuid = pThis->Uuid;
2374 LogFlowFunc(("returns {%RTuuid}\n", pUuid));
2375 return VINF_SUCCESS;
2376}
2377
2378static DECLCALLBACK(int) drvvdDiscard(PPDMIMEDIA pInterface, PCRTRANGE paRanges, unsigned cRanges)
2379{
2380 LogFlowFunc(("\n"));
2381 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2382
2383 int rc = VDDiscardRanges(pThis->pDisk, paRanges, cRanges);
2384 LogFlowFunc(("returns %Rrc\n", rc));
2385 return rc;
2386}
2387
2388/* -=-=-=-=- IMount -=-=-=-=- */
2389
2390/** @interface_method_impl{PDMIMOUNT,pfnUnmount} */
2391static DECLCALLBACK(int) drvvdUnmount(PPDMIMOUNT pInterface, bool fForce, bool fEject)
2392{
2393 RT_NOREF(fEject);
2394 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2395
2396 /*
2397 * Validate state.
2398 */
2399 if (!pThis->pDisk)
2400 {
2401 Log(("drvvdUnmount: Not mounted\n"));
2402 return VERR_PDM_MEDIA_NOT_MOUNTED;
2403 }
2404 if (pThis->fLocked && !fForce)
2405 {
2406 Log(("drvvdUnmount: Locked\n"));
2407 return VERR_PDM_MEDIA_LOCKED;
2408 }
2409
2410 /* Media is no longer locked even if it was previously. */
2411 pThis->fLocked = false;
2412 drvvdPowerOffOrDestructOrUnmount(pThis->pDrvIns);
2413
2414 /*
2415 * Notify driver/device above us.
2416 */
2417 if (pThis->pDrvMountNotify)
2418 pThis->pDrvMountNotify->pfnUnmountNotify(pThis->pDrvMountNotify);
2419 Log(("drvblockUnmount: success\n"));
2420 return VINF_SUCCESS;
2421}
2422
2423
2424/** @interface_method_impl{PDMIMOUNT,pfnIsMounted} */
2425static DECLCALLBACK(bool) drvvdIsMounted(PPDMIMOUNT pInterface)
2426{
2427 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2428 return pThis->pDisk != NULL;
2429}
2430
2431/** @interface_method_impl{PDMIMOUNT,pfnLock} */
2432static DECLCALLBACK(int) drvvdLock(PPDMIMOUNT pInterface)
2433{
2434 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2435 Log(("drvblockLock: %d -> %d\n", pThis->fLocked, true));
2436 pThis->fLocked = true;
2437 return VINF_SUCCESS;
2438}
2439
2440/** @interface_method_impl{PDMIMOUNT,pfnUnlock} */
2441static DECLCALLBACK(int) drvvdUnlock(PPDMIMOUNT pInterface)
2442{
2443 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2444 Log(("drvblockUnlock: %d -> %d\n", pThis->fLocked, false));
2445 pThis->fLocked = false;
2446 return VINF_SUCCESS;
2447}
2448
2449/** @interface_method_impl{PDMIMOUNT,pfnIsLocked} */
2450static DECLCALLBACK(bool) drvvdIsLocked(PPDMIMOUNT pInterface)
2451{
2452 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2453 return pThis->fLocked;
2454}
2455
2456
2457static DECLCALLBACK(void) drvvdBlkCacheReqComplete(void *pvUser1, void *pvUser2, int rcReq)
2458{
2459 PVBOXDISK pThis = (PVBOXDISK)pvUser1;
2460
2461 AssertPtr(pThis->pBlkCache);
2462 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, (PPDMBLKCACHEIOXFER)pvUser2, rcReq);
2463}
2464
2465
2466/** @copydoc FNPDMBLKCACHEXFERCOMPLETEDRV */
2467static DECLCALLBACK(void) drvvdBlkCacheXferCompleteIoReq(PPDMDRVINS pDrvIns, void *pvUser, int rc)
2468{
2469 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
2470
2471 drvvdMediaExIoReqCompleteWorker(pThis, (PPDMMEDIAEXIOREQINT)pvUser, rc, true /* fUpNotify */);
2472}
2473
2474/** @copydoc FNPDMBLKCACHEXFERENQUEUEDRV */
2475static DECLCALLBACK(int) drvvdBlkCacheXferEnqueue(PPDMDRVINS pDrvIns,
2476 PDMBLKCACHEXFERDIR enmXferDir,
2477 uint64_t off, size_t cbXfer,
2478 PCRTSGBUF pSgBuf, PPDMBLKCACHEIOXFER hIoXfer)
2479{
2480 int rc = VINF_SUCCESS;
2481 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
2482
2483 Assert (!pThis->pCfgCrypto);
2484
2485 switch (enmXferDir)
2486 {
2487 case PDMBLKCACHEXFERDIR_READ:
2488 rc = VDAsyncRead(pThis->pDisk, off, cbXfer, pSgBuf, drvvdBlkCacheReqComplete,
2489 pThis, hIoXfer);
2490 break;
2491 case PDMBLKCACHEXFERDIR_WRITE:
2492 rc = VDAsyncWrite(pThis->pDisk, off, cbXfer, pSgBuf, drvvdBlkCacheReqComplete,
2493 pThis, hIoXfer);
2494 break;
2495 case PDMBLKCACHEXFERDIR_FLUSH:
2496 rc = VDAsyncFlush(pThis->pDisk, drvvdBlkCacheReqComplete, pThis, hIoXfer);
2497 break;
2498 default:
2499 AssertMsgFailed(("Invalid transfer type %d\n", enmXferDir));
2500 rc = VERR_INVALID_PARAMETER;
2501 }
2502
2503 if (rc == VINF_VD_ASYNC_IO_FINISHED)
2504 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, hIoXfer, VINF_SUCCESS);
2505 else if (RT_FAILURE(rc) && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
2506 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, hIoXfer, rc);
2507
2508 return VINF_SUCCESS;
2509}
2510
2511/** @copydoc FNPDMBLKCACHEXFERENQUEUEDISCARDDRV */
2512static DECLCALLBACK(int) drvvdBlkCacheXferEnqueueDiscard(PPDMDRVINS pDrvIns, PCRTRANGE paRanges,
2513 unsigned cRanges, PPDMBLKCACHEIOXFER hIoXfer)
2514{
2515 int rc = VINF_SUCCESS;
2516 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
2517
2518 rc = VDAsyncDiscardRanges(pThis->pDisk, paRanges, cRanges,
2519 drvvdBlkCacheReqComplete, pThis, hIoXfer);
2520
2521 if (rc == VINF_VD_ASYNC_IO_FINISHED)
2522 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, hIoXfer, VINF_SUCCESS);
2523 else if (RT_FAILURE(rc) && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
2524 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, hIoXfer, rc);
2525
2526 return VINF_SUCCESS;
2527}
2528
2529
2530/*********************************************************************************************************************************
2531* Extended media interface methods *
2532*********************************************************************************************************************************/
2533
2534static void drvvdMediaExIoReqWarningDiskFull(PPDMDRVINS pDrvIns)
2535{
2536 int rc;
2537 LogRel(("VD#%u: Host disk full\n", pDrvIns->iInstance));
2538 rc = PDMDrvHlpVMSetRuntimeError(pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_DISKFULL",
2539 N_("Host system reported disk full. VM execution is suspended. You can resume after freeing some space"));
2540 AssertRC(rc);
2541}
2542
2543static void drvvdMediaExIoReqWarningFileTooBig(PPDMDRVINS pDrvIns)
2544{
2545 int rc;
2546 LogRel(("VD#%u: File too big\n", pDrvIns->iInstance));
2547 rc = PDMDrvHlpVMSetRuntimeError(pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_FILETOOBIG",
2548 N_("Host system reported that the file size limit of the host file system has been exceeded. VM execution is suspended. You need to move your virtual hard disk to a filesystem which allows bigger files"));
2549 AssertRC(rc);
2550}
2551
2552static void drvvdMediaExIoReqWarningISCSI(PPDMDRVINS pDrvIns)
2553{
2554 int rc;
2555 LogRel(("VD#%u: iSCSI target unavailable\n", pDrvIns->iInstance));
2556 rc = PDMDrvHlpVMSetRuntimeError(pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_ISCSIDOWN",
2557 N_("The iSCSI target has stopped responding. VM execution is suspended. You can resume when it is available again"));
2558 AssertRC(rc);
2559}
2560
2561static void drvvdMediaExIoReqWarningDekMissing(PPDMDRVINS pDrvIns)
2562{
2563 LogRel(("VD#%u: DEK is missing\n", pDrvIns->iInstance));
2564 int rc = PDMDrvHlpVMSetRuntimeError(pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_DEKMISSING",
2565 N_("VD: The DEK for this disk is missing"));
2566 AssertRC(rc);
2567}
2568
2569/**
2570 * Checks whether a given status code indicates a recoverable error
2571 * suspending the VM if it is.
2572 *
2573 * @returns Flag indicating whether the status code is a recoverable error
2574 * (full disk, broken network connection).
2575 * @param pThis VBox disk container instance data.
2576 * @param rc Status code to check.
2577 */
2578bool drvvdMediaExIoReqIsRedoSetWarning(PVBOXDISK pThis, int rc)
2579{
2580 if (rc == VERR_DISK_FULL)
2581 {
2582 if (ASMAtomicCmpXchgBool(&pThis->fRedo, true, false))
2583 drvvdMediaExIoReqWarningDiskFull(pThis->pDrvIns);
2584 return true;
2585 }
2586 if (rc == VERR_FILE_TOO_BIG)
2587 {
2588 if (ASMAtomicCmpXchgBool(&pThis->fRedo, true, false))
2589 drvvdMediaExIoReqWarningFileTooBig(pThis->pDrvIns);
2590 return true;
2591 }
2592 if (rc == VERR_BROKEN_PIPE || rc == VERR_NET_CONNECTION_REFUSED)
2593 {
2594 /* iSCSI connection abort (first error) or failure to reestablish
2595 * connection (second error). Pause VM. On resume we'll retry. */
2596 if (ASMAtomicCmpXchgBool(&pThis->fRedo, true, false))
2597 drvvdMediaExIoReqWarningISCSI(pThis->pDrvIns);
2598 return true;
2599 }
2600 if (rc == VERR_VD_DEK_MISSING)
2601 {
2602 /* Error message already set. */
2603 if (ASMAtomicCmpXchgBool(&pThis->fRedo, true, false))
2604 drvvdMediaExIoReqWarningDekMissing(pThis->pDrvIns);
2605 return true;
2606 }
2607
2608 return false;
2609}
2610
2611/**
2612 * Syncs the memory buffers between the I/O request allocator and the internal buffer.
2613 *
2614 * @returns VBox status code.
2615 * @param pThis VBox disk container instance data.
2616 * @param pIoReq I/O request to sync.
2617 * @param fToIoBuf Flag indicating the sync direction.
2618 * true to copy data from the allocators buffer to our internal buffer.
2619 * false for the other direction.
2620 */
2621DECLINLINE(int) drvvdMediaExIoReqBufSync(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, bool fToIoBuf)
2622{
2623 int rc = VINF_SUCCESS;
2624
2625 Assert(pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE);
2626 Assert(pIoReq->ReadWrite.cbIoBuf > 0);
2627
2628 /* Make sure the buffer is reset. */
2629 RTSgBufReset(&pIoReq->ReadWrite.IoBuf.SgBuf);
2630
2631 size_t const offSrc = pIoReq->ReadWrite.cbReq - pIoReq->ReadWrite.cbReqLeft;
2632 Assert((uint32_t)offSrc == offSrc);
2633 if (fToIoBuf)
2634 rc = pThis->pDrvMediaExPort->pfnIoReqCopyToBuf(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0], (uint32_t)offSrc,
2635 &pIoReq->ReadWrite.IoBuf.SgBuf,
2636 RT_MIN(pIoReq->ReadWrite.cbIoBuf, pIoReq->ReadWrite.cbReqLeft));
2637 else
2638 rc = pThis->pDrvMediaExPort->pfnIoReqCopyFromBuf(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0], (uint32_t)offSrc,
2639 &pIoReq->ReadWrite.IoBuf.SgBuf,
2640 (uint32_t)RT_MIN(pIoReq->ReadWrite.cbIoBuf, pIoReq->ReadWrite.cbReqLeft));
2641
2642 RTSgBufReset(&pIoReq->ReadWrite.IoBuf.SgBuf);
2643 return rc;
2644}
2645
2646/**
2647 * Hashes the I/O request ID to an index for the allocated I/O request bin.
2648 */
2649DECLINLINE(unsigned) drvvdMediaExIoReqIdHash(PDMMEDIAEXIOREQID uIoReqId)
2650{
2651 return uIoReqId % DRVVD_VDIOREQ_ALLOC_BINS; /** @todo Find something better? */
2652}
2653
2654/**
2655 * Inserts the given I/O request in to the list of allocated I/O requests.
2656 *
2657 * @returns VBox status code.
2658 * @param pThis VBox disk container instance data.
2659 * @param pIoReq I/O request to insert.
2660 */
2661static int drvvdMediaExIoReqInsert(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
2662{
2663 int rc = VINF_SUCCESS;
2664 unsigned idxBin = drvvdMediaExIoReqIdHash(pIoReq->uIoReqId);
2665
2666 rc = RTSemFastMutexRequest(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
2667 if (RT_SUCCESS(rc))
2668 {
2669 /* Search for conflicting I/O request ID. */
2670 PPDMMEDIAEXIOREQINT pIt;
2671 RTListForEach(&pThis->aIoReqAllocBins[idxBin].LstIoReqAlloc, pIt, PDMMEDIAEXIOREQINT, NdAllocatedList)
2672 {
2673 if (RT_UNLIKELY(pIt->uIoReqId == pIoReq->uIoReqId))
2674 {
2675 rc = VERR_PDM_MEDIAEX_IOREQID_CONFLICT;
2676 break;
2677 }
2678 }
2679 if (RT_SUCCESS(rc))
2680 RTListAppend(&pThis->aIoReqAllocBins[idxBin].LstIoReqAlloc, &pIoReq->NdAllocatedList);
2681 RTSemFastMutexRelease(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
2682 }
2683
2684 return rc;
2685}
2686
2687/**
2688 * Removes the given I/O request from the list of allocated I/O requests.
2689 *
2690 * @returns VBox status code.
2691 * @param pThis VBox disk container instance data.
2692 * @param pIoReq I/O request to insert.
2693 */
2694static int drvvdMediaExIoReqRemove(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
2695{
2696 int rc = VINF_SUCCESS;
2697 unsigned idxBin = drvvdMediaExIoReqIdHash(pIoReq->uIoReqId);
2698
2699 rc = RTSemFastMutexRequest(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
2700 if (RT_SUCCESS(rc))
2701 {
2702 RTListNodeRemove(&pIoReq->NdAllocatedList);
2703 RTSemFastMutexRelease(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
2704 }
2705
2706 return rc;
2707}
2708
2709/**
2710 * Retires a given I/O request marking it as complete and notiyfing the
2711 * device/driver above about the completion if requested.
2712 *
2713 * @returns VBox status code.
2714 * @param pThis VBox disk container instance data.
2715 * @param pIoReq I/O request to complete.
2716 * @param rcReq The status code the request completed with.
2717 * @param fUpNotify Flag whether to notify the driver/device above us about the completion.
2718 */
2719static void drvvdMediaExIoReqRetire(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, int rcReq, bool fUpNotify)
2720{
2721 LogFlowFunc(("pThis=%#p pIoReq=%#p rcReq=%Rrc fUpNotify=%RTbool\n",
2722 pThis, pIoReq, rcReq, fUpNotify));
2723
2724 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_COMPLETING, VDIOREQSTATE_ACTIVE);
2725 if (fXchg)
2726 ASMAtomicDecU32(&pThis->cIoReqsActive);
2727 else
2728 {
2729 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
2730 rcReq = VERR_PDM_MEDIAEX_IOREQ_CANCELED;
2731 }
2732
2733 ASMAtomicXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_COMPLETED);
2734 drvvdMediaExIoReqBufFree(pThis, pIoReq);
2735
2736 /*
2737 * Leave a release log entry if the request was active for more than 25 seconds
2738 * (30 seconds is the timeout of the guest).
2739 */
2740 uint64_t tsNow = RTTimeMilliTS();
2741 if (tsNow - pIoReq->tsSubmit >= 25 * 1000)
2742 {
2743 const char *pcszReq = NULL;
2744
2745 switch (pIoReq->enmType)
2746 {
2747 case PDMMEDIAEXIOREQTYPE_READ:
2748 pcszReq = "Read";
2749 break;
2750 case PDMMEDIAEXIOREQTYPE_WRITE:
2751 pcszReq = "Write";
2752 break;
2753 case PDMMEDIAEXIOREQTYPE_FLUSH:
2754 pcszReq = "Flush";
2755 break;
2756 case PDMMEDIAEXIOREQTYPE_DISCARD:
2757 pcszReq = "Discard";
2758 break;
2759 default:
2760 pcszReq = "<Invalid>";
2761 }
2762
2763 LogRel(("VD#%u: %s request was active for %llu seconds\n",
2764 pThis->pDrvIns->iInstance, pcszReq, (tsNow - pIoReq->tsSubmit) / 1000));
2765 }
2766
2767 if (RT_FAILURE(rcReq))
2768 {
2769 /* Log the error. */
2770 if (pThis->cErrors++ < DRVVD_MAX_LOG_REL_ERRORS)
2771 {
2772 if (rcReq == VERR_PDM_MEDIAEX_IOREQ_CANCELED)
2773 {
2774 if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH)
2775 LogRel(("VD#%u: Aborted flush returned rc=%Rrc\n",
2776 pThis->pDrvIns->iInstance, rcReq));
2777 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
2778 LogRel(("VD#%u: Aborted discard returned rc=%Rrc\n",
2779 pThis->pDrvIns->iInstance, rcReq));
2780 else
2781 LogRel(("VD#%u: Aborted %s (%u bytes left) returned rc=%Rrc\n",
2782 pThis->pDrvIns->iInstance,
2783 pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
2784 ? "read"
2785 : "write",
2786 pIoReq->ReadWrite.cbReqLeft, rcReq));
2787 }
2788 else
2789 {
2790 if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH)
2791 LogRel(("VD#%u: Flush returned rc=%Rrc\n",
2792 pThis->pDrvIns->iInstance, rcReq));
2793 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
2794 LogRel(("VD#%u: Discard returned rc=%Rrc\n",
2795 pThis->pDrvIns->iInstance, rcReq));
2796 else
2797 LogRel(("VD#%u: %s (%u bytes left) returned rc=%Rrc\n",
2798 pThis->pDrvIns->iInstance,
2799 pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
2800 ? "Read"
2801 : "Write",
2802 pIoReq->ReadWrite.cbReqLeft, rcReq));
2803 }
2804 }
2805 }
2806
2807 if (fUpNotify)
2808 {
2809 int rc = pThis->pDrvMediaExPort->pfnIoReqCompleteNotify(pThis->pDrvMediaExPort,
2810 pIoReq, &pIoReq->abAlloc[0], rcReq);
2811 AssertRC(rc);
2812 }
2813
2814 LogFlowFunc(("returns\n"));
2815}
2816
2817/**
2818 * I/O request completion worker.
2819 *
2820 * @returns VBox status code.
2821 * @param pThis VBox disk container instance data.
2822 * @param pIoReq I/O request to complete.
2823 * @param rcReq The status code the request completed with.
2824 * @param fUpNotify Flag whether to notify the driver/device above us about the completion.
2825 */
2826static int drvvdMediaExIoReqCompleteWorker(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, int rcReq, bool fUpNotify)
2827{
2828 LogFlowFunc(("pThis=%#p pIoReq=%#p rcReq=%Rrc fUpNotify=%RTbool\n",
2829 pThis, pIoReq, rcReq, fUpNotify));
2830
2831 /*
2832 * For a read we need to sync the memory before continuing to process
2833 * the request further.
2834 */
2835 if ( RT_SUCCESS(rcReq)
2836 && pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ)
2837 rcReq = drvvdMediaExIoReqBufSync(pThis, pIoReq, false /* fToIoBuf */);
2838
2839 /*
2840 * When the request owner instructs us to handle recoverable errors like full disks
2841 * do it. Mark the request as suspended, notify the owner and put the request on the
2842 * redo list.
2843 */
2844 if ( RT_FAILURE(rcReq)
2845 && (pIoReq->fFlags & PDMIMEDIAEX_F_SUSPEND_ON_RECOVERABLE_ERR)
2846 && drvvdMediaExIoReqIsRedoSetWarning(pThis, rcReq))
2847 {
2848 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_SUSPENDED, VDIOREQSTATE_ACTIVE);
2849 if (fXchg)
2850 {
2851 /* Put on redo list and adjust active request counter. */
2852 RTCritSectEnter(&pThis->CritSectIoReqRedo);
2853 RTListAppend(&pThis->LstIoReqRedo, &pIoReq->NdLstWait);
2854 RTCritSectLeave(&pThis->CritSectIoReqRedo);
2855 ASMAtomicDecU32(&pThis->cIoReqsActive);
2856 pThis->pDrvMediaExPort->pfnIoReqStateChanged(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0],
2857 PDMMEDIAEXIOREQSTATE_SUSPENDED);
2858 rcReq = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
2859 }
2860 else
2861 {
2862 /* Request was canceled inbetween, so don't care and notify the owner about the completed request. */
2863 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
2864 drvvdMediaExIoReqRetire(pThis, pIoReq, rcReq, fUpNotify);
2865 }
2866 }
2867 else
2868 {
2869 /* Adjust the remaining amount to transfer. */
2870 Assert(pIoReq->ReadWrite.cbIoBuf > 0);
2871
2872 size_t cbReqIo = RT_MIN(pIoReq->ReadWrite.cbReqLeft, pIoReq->ReadWrite.cbIoBuf);
2873 pIoReq->ReadWrite.offStart += cbReqIo;
2874 pIoReq->ReadWrite.cbReqLeft -= cbReqIo;
2875
2876 if ( RT_FAILURE(rcReq)
2877 || !pIoReq->ReadWrite.cbReqLeft
2878 || ( pIoReq->enmType != PDMMEDIAEXIOREQTYPE_READ
2879 && pIoReq->enmType != PDMMEDIAEXIOREQTYPE_WRITE))
2880 drvvdMediaExIoReqRetire(pThis, pIoReq, rcReq, fUpNotify);
2881 else
2882 drvvdMediaExIoReqReadWriteProcess(pThis, pIoReq, fUpNotify);
2883 }
2884
2885 LogFlowFunc(("returns %Rrc\n", rcReq));
2886 return rcReq;
2887}
2888
2889
2890/**
2891 * Allocates a memory buffer suitable for I/O for the given request.
2892 *
2893 * @returns VBox status code.
2894 * @retval VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS if there is no I/O memory available to allocate and
2895 * the request was placed on a waiting list.
2896 * @param pThis VBox disk container instance data.
2897 * @param pIoReq I/O request to allocate memory for.
2898 * @param cb Size of the buffer.
2899 */
2900DECLINLINE(int) drvvdMediaExIoReqBufAlloc(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, size_t cb)
2901{
2902 LogFlowFunc(("pThis=%#p pIoReq=%#p cb=%zu\n", pThis, pIoReq, cb));
2903
2904 int rc = IOBUFMgrAllocBuf(pThis->hIoBufMgr, &pIoReq->ReadWrite.IoBuf, cb, &pIoReq->ReadWrite.cbIoBuf);
2905 if (rc == VERR_NO_MEMORY)
2906 {
2907 LogFlowFunc(("Could not allocate memory for request, deferring\n"));
2908 RTCritSectEnter(&pThis->CritSectIoReqsIoBufWait);
2909 RTListAppend(&pThis->LstIoReqIoBufWait, &pIoReq->NdLstWait);
2910 RTCritSectLeave(&pThis->CritSectIoReqsIoBufWait);
2911 ASMAtomicIncU32(&pThis->cIoReqsWaiting);
2912 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
2913 }
2914 else
2915 {
2916 LogFlowFunc(("Allocated %zu bytes of memory\n", pIoReq->ReadWrite.cbIoBuf));
2917 Assert(pIoReq->ReadWrite.cbIoBuf > 0);
2918 }
2919
2920 LogFlowFunc(("returns %Rrc\n", rc));
2921 return rc;
2922}
2923
2924/**
2925 * Wrapper around the various ways to read from the underlying medium (cache, async vs. sync).
2926 *
2927 * @returns VBox status code.
2928 * @param pThis VBox disk container instance data.
2929 * @param pIoReq I/O request to process.
2930 * @param cbReqIo Transfer size.
2931 * @param pcbReqIo Where to store the amount of transferred data.
2932 */
2933static int drvvdMediaExIoReqReadWrapper(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, size_t cbReqIo, size_t *pcbReqIo)
2934{
2935 int rc = VINF_SUCCESS;
2936
2937 LogFlowFunc(("pThis=%#p pIoReq=%#p cbReqIo=%zu pcbReqIo=%#p\n", pThis, pIoReq, cbReqIo, pcbReqIo));
2938
2939 Assert(cbReqIo > 0);
2940
2941 if ( pThis->fAsyncIOSupported
2942 && !(pIoReq->fFlags & PDMIMEDIAEX_F_SYNC))
2943 {
2944 if (pThis->pBlkCache)
2945 {
2946 rc = PDMR3BlkCacheRead(pThis->pBlkCache, pIoReq->ReadWrite.offStart,
2947 &pIoReq->ReadWrite.IoBuf.SgBuf, cbReqIo, pIoReq);
2948 if (rc == VINF_SUCCESS)
2949 rc = VINF_VD_ASYNC_IO_FINISHED;
2950 else if (rc == VINF_AIO_TASK_PENDING)
2951 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
2952 }
2953 else
2954 rc = VDAsyncRead(pThis->pDisk, pIoReq->ReadWrite.offStart, cbReqIo, &pIoReq->ReadWrite.IoBuf.SgBuf,
2955 drvvdMediaExIoReqComplete, pThis, pIoReq);
2956 }
2957 else
2958 {
2959 void *pvBuf = RTSgBufGetNextSegment(&pIoReq->ReadWrite.IoBuf.SgBuf, &cbReqIo);
2960
2961 Assert(cbReqIo > 0 && VALID_PTR(pvBuf));
2962 rc = VDRead(pThis->pDisk, pIoReq->ReadWrite.offStart, pvBuf, cbReqIo);
2963 if (RT_SUCCESS(rc))
2964 rc = VINF_VD_ASYNC_IO_FINISHED;
2965 }
2966
2967 *pcbReqIo = cbReqIo;
2968
2969 LogFlowFunc(("returns %Rrc *pcbReqIo=%zu\n", rc, *pcbReqIo));
2970 return rc;
2971}
2972
2973/**
2974 * Wrapper around the various ways to write to the underlying medium (cache, async vs. sync).
2975 *
2976 * @returns VBox status code.
2977 * @param pThis VBox disk container instance data.
2978 * @param pIoReq I/O request to process.
2979 * @param cbReqIo Transfer size.
2980 * @param pcbReqIo Where to store the amount of transferred data.
2981 */
2982static int drvvdMediaExIoReqWriteWrapper(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, size_t cbReqIo, size_t *pcbReqIo)
2983{
2984 int rc = VINF_SUCCESS;
2985
2986 Assert(cbReqIo > 0);
2987
2988 LogFlowFunc(("pThis=%#p pIoReq=%#p cbReqIo=%zu pcbReqIo=%#p\n", pThis, pIoReq, cbReqIo, pcbReqIo));
2989
2990 if ( pThis->fAsyncIOSupported
2991 && !(pIoReq->fFlags & PDMIMEDIAEX_F_SYNC))
2992 {
2993 if (pThis->pBlkCache)
2994 {
2995 rc = PDMR3BlkCacheWrite(pThis->pBlkCache, pIoReq->ReadWrite.offStart,
2996 &pIoReq->ReadWrite.IoBuf.SgBuf, cbReqIo, pIoReq);
2997 if (rc == VINF_SUCCESS)
2998 rc = VINF_VD_ASYNC_IO_FINISHED;
2999 else if (rc == VINF_AIO_TASK_PENDING)
3000 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
3001 }
3002 else
3003 rc = VDAsyncWrite(pThis->pDisk, pIoReq->ReadWrite.offStart, cbReqIo, &pIoReq->ReadWrite.IoBuf.SgBuf,
3004 drvvdMediaExIoReqComplete, pThis, pIoReq);
3005 }
3006 else
3007 {
3008 void *pvBuf = RTSgBufGetNextSegment(&pIoReq->ReadWrite.IoBuf.SgBuf, &cbReqIo);
3009
3010 Assert(cbReqIo > 0 && VALID_PTR(pvBuf));
3011 rc = VDWrite(pThis->pDisk, pIoReq->ReadWrite.offStart, pvBuf, cbReqIo);
3012 if (RT_SUCCESS(rc))
3013 rc = VINF_VD_ASYNC_IO_FINISHED;
3014 }
3015
3016 *pcbReqIo = cbReqIo;
3017
3018 LogFlowFunc(("returns %Rrc *pcbReqIo=%zu\n", rc, *pcbReqIo));
3019 return rc;
3020}
3021
3022/**
3023 * Wrapper around the various ways to flush all data to the underlying medium (cache, async vs. sync).
3024 *
3025 * @returns VBox status code.
3026 * @param pThis VBox disk container instance data.
3027 * @param pIoReq I/O request to process.
3028 */
3029static int drvvdMediaExIoReqFlushWrapper(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
3030{
3031 int rc = VINF_SUCCESS;
3032
3033 LogFlowFunc(("pThis=%#p pIoReq=%#p\n", pThis, pIoReq));
3034
3035 if ( pThis->fAsyncIOSupported
3036 && !(pIoReq->fFlags & PDMIMEDIAEX_F_SYNC))
3037 {
3038 if (pThis->pBlkCache)
3039 {
3040 rc = PDMR3BlkCacheFlush(pThis->pBlkCache, pIoReq);
3041 if (rc == VINF_SUCCESS)
3042 rc = VINF_VD_ASYNC_IO_FINISHED;
3043 else if (rc == VINF_AIO_TASK_PENDING)
3044 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
3045 }
3046 else
3047 rc = VDAsyncFlush(pThis->pDisk, drvvdMediaExIoReqComplete, pThis, pIoReq);
3048 }
3049 else
3050 {
3051 rc = VDFlush(pThis->pDisk);
3052 if (RT_SUCCESS(rc))
3053 rc = VINF_VD_ASYNC_IO_FINISHED;
3054 }
3055
3056 LogFlowFunc(("returns %Rrc\n", rc));
3057 return rc;
3058}
3059
3060/**
3061 * Wrapper around the various ways to discard data blocks on the underlying medium (cache, async vs. sync).
3062 *
3063 * @returns VBox status code.
3064 * @param pThis VBox disk container instance data.
3065 * @param pIoReq I/O request to process.
3066 */
3067static int drvvdMediaExIoReqDiscardWrapper(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
3068{
3069 int rc = VINF_SUCCESS;
3070
3071 LogFlowFunc(("pThis=%#p pIoReq=%#p\n", pThis, pIoReq));
3072
3073 if ( pThis->fAsyncIOSupported
3074 && !(pIoReq->fFlags & PDMIMEDIAEX_F_SYNC))
3075 {
3076 if (pThis->pBlkCache)
3077 {
3078 rc = PDMR3BlkCacheDiscard(pThis->pBlkCache, pIoReq->Discard.paRanges, pIoReq->Discard.cRanges, pIoReq);
3079 if (rc == VINF_SUCCESS)
3080 rc = VINF_VD_ASYNC_IO_FINISHED;
3081 else if (rc == VINF_AIO_TASK_PENDING)
3082 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
3083 }
3084 else
3085 rc = VDAsyncDiscardRanges(pThis->pDisk, pIoReq->Discard.paRanges, pIoReq->Discard.cRanges,
3086 drvvdMediaExIoReqComplete, pThis, pIoReq);
3087 }
3088 else
3089 {
3090 rc = VDDiscardRanges(pThis->pDisk, pIoReq->Discard.paRanges, pIoReq->Discard.cRanges);
3091 if (RT_SUCCESS(rc))
3092 rc = VINF_VD_ASYNC_IO_FINISHED;
3093 }
3094
3095 LogFlowFunc(("returns %Rrc\n", rc));
3096 return rc;
3097}
3098
3099/**
3100 * Processes a read/write request.
3101 *
3102 * @returns VBox status code.
3103 * @param pThis VBox disk container instance data.
3104 * @param pIoReq I/O request to process.
3105 * @param fUpNotify Flag whether to notify the driver/device above us about the completion.
3106 */
3107static int drvvdMediaExIoReqReadWriteProcess(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, bool fUpNotify)
3108{
3109 int rc = VINF_SUCCESS;
3110
3111 LogFlowFunc(("pThis=%#p pIoReq=%#p fUpNotify=%RTbool\n", pThis, pIoReq, fUpNotify));
3112
3113 Assert(pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE);
3114
3115 rc = drvvdKeyCheckPrereqs(pThis, false /* fSetError */);
3116
3117 while ( pIoReq->ReadWrite.cbReqLeft
3118 && rc == VINF_SUCCESS)
3119 {
3120 Assert(pIoReq->ReadWrite.cbIoBuf > 0);
3121
3122 size_t cbReqIo = RT_MIN(pIoReq->ReadWrite.cbReqLeft, pIoReq->ReadWrite.cbIoBuf);
3123
3124 if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ)
3125 rc = drvvdMediaExIoReqReadWrapper(pThis, pIoReq, cbReqIo, &cbReqIo);
3126 else
3127 {
3128 /* Sync memory buffer from the request initiator. */
3129 rc = drvvdMediaExIoReqBufSync(pThis, pIoReq, true /* fToIoBuf */);
3130 if (RT_SUCCESS(rc))
3131 rc = drvvdMediaExIoReqWriteWrapper(pThis, pIoReq, cbReqIo, &cbReqIo);
3132 }
3133
3134 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3135 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
3136 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
3137 {
3138 if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ)
3139 rc = drvvdMediaExIoReqBufSync(pThis, pIoReq, false /* fToIoBuf */);
3140 else
3141 rc = VINF_SUCCESS;
3142 pIoReq->ReadWrite.offStart += cbReqIo;
3143 pIoReq->ReadWrite.cbReqLeft -= cbReqIo;
3144 }
3145 }
3146
3147 if (rc != VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS)
3148 {
3149 Assert(!pIoReq->ReadWrite.cbReqLeft || RT_FAILURE(rc));
3150 rc = drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rc, fUpNotify);
3151 }
3152
3153 LogFlowFunc(("returns %Rrc\n", rc));
3154 return rc;
3155}
3156
3157
3158/**
3159 * Frees a I/O memory buffer allocated previously.
3160 *
3161 * @returns nothing.
3162 * @param pThis VBox disk container instance data.
3163 * @param pIoReq I/O request for which to free memory.
3164 */
3165DECLINLINE(void) drvvdMediaExIoReqBufFree(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
3166{
3167 LogFlowFunc(("pThis=%#p pIoReq=%#p{.cbIoBuf=%zu}\n", pThis, pIoReq, pIoReq->ReadWrite.cbIoBuf));
3168
3169 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
3170 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
3171 {
3172 IOBUFMgrFreeBuf(&pIoReq->ReadWrite.IoBuf);
3173
3174 uint32_t cIoReqsWaiting = ASMAtomicXchgU32(&pThis->cIoReqsWaiting, 0);
3175 if (cIoReqsWaiting > 0)
3176 {
3177 /* Try to process as many requests as possible. */
3178 RTCritSectEnter(&pThis->CritSectIoReqsIoBufWait);
3179 PPDMMEDIAEXIOREQINT pIoReqCur, pIoReqNext;
3180
3181 RTListForEachSafe(&pThis->LstIoReqIoBufWait, pIoReqCur, pIoReqNext, PDMMEDIAEXIOREQINT, NdLstWait)
3182 {
3183 LogFlowFunc(("Found I/O request %#p on waiting list, trying to allocate buffer of size %zu bytes\n",
3184 pIoReqCur, pIoReqCur->ReadWrite.cbReq));
3185
3186 /* Allocate a suitable I/O buffer for this request. */
3187 int rc = IOBUFMgrAllocBuf(pThis->hIoBufMgr, &pIoReqCur->ReadWrite.IoBuf, pIoReqCur->ReadWrite.cbReq,
3188 &pIoReqCur->ReadWrite.cbIoBuf);
3189 if (rc == VINF_SUCCESS)
3190 {
3191 Assert(pIoReq->ReadWrite.cbIoBuf > 0);
3192
3193 cIoReqsWaiting--;
3194 RTListNodeRemove(&pIoReqCur->NdLstWait);
3195
3196 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReqCur->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
3197 if (RT_UNLIKELY(!fXchg))
3198 {
3199 /* Must have been canceled inbetween. */
3200 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
3201 drvvdMediaExIoReqCompleteWorker(pThis, pIoReqCur, VERR_PDM_MEDIAEX_IOREQ_CANCELED, true /* fUpNotify */);
3202 }
3203 ASMAtomicIncU32(&pThis->cIoReqsActive);
3204 rc = drvvdMediaExIoReqReadWriteProcess(pThis, pIoReqCur, true /* fUpNotify */);
3205 }
3206 else
3207 {
3208 Assert(rc == VERR_NO_MEMORY);
3209 break;
3210 }
3211 }
3212 RTCritSectLeave(&pThis->CritSectIoReqsIoBufWait);
3213
3214 ASMAtomicAddU32(&pThis->cIoReqsWaiting, cIoReqsWaiting);
3215 }
3216 }
3217
3218 LogFlowFunc(("returns\n"));
3219}
3220
3221
3222/**
3223 * Returns whether the VM is in a running state.
3224 *
3225 * @returns Flag indicating whether the VM is currently in a running state.
3226 * @param pThis VBox disk container instance data.
3227 */
3228DECLINLINE(bool) drvvdMediaExIoReqIsVmRunning(PVBOXDISK pThis)
3229{
3230 VMSTATE enmVmState = PDMDrvHlpVMState(pThis->pDrvIns);
3231 if ( enmVmState == VMSTATE_RESUMING
3232 || enmVmState == VMSTATE_RUNNING
3233 || enmVmState == VMSTATE_RUNNING_LS
3234 || enmVmState == VMSTATE_RUNNING_FT
3235 || enmVmState == VMSTATE_RESETTING
3236 || enmVmState == VMSTATE_RESETTING_LS
3237 || enmVmState == VMSTATE_SOFT_RESETTING
3238 || enmVmState == VMSTATE_SOFT_RESETTING_LS
3239 || enmVmState == VMSTATE_SUSPENDING
3240 || enmVmState == VMSTATE_SUSPENDING_LS
3241 || enmVmState == VMSTATE_SUSPENDING_EXT_LS)
3242 return true;
3243
3244 return false;
3245}
3246
3247/**
3248 * @copydoc FNVDASYNCTRANSFERCOMPLETE
3249 */
3250static DECLCALLBACK(void) drvvdMediaExIoReqComplete(void *pvUser1, void *pvUser2, int rcReq)
3251{
3252 PVBOXDISK pThis = (PVBOXDISK)pvUser1;
3253 PPDMMEDIAEXIOREQINT pIoReq = (PPDMMEDIAEXIOREQINT)pvUser2;
3254
3255 drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rcReq, true /* fUpNotify */);
3256}
3257
3258/**
3259 * Tries to cancel the given I/O request returning the result.
3260 *
3261 * @returns Flag whether the request was successfully canceled or whether it
3262 * already complete inbetween.
3263 * @param pThis VBox disk container instance data.
3264 * @param pIoReq The I/O request to cancel.
3265 */
3266static bool drvvdMediaExIoReqCancel(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
3267{
3268 bool fXchg = true;
3269 VDIOREQSTATE enmStateOld = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3270
3271 /*
3272 * We might have to try canceling the request multiple times if it transitioned from
3273 * ALLOCATED to ACTIVE or to SUSPENDED between reading the state and trying to change it.
3274 */
3275 while ( ( enmStateOld == VDIOREQSTATE_ALLOCATED
3276 || enmStateOld == VDIOREQSTATE_ACTIVE
3277 || enmStateOld == VDIOREQSTATE_SUSPENDED)
3278 && !fXchg)
3279 {
3280 fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_CANCELED, enmStateOld);
3281 if (!fXchg)
3282 enmStateOld = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3283 }
3284
3285 if (fXchg)
3286 ASMAtomicDecU32(&pThis->cIoReqsActive);
3287
3288 return fXchg;
3289}
3290
3291/**
3292 * @interface_method_impl{PDMIMEDIAEX,pfnQueryFeatures}
3293 */
3294static DECLCALLBACK(int) drvvdQueryFeatures(PPDMIMEDIAEX pInterface, uint32_t *pfFeatures)
3295{
3296 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3297
3298 AssertPtrReturn(pfFeatures, VERR_INVALID_POINTER);
3299
3300 uint32_t fFeatures = 0;
3301 if (pThis->fAsyncIOSupported)
3302 fFeatures |= PDMIMEDIAEX_FEATURE_F_ASYNC;
3303 if (pThis->IMedia.pfnDiscard)
3304 fFeatures |= PDMIMEDIAEX_FEATURE_F_DISCARD;
3305
3306 *pfFeatures = fFeatures;
3307
3308 return VINF_SUCCESS;
3309}
3310
3311
3312/**
3313 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqAllocSizeSet}
3314 */
3315static DECLCALLBACK(int) drvvdIoReqAllocSizeSet(PPDMIMEDIAEX pInterface, size_t cbIoReqAlloc)
3316{
3317 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3318 if (RT_UNLIKELY(pThis->hIoReqCache != NIL_RTMEMCACHE))
3319 return VERR_INVALID_STATE;
3320
3321 return RTMemCacheCreate(&pThis->hIoReqCache, sizeof(PDMMEDIAEXIOREQINT) + cbIoReqAlloc, 0, UINT32_MAX,
3322 NULL, NULL, NULL, 0);
3323}
3324
3325/**
3326 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqAlloc}
3327 */
3328static DECLCALLBACK(int) drvvdIoReqAlloc(PPDMIMEDIAEX pInterface, PPDMMEDIAEXIOREQ phIoReq, void **ppvIoReqAlloc,
3329 PDMMEDIAEXIOREQID uIoReqId, uint32_t fFlags)
3330{
3331 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3332
3333 AssertReturn(!(fFlags & ~PDMIMEDIAEX_F_VALID), VERR_INVALID_PARAMETER);
3334
3335 PPDMMEDIAEXIOREQINT pIoReq = (PPDMMEDIAEXIOREQINT)RTMemCacheAlloc(pThis->hIoReqCache);
3336
3337 if (RT_UNLIKELY(!pIoReq))
3338 return VERR_NO_MEMORY;
3339
3340 pIoReq->uIoReqId = uIoReqId;
3341 pIoReq->fFlags = fFlags;
3342 pIoReq->pDisk = pThis;
3343 pIoReq->enmState = VDIOREQSTATE_ALLOCATED;
3344 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_INVALID;
3345
3346 int rc = drvvdMediaExIoReqInsert(pThis, pIoReq);
3347 if (RT_SUCCESS(rc))
3348 {
3349 *phIoReq = pIoReq;
3350 *ppvIoReqAlloc = &pIoReq->abAlloc[0];
3351 }
3352 else
3353 RTMemCacheFree(pThis->hIoReqCache, pIoReq);
3354
3355 return rc;
3356}
3357
3358/**
3359 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqFree}
3360 */
3361static DECLCALLBACK(int) drvvdIoReqFree(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq)
3362{
3363 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3364 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3365
3366 if ( pIoReq->enmState != VDIOREQSTATE_COMPLETED
3367 && pIoReq->enmState != VDIOREQSTATE_ALLOCATED)
3368 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3369
3370 /* Remove from allocated list. */
3371 int rc = drvvdMediaExIoReqRemove(pThis, pIoReq);
3372 if (RT_FAILURE(rc))
3373 return rc;
3374
3375 /* Free any associated I/O memory. */
3376 drvvdMediaExIoReqBufFree(pThis, pIoReq);
3377
3378 /* For discard request discard the range array. */
3379 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD
3380 && pIoReq->Discard.paRanges)
3381 {
3382 RTMemFree(pIoReq->Discard.paRanges);
3383 pIoReq->Discard.paRanges = NULL;
3384 }
3385
3386 pIoReq->enmState = VDIOREQSTATE_FREE;
3387 RTMemCacheFree(pThis->hIoReqCache, pIoReq);
3388 return VINF_SUCCESS;
3389}
3390
3391/**
3392 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqQueryResidual}
3393 */
3394static DECLCALLBACK(int) drvvdIoReqQueryResidual(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, size_t *pcbResidual)
3395{
3396 RT_NOREF1(pInterface);
3397
3398 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3399
3400 if (pIoReq->enmState != VDIOREQSTATE_COMPLETED)
3401 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3402
3403 if ( pIoReq->enmType != PDMMEDIAEXIOREQTYPE_READ
3404 && pIoReq->enmType != PDMMEDIAEXIOREQTYPE_WRITE
3405 && pIoReq->enmType != PDMMEDIAEXIOREQTYPE_FLUSH)
3406 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3407
3408 *pcbResidual = 0; /* No data left to transfer always. */
3409 return VINF_SUCCESS;
3410}
3411
3412/**
3413 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqQueryXferSize}
3414 */
3415static DECLCALLBACK(int) drvvdIoReqQueryXferSize(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, size_t *pcbXfer)
3416{
3417 int rc = VINF_SUCCESS;
3418 RT_NOREF1(pInterface);
3419
3420 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3421
3422 if (pIoReq->enmState != VDIOREQSTATE_COMPLETED)
3423 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3424
3425 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
3426 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
3427 *pcbXfer = pIoReq->ReadWrite.cbReq;
3428 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH)
3429 *pcbXfer = 0;
3430 else
3431 rc = VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3432
3433 return rc;
3434}
3435
3436/**
3437 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqCancelAll}
3438 */
3439static DECLCALLBACK(int) drvvdIoReqCancelAll(PPDMIMEDIAEX pInterface)
3440{
3441 int rc = VINF_SUCCESS;
3442 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3443
3444 for (unsigned idxBin = 0; idxBin < RT_ELEMENTS(pThis->aIoReqAllocBins); idxBin++)
3445 {
3446 rc = RTSemFastMutexRequest(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
3447 if (RT_SUCCESS(rc))
3448 {
3449 /* Search for I/O request with ID. */
3450 PPDMMEDIAEXIOREQINT pIt;
3451
3452 RTListForEach(&pThis->aIoReqAllocBins[idxBin].LstIoReqAlloc, pIt, PDMMEDIAEXIOREQINT, NdAllocatedList)
3453 {
3454 drvvdMediaExIoReqCancel(pThis, pIt);
3455 }
3456 RTSemFastMutexRelease(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
3457 }
3458 }
3459
3460 return rc;
3461}
3462
3463/**
3464 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqCancel}
3465 */
3466static DECLCALLBACK(int) drvvdIoReqCancel(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQID uIoReqId)
3467{
3468 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3469 unsigned idxBin = drvvdMediaExIoReqIdHash(uIoReqId);
3470
3471 int rc = RTSemFastMutexRequest(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
3472 if (RT_SUCCESS(rc))
3473 {
3474 /* Search for I/O request with ID. */
3475 PPDMMEDIAEXIOREQINT pIt;
3476 rc = VERR_PDM_MEDIAEX_IOREQID_NOT_FOUND;
3477
3478 RTListForEach(&pThis->aIoReqAllocBins[idxBin].LstIoReqAlloc, pIt, PDMMEDIAEXIOREQINT, NdAllocatedList)
3479 {
3480 if (pIt->uIoReqId == uIoReqId)
3481 {
3482 if (drvvdMediaExIoReqCancel(pThis, pIt))
3483 rc = VINF_SUCCESS;
3484
3485 break;
3486 }
3487 }
3488 RTSemFastMutexRelease(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
3489 }
3490
3491 return rc;
3492}
3493
3494/**
3495 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqRead}
3496 */
3497static DECLCALLBACK(int) drvvdIoReqRead(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, uint64_t off, size_t cbRead)
3498{
3499 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3500 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3501 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3502
3503 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
3504 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3505
3506 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
3507 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3508
3509 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_READ;
3510 pIoReq->tsSubmit = RTTimeMilliTS();
3511 pIoReq->ReadWrite.offStart = off;
3512 pIoReq->ReadWrite.cbReq = cbRead;
3513 pIoReq->ReadWrite.cbReqLeft = cbRead;
3514 /* Allocate a suitable I/O buffer for this request. */
3515 int rc = drvvdMediaExIoReqBufAlloc(pThis, pIoReq, cbRead);
3516 if (rc == VINF_SUCCESS)
3517 {
3518 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
3519 if (RT_UNLIKELY(!fXchg))
3520 {
3521 /* Must have been canceled inbetween. */
3522 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
3523 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3524 }
3525 ASMAtomicIncU32(&pThis->cIoReqsActive);
3526
3527 rc = drvvdMediaExIoReqReadWriteProcess(pThis, pIoReq, false /* fUpNotify */);
3528 }
3529
3530 return rc;
3531}
3532
3533/**
3534 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqWrite}
3535 */
3536static DECLCALLBACK(int) drvvdIoReqWrite(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, uint64_t off, size_t cbWrite)
3537{
3538 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3539 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3540 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3541
3542 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
3543 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3544
3545 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
3546 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3547
3548 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_WRITE;
3549 pIoReq->tsSubmit = RTTimeMilliTS();
3550 pIoReq->ReadWrite.offStart = off;
3551 pIoReq->ReadWrite.cbReq = cbWrite;
3552 pIoReq->ReadWrite.cbReqLeft = cbWrite;
3553 /* Allocate a suitable I/O buffer for this request. */
3554 int rc = drvvdMediaExIoReqBufAlloc(pThis, pIoReq, cbWrite);
3555 if (rc == VINF_SUCCESS)
3556 {
3557 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
3558 if (RT_UNLIKELY(!fXchg))
3559 {
3560 /* Must have been canceled inbetween. */
3561 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
3562 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3563 }
3564 ASMAtomicIncU32(&pThis->cIoReqsActive);
3565
3566 rc = drvvdMediaExIoReqReadWriteProcess(pThis, pIoReq, false /* fUpNotify */);
3567 }
3568
3569 return rc;
3570}
3571
3572/**
3573 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqFlush}
3574 */
3575static DECLCALLBACK(int) drvvdIoReqFlush(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq)
3576{
3577 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3578 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3579 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3580
3581 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
3582 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3583
3584 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
3585 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3586
3587 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_FLUSH;
3588 pIoReq->tsSubmit = RTTimeMilliTS();
3589 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
3590 if (RT_UNLIKELY(!fXchg))
3591 {
3592 /* Must have been canceled inbetween. */
3593 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
3594 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3595 }
3596
3597 ASMAtomicIncU32(&pThis->cIoReqsActive);
3598 int rc = drvvdMediaExIoReqFlushWrapper(pThis, pIoReq);
3599 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3600 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
3601 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
3602 rc = VINF_SUCCESS;
3603
3604 if (rc != VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS)
3605 rc = drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rc, false /* fUpNotify */);
3606
3607 return rc;
3608}
3609
3610/**
3611 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqDiscard}
3612 */
3613static DECLCALLBACK(int) drvvdIoReqDiscard(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, unsigned cRangesMax)
3614{
3615 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3616 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3617 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3618
3619 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
3620 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3621
3622 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
3623 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3624
3625 /* Copy the ranges over now, this can be optimized in the future. */
3626 pIoReq->Discard.paRanges = (PRTRANGE)RTMemAllocZ(cRangesMax * sizeof(RTRANGE));
3627 if (RT_UNLIKELY(!pIoReq->Discard.paRanges))
3628 return VERR_NO_MEMORY;
3629
3630 int rc = pThis->pDrvMediaExPort->pfnIoReqQueryDiscardRanges(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0],
3631 0, cRangesMax, pIoReq->Discard.paRanges,
3632 &pIoReq->Discard.cRanges);
3633 if (RT_SUCCESS(rc))
3634 {
3635 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_DISCARD;
3636 pIoReq->tsSubmit = RTTimeMilliTS();
3637 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
3638 if (RT_UNLIKELY(!fXchg))
3639 {
3640 /* Must have been canceled inbetween. */
3641 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
3642 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3643 }
3644
3645 ASMAtomicIncU32(&pThis->cIoReqsActive);
3646 rc = drvvdMediaExIoReqDiscardWrapper(pThis, pIoReq);
3647 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3648 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
3649 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
3650 rc = VINF_SUCCESS;
3651
3652 if (rc != VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS)
3653 rc = drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rc, false /* fUpNotify */);
3654 }
3655
3656 return rc;
3657}
3658
3659/**
3660 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqSendScsiCmd}
3661 */
3662static DECLCALLBACK(int) drvvdIoReqSendScsiCmd(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, uint32_t uLun,
3663 const uint8_t *pbCdb, size_t cbCdb, PDMMEDIAEXIOREQSCSITXDIR enmTxDir,
3664 size_t cbBuf, uint8_t *pabSense, size_t cbSense, uint8_t *pu8ScsiSts,
3665 uint32_t cTimeoutMillies)
3666{
3667 RT_NOREF10(pInterface, uLun, pbCdb, cbCdb, enmTxDir, cbBuf, pabSense, cbSense, pu8ScsiSts, cTimeoutMillies);
3668 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3669 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3670
3671 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
3672 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3673
3674 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
3675 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3676
3677 return VERR_NOT_SUPPORTED;
3678}
3679
3680/**
3681 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqGetActiveCount}
3682 */
3683static DECLCALLBACK(uint32_t) drvvdIoReqGetActiveCount(PPDMIMEDIAEX pInterface)
3684{
3685 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3686 return ASMAtomicReadU32(&pThis->cIoReqsActive);
3687}
3688
3689/**
3690 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqGetSuspendedCount}
3691 */
3692static DECLCALLBACK(uint32_t) drvvdIoReqGetSuspendedCount(PPDMIMEDIAEX pInterface)
3693{
3694 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3695
3696 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), 0);
3697
3698 uint32_t cIoReqSuspended = 0;
3699 PPDMMEDIAEXIOREQINT pIoReq;
3700 RTCritSectEnter(&pThis->CritSectIoReqRedo);
3701 RTListForEach(&pThis->LstIoReqRedo, pIoReq, PDMMEDIAEXIOREQINT, NdLstWait)
3702 {
3703 cIoReqSuspended++;
3704 }
3705 RTCritSectLeave(&pThis->CritSectIoReqRedo);
3706
3707 return cIoReqSuspended;
3708}
3709
3710/**
3711 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqQuerySuspendedStart}
3712 */
3713static DECLCALLBACK(int) drvvdIoReqQuerySuspendedStart(PPDMIMEDIAEX pInterface, PPDMMEDIAEXIOREQ phIoReq,
3714 void **ppvIoReqAlloc)
3715{
3716 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3717
3718 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), VERR_INVALID_STATE);
3719 AssertReturn(!RTListIsEmpty(&pThis->LstIoReqRedo), VERR_NOT_FOUND);
3720
3721 RTCritSectEnter(&pThis->CritSectIoReqRedo);
3722 PPDMMEDIAEXIOREQINT pIoReq = RTListGetFirst(&pThis->LstIoReqRedo, PDMMEDIAEXIOREQINT, NdLstWait);
3723 *phIoReq = pIoReq;
3724 *ppvIoReqAlloc = &pIoReq->abAlloc[0];
3725 RTCritSectLeave(&pThis->CritSectIoReqRedo);
3726
3727 return VINF_SUCCESS;
3728}
3729
3730/**
3731 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqQuerySuspendedNext}
3732 */
3733static DECLCALLBACK(int) drvvdIoReqQuerySuspendedNext(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq,
3734 PPDMMEDIAEXIOREQ phIoReqNext, void **ppvIoReqAllocNext)
3735{
3736 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3737 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3738
3739 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), VERR_INVALID_STATE);
3740 AssertPtrReturn(pIoReq, VERR_INVALID_HANDLE);
3741 AssertReturn(!RTListNodeIsLast(&pThis->LstIoReqRedo, &pIoReq->NdLstWait), VERR_NOT_FOUND);
3742
3743 RTCritSectEnter(&pThis->CritSectIoReqRedo);
3744 PPDMMEDIAEXIOREQINT pIoReqNext = RTListNodeGetNext(&pIoReq->NdLstWait, PDMMEDIAEXIOREQINT, NdLstWait);
3745 *phIoReqNext = pIoReqNext;
3746 *ppvIoReqAllocNext = &pIoReqNext->abAlloc[0];
3747 RTCritSectLeave(&pThis->CritSectIoReqRedo);
3748
3749 return VINF_SUCCESS;
3750}
3751
3752/**
3753 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqSuspendedSave}
3754 */
3755static DECLCALLBACK(int) drvvdIoReqSuspendedSave(PPDMIMEDIAEX pInterface, PSSMHANDLE pSSM, PDMMEDIAEXIOREQ hIoReq)
3756{
3757 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3758 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3759
3760 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), VERR_INVALID_STATE);
3761 AssertPtrReturn(pIoReq, VERR_INVALID_HANDLE);
3762 AssertReturn(pIoReq->enmState == VDIOREQSTATE_SUSPENDED, VERR_INVALID_STATE);
3763
3764 SSMR3PutU32(pSSM, DRVVD_IOREQ_SAVED_STATE_VERSION);
3765 SSMR3PutU32(pSSM, (uint32_t)pIoReq->enmType);
3766 SSMR3PutU32(pSSM, pIoReq->uIoReqId);
3767 SSMR3PutU32(pSSM, pIoReq->fFlags);
3768 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
3769 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
3770 {
3771 SSMR3PutU64(pSSM, pIoReq->ReadWrite.offStart);
3772 SSMR3PutU64(pSSM, pIoReq->ReadWrite.cbReq);
3773 SSMR3PutU64(pSSM, pIoReq->ReadWrite.cbReqLeft);
3774 }
3775 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
3776 {
3777 SSMR3PutU32(pSSM, pIoReq->Discard.cRanges);
3778 for (unsigned i = 0; i < pIoReq->Discard.cRanges; i++)
3779 {
3780 SSMR3PutU64(pSSM, pIoReq->Discard.paRanges[i].offStart);
3781 SSMR3PutU64(pSSM, pIoReq->Discard.paRanges[i].cbRange);
3782 }
3783 }
3784
3785 return SSMR3PutU32(pSSM, UINT32_MAX); /* sanity/terminator */
3786}
3787
3788/**
3789 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqSuspendedLoad}
3790 */
3791static DECLCALLBACK(int) drvvdIoReqSuspendedLoad(PPDMIMEDIAEX pInterface, PSSMHANDLE pSSM, PDMMEDIAEXIOREQ hIoReq)
3792{
3793 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3794 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3795
3796 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), VERR_INVALID_STATE);
3797 AssertPtrReturn(pIoReq, VERR_INVALID_HANDLE);
3798 AssertReturn(pIoReq->enmState == VDIOREQSTATE_ALLOCATED, VERR_INVALID_STATE);
3799
3800 uint32_t u32;
3801 uint64_t u64;
3802 int rc = VINF_SUCCESS;
3803 bool fPlaceOnRedoList = true;
3804
3805 SSMR3GetU32(pSSM, &u32);
3806 if (u32 <= DRVVD_IOREQ_SAVED_STATE_VERSION)
3807 {
3808 SSMR3GetU32(pSSM, &u32);
3809 AssertReturn( u32 == PDMMEDIAEXIOREQTYPE_WRITE
3810 || u32 == PDMMEDIAEXIOREQTYPE_READ
3811 || u32 == PDMMEDIAEXIOREQTYPE_DISCARD
3812 || u32 == PDMMEDIAEXIOREQTYPE_FLUSH,
3813 VERR_SSM_DATA_UNIT_FORMAT_CHANGED);
3814 pIoReq->enmType = (PDMMEDIAEXIOREQTYPE)u32;
3815
3816 SSMR3GetU32(pSSM, &u32);
3817 AssertReturn(u32 == pIoReq->uIoReqId, VERR_SSM_DATA_UNIT_FORMAT_CHANGED);
3818
3819 SSMR3GetU32(pSSM, &u32);
3820 AssertReturn(u32 == pIoReq->fFlags, VERR_SSM_DATA_UNIT_FORMAT_CHANGED);
3821
3822 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
3823 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
3824 {
3825 SSMR3GetU64(pSSM, &pIoReq->ReadWrite.offStart);
3826 SSMR3GetU64(pSSM, &u64);
3827 pIoReq->ReadWrite.cbReq = (size_t)u64;
3828 SSMR3GetU64(pSSM, &u64);
3829 pIoReq->ReadWrite.cbReqLeft = (size_t)u64;
3830
3831 /*
3832 * Try to allocate enough I/O buffer, if this fails for some reason put it onto the
3833 * waitign list instead of the redo list.
3834 */
3835 pIoReq->ReadWrite.cbIoBuf = 0;
3836 rc = IOBUFMgrAllocBuf(pThis->hIoBufMgr, &pIoReq->ReadWrite.IoBuf, pIoReq->ReadWrite.cbReqLeft,
3837 &pIoReq->ReadWrite.cbIoBuf);
3838 if (rc == VERR_NO_MEMORY)
3839 {
3840 pIoReq->enmState = VDIOREQSTATE_ALLOCATED;
3841 ASMAtomicIncU32(&pThis->cIoReqsWaiting);
3842 RTListAppend(&pThis->LstIoReqIoBufWait, &pIoReq->NdLstWait);
3843 fPlaceOnRedoList = false;
3844 rc = VINF_SUCCESS;
3845 }
3846 }
3847 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
3848 {
3849 rc = SSMR3GetU32(pSSM, &pIoReq->Discard.cRanges);
3850 if (RT_SUCCESS(rc))
3851 {
3852 pIoReq->Discard.paRanges = (PRTRANGE)RTMemAllocZ(pIoReq->Discard.cRanges * sizeof(RTRANGE));
3853 if (RT_LIKELY(pIoReq->Discard.paRanges))
3854 {
3855 for (unsigned i = 0; i < pIoReq->Discard.cRanges; i++)
3856 {
3857 SSMR3GetU64(pSSM, &pIoReq->Discard.paRanges[i].offStart);
3858 SSMR3GetU64(pSSM, &u64);
3859 pIoReq->Discard.paRanges[i].cbRange = (size_t)u64;
3860 }
3861 }
3862 else
3863 rc = VERR_NO_MEMORY;
3864 }
3865 }
3866
3867 if (RT_SUCCESS(rc))
3868 rc = SSMR3GetU32(pSSM, &u32); /* sanity/terminator */
3869 if (RT_SUCCESS(rc))
3870 AssertReturn(u32 == UINT32_MAX, VERR_SSM_DATA_UNIT_FORMAT_CHANGED);
3871 if ( RT_SUCCESS(rc)
3872 && fPlaceOnRedoList)
3873 {
3874 /* Mark as suspended */
3875 pIoReq->enmState = VDIOREQSTATE_SUSPENDED;
3876
3877 /* Link into suspended list so it gets kicked off again when we resume. */
3878 RTCritSectEnter(&pThis->CritSectIoReqRedo);
3879 RTListAppend(&pThis->LstIoReqRedo, &pIoReq->NdLstWait);
3880 RTCritSectLeave(&pThis->CritSectIoReqRedo);
3881 }
3882 }
3883
3884 return rc;
3885}
3886
3887/**
3888 * Loads all configured plugins.
3889 *
3890 * @returns VBox status code.
3891 * @param pCfg CFGM node holding plugin list.
3892 */
3893static int drvvdLoadPlugins(PCFGMNODE pCfg)
3894{
3895 PCFGMNODE pCfgPlugins = CFGMR3GetChild(pCfg, "Plugins");
3896
3897 if (pCfgPlugins)
3898 {
3899 PCFGMNODE pPluginCur = CFGMR3GetFirstChild(pCfgPlugins);
3900 while (pPluginCur)
3901 {
3902 int rc = VINF_SUCCESS;
3903 char *pszPluginFilename = NULL;
3904 rc = CFGMR3QueryStringAlloc(pPluginCur, "Path", &pszPluginFilename);
3905 if (RT_SUCCESS(rc))
3906 rc = VDPluginLoadFromFilename(pszPluginFilename);
3907
3908 if (RT_FAILURE(rc))
3909 LogRel(("VD: Failed to load plugin '%s' with %Rrc, continuing\n", pszPluginFilename, rc));
3910
3911 pPluginCur = CFGMR3GetNextChild(pPluginCur);
3912 }
3913 }
3914
3915 return VINF_SUCCESS;
3916}
3917
3918
3919/**
3920 * Sets up the disk filter chain.
3921 *
3922 * @returns VBox status code.
3923 * @param pThis The disk instance.
3924 * @param pCfg CFGM node holding the filter parameters.
3925 */
3926static int drvvdSetupFilters(PVBOXDISK pThis, PCFGMNODE pCfg)
3927{
3928 int rc = VINF_SUCCESS;
3929 PCFGMNODE pCfgFilter = CFGMR3GetChild(pCfg, "Filters");
3930
3931 if (pCfgFilter)
3932 {
3933 PCFGMNODE pCfgFilterConfig = CFGMR3GetChild(pCfgFilter, "VDConfig");
3934 char *pszFilterName = NULL;
3935 VDINTERFACECONFIG VDIfConfig;
3936 PVDINTERFACE pVDIfsFilter = NULL;
3937
3938 rc = CFGMR3QueryStringAlloc(pCfgFilter, "FilterName", &pszFilterName);
3939 if (RT_SUCCESS(rc))
3940 {
3941 VDIfConfig.pfnAreKeysValid = drvvdCfgAreKeysValid;
3942 VDIfConfig.pfnQuerySize = drvvdCfgQuerySize;
3943 VDIfConfig.pfnQuery = drvvdCfgQuery;
3944 VDIfConfig.pfnQueryBytes = drvvdCfgQueryBytes;
3945 rc = VDInterfaceAdd(&VDIfConfig.Core, "DrvVD_Config", VDINTERFACETYPE_CONFIG,
3946 pCfgFilterConfig, sizeof(VDINTERFACECONFIG), &pVDIfsFilter);
3947 AssertRC(rc);
3948
3949 rc = VDFilterAdd(pThis->pDisk, pszFilterName, VD_FILTER_FLAGS_DEFAULT, pVDIfsFilter);
3950
3951 MMR3HeapFree(pszFilterName);
3952 }
3953 }
3954
3955 return rc;
3956}
3957
3958
3959/**
3960 * Translates a PDMMEDIATYPE value into a string.
3961 *
3962 * @returns Read only string.
3963 * @param enmType The type value.
3964 */
3965static const char *drvvdGetTypeName(PDMMEDIATYPE enmType)
3966{
3967 switch (enmType)
3968 {
3969 case PDMMEDIATYPE_ERROR: return "ERROR";
3970 case PDMMEDIATYPE_FLOPPY_360: return "FLOPPY_360";
3971 case PDMMEDIATYPE_FLOPPY_720: return "FLOPPY_720";
3972 case PDMMEDIATYPE_FLOPPY_1_20: return "FLOPPY_1_20";
3973 case PDMMEDIATYPE_FLOPPY_1_44: return "FLOPPY_1_44";
3974 case PDMMEDIATYPE_FLOPPY_2_88: return "FLOPPY_2_88";
3975 case PDMMEDIATYPE_FLOPPY_FAKE_15_6: return "FLOPPY_FAKE_15_6";
3976 case PDMMEDIATYPE_FLOPPY_FAKE_63_5: return "FLOPPY_FAKE_63_5";
3977 case PDMMEDIATYPE_CDROM: return "CDROM";
3978 case PDMMEDIATYPE_DVD: return "DVD";
3979 case PDMMEDIATYPE_HARD_DISK: return "HARD_DISK";
3980 default: return "Unknown";
3981 }
3982}
3983
3984/**
3985 * Returns the appropriate PDMMEDIATYPE for t he given string.
3986 *
3987 * @returns PDMMEDIATYPE
3988 * @param pszType The string representation of the media type.
3989 */
3990static PDMMEDIATYPE drvvdGetMediaTypeFromString(const char *pszType)
3991{
3992 PDMMEDIATYPE enmType = PDMMEDIATYPE_ERROR;
3993
3994 if (!strcmp(pszType, "HardDisk"))
3995 enmType = PDMMEDIATYPE_HARD_DISK;
3996 else if (!strcmp(pszType, "DVD"))
3997 enmType = PDMMEDIATYPE_DVD;
3998 else if (!strcmp(pszType, "CDROM"))
3999 enmType = PDMMEDIATYPE_CDROM;
4000 else if (!strcmp(pszType, "Floppy 2.88"))
4001 enmType = PDMMEDIATYPE_FLOPPY_2_88;
4002 else if (!strcmp(pszType, "Floppy 1.44"))
4003 enmType = PDMMEDIATYPE_FLOPPY_1_44;
4004 else if (!strcmp(pszType, "Floppy 1.20"))
4005 enmType = PDMMEDIATYPE_FLOPPY_1_20;
4006 else if (!strcmp(pszType, "Floppy 720"))
4007 enmType = PDMMEDIATYPE_FLOPPY_720;
4008 else if (!strcmp(pszType, "Floppy 360"))
4009 enmType = PDMMEDIATYPE_FLOPPY_360;
4010 else if (!strcmp(pszType, "Floppy 15.6"))
4011 enmType = PDMMEDIATYPE_FLOPPY_FAKE_15_6;
4012 else if (!strcmp(pszType, "Floppy 63.5"))
4013 enmType = PDMMEDIATYPE_FLOPPY_FAKE_63_5;
4014
4015 return enmType;
4016}
4017
4018/**
4019 * Converts PDMMEDIATYPE to the appropriate VDTYPE.
4020 *
4021 * @returns The VDTYPE.
4022 * @param enmType The PDMMEDIATYPE to convert from.
4023 */
4024static VDTYPE drvvdGetVDFromMediaType(PDMMEDIATYPE enmType)
4025{
4026 if (PDMMEDIATYPE_IS_FLOPPY(enmType))
4027 return VDTYPE_FLOPPY;
4028 else if (enmType == PDMMEDIATYPE_DVD || enmType == PDMMEDIATYPE_CDROM)
4029 return VDTYPE_DVD;
4030 else if (enmType == PDMMEDIATYPE_HARD_DISK)
4031 return VDTYPE_HDD;
4032
4033 AssertMsgFailed(("Invalid media type %d{%s} given!\n", enmType, drvvdGetTypeName(enmType)));
4034 return VDTYPE_HDD;
4035}
4036
4037
4038/*********************************************************************************************************************************
4039* Base interface methods *
4040*********************************************************************************************************************************/
4041
4042/**
4043 * @interface_method_impl{PDMIBASE,pfnQueryInterface}
4044 */
4045static DECLCALLBACK(void *) drvvdQueryInterface(PPDMIBASE pInterface, const char *pszIID)
4046{
4047 PPDMDRVINS pDrvIns = PDMIBASE_2_PDMDRV(pInterface);
4048 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4049
4050 PDMIBASE_RETURN_INTERFACE(pszIID, PDMIBASE, &pDrvIns->IBase);
4051 PDMIBASE_RETURN_INTERFACE(pszIID, PDMIMEDIA, &pThis->IMedia);
4052 PDMIBASE_RETURN_INTERFACE(pszIID, PDMIMOUNT, pThis->fMountable ? &pThis->IMount : NULL);
4053 PDMIBASE_RETURN_INTERFACE(pszIID, PDMIMEDIAEX, pThis->pDrvMediaExPort ? &pThis->IMediaEx : NULL);
4054 return NULL;
4055}
4056
4057
4058/*********************************************************************************************************************************
4059* Saved state notification methods *
4060*********************************************************************************************************************************/
4061
4062/**
4063 * Load done callback for re-opening the image writable during teleportation.
4064 *
4065 * This is called both for successful and failed load runs, we only care about
4066 * successful ones.
4067 *
4068 * @returns VBox status code.
4069 * @param pDrvIns The driver instance.
4070 * @param pSSM The saved state handle.
4071 */
4072static DECLCALLBACK(int) drvvdLoadDone(PPDMDRVINS pDrvIns, PSSMHANDLE pSSM)
4073{
4074 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4075 Assert(!pThis->fErrorUseRuntime);
4076
4077 /* Drop out if we don't have any work to do or if it's a failed load. */
4078 if ( !pThis->fTempReadOnly
4079 || RT_FAILURE(SSMR3HandleGetStatus(pSSM)))
4080 return VINF_SUCCESS;
4081
4082 int rc = drvvdSetWritable(pThis);
4083 if (RT_FAILURE(rc)) /** @todo does the bugger set any errors? */
4084 return SSMR3SetLoadError(pSSM, rc, RT_SRC_POS,
4085 N_("Failed to write lock the images"));
4086 return VINF_SUCCESS;
4087}
4088
4089
4090/*********************************************************************************************************************************
4091* Driver methods *
4092*********************************************************************************************************************************/
4093
4094/**
4095 * Worker for the power off or destruct callback.
4096 *
4097 * @returns nothing.
4098 * @param pDrvIns The driver instance.
4099 */
4100static void drvvdPowerOffOrDestructOrUnmount(PPDMDRVINS pDrvIns)
4101{
4102 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4103 LogFlowFunc(("\n"));
4104
4105 RTSEMFASTMUTEX mutex;
4106 ASMAtomicXchgHandle(&pThis->MergeCompleteMutex, NIL_RTSEMFASTMUTEX, &mutex);
4107 if (mutex != NIL_RTSEMFASTMUTEX)
4108 {
4109 /* Request the semaphore to wait until a potentially running merge
4110 * operation has been finished. */
4111 int rc = RTSemFastMutexRequest(mutex);
4112 AssertRC(rc);
4113 pThis->fMergePending = false;
4114 rc = RTSemFastMutexRelease(mutex);
4115 AssertRC(rc);
4116 rc = RTSemFastMutexDestroy(mutex);
4117 AssertRC(rc);
4118 }
4119
4120 if (RT_VALID_PTR(pThis->pBlkCache))
4121 {
4122 PDMR3BlkCacheRelease(pThis->pBlkCache);
4123 pThis->pBlkCache = NULL;
4124 }
4125
4126 if (RT_VALID_PTR(pThis->pDisk))
4127 {
4128 VDDestroy(pThis->pDisk);
4129 pThis->pDisk = NULL;
4130 }
4131 drvvdFreeImages(pThis);
4132}
4133
4134/**
4135 * @copydoc FNPDMDRVPOWEROFF
4136 */
4137static DECLCALLBACK(void) drvvdPowerOff(PPDMDRVINS pDrvIns)
4138{
4139 PDMDRV_CHECK_VERSIONS_RETURN_VOID(pDrvIns);
4140 drvvdPowerOffOrDestructOrUnmount(pDrvIns);
4141}
4142
4143/**
4144 * @callback_method_impl{FNPDMDRVRESUME}
4145 *
4146 * VM resume notification that we use to undo what the temporary read-only image
4147 * mode set by drvvdSuspend.
4148 *
4149 * Also switch to runtime error mode if we're resuming after a state load
4150 * without having been powered on first.
4151 *
4152 * @todo The VMSetError vs VMSetRuntimeError mess must be fixed elsewhere,
4153 * we're making assumptions about Main behavior here!
4154 */
4155static DECLCALLBACK(void) drvvdResume(PPDMDRVINS pDrvIns)
4156{
4157 LogFlowFunc(("\n"));
4158 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4159
4160 drvvdSetWritable(pThis);
4161 pThis->fErrorUseRuntime = true;
4162
4163 if (pThis->pBlkCache)
4164 {
4165 int rc = PDMR3BlkCacheResume(pThis->pBlkCache);
4166 AssertRC(rc);
4167 }
4168
4169 if (pThis->pDrvMediaExPort)
4170 {
4171 /* Kick of any request we have to redo. */
4172 PPDMMEDIAEXIOREQINT pIoReq, pIoReqNext;
4173 RTCritSectEnter(&pThis->CritSectIoReqRedo);
4174 RTListForEachSafe(&pThis->LstIoReqRedo, pIoReq, pIoReqNext, PDMMEDIAEXIOREQINT, NdLstWait)
4175 {
4176 int rc = VINF_SUCCESS;
4177 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_SUSPENDED);
4178
4179 RTListNodeRemove(&pIoReq->NdLstWait);
4180 ASMAtomicIncU32(&pThis->cIoReqsActive);
4181
4182 if (fXchg)
4183 {
4184 pThis->pDrvMediaExPort->pfnIoReqStateChanged(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0],
4185 PDMMEDIAEXIOREQSTATE_ACTIVE);
4186 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
4187 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
4188 rc = drvvdMediaExIoReqReadWriteProcess(pThis, pIoReq, true /* fUpNotify */);
4189 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH)
4190 {
4191 rc = drvvdMediaExIoReqFlushWrapper(pThis, pIoReq);
4192 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4193 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
4194 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
4195 rc = VINF_SUCCESS;
4196 }
4197 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
4198 {
4199 rc = drvvdMediaExIoReqDiscardWrapper(pThis, pIoReq);
4200 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4201 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
4202 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
4203 rc = VINF_SUCCESS;
4204 }
4205 else
4206 AssertMsgFailed(("Invalid request type %u\n", pIoReq->enmType));
4207
4208 /* The read write process will call the completion callback on its own. */
4209 if ( rc != VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS
4210 && ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD
4211 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH))
4212 {
4213 Assert( ( pIoReq->enmType != PDMMEDIAEXIOREQTYPE_WRITE
4214 && pIoReq->enmType != PDMMEDIAEXIOREQTYPE_READ)
4215 || !pIoReq->ReadWrite.cbReqLeft
4216 || RT_FAILURE(rc));
4217 drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rc, true /* fUpNotify */);
4218 }
4219
4220 }
4221 else
4222 {
4223 /* Request was canceled inbetween, so don't care and notify the owner about the completed request. */
4224 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
4225 drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, VERR_PDM_MEDIAEX_IOREQ_CANCELED, true /* fUpNotify */);
4226 }
4227 }
4228 Assert(RTListIsEmpty(&pThis->LstIoReqRedo));
4229 RTCritSectLeave(&pThis->CritSectIoReqRedo);
4230 }
4231}
4232
4233/**
4234 * @callback_method_impl{FNPDMDRVSUSPEND}
4235 *
4236 * When the VM is being suspended, temporarily change to read-only image mode.
4237 *
4238 * This is important for several reasons:
4239 * -# It makes sure that there are no pending writes to the image. Most
4240 * backends implements this by closing and reopening the image in read-only
4241 * mode.
4242 * -# It allows Main to read the images during snapshotting without having
4243 * to account for concurrent writes.
4244 * -# This is essential for making teleportation targets sharing images work
4245 * right. Both with regards to caching and with regards to file sharing
4246 * locks (RTFILE_O_DENY_*). (See also drvvdLoadDone.)
4247 */
4248static DECLCALLBACK(void) drvvdSuspend(PPDMDRVINS pDrvIns)
4249{
4250 LogFlowFunc(("\n"));
4251 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4252
4253 if (pThis->pBlkCache)
4254 {
4255 int rc = PDMR3BlkCacheSuspend(pThis->pBlkCache);
4256 AssertRC(rc);
4257 }
4258
4259 drvvdSetReadonly(pThis);
4260}
4261
4262/**
4263 * @callback_method_impl{FNPDMDRVPOWERON}
4264 */
4265static DECLCALLBACK(void) drvvdPowerOn(PPDMDRVINS pDrvIns)
4266{
4267 LogFlowFunc(("\n"));
4268 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4269 drvvdSetWritable(pThis);
4270 pThis->fErrorUseRuntime = true;
4271}
4272
4273/**
4274 * @callback_method_impl{FNPDMDRVRESET}
4275 */
4276static DECLCALLBACK(void) drvvdReset(PPDMDRVINS pDrvIns)
4277{
4278 LogFlowFunc(("\n"));
4279 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4280
4281 if (pThis->pBlkCache)
4282 {
4283 int rc = PDMR3BlkCacheClear(pThis->pBlkCache);
4284 AssertRC(rc);
4285 }
4286
4287 if (pThis->fBootAccelEnabled)
4288 {
4289 pThis->fBootAccelActive = true;
4290 pThis->cbDataValid = 0;
4291 pThis->offDisk = 0;
4292 }
4293}
4294
4295/**
4296 * @callback_method_impl{FNPDMDRVDESTRUCT}
4297 */
4298static DECLCALLBACK(void) drvvdDestruct(PPDMDRVINS pDrvIns)
4299{
4300 PDMDRV_CHECK_VERSIONS_RETURN_VOID(pDrvIns);
4301 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4302 LogFlowFunc(("\n"));
4303
4304 /*
4305 * Make sure the block cache and disks are closed when this driver is
4306 * destroyed. This method will get called without calling the power off
4307 * callback first when we reconfigure the driver chain after a snapshot.
4308 */
4309 drvvdPowerOffOrDestructOrUnmount(pDrvIns);
4310 if (pThis->MergeLock != NIL_RTSEMRW)
4311 {
4312 int rc = RTSemRWDestroy(pThis->MergeLock);
4313 AssertRC(rc);
4314 pThis->MergeLock = NIL_RTSEMRW;
4315 }
4316 if (pThis->pbData)
4317 {
4318 RTMemFree(pThis->pbData);
4319 pThis->pbData = NULL;
4320 }
4321 if (pThis->pszBwGroup)
4322 {
4323 MMR3HeapFree(pThis->pszBwGroup);
4324 pThis->pszBwGroup = NULL;
4325 }
4326 if (pThis->hHbdMgr != NIL_HBDMGR)
4327 HBDMgrDestroy(pThis->hHbdMgr);
4328 if (pThis->hIoReqCache != NIL_RTMEMCACHE)
4329 RTMemCacheDestroy(pThis->hIoReqCache);
4330 if (pThis->hIoBufMgr != NIL_IOBUFMGR)
4331 IOBUFMgrDestroy(pThis->hIoBufMgr);
4332 if (RTCritSectIsInitialized(&pThis->CritSectIoReqsIoBufWait))
4333 RTCritSectDelete(&pThis->CritSectIoReqsIoBufWait);
4334 if (RTCritSectIsInitialized(&pThis->CritSectIoReqRedo))
4335 RTCritSectDelete(&pThis->CritSectIoReqRedo);
4336 for (unsigned i = 0; i < RT_ELEMENTS(pThis->aIoReqAllocBins); i++)
4337 if (pThis->aIoReqAllocBins[i].hMtxLstIoReqAlloc != NIL_RTSEMFASTMUTEX)
4338 RTSemFastMutexDestroy(pThis->aIoReqAllocBins[i].hMtxLstIoReqAlloc);
4339}
4340
4341/**
4342 * @callback_method_impl{FNPDMDRVCONSTRUCT,
4343 * Construct a VBox disk media driver instance.}
4344 */
4345static DECLCALLBACK(int) drvvdConstruct(PPDMDRVINS pDrvIns, PCFGMNODE pCfg, uint32_t fFlags)
4346{
4347 RT_NOREF(fFlags);
4348 LogFlowFunc(("\n"));
4349 PDMDRV_CHECK_VERSIONS_RETURN(pDrvIns);
4350 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4351 int rc = VINF_SUCCESS;
4352 char *pszName = NULL; /* The path of the disk image file. */
4353 char *pszFormat = NULL; /* The format backed to use for this image. */
4354 char *pszCachePath = NULL; /* The path to the cache image. */
4355 char *pszCacheFormat = NULL; /* The format backend to use for the cache image. */
4356 bool fReadOnly = false; /* True if the media is read-only. */
4357 bool fMaybeReadOnly = false; /* True if the media may or may not be read-only. */
4358 bool fHonorZeroWrites = false; /* True if zero blocks should be written. */
4359
4360 /*
4361 * Init the static parts.
4362 */
4363 pDrvIns->IBase.pfnQueryInterface = drvvdQueryInterface;
4364 pThis->pDrvIns = pDrvIns;
4365 pThis->fTempReadOnly = false;
4366 pThis->pDisk = NULL;
4367 pThis->fAsyncIOSupported = false;
4368 pThis->fShareable = false;
4369 pThis->fMergePending = false;
4370 pThis->MergeCompleteMutex = NIL_RTSEMFASTMUTEX;
4371 pThis->MergeLock = NIL_RTSEMRW;
4372 pThis->uMergeSource = VD_LAST_IMAGE;
4373 pThis->uMergeTarget = VD_LAST_IMAGE;
4374 pThis->pCfgCrypto = NULL;
4375 pThis->pIfSecKey = NULL;
4376 pThis->hIoReqCache = NIL_RTMEMCACHE;
4377 pThis->hIoBufMgr = NIL_IOBUFMGR;
4378
4379 for (unsigned i = 0; i < RT_ELEMENTS(pThis->aIoReqAllocBins); i++)
4380 pThis->aIoReqAllocBins[i].hMtxLstIoReqAlloc = NIL_RTSEMFASTMUTEX;
4381
4382 /* IMedia */
4383 pThis->IMedia.pfnRead = drvvdRead;
4384 pThis->IMedia.pfnReadPcBios = drvvdReadPcBios;
4385 pThis->IMedia.pfnWrite = drvvdWrite;
4386 pThis->IMedia.pfnFlush = drvvdFlush;
4387 pThis->IMedia.pfnMerge = drvvdMerge;
4388 pThis->IMedia.pfnSetSecKeyIf = drvvdSetSecKeyIf;
4389 pThis->IMedia.pfnGetSize = drvvdGetSize;
4390 pThis->IMedia.pfnGetSectorSize = drvvdGetSectorSize;
4391 pThis->IMedia.pfnIsReadOnly = drvvdIsReadOnly;
4392 pThis->IMedia.pfnIsNonRotational = drvvdIsNonRotational;
4393 pThis->IMedia.pfnBiosGetPCHSGeometry = drvvdBiosGetPCHSGeometry;
4394 pThis->IMedia.pfnBiosSetPCHSGeometry = drvvdBiosSetPCHSGeometry;
4395 pThis->IMedia.pfnBiosGetLCHSGeometry = drvvdBiosGetLCHSGeometry;
4396 pThis->IMedia.pfnBiosSetLCHSGeometry = drvvdBiosSetLCHSGeometry;
4397 pThis->IMedia.pfnBiosIsVisible = drvvdBiosIsVisible;
4398 pThis->IMedia.pfnGetType = drvvdGetType;
4399 pThis->IMedia.pfnGetUuid = drvvdGetUuid;
4400 pThis->IMedia.pfnDiscard = drvvdDiscard;
4401 pThis->IMedia.pfnSendCmd = NULL;
4402
4403 /* IMount */
4404 pThis->IMount.pfnUnmount = drvvdUnmount;
4405 pThis->IMount.pfnIsMounted = drvvdIsMounted;
4406 pThis->IMount.pfnLock = drvvdLock;
4407 pThis->IMount.pfnUnlock = drvvdUnlock;
4408 pThis->IMount.pfnIsLocked = drvvdIsLocked;
4409
4410 /* IMediaEx */
4411 pThis->IMediaEx.pfnQueryFeatures = drvvdQueryFeatures;
4412 pThis->IMediaEx.pfnIoReqAllocSizeSet = drvvdIoReqAllocSizeSet;
4413 pThis->IMediaEx.pfnIoReqAlloc = drvvdIoReqAlloc;
4414 pThis->IMediaEx.pfnIoReqFree = drvvdIoReqFree;
4415 pThis->IMediaEx.pfnIoReqQueryResidual = drvvdIoReqQueryResidual;
4416 pThis->IMediaEx.pfnIoReqQueryXferSize = drvvdIoReqQueryXferSize;
4417 pThis->IMediaEx.pfnIoReqCancelAll = drvvdIoReqCancelAll;
4418 pThis->IMediaEx.pfnIoReqCancel = drvvdIoReqCancel;
4419 pThis->IMediaEx.pfnIoReqRead = drvvdIoReqRead;
4420 pThis->IMediaEx.pfnIoReqWrite = drvvdIoReqWrite;
4421 pThis->IMediaEx.pfnIoReqFlush = drvvdIoReqFlush;
4422 pThis->IMediaEx.pfnIoReqDiscard = drvvdIoReqDiscard;
4423 pThis->IMediaEx.pfnIoReqSendScsiCmd = drvvdIoReqSendScsiCmd;
4424 pThis->IMediaEx.pfnIoReqGetActiveCount = drvvdIoReqGetActiveCount;
4425 pThis->IMediaEx.pfnIoReqGetSuspendedCount = drvvdIoReqGetSuspendedCount;
4426 pThis->IMediaEx.pfnIoReqQuerySuspendedStart = drvvdIoReqQuerySuspendedStart;
4427 pThis->IMediaEx.pfnIoReqQuerySuspendedNext = drvvdIoReqQuerySuspendedNext;
4428 pThis->IMediaEx.pfnIoReqSuspendedSave = drvvdIoReqSuspendedSave;
4429 pThis->IMediaEx.pfnIoReqSuspendedLoad = drvvdIoReqSuspendedLoad;
4430
4431 /* Initialize supported VD interfaces. */
4432 pThis->pVDIfsDisk = NULL;
4433
4434 pThis->VDIfError.pfnError = drvvdErrorCallback;
4435 pThis->VDIfError.pfnMessage = NULL;
4436 rc = VDInterfaceAdd(&pThis->VDIfError.Core, "DrvVD_VDIError", VDINTERFACETYPE_ERROR,
4437 pDrvIns, sizeof(VDINTERFACEERROR), &pThis->pVDIfsDisk);
4438 AssertRC(rc);
4439
4440 /* List of images is empty now. */
4441 pThis->pImages = NULL;
4442
4443 pThis->pDrvMediaPort = PDMIBASE_QUERY_INTERFACE(pDrvIns->pUpBase, PDMIMEDIAPORT);
4444 if (!pThis->pDrvMediaPort)
4445 return PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_MISSING_INTERFACE_ABOVE,
4446 N_("No media port interface above"));
4447
4448 pThis->pDrvMountNotify = PDMIBASE_QUERY_INTERFACE(pDrvIns->pUpBase, PDMIMOUNTNOTIFY);
4449
4450 /*
4451 * Try to attach the optional extended media interface port above and initialize associated
4452 * structures if available.
4453 */
4454 pThis->pDrvMediaExPort = PDMIBASE_QUERY_INTERFACE(pDrvIns->pUpBase, PDMIMEDIAEXPORT);
4455 if (pThis->pDrvMediaExPort)
4456 {
4457 for (unsigned i = 0; i < RT_ELEMENTS(pThis->aIoReqAllocBins); i++)
4458 {
4459 rc = RTSemFastMutexCreate(&pThis->aIoReqAllocBins[i].hMtxLstIoReqAlloc);
4460 if (RT_FAILURE(rc))
4461 break;
4462 RTListInit(&pThis->aIoReqAllocBins[i].LstIoReqAlloc);
4463 }
4464
4465 if (RT_SUCCESS(rc))
4466 rc = RTCritSectInit(&pThis->CritSectIoReqsIoBufWait);
4467
4468 if (RT_SUCCESS(rc))
4469 rc = RTCritSectInit(&pThis->CritSectIoReqRedo);
4470
4471 if (RT_FAILURE(rc))
4472 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Creating Mutex failed"));
4473
4474 RTListInit(&pThis->LstIoReqIoBufWait);
4475 RTListInit(&pThis->LstIoReqRedo);
4476 }
4477
4478 /* Before we access any VD API load all given plugins. */
4479 rc = drvvdLoadPlugins(pCfg);
4480 if (RT_FAILURE(rc))
4481 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Loading VD plugins failed"));
4482
4483 /*
4484 * Validate configuration and find all parent images.
4485 * It's sort of up side down from the image dependency tree.
4486 */
4487 bool fHostIP = false;
4488 bool fUseNewIo = false;
4489 bool fUseBlockCache = false;
4490 bool fDiscard = false;
4491 bool fInformAboutZeroBlocks = false;
4492 bool fSkipConsistencyChecks = false;
4493 bool fEmptyDrive = false;
4494 unsigned iLevel = 0;
4495 PCFGMNODE pCurNode = pCfg;
4496 uint32_t cbIoBufMax = 0;
4497
4498 for (;;)
4499 {
4500 bool fValid;
4501
4502 if (pCurNode == pCfg)
4503 {
4504 /* Toplevel configuration additionally contains the global image
4505 * open flags. Some might be converted to per-image flags later. */
4506 fValid = CFGMR3AreValuesValid(pCurNode,
4507 "Format\0Path\0"
4508 "ReadOnly\0MaybeReadOnly\0TempReadOnly\0Shareable\0HonorZeroWrites\0"
4509 "HostIPStack\0UseNewIo\0BootAcceleration\0BootAccelerationBuffer\0"
4510 "SetupMerge\0MergeSource\0MergeTarget\0BwGroup\0Type\0BlockCache\0"
4511 "CachePath\0CacheFormat\0Discard\0InformAboutZeroBlocks\0"
4512 "SkipConsistencyChecks\0"
4513 "Locked\0BIOSVisible\0Cylinders\0Heads\0Sectors\0Mountable\0"
4514 "EmptyDrive\0IoBufMax\0NonRotationalMedium\0"
4515#if defined(VBOX_PERIODIC_FLUSH) || defined(VBOX_IGNORE_FLUSH)
4516 "FlushInterval\0IgnoreFlush\0IgnoreFlushAsync\0"
4517#endif /* !(VBOX_PERIODIC_FLUSH || VBOX_IGNORE_FLUSH) */
4518 );
4519 }
4520 else
4521 {
4522 /* All other image configurations only contain image name and
4523 * the format information. */
4524 fValid = CFGMR3AreValuesValid(pCurNode, "Format\0Path\0"
4525 "MergeSource\0MergeTarget\0");
4526 }
4527 if (!fValid)
4528 {
4529 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_DRVINS_UNKNOWN_CFG_VALUES,
4530 RT_SRC_POS, N_("DrvVD: Configuration error: keys incorrect at level %d"), iLevel);
4531 break;
4532 }
4533
4534 if (pCurNode == pCfg)
4535 {
4536 rc = CFGMR3QueryBoolDef(pCurNode, "HostIPStack", &fHostIP, true);
4537 if (RT_FAILURE(rc))
4538 {
4539 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4540 N_("DrvVD: Configuration error: Querying \"HostIPStack\" as boolean failed"));
4541 break;
4542 }
4543
4544 rc = CFGMR3QueryBoolDef(pCurNode, "HonorZeroWrites", &fHonorZeroWrites, false);
4545 if (RT_FAILURE(rc))
4546 {
4547 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4548 N_("DrvVD: Configuration error: Querying \"HonorZeroWrites\" as boolean failed"));
4549 break;
4550 }
4551
4552 rc = CFGMR3QueryBoolDef(pCurNode, "ReadOnly", &fReadOnly, false);
4553 if (RT_FAILURE(rc))
4554 {
4555 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4556 N_("DrvVD: Configuration error: Querying \"ReadOnly\" as boolean failed"));
4557 break;
4558 }
4559
4560 rc = CFGMR3QueryBoolDef(pCurNode, "MaybeReadOnly", &fMaybeReadOnly, false);
4561 if (RT_FAILURE(rc))
4562 {
4563 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4564 N_("DrvVD: Configuration error: Querying \"MaybeReadOnly\" as boolean failed"));
4565 break;
4566 }
4567
4568 rc = CFGMR3QueryBoolDef(pCurNode, "TempReadOnly", &pThis->fTempReadOnly, false);
4569 if (RT_FAILURE(rc))
4570 {
4571 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4572 N_("DrvVD: Configuration error: Querying \"TempReadOnly\" as boolean failed"));
4573 break;
4574 }
4575 if (fReadOnly && pThis->fTempReadOnly)
4576 {
4577 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
4578 N_("DrvVD: Configuration error: Both \"ReadOnly\" and \"TempReadOnly\" are set"));
4579 break;
4580 }
4581
4582 rc = CFGMR3QueryBoolDef(pCurNode, "Shareable", &pThis->fShareable, false);
4583 if (RT_FAILURE(rc))
4584 {
4585 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4586 N_("DrvVD: Configuration error: Querying \"Shareable\" as boolean failed"));
4587 break;
4588 }
4589
4590 rc = CFGMR3QueryBoolDef(pCurNode, "UseNewIo", &fUseNewIo, false);
4591 if (RT_FAILURE(rc))
4592 {
4593 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4594 N_("DrvVD: Configuration error: Querying \"UseNewIo\" as boolean failed"));
4595 break;
4596 }
4597 rc = CFGMR3QueryBoolDef(pCurNode, "SetupMerge", &pThis->fMergePending, false);
4598 if (RT_FAILURE(rc))
4599 {
4600 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4601 N_("DrvVD: Configuration error: Querying \"SetupMerge\" as boolean failed"));
4602 break;
4603 }
4604 if (fReadOnly && pThis->fMergePending)
4605 {
4606 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
4607 N_("DrvVD: Configuration error: Both \"ReadOnly\" and \"MergePending\" are set"));
4608 break;
4609 }
4610 rc = CFGMR3QueryBoolDef(pCurNode, "BootAcceleration", &pThis->fBootAccelEnabled, false);
4611 if (RT_FAILURE(rc))
4612 {
4613 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4614 N_("DrvVD: Configuration error: Querying \"BootAcceleration\" as boolean failed"));
4615 break;
4616 }
4617 rc = CFGMR3QueryU32Def(pCurNode, "BootAccelerationBuffer", (uint32_t *)&pThis->cbBootAccelBuffer, 16 * _1K);
4618 if (RT_FAILURE(rc))
4619 {
4620 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4621 N_("DrvVD: Configuration error: Querying \"BootAccelerationBuffer\" as integer failed"));
4622 break;
4623 }
4624 rc = CFGMR3QueryBoolDef(pCurNode, "BlockCache", &fUseBlockCache, false);
4625 if (RT_FAILURE(rc))
4626 {
4627 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4628 N_("DrvVD: Configuration error: Querying \"BlockCache\" as boolean failed"));
4629 break;
4630 }
4631 rc = CFGMR3QueryStringAlloc(pCurNode, "BwGroup", &pThis->pszBwGroup);
4632 if (RT_FAILURE(rc) && rc != VERR_CFGM_VALUE_NOT_FOUND)
4633 {
4634 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4635 N_("DrvVD: Configuration error: Querying \"BwGroup\" as string failed"));
4636 break;
4637 }
4638 else
4639 rc = VINF_SUCCESS;
4640 rc = CFGMR3QueryBoolDef(pCurNode, "Discard", &fDiscard, false);
4641 if (RT_FAILURE(rc))
4642 {
4643 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4644 N_("DrvVD: Configuration error: Querying \"Discard\" as boolean failed"));
4645 break;
4646 }
4647 if (fReadOnly && fDiscard)
4648 {
4649 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
4650 N_("DrvVD: Configuration error: Both \"ReadOnly\" and \"Discard\" are set"));
4651 break;
4652 }
4653 rc = CFGMR3QueryBoolDef(pCurNode, "InformAboutZeroBlocks", &fInformAboutZeroBlocks, false);
4654 if (RT_FAILURE(rc))
4655 {
4656 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4657 N_("DrvVD: Configuration error: Querying \"InformAboutZeroBlocks\" as boolean failed"));
4658 break;
4659 }
4660 rc = CFGMR3QueryBoolDef(pCurNode, "SkipConsistencyChecks", &fSkipConsistencyChecks, true);
4661 if (RT_FAILURE(rc))
4662 {
4663 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4664 N_("DrvVD: Configuration error: Querying \"SKipConsistencyChecks\" as boolean failed"));
4665 break;
4666 }
4667
4668 char *psz = NULL;
4669 rc = CFGMR3QueryStringAlloc(pCfg, "Type", &psz);
4670 if (RT_FAILURE(rc))
4671 return PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_BLOCK_NO_TYPE, N_("Failed to obtain the sub type"));
4672 pThis->enmType = drvvdGetMediaTypeFromString(psz);
4673 if (pThis->enmType == PDMMEDIATYPE_ERROR)
4674 {
4675 PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_BLOCK_UNKNOWN_TYPE, RT_SRC_POS,
4676 N_("Unknown type \"%s\""), psz);
4677 MMR3HeapFree(psz);
4678 return VERR_PDM_BLOCK_UNKNOWN_TYPE;
4679 }
4680 MMR3HeapFree(psz); psz = NULL;
4681
4682 rc = CFGMR3QueryStringAlloc(pCurNode, "CachePath", &pszCachePath);
4683 if (RT_FAILURE(rc) && rc != VERR_CFGM_VALUE_NOT_FOUND)
4684 {
4685 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4686 N_("DrvVD: Configuration error: Querying \"CachePath\" as string failed"));
4687 break;
4688 }
4689 else
4690 rc = VINF_SUCCESS;
4691
4692 if (pszCachePath)
4693 {
4694 rc = CFGMR3QueryStringAlloc(pCurNode, "CacheFormat", &pszCacheFormat);
4695 if (RT_FAILURE(rc))
4696 {
4697 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4698 N_("DrvVD: Configuration error: Querying \"CacheFormat\" as string failed"));
4699 break;
4700 }
4701 }
4702
4703 /* Mountable */
4704 rc = CFGMR3QueryBoolDef(pCfg, "Mountable", &pThis->fMountable, false);
4705 if (RT_FAILURE(rc))
4706 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Mountable\" from the config"));
4707
4708 /* Locked */
4709 rc = CFGMR3QueryBoolDef(pCfg, "Locked", &pThis->fLocked, false);
4710 if (RT_FAILURE(rc))
4711 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Locked\" from the config"));
4712
4713 /* BIOS visible */
4714 rc = CFGMR3QueryBoolDef(pCfg, "BIOSVisible", &pThis->fBiosVisible, true);
4715 if (RT_FAILURE(rc))
4716 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"BIOSVisible\" from the config"));
4717
4718 /* Cylinders */
4719 rc = CFGMR3QueryU32Def(pCfg, "Cylinders", &pThis->LCHSGeometry.cCylinders, 0);
4720 if (RT_FAILURE(rc))
4721 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Cylinders\" from the config"));
4722
4723 /* Heads */
4724 rc = CFGMR3QueryU32Def(pCfg, "Heads", &pThis->LCHSGeometry.cHeads, 0);
4725 if (RT_FAILURE(rc))
4726 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Heads\" from the config"));
4727
4728 /* Sectors */
4729 rc = CFGMR3QueryU32Def(pCfg, "Sectors", &pThis->LCHSGeometry.cSectors, 0);
4730 if (RT_FAILURE(rc))
4731 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Sectors\" from the config"));
4732
4733 /* Uuid */
4734 rc = CFGMR3QueryStringAlloc(pCfg, "Uuid", &psz);
4735 if (rc == VERR_CFGM_VALUE_NOT_FOUND)
4736 RTUuidClear(&pThis->Uuid);
4737 else if (RT_SUCCESS(rc))
4738 {
4739 rc = RTUuidFromStr(&pThis->Uuid, psz);
4740 if (RT_FAILURE(rc))
4741 {
4742 PDMDrvHlpVMSetError(pDrvIns, rc, RT_SRC_POS, N_("Uuid from string failed on \"%s\""), psz);
4743 MMR3HeapFree(psz);
4744 return rc;
4745 }
4746 MMR3HeapFree(psz); psz = NULL;
4747 }
4748 else
4749 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Uuid\" from the config"));
4750
4751#ifdef VBOX_PERIODIC_FLUSH
4752 rc = CFGMR3QueryU32Def(pCfg, "FlushInterval", &pThis->cbFlushInterval, 0);
4753 if (RT_FAILURE(rc))
4754 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"FlushInterval\" from the config"));
4755#endif /* VBOX_PERIODIC_FLUSH */
4756
4757#ifdef VBOX_IGNORE_FLUSH
4758 rc = CFGMR3QueryBoolDef(pCfg, "IgnoreFlush", &pThis->fIgnoreFlush, true);
4759 if (RT_FAILURE(rc))
4760 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"IgnoreFlush\" from the config"));
4761
4762 if (pThis->fIgnoreFlush)
4763 LogRel(("DrvVD: Flushes will be ignored\n"));
4764 else
4765 LogRel(("DrvVD: Flushes will be passed to the disk\n"));
4766
4767 rc = CFGMR3QueryBoolDef(pCfg, "IgnoreFlushAsync", &pThis->fIgnoreFlushAsync, false);
4768 if (RT_FAILURE(rc))
4769 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"IgnoreFlushAsync\" from the config"));
4770
4771 if (pThis->fIgnoreFlushAsync)
4772 LogRel(("DrvVD: Async flushes will be ignored\n"));
4773 else
4774 LogRel(("DrvVD: Async flushes will be passed to the disk\n"));
4775#endif /* VBOX_IGNORE_FLUSH */
4776
4777 rc = CFGMR3QueryBoolDef(pCurNode, "EmptyDrive", &fEmptyDrive, false);
4778 if (RT_FAILURE(rc))
4779 {
4780 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4781 N_("DrvVD: Configuration error: Querying \"EmptyDrive\" as boolean failed"));
4782 break;
4783 }
4784
4785 rc = CFGMR3QueryU32Def(pCfg, "IoBufMax", &cbIoBufMax, 5 * _1M);
4786 if (RT_FAILURE(rc))
4787 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"IoBufMax\" from the config"));
4788
4789 rc = CFGMR3QueryBoolDef(pCfg, "NonRotationalMedium", &pThis->fNonRotational, false);
4790 if (RT_FAILURE(rc))
4791 return PDMDRV_SET_ERROR(pDrvIns, rc,
4792 N_("DrvVD configuration error: Querying \"NonRotationalMedium\" as boolean failed"));
4793 }
4794
4795 PCFGMNODE pParent = CFGMR3GetChild(pCurNode, "Parent");
4796 if (!pParent)
4797 break;
4798 pCurNode = pParent;
4799 iLevel++;
4800 }
4801
4802 if (pThis->pDrvMediaExPort)
4803 rc = IOBUFMgrCreate(&pThis->hIoBufMgr, cbIoBufMax, pThis->pCfgCrypto ? IOBUFMGR_F_REQUIRE_NOT_PAGABLE : IOBUFMGR_F_DEFAULT);
4804
4805 if ( !fEmptyDrive
4806 && RT_SUCCESS(rc))
4807 {
4808 /*
4809 * Create the image container and the necessary interfaces.
4810 */
4811 if (RT_SUCCESS(rc))
4812 {
4813 /*
4814 * The image has a bandwidth group but the host cache is enabled.
4815 * Use the async I/O framework but tell it to enable the host cache.
4816 */
4817 if (!fUseNewIo && pThis->pszBwGroup)
4818 {
4819 pThis->fAsyncIoWithHostCache = true;
4820 fUseNewIo = true;
4821 }
4822
4823 /** @todo quick hack to work around problems in the async I/O
4824 * implementation (rw semaphore thread ownership problem)
4825 * while a merge is running. Remove once this is fixed. */
4826 if (pThis->fMergePending)
4827 fUseNewIo = false;
4828
4829 if (RT_SUCCESS(rc) && pThis->fMergePending)
4830 {
4831 rc = RTSemFastMutexCreate(&pThis->MergeCompleteMutex);
4832 if (RT_SUCCESS(rc))
4833 rc = RTSemRWCreate(&pThis->MergeLock);
4834 if (RT_SUCCESS(rc))
4835 {
4836 pThis->VDIfThreadSync.pfnStartRead = drvvdThreadStartRead;
4837 pThis->VDIfThreadSync.pfnFinishRead = drvvdThreadFinishRead;
4838 pThis->VDIfThreadSync.pfnStartWrite = drvvdThreadStartWrite;
4839 pThis->VDIfThreadSync.pfnFinishWrite = drvvdThreadFinishWrite;
4840
4841 rc = VDInterfaceAdd(&pThis->VDIfThreadSync.Core, "DrvVD_ThreadSync", VDINTERFACETYPE_THREADSYNC,
4842 pThis, sizeof(VDINTERFACETHREADSYNC), &pThis->pVDIfsDisk);
4843 }
4844 else
4845 {
4846 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4847 N_("DrvVD: Failed to create semaphores for \"MergePending\""));
4848 }
4849 }
4850
4851 if (RT_SUCCESS(rc))
4852 {
4853 rc = VDCreate(pThis->pVDIfsDisk, drvvdGetVDFromMediaType(pThis->enmType), &pThis->pDisk);
4854 /* Error message is already set correctly. */
4855 }
4856 }
4857
4858 if (pThis->pDrvMediaExPort && fUseNewIo)
4859 pThis->fAsyncIOSupported = true;
4860
4861 uint64_t tsStart = RTTimeNanoTS();
4862
4863 unsigned iImageIdx = 0;
4864 while (pCurNode && RT_SUCCESS(rc))
4865 {
4866 /* Allocate per-image data. */
4867 PVBOXIMAGE pImage = drvvdNewImage(pThis);
4868 if (!pImage)
4869 {
4870 rc = VERR_NO_MEMORY;
4871 break;
4872 }
4873
4874 /*
4875 * Read the image configuration.
4876 */
4877 rc = CFGMR3QueryStringAlloc(pCurNode, "Path", &pszName);
4878 if (RT_FAILURE(rc))
4879 {
4880 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4881 N_("DrvVD: Configuration error: Querying \"Path\" as string failed"));
4882 break;
4883 }
4884
4885 rc = CFGMR3QueryStringAlloc(pCurNode, "Format", &pszFormat);
4886 if (RT_FAILURE(rc))
4887 {
4888 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4889 N_("DrvVD: Configuration error: Querying \"Format\" as string failed"));
4890 break;
4891 }
4892
4893 bool fMergeSource;
4894 rc = CFGMR3QueryBoolDef(pCurNode, "MergeSource", &fMergeSource, false);
4895 if (RT_FAILURE(rc))
4896 {
4897 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4898 N_("DrvVD: Configuration error: Querying \"MergeSource\" as boolean failed"));
4899 break;
4900 }
4901 if (fMergeSource)
4902 {
4903 if (pThis->uMergeSource == VD_LAST_IMAGE)
4904 pThis->uMergeSource = iImageIdx;
4905 else
4906 {
4907 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
4908 N_("DrvVD: Configuration error: Multiple \"MergeSource\" occurrences"));
4909 break;
4910 }
4911 }
4912
4913 bool fMergeTarget;
4914 rc = CFGMR3QueryBoolDef(pCurNode, "MergeTarget", &fMergeTarget, false);
4915 if (RT_FAILURE(rc))
4916 {
4917 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
4918 N_("DrvVD: Configuration error: Querying \"MergeTarget\" as boolean failed"));
4919 break;
4920 }
4921 if (fMergeTarget)
4922 {
4923 if (pThis->uMergeTarget == VD_LAST_IMAGE)
4924 pThis->uMergeTarget = iImageIdx;
4925 else
4926 {
4927 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
4928 N_("DrvVD: Configuration error: Multiple \"MergeTarget\" occurrences"));
4929 break;
4930 }
4931 }
4932
4933 PCFGMNODE pCfgVDConfig = CFGMR3GetChild(pCurNode, "VDConfig");
4934 pImage->VDIfConfig.pfnAreKeysValid = drvvdCfgAreKeysValid;
4935 pImage->VDIfConfig.pfnQuerySize = drvvdCfgQuerySize;
4936 pImage->VDIfConfig.pfnQuery = drvvdCfgQuery;
4937 pImage->VDIfConfig.pfnQueryBytes = NULL;
4938 rc = VDInterfaceAdd(&pImage->VDIfConfig.Core, "DrvVD_Config", VDINTERFACETYPE_CONFIG,
4939 pCfgVDConfig, sizeof(VDINTERFACECONFIG), &pImage->pVDIfsImage);
4940 AssertRC(rc);
4941
4942 /* Check VDConfig for encryption config. */
4943 if (pCfgVDConfig)
4944 pThis->pCfgCrypto = CFGMR3GetChild(pCfgVDConfig, "CRYPT");
4945
4946 if (pThis->pCfgCrypto)
4947 {
4948 /* Setup VDConfig interface for disk encryption support. */
4949 pThis->VDIfCfg.pfnAreKeysValid = drvvdCfgAreKeysValid;
4950 pThis->VDIfCfg.pfnQuerySize = drvvdCfgQuerySize;
4951 pThis->VDIfCfg.pfnQuery = drvvdCfgQuery;
4952 pThis->VDIfCfg.pfnQueryBytes = NULL;
4953
4954 pThis->VDIfCrypto.pfnKeyRetain = drvvdCryptoKeyRetain;
4955 pThis->VDIfCrypto.pfnKeyRelease = drvvdCryptoKeyRelease;
4956 pThis->VDIfCrypto.pfnKeyStorePasswordRetain = drvvdCryptoKeyStorePasswordRetain;
4957 pThis->VDIfCrypto.pfnKeyStorePasswordRelease = drvvdCryptoKeyStorePasswordRelease;
4958 }
4959
4960 /* Unconditionally insert the TCPNET interface, don't bother to check
4961 * if an image really needs it. Will be ignored. Since the TCPNET
4962 * interface is per image we could make this more flexible in the
4963 * future if we want to. */
4964 /* Construct TCPNET callback table depending on the config. This is
4965 * done unconditionally, as uninterested backends will ignore it. */
4966 if (fHostIP)
4967 {
4968 pImage->VDIfTcpNet.pfnSocketCreate = drvvdTcpSocketCreate;
4969 pImage->VDIfTcpNet.pfnSocketDestroy = drvvdTcpSocketDestroy;
4970 pImage->VDIfTcpNet.pfnClientConnect = drvvdTcpClientConnect;
4971 pImage->VDIfTcpNet.pfnIsClientConnected = drvvdTcpIsClientConnected;
4972 pImage->VDIfTcpNet.pfnClientClose = drvvdTcpClientClose;
4973 pImage->VDIfTcpNet.pfnSelectOne = drvvdTcpSelectOne;
4974 pImage->VDIfTcpNet.pfnRead = drvvdTcpRead;
4975 pImage->VDIfTcpNet.pfnWrite = drvvdTcpWrite;
4976 pImage->VDIfTcpNet.pfnSgWrite = drvvdTcpSgWrite;
4977 pImage->VDIfTcpNet.pfnReadNB = drvvdTcpReadNB;
4978 pImage->VDIfTcpNet.pfnWriteNB = drvvdTcpWriteNB;
4979 pImage->VDIfTcpNet.pfnSgWriteNB = drvvdTcpSgWriteNB;
4980 pImage->VDIfTcpNet.pfnFlush = drvvdTcpFlush;
4981 pImage->VDIfTcpNet.pfnSetSendCoalescing = drvvdTcpSetSendCoalescing;
4982 pImage->VDIfTcpNet.pfnGetLocalAddress = drvvdTcpGetLocalAddress;
4983 pImage->VDIfTcpNet.pfnGetPeerAddress = drvvdTcpGetPeerAddress;
4984
4985 /*
4986 * There is a 15ms delay between receiving the data and marking the socket
4987 * as readable on Windows XP which hurts async I/O performance of
4988 * TCP backends badly. Provide a different select method without
4989 * using poll on XP.
4990 * This is only used on XP because it is not as efficient as the one using poll
4991 * and all other Windows versions are working fine.
4992 */
4993 char szOS[64];
4994 memset(szOS, 0, sizeof(szOS));
4995 rc = RTSystemQueryOSInfo(RTSYSOSINFO_PRODUCT, &szOS[0], sizeof(szOS));
4996
4997 if (RT_SUCCESS(rc) && !strncmp(szOS, "Windows XP", 10))
4998 {
4999 LogRel(("VD: Detected Windows XP, disabled poll based waiting for TCP\n"));
5000 pImage->VDIfTcpNet.pfnSelectOneEx = drvvdTcpSelectOneExNoPoll;
5001 }
5002 else
5003 pImage->VDIfTcpNet.pfnSelectOneEx = drvvdTcpSelectOneExPoll;
5004
5005 pImage->VDIfTcpNet.pfnPoke = drvvdTcpPoke;
5006 }
5007 else
5008 {
5009#ifndef VBOX_WITH_INIP
5010 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_DRVINS_UNKNOWN_CFG_VALUES,
5011 RT_SRC_POS, N_("DrvVD: Configuration error: TCP over Internal Networking not compiled in"));
5012#else /* VBOX_WITH_INIP */
5013 pImage->VDIfTcpNet.pfnSocketCreate = drvvdINIPSocketCreate;
5014 pImage->VDIfTcpNet.pfnSocketDestroy = drvvdINIPSocketDestroy;
5015 pImage->VDIfTcpNet.pfnClientConnect = drvvdINIPClientConnect;
5016 pImage->VDIfTcpNet.pfnClientClose = drvvdINIPClientClose;
5017 pImage->VDIfTcpNet.pfnIsClientConnected = drvvdINIPIsClientConnected;
5018 pImage->VDIfTcpNet.pfnSelectOne = drvvdINIPSelectOne;
5019 pImage->VDIfTcpNet.pfnRead = drvvdINIPRead;
5020 pImage->VDIfTcpNet.pfnWrite = drvvdINIPWrite;
5021 pImage->VDIfTcpNet.pfnSgWrite = drvvdINIPSgWrite;
5022 pImage->VDIfTcpNet.pfnFlush = drvvdINIPFlush;
5023 pImage->VDIfTcpNet.pfnSetSendCoalescing = drvvdINIPSetSendCoalescing;
5024 pImage->VDIfTcpNet.pfnGetLocalAddress = drvvdINIPGetLocalAddress;
5025 pImage->VDIfTcpNet.pfnGetPeerAddress = drvvdINIPGetPeerAddress;
5026 pImage->VDIfTcpNet.pfnSelectOneEx = drvvdINIPSelectOneEx;
5027 pImage->VDIfTcpNet.pfnPoke = drvvdINIPPoke;
5028#endif /* VBOX_WITH_INIP */
5029 }
5030 rc = VDInterfaceAdd(&pImage->VDIfTcpNet.Core, "DrvVD_TCPNET",
5031 VDINTERFACETYPE_TCPNET, NULL,
5032 sizeof(VDINTERFACETCPNET), &pImage->pVDIfsImage);
5033 AssertRC(rc);
5034
5035 /* Insert the custom I/O interface only if we're told to use new IO.
5036 * Since the I/O interface is per image we could make this more
5037 * flexible in the future if we want to. */
5038 if (fUseNewIo)
5039 {
5040#ifdef VBOX_WITH_PDM_ASYNC_COMPLETION
5041 pImage->VDIfIo.pfnOpen = drvvdAsyncIOOpen;
5042 pImage->VDIfIo.pfnClose = drvvdAsyncIOClose;
5043 pImage->VDIfIo.pfnGetSize = drvvdAsyncIOGetSize;
5044 pImage->VDIfIo.pfnSetSize = drvvdAsyncIOSetSize;
5045 pImage->VDIfIo.pfnSetAllocationSize = drvvdAsyncIOSetAllocationSize;
5046 pImage->VDIfIo.pfnReadSync = drvvdAsyncIOReadSync;
5047 pImage->VDIfIo.pfnWriteSync = drvvdAsyncIOWriteSync;
5048 pImage->VDIfIo.pfnFlushSync = drvvdAsyncIOFlushSync;
5049 pImage->VDIfIo.pfnReadAsync = drvvdAsyncIOReadAsync;
5050 pImage->VDIfIo.pfnWriteAsync = drvvdAsyncIOWriteAsync;
5051 pImage->VDIfIo.pfnFlushAsync = drvvdAsyncIOFlushAsync;
5052#else /* !VBOX_WITH_PDM_ASYNC_COMPLETION */
5053 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_DRVINS_UNKNOWN_CFG_VALUES,
5054 RT_SRC_POS, N_("DrvVD: Configuration error: Async Completion Framework not compiled in"));
5055#endif /* !VBOX_WITH_PDM_ASYNC_COMPLETION */
5056 if (RT_SUCCESS(rc))
5057 rc = VDInterfaceAdd(&pImage->VDIfIo.Core, "DrvVD_IO", VDINTERFACETYPE_IO,
5058 pThis, sizeof(VDINTERFACEIO), &pImage->pVDIfsImage);
5059 AssertRC(rc);
5060 }
5061
5062 /*
5063 * Open the image.
5064 */
5065 unsigned uOpenFlags;
5066 if (fReadOnly || pThis->fTempReadOnly || iLevel != 0)
5067 uOpenFlags = VD_OPEN_FLAGS_READONLY;
5068 else
5069 uOpenFlags = VD_OPEN_FLAGS_NORMAL;
5070 if (fHonorZeroWrites)
5071 uOpenFlags |= VD_OPEN_FLAGS_HONOR_ZEROES;
5072 if (pThis->fAsyncIOSupported)
5073 uOpenFlags |= VD_OPEN_FLAGS_ASYNC_IO;
5074 if (pThis->fShareable)
5075 uOpenFlags |= VD_OPEN_FLAGS_SHAREABLE;
5076 if (fDiscard && iLevel == 0)
5077 uOpenFlags |= VD_OPEN_FLAGS_DISCARD;
5078 if (fInformAboutZeroBlocks)
5079 uOpenFlags |= VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS;
5080 if ( (uOpenFlags & VD_OPEN_FLAGS_READONLY)
5081 && fSkipConsistencyChecks)
5082 uOpenFlags |= VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS;
5083
5084 /* Try to open backend in async I/O mode first. */
5085 rc = VDOpen(pThis->pDisk, pszFormat, pszName, uOpenFlags, pImage->pVDIfsImage);
5086 if (rc == VERR_NOT_SUPPORTED)
5087 {
5088 pThis->fAsyncIOSupported = false;
5089 uOpenFlags &= ~VD_OPEN_FLAGS_ASYNC_IO;
5090 rc = VDOpen(pThis->pDisk, pszFormat, pszName, uOpenFlags, pImage->pVDIfsImage);
5091 }
5092
5093 if (rc == VERR_VD_DISCARD_NOT_SUPPORTED)
5094 {
5095 fDiscard = false;
5096 uOpenFlags &= ~VD_OPEN_FLAGS_DISCARD;
5097 rc = VDOpen(pThis->pDisk, pszFormat, pszName, uOpenFlags, pImage->pVDIfsImage);
5098 }
5099
5100 if (!fDiscard)
5101 {
5102 pThis->IMedia.pfnDiscard = NULL;
5103 pThis->IMediaEx.pfnIoReqDiscard = NULL;
5104 }
5105
5106 if (RT_SUCCESS(rc))
5107 {
5108 LogFunc(("%d - Opened '%s' in %s mode\n",
5109 iLevel, pszName,
5110 VDIsReadOnly(pThis->pDisk) ? "read-only" : "read-write"));
5111 if ( VDIsReadOnly(pThis->pDisk)
5112 && !fReadOnly
5113 && !fMaybeReadOnly
5114 && !pThis->fTempReadOnly
5115 && iLevel == 0)
5116 {
5117 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_VD_IMAGE_READ_ONLY, RT_SRC_POS,
5118 N_("Failed to open image '%s' for writing due to wrong permissions"),
5119 pszName);
5120 break;
5121 }
5122 }
5123 else
5124 {
5125 rc = PDMDrvHlpVMSetError(pDrvIns, rc, RT_SRC_POS,
5126 N_("Failed to open image '%s' in %s mode"), pszName,
5127 (uOpenFlags & VD_OPEN_FLAGS_READONLY) ? "read-only" : "read-write");
5128 break;
5129 }
5130
5131 MMR3HeapFree(pszName);
5132 pszName = NULL;
5133 MMR3HeapFree(pszFormat);
5134 pszFormat = NULL;
5135
5136 /* next */
5137 iLevel--;
5138 iImageIdx++;
5139 pCurNode = CFGMR3GetParent(pCurNode);
5140 }
5141
5142 LogRel(("VD: Opening the disk took %lld ns\n", RTTimeNanoTS() - tsStart));
5143
5144 /* Open the cache image if set. */
5145 if ( RT_SUCCESS(rc)
5146 && RT_VALID_PTR(pszCachePath))
5147 {
5148 /* Insert the custom I/O interface only if we're told to use new IO.
5149 * Since the I/O interface is per image we could make this more
5150 * flexible in the future if we want to. */
5151 if (fUseNewIo)
5152 {
5153#ifdef VBOX_WITH_PDM_ASYNC_COMPLETION
5154 pThis->VDIfIoCache.pfnOpen = drvvdAsyncIOOpen;
5155 pThis->VDIfIoCache.pfnClose = drvvdAsyncIOClose;
5156 pThis->VDIfIoCache.pfnGetSize = drvvdAsyncIOGetSize;
5157 pThis->VDIfIoCache.pfnSetSize = drvvdAsyncIOSetSize;
5158 pThis->VDIfIoCache.pfnReadSync = drvvdAsyncIOReadSync;
5159 pThis->VDIfIoCache.pfnWriteSync = drvvdAsyncIOWriteSync;
5160 pThis->VDIfIoCache.pfnFlushSync = drvvdAsyncIOFlushSync;
5161 pThis->VDIfIoCache.pfnReadAsync = drvvdAsyncIOReadAsync;
5162 pThis->VDIfIoCache.pfnWriteAsync = drvvdAsyncIOWriteAsync;
5163 pThis->VDIfIoCache.pfnFlushAsync = drvvdAsyncIOFlushAsync;
5164#else /* !VBOX_WITH_PDM_ASYNC_COMPLETION */
5165 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_DRVINS_UNKNOWN_CFG_VALUES,
5166 RT_SRC_POS, N_("DrvVD: Configuration error: Async Completion Framework not compiled in"));
5167#endif /* !VBOX_WITH_PDM_ASYNC_COMPLETION */
5168 if (RT_SUCCESS(rc))
5169 rc = VDInterfaceAdd(&pThis->VDIfIoCache.Core, "DrvVD_IO", VDINTERFACETYPE_IO,
5170 pThis, sizeof(VDINTERFACEIO), &pThis->pVDIfsCache);
5171 AssertRC(rc);
5172 }
5173
5174 rc = VDCacheOpen(pThis->pDisk, pszCacheFormat, pszCachePath, VD_OPEN_FLAGS_NORMAL, pThis->pVDIfsCache);
5175 if (RT_FAILURE(rc))
5176 rc = PDMDRV_SET_ERROR(pDrvIns, rc, N_("DrvVD: Could not open cache image"));
5177 }
5178
5179 if (RT_VALID_PTR(pszCachePath))
5180 MMR3HeapFree(pszCachePath);
5181 if (RT_VALID_PTR(pszCacheFormat))
5182 MMR3HeapFree(pszCacheFormat);
5183
5184 if ( RT_SUCCESS(rc)
5185 && pThis->fMergePending
5186 && ( pThis->uMergeSource == VD_LAST_IMAGE
5187 || pThis->uMergeTarget == VD_LAST_IMAGE))
5188 {
5189 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5190 N_("DrvVD: Configuration error: Inconsistent image merge data"));
5191 }
5192
5193 /* Create the block cache if enabled. */
5194 if ( fUseBlockCache
5195 && !pThis->fShareable
5196 && !fDiscard
5197 && !pThis->pCfgCrypto /* Disk encryption disables the block cache for security reasons */
5198 && RT_SUCCESS(rc))
5199 {
5200 /*
5201 * We need a unique ID for the block cache (to identify the owner of data
5202 * blocks in a saved state). UUIDs are not really suitable because
5203 * there are image formats which don't support them. Furthermore it is
5204 * possible that a new diff image was attached after a saved state
5205 * which changes the UUID.
5206 * However the device "name + device instance + LUN" triple the disk is
5207 * attached to is always constant for saved states.
5208 */
5209 char *pszId = NULL;
5210 uint32_t iInstance, iLUN;
5211 const char *pcszController;
5212
5213 rc = pThis->pDrvMediaPort->pfnQueryDeviceLocation(pThis->pDrvMediaPort, &pcszController,
5214 &iInstance, &iLUN);
5215 if (RT_FAILURE(rc))
5216 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5217 N_("DrvVD: Configuration error: Could not query device data"));
5218 else
5219 {
5220 int cbStr = RTStrAPrintf(&pszId, "%s-%d-%d", pcszController, iInstance, iLUN);
5221
5222 if (cbStr > 0)
5223 {
5224 rc = PDMDrvHlpBlkCacheRetain(pDrvIns, &pThis->pBlkCache,
5225 drvvdBlkCacheXferCompleteIoReq,
5226 drvvdBlkCacheXferEnqueue,
5227 drvvdBlkCacheXferEnqueueDiscard,
5228 pszId);
5229 if (rc == VERR_NOT_SUPPORTED)
5230 {
5231 LogRel(("VD: Block cache is not supported\n"));
5232 rc = VINF_SUCCESS;
5233 }
5234 else
5235 AssertRC(rc);
5236
5237 RTStrFree(pszId);
5238 }
5239 else
5240 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5241 N_("DrvVD: Out of memory when creating block cache"));
5242 }
5243 }
5244
5245 if (RT_SUCCESS(rc))
5246 rc = drvvdSetupFilters(pThis, pCfg);
5247
5248 /*
5249 * Register a load-done callback so we can undo TempReadOnly config before
5250 * we get to drvvdResume. Automatically deregistered upon destruction.
5251 */
5252 if (RT_SUCCESS(rc))
5253 rc = PDMDrvHlpSSMRegisterEx(pDrvIns, 0 /* version */, 0 /* cbGuess */,
5254 NULL /*pfnLivePrep*/, NULL /*pfnLiveExec*/, NULL /*pfnLiveVote*/,
5255 NULL /*pfnSavePrep*/, NULL /*pfnSaveExec*/, NULL /*pfnSaveDone*/,
5256 NULL /*pfnDonePrep*/, NULL /*pfnLoadExec*/, drvvdLoadDone);
5257
5258 /* Setup the boot acceleration stuff if enabled. */
5259 if (RT_SUCCESS(rc) && pThis->fBootAccelEnabled)
5260 {
5261 pThis->cbDisk = VDGetSize(pThis->pDisk, VD_LAST_IMAGE);
5262 Assert(pThis->cbDisk > 0);
5263 pThis->pbData = (uint8_t *)RTMemAllocZ(pThis->cbBootAccelBuffer);
5264 if (pThis->pbData)
5265 {
5266 pThis->fBootAccelActive = true;
5267 pThis->offDisk = 0;
5268 pThis->cbDataValid = 0;
5269 LogRel(("VD: Boot acceleration enabled\n"));
5270 }
5271 else
5272 LogRel(("VD: Boot acceleration, out of memory, disabled\n"));
5273 }
5274
5275 if ( RTUuidIsNull(&pThis->Uuid)
5276 && pThis->enmType == PDMMEDIATYPE_HARD_DISK)
5277 VDGetUuid(pThis->pDisk, 0, &pThis->Uuid);
5278
5279 /*
5280 * Automatically upgrade the floppy drive if the specified one is too
5281 * small to represent the whole boot time image. (We cannot do this later
5282 * since the BIOS (and others) gets the info via CMOS.)
5283 *
5284 * This trick should make 2.88 images as well as the fake 15.6 and 63.5 MB
5285 * images despite the hardcoded default 1.44 drive.
5286 */
5287 if ( PDMMEDIATYPE_IS_FLOPPY(pThis->enmType)
5288 && pThis->pDisk)
5289 {
5290 uint64_t const cbFloppyImg = VDGetSize(pThis->pDisk, VD_LAST_IMAGE);
5291 PDMMEDIATYPE const enmCfgType = pThis->enmType;
5292 switch (enmCfgType)
5293 {
5294 default:
5295 AssertFailed();
5296 case PDMMEDIATYPE_FLOPPY_360:
5297 if (cbFloppyImg > 40 * 2 * 9 * 512)
5298 pThis->enmType = PDMMEDIATYPE_FLOPPY_720;
5299 /* fall thru */
5300 case PDMMEDIATYPE_FLOPPY_720:
5301 if (cbFloppyImg > 80 * 2 * 14 * 512)
5302 pThis->enmType = PDMMEDIATYPE_FLOPPY_1_20;
5303 /* fall thru */
5304 case PDMMEDIATYPE_FLOPPY_1_20:
5305 if (cbFloppyImg > 80 * 2 * 20 * 512)
5306 pThis->enmType = PDMMEDIATYPE_FLOPPY_1_44;
5307 /* fall thru */
5308 case PDMMEDIATYPE_FLOPPY_1_44:
5309 if (cbFloppyImg > 80 * 2 * 24 * 512)
5310 pThis->enmType = PDMMEDIATYPE_FLOPPY_2_88;
5311 /* fall thru */
5312 case PDMMEDIATYPE_FLOPPY_2_88:
5313 if (cbFloppyImg > 80 * 2 * 48 * 512)
5314 pThis->enmType = PDMMEDIATYPE_FLOPPY_FAKE_15_6;
5315 /* fall thru */
5316 case PDMMEDIATYPE_FLOPPY_FAKE_15_6:
5317 if (cbFloppyImg > 255 * 2 * 63 * 512)
5318 pThis->enmType = PDMMEDIATYPE_FLOPPY_FAKE_63_5;
5319 case PDMMEDIATYPE_FLOPPY_FAKE_63_5:
5320 if (cbFloppyImg > 255 * 2 * 255 * 512)
5321 LogRel(("Warning: Floppy image is larger that 63.5 MB! (%llu bytes)\n", cbFloppyImg));
5322 break;
5323 }
5324 if (pThis->enmType != enmCfgType)
5325 LogRel(("DrvVD: Automatically upgraded floppy drive from %s to %s to better support the %u byte image\n",
5326 drvvdGetTypeName(enmCfgType), drvvdGetTypeName(pThis->enmType), cbFloppyImg));
5327 }
5328 } /* !fEmptyDrive */
5329
5330 if (RT_FAILURE(rc))
5331 {
5332 if (RT_VALID_PTR(pszName))
5333 MMR3HeapFree(pszName);
5334 if (RT_VALID_PTR(pszFormat))
5335 MMR3HeapFree(pszFormat);
5336 /* drvvdDestruct does the rest. */
5337 }
5338
5339 LogFlowFunc(("returns %Rrc\n", rc));
5340 return rc;
5341}
5342
5343/**
5344 * VBox disk container media driver registration record.
5345 */
5346const PDMDRVREG g_DrvVD =
5347{
5348 /* u32Version */
5349 PDM_DRVREG_VERSION,
5350 /* szName */
5351 "VD",
5352 /* szRCMod */
5353 "",
5354 /* szR0Mod */
5355 "",
5356 /* pszDescription */
5357 "Generic VBox disk media driver.",
5358 /* fFlags */
5359 PDM_DRVREG_FLAGS_HOST_BITS_DEFAULT,
5360 /* fClass. */
5361 PDM_DRVREG_CLASS_MEDIA,
5362 /* cMaxInstances */
5363 ~0U,
5364 /* cbInstance */
5365 sizeof(VBOXDISK),
5366 /* pfnConstruct */
5367 drvvdConstruct,
5368 /* pfnDestruct */
5369 drvvdDestruct,
5370 /* pfnRelocate */
5371 NULL,
5372 /* pfnIOCtl */
5373 NULL,
5374 /* pfnPowerOn */
5375 drvvdPowerOn,
5376 /* pfnReset */
5377 drvvdReset,
5378 /* pfnSuspend */
5379 drvvdSuspend,
5380 /* pfnResume */
5381 drvvdResume,
5382 /* pfnAttach */
5383 NULL,
5384 /* pfnDetach */
5385 NULL,
5386 /* pfnPowerOff */
5387 drvvdPowerOff,
5388 /* pfnSoftReset */
5389 NULL,
5390 /* u32EndVersion */
5391 PDM_DRVREG_VERSION
5392};
5393
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette