VirtualBox

source: vbox/trunk/src/VBox/Devices/Storage/DrvVD.cpp@ 70775

Last change on this file since 70775 was 70775, checked in by vboxsync, 7 years ago

Devices/Storage/DrvVD.cpp: Fix assertion

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 214.9 KB
Line 
1/* $Id: DrvVD.cpp 70775 2018-01-28 21:48:16Z vboxsync $ */
2/** @file
3 * DrvVD - Generic VBox disk media driver.
4 */
5
6/*
7 * Copyright (C) 2006-2017 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 */
17
18
19/*********************************************************************************************************************************
20* Header files *
21*********************************************************************************************************************************/
22#define LOG_GROUP LOG_GROUP_DRV_VD
23#include <VBox/vd.h>
24#include <VBox/vmm/pdmdrv.h>
25#include <VBox/vmm/pdmstorageifs.h>
26#include <VBox/vmm/pdmasynccompletion.h>
27#include <VBox/vmm/pdmblkcache.h>
28#include <VBox/vmm/ssm.h>
29#include <iprt/asm.h>
30#include <iprt/alloc.h>
31#include <iprt/assert.h>
32#include <iprt/uuid.h>
33#include <iprt/file.h>
34#include <iprt/string.h>
35#include <iprt/tcp.h>
36#include <iprt/semaphore.h>
37#include <iprt/sg.h>
38#include <iprt/poll.h>
39#include <iprt/pipe.h>
40#include <iprt/system.h>
41#include <iprt/memsafer.h>
42#include <iprt/memcache.h>
43#include <iprt/list.h>
44
45#ifdef VBOX_WITH_INIP
46/* All lwip header files are not C++ safe. So hack around this. */
47RT_C_DECLS_BEGIN
48#include <lwip/opt.h>
49#include <lwip/inet.h>
50#include <lwip/tcp.h>
51#include <lwip/sockets.h>
52# if LWIP_IPV6
53# include <lwip/inet6.h>
54# endif
55RT_C_DECLS_END
56#endif /* VBOX_WITH_INIP */
57
58#include "HBDMgmt.h"
59#include "IOBufMgmt.h"
60
61#include "VBoxDD.h"
62
63#ifdef VBOX_WITH_INIP
64/* Small hack to get at lwIP initialized status */
65extern bool DevINIPConfigured(void);
66#endif /* VBOX_WITH_INIP */
67
68
69/** @def VBOX_PERIODIC_FLUSH
70 * Enable support for periodically flushing the VDI to disk. This may prove
71 * useful for those nasty problems with the ultra-slow host filesystems.
72 * If this is enabled, it can be configured via the CFGM key
73 * "VBoxInternal/Devices/piix3ide/0/LUN#<x>/Config/FlushInterval". @verbatim<x>@endverbatim
74 * must be replaced with the correct LUN number of the disk that should
75 * do the periodic flushes. The value of the key is the number of bytes
76 * written between flushes. A value of 0 (the default) denotes no flushes. */
77#define VBOX_PERIODIC_FLUSH
78
79/** @def VBOX_IGNORE_FLUSH
80 * Enable support for ignoring VDI flush requests. This can be useful for
81 * filesystems that show bad guest IDE write performance (especially with
82 * Windows guests). NOTE that this does not disable the flushes caused by
83 * the periodic flush cache feature above.
84 * If this feature is enabled, it can be configured via the CFGM key
85 * "VBoxInternal/Devices/piix3ide/0/LUN#<x>/Config/IgnoreFlush". @verbatim<x>@endverbatim
86 * must be replaced with the correct LUN number of the disk that should
87 * ignore flush requests. The value of the key is a boolean. The default
88 * is to ignore flushes, i.e. true. */
89#define VBOX_IGNORE_FLUSH
90
91
92/*********************************************************************************************************************************
93* Defined types, constants and macros *
94*********************************************************************************************************************************/
95
96/** Converts a pointer to VBOXDISK::IMedia to a PVBOXDISK. */
97#define PDMIMEDIA_2_VBOXDISK(pInterface) \
98 ( (PVBOXDISK)((uintptr_t)pInterface - RT_OFFSETOF(VBOXDISK, IMedia)) )
99
100/** Saved state version of an I/O request .*/
101#define DRVVD_IOREQ_SAVED_STATE_VERSION UINT32_C(1)
102/** Maximum number of request errors in the release log before muting. */
103#define DRVVD_MAX_LOG_REL_ERRORS 100
104
105/** Forward declaration for the dis kcontainer. */
106typedef struct VBOXDISK *PVBOXDISK;
107
108/**
109 * VBox disk container, image information, private part.
110 */
111
112typedef struct VBOXIMAGE
113{
114 /** Pointer to next image. */
115 struct VBOXIMAGE *pNext;
116 /** Pointer to list of VD interfaces. Per-image. */
117 PVDINTERFACE pVDIfsImage;
118 /** Configuration information interface. */
119 VDINTERFACECONFIG VDIfConfig;
120 /** TCP network stack interface. */
121 VDINTERFACETCPNET VDIfTcpNet;
122 /** I/O interface. */
123 VDINTERFACEIO VDIfIo;
124} VBOXIMAGE, *PVBOXIMAGE;
125
126/**
127 * Storage backend data.
128 */
129typedef struct DRVVDSTORAGEBACKEND
130{
131 /** PDM async completion end point. */
132 PPDMASYNCCOMPLETIONENDPOINT pEndpoint;
133 /** The template. */
134 PPDMASYNCCOMPLETIONTEMPLATE pTemplate;
135 /** Event semaphore for synchronous operations. */
136 RTSEMEVENT EventSem;
137 /** Flag whether a synchronous operation is currently pending. */
138 volatile bool fSyncIoPending;
139 /** Return code of the last completed request. */
140 int rcReqLast;
141 /** Callback routine */
142 PFNVDCOMPLETED pfnCompleted;
143} DRVVDSTORAGEBACKEND, *PDRVVDSTORAGEBACKEND;
144
145/**
146 * VD I/O request state.
147 */
148typedef enum VDIOREQSTATE
149{
150 /** Invalid. */
151 VDIOREQSTATE_INVALID = 0,
152 /** The request is not in use and resides on the free list. */
153 VDIOREQSTATE_FREE,
154 /** The request was just allocated and is not active. */
155 VDIOREQSTATE_ALLOCATED,
156 /** The request was allocated and is in use. */
157 VDIOREQSTATE_ACTIVE,
158 /** The request was suspended and is not actively processed. */
159 VDIOREQSTATE_SUSPENDED,
160 /** The request is in the last step of completion and syncs memory. */
161 VDIOREQSTATE_COMPLETING,
162 /** The request completed. */
163 VDIOREQSTATE_COMPLETED,
164 /** The request was aborted but wasn't returned as complete from the storage
165 * layer below us. */
166 VDIOREQSTATE_CANCELED,
167 /** 32bit hack. */
168 VDIOREQSTATE_32BIT_HACK = 0x7fffffff
169} VDIOREQSTATE;
170
171/**
172 * VD I/O Request.
173 */
174typedef struct PDMMEDIAEXIOREQINT
175{
176 /** List node for the list of allocated requests. */
177 RTLISTNODE NdAllocatedList;
178 /** List for requests waiting for I/O memory or on the redo list. */
179 RTLISTNODE NdLstWait;
180 /** I/O request type. */
181 PDMMEDIAEXIOREQTYPE enmType;
182 /** Request state. */
183 volatile VDIOREQSTATE enmState;
184 /** I/O request ID. */
185 PDMMEDIAEXIOREQID uIoReqId;
186 /** Pointer to the disk container. */
187 PVBOXDISK pDisk;
188 /** Flags. */
189 uint32_t fFlags;
190 /** Timestamp when the request was submitted. */
191 uint64_t tsSubmit;
192 /** Type dependent data. */
193 union
194 {
195 /** Read/Write request sepcific data. */
196 struct
197 {
198 /** Start offset of the request. */
199 uint64_t offStart;
200 /** Size of the request. */
201 size_t cbReq;
202 /** Size left for this request. */
203 size_t cbReqLeft;
204 /** Size of the allocated I/O buffer. */
205 size_t cbIoBuf;
206 /** Pointer to the S/G buffer. */
207 PRTSGBUF pSgBuf;
208 /** Flag whether the pointer is a direct buffer or
209 * was allocated by us. */
210 bool fDirectBuf;
211 /** Buffer management data based on the fDirectBuf flag. */
212 union
213 {
214 /** Direct buffer. */
215 struct
216 {
217 /** Segment for the data buffer. */
218 RTSGSEG Seg;
219 /** S/G buffer structure. */
220 RTSGBUF SgBuf;
221 } Direct;
222 /** I/O buffer descriptor. */
223 IOBUFDESC IoBuf;
224 };
225 } ReadWrite;
226 /** Discard specific data. */
227 struct
228 {
229 /** Pointer to array of ranges to discard. */
230 PRTRANGE paRanges;
231 /** Number of ranges to discard. */
232 unsigned cRanges;
233 } Discard;
234 };
235 /** Allocator specific memory - variable size. */
236 uint8_t abAlloc[1];
237} PDMMEDIAEXIOREQINT;
238/** Pointer to a VD I/O request. */
239typedef PDMMEDIAEXIOREQINT *PPDMMEDIAEXIOREQINT;
240
241/**
242 * Structure for holding a list of allocated requests.
243 */
244typedef struct VDLSTIOREQALLOC
245{
246 /** Mutex protecting the table of allocated requests. */
247 RTSEMFASTMUTEX hMtxLstIoReqAlloc;
248 /** List anchor. */
249 RTLISTANCHOR LstIoReqAlloc;
250} VDLSTIOREQALLOC;
251typedef VDLSTIOREQALLOC *PVDLSTIOREQALLOC;
252
253/** Number of bins for allocated requests. */
254#define DRVVD_VDIOREQ_ALLOC_BINS 8
255
256/**
257 * VBox disk container media main structure, private part.
258 *
259 * @implements PDMIMEDIA
260 * @implements PDMIMEDIAEX
261 * @implements PDMIMOUNT
262 * @implements VDINTERFACEERROR
263 * @implements VDINTERFACETCPNET
264 * @implements VDINTERFACEASYNCIO
265 * @implements VDINTERFACECONFIG
266 */
267typedef struct VBOXDISK
268{
269 /** The VBox disk container. */
270 PVDISK pDisk;
271 /** The media interface. */
272 PDMIMEDIA IMedia;
273 /** Media port. */
274 PPDMIMEDIAPORT pDrvMediaPort;
275 /** Pointer to the driver instance. */
276 PPDMDRVINS pDrvIns;
277 /** Flag whether suspend has changed image open mode to read only. */
278 bool fTempReadOnly;
279 /** Flag whether to use the runtime (true) or startup error facility. */
280 bool fErrorUseRuntime;
281 /** Pointer to list of VD interfaces. Per-disk. */
282 PVDINTERFACE pVDIfsDisk;
283 /** Error interface. */
284 VDINTERFACEERROR VDIfError;
285 /** Thread synchronization interface. */
286 VDINTERFACETHREADSYNC VDIfThreadSync;
287
288 /** Flag whether opened disk supports async I/O operations. */
289 bool fAsyncIOSupported;
290 /** Pointer to the list of data we need to keep per image. */
291 PVBOXIMAGE pImages;
292 /** Flag whether the media should allow concurrent open for writing. */
293 bool fShareable;
294 /** Flag whether a merge operation has been set up. */
295 bool fMergePending;
296 /** Synchronization to prevent destruction before merge finishes. */
297 RTSEMFASTMUTEX MergeCompleteMutex;
298 /** Synchronization between merge and other image accesses. */
299 RTSEMRW MergeLock;
300 /** Source image index for merging. */
301 unsigned uMergeSource;
302 /** Target image index for merging. */
303 unsigned uMergeTarget;
304
305 /** Flag whether boot acceleration is enabled. */
306 bool fBootAccelEnabled;
307 /** Flag whether boot acceleration is currently active. */
308 bool fBootAccelActive;
309 /** Size of the disk, used for read truncation. */
310 uint64_t cbDisk;
311 /** Size of the configured buffer. */
312 size_t cbBootAccelBuffer;
313 /** Start offset for which the buffer holds data. */
314 uint64_t offDisk;
315 /** Number of valid bytes in the buffer. */
316 size_t cbDataValid;
317 /** The disk buffer. */
318 uint8_t *pbData;
319 /** Bandwidth group the disk is assigned to. */
320 char *pszBwGroup;
321 /** Flag whether async I/O using the host cache is enabled. */
322 bool fAsyncIoWithHostCache;
323
324 /** I/O interface for a cache image. */
325 VDINTERFACEIO VDIfIoCache;
326 /** Interface list for the cache image. */
327 PVDINTERFACE pVDIfsCache;
328
329 /** The block cache handle if configured. */
330 PPDMBLKCACHE pBlkCache;
331 /** Host block device manager. */
332 HBDMGR hHbdMgr;
333
334 /** Drive type. */
335 PDMMEDIATYPE enmType;
336 /** Locked indicator. */
337 bool fLocked;
338 /** Mountable indicator. */
339 bool fMountable;
340 /** Visible to the BIOS. */
341 bool fBiosVisible;
342 /** Flag whether this medium should be presented as non rotational. */
343 bool fNonRotational;
344#ifdef VBOX_PERIODIC_FLUSH
345 /** HACK: Configuration value for number of bytes written after which to flush. */
346 uint32_t cbFlushInterval;
347 /** HACK: Current count for the number of bytes written since the last flush. */
348 uint32_t cbDataWritten;
349#endif /* VBOX_PERIODIC_FLUSH */
350#ifdef VBOX_IGNORE_FLUSH
351 /** HACK: Disable flushes for this drive. */
352 bool fIgnoreFlush;
353 /** Disable async flushes for this drive. */
354 bool fIgnoreFlushAsync;
355#endif /* VBOX_IGNORE_FLUSH */
356 /** Our mountable interface. */
357 PDMIMOUNT IMount;
358 /** Pointer to the mount notify interface above us. */
359 PPDMIMOUNTNOTIFY pDrvMountNotify;
360 /** Uuid of the drive. */
361 RTUUID Uuid;
362 /** BIOS PCHS Geometry. */
363 PDMMEDIAGEOMETRY PCHSGeometry;
364 /** BIOS LCHS Geometry. */
365 PDMMEDIAGEOMETRY LCHSGeometry;
366 /** Region list. */
367 PVDREGIONLIST pRegionList;
368
369 /** Cryptographic support
370 * @{ */
371 /** Pointer to the CFGM node containing the config of the crypto filter
372 * if enable. */
373 PCFGMNODE pCfgCrypto;
374 /** Config interface for the encryption filter. */
375 VDINTERFACECONFIG VDIfCfg;
376 /** Crypto interface for the encryption filter. */
377 VDINTERFACECRYPTO VDIfCrypto;
378 /** The secret key interface used to retrieve keys. */
379 PPDMISECKEY pIfSecKey;
380 /** The secret key helper interface used to notify about missing keys. */
381 PPDMISECKEYHLP pIfSecKeyHlp;
382 /** @} */
383
384 /** @name IMEDIAEX interface support specific members.
385 * @{ */
386 /** Pointer to the IMEDIAEXPORT interface above us. */
387 PPDMIMEDIAEXPORT pDrvMediaExPort;
388 /** Our extended media interface. */
389 PDMIMEDIAEX IMediaEx;
390 /** Memory cache for the I/O requests. */
391 RTMEMCACHE hIoReqCache;
392 /** I/O buffer manager. */
393 IOBUFMGR hIoBufMgr;
394 /** Active request counter. */
395 volatile uint32_t cIoReqsActive;
396 /** Bins for allocated requests. */
397 VDLSTIOREQALLOC aIoReqAllocBins[DRVVD_VDIOREQ_ALLOC_BINS];
398 /** List of requests for I/O memory to be available - VDIOREQ::NdLstWait. */
399 RTLISTANCHOR LstIoReqIoBufWait;
400 /** Critical section protecting the list of requests waiting for I/O memory. */
401 RTCRITSECT CritSectIoReqsIoBufWait;
402 /** Number of requests waiting for a I/O buffer. */
403 volatile uint32_t cIoReqsWaiting;
404 /** Flag whether we have to resubmit requests on resume because the
405 * VM was suspended due to a recoverable I/O error.
406 */
407 volatile bool fRedo;
408 /** List of requests we have to redo. */
409 RTLISTANCHOR LstIoReqRedo;
410 /** Criticial section protecting the list of waiting requests. */
411 RTCRITSECT CritSectIoReqRedo;
412 /** Number of errors logged so far. */
413 unsigned cErrors;
414 /** @} */
415
416 /** @name Statistics.
417 * @{ */
418 /** How many attempts were made to query a direct buffer pointer from the
419 * device/driver above. */
420 STAMCOUNTER StatQueryBufAttempts;
421 /** How many attempts to query a direct buffer pointer succeeded. */
422 STAMCOUNTER StatQueryBufSuccess;
423 /** Release statistics: number of bytes written. */
424 STAMCOUNTER StatBytesWritten;
425 /** Release statistics: number of bytes read. */
426 STAMCOUNTER StatBytesRead;
427 /** Release statistics: Number of requests submitted. */
428 STAMCOUNTER StatReqsSubmitted;
429 /** Release statistics: Number of requests failed. */
430 STAMCOUNTER StatReqsFailed;
431 /** Release statistics: Number of requests succeeded. */
432 STAMCOUNTER StatReqsSucceeded;
433 /** Release statistics: Number of flush requests. */
434 STAMCOUNTER StatReqsFlush;
435 /** Release statistics: Number of write requests. */
436 STAMCOUNTER StatReqsWrite;
437 /** Release statistics: Number of read requests. */
438 STAMCOUNTER StatReqsRead;
439 /** Release statistics: Number of discard requests. */
440 STAMCOUNTER StatReqsDiscard;
441 /** Release statistics: Number of I/O requests processed per second. */
442 STAMCOUNTER StatReqsPerSec;
443 /** @} */
444} VBOXDISK;
445
446
447/*********************************************************************************************************************************
448* Internal Functions *
449*********************************************************************************************************************************/
450
451static DECLCALLBACK(void) drvvdMediaExIoReqComplete(void *pvUser1, void *pvUser2, int rcReq);
452static void drvvdPowerOffOrDestructOrUnmount(PPDMDRVINS pDrvIns);
453DECLINLINE(void) drvvdMediaExIoReqBufFree(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq);
454static int drvvdMediaExIoReqCompleteWorker(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, int rcReq, bool fUpNotify);
455static int drvvdMediaExIoReqReadWriteProcess(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, bool fUpNotify);
456
457/**
458 * Internal: allocate new image descriptor and put it in the list
459 */
460static PVBOXIMAGE drvvdNewImage(PVBOXDISK pThis)
461{
462 AssertPtr(pThis);
463 PVBOXIMAGE pImage = (PVBOXIMAGE)RTMemAllocZ(sizeof(VBOXIMAGE));
464 if (pImage)
465 {
466 pImage->pVDIfsImage = NULL;
467 PVBOXIMAGE *pp = &pThis->pImages;
468 while (*pp != NULL)
469 pp = &(*pp)->pNext;
470 *pp = pImage;
471 pImage->pNext = NULL;
472 }
473
474 return pImage;
475}
476
477/**
478 * Internal: free the list of images descriptors.
479 */
480static void drvvdFreeImages(PVBOXDISK pThis)
481{
482 while (pThis->pImages != NULL)
483 {
484 PVBOXIMAGE p = pThis->pImages;
485 pThis->pImages = pThis->pImages->pNext;
486 RTMemFree(p);
487 }
488}
489
490
491/**
492 * Make the image temporarily read-only.
493 *
494 * @returns VBox status code.
495 * @param pThis The driver instance data.
496 */
497static int drvvdSetReadonly(PVBOXDISK pThis)
498{
499 int rc = VINF_SUCCESS;
500 if ( pThis->pDisk
501 && !VDIsReadOnly(pThis->pDisk))
502 {
503 unsigned uOpenFlags;
504 rc = VDGetOpenFlags(pThis->pDisk, VD_LAST_IMAGE, &uOpenFlags);
505 AssertRC(rc);
506 uOpenFlags |= VD_OPEN_FLAGS_READONLY;
507 rc = VDSetOpenFlags(pThis->pDisk, VD_LAST_IMAGE, uOpenFlags);
508 AssertRC(rc);
509 pThis->fTempReadOnly = true;
510 }
511 return rc;
512}
513
514
515/**
516 * Undo the temporary read-only status of the image.
517 *
518 * @returns VBox status code.
519 * @param pThis The driver instance data.
520 */
521static int drvvdSetWritable(PVBOXDISK pThis)
522{
523 int rc = VINF_SUCCESS;
524 if (pThis->fTempReadOnly)
525 {
526 unsigned uOpenFlags;
527 rc = VDGetOpenFlags(pThis->pDisk, VD_LAST_IMAGE, &uOpenFlags);
528 AssertRC(rc);
529 uOpenFlags &= ~VD_OPEN_FLAGS_READONLY;
530 rc = VDSetOpenFlags(pThis->pDisk, VD_LAST_IMAGE, uOpenFlags);
531 if (RT_SUCCESS(rc))
532 pThis->fTempReadOnly = false;
533 else
534 AssertRC(rc);
535 }
536 return rc;
537}
538
539
540/*********************************************************************************************************************************
541* Error reporting callback *
542*********************************************************************************************************************************/
543
544static DECLCALLBACK(void) drvvdErrorCallback(void *pvUser, int rc, RT_SRC_POS_DECL,
545 const char *pszFormat, va_list va)
546{
547 PPDMDRVINS pDrvIns = (PPDMDRVINS)pvUser;
548 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
549 if (pThis->fErrorUseRuntime)
550 /* We must not pass VMSETRTERR_FLAGS_FATAL as it could lead to a
551 * deadlock: We are probably executed in a thread context != EMT
552 * and the EM thread would wait until every thread is suspended
553 * but we would wait for the EM thread ... */
554
555 PDMDrvHlpVMSetRuntimeErrorV(pDrvIns, /* fFlags=*/ 0, "DrvVD", pszFormat, va);
556 else
557 PDMDrvHlpVMSetErrorV(pDrvIns, rc, RT_SRC_POS_ARGS, pszFormat, va);
558}
559
560
561/*********************************************************************************************************************************
562* VD Async I/O interface implementation *
563*********************************************************************************************************************************/
564
565#ifdef VBOX_WITH_PDM_ASYNC_COMPLETION
566
567static DECLCALLBACK(void) drvvdAsyncTaskCompleted(PPDMDRVINS pDrvIns, void *pvTemplateUser, void *pvUser, int rcReq)
568{
569 RT_NOREF(pDrvIns);
570 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pvTemplateUser;
571
572 LogFlowFunc(("pDrvIns=%#p pvTemplateUser=%#p pvUser=%#p rcReq=%d\n",
573 pDrvIns, pvTemplateUser, pvUser, rcReq));
574
575 if (pStorageBackend->fSyncIoPending)
576 {
577 Assert(!pvUser);
578 pStorageBackend->rcReqLast = rcReq;
579 ASMAtomicWriteBool(&pStorageBackend->fSyncIoPending, false);
580 RTSemEventSignal(pStorageBackend->EventSem);
581 }
582 else
583 {
584 int rc;
585
586 AssertPtr(pvUser);
587
588 AssertPtr(pStorageBackend->pfnCompleted);
589 rc = pStorageBackend->pfnCompleted(pvUser, rcReq);
590 AssertRC(rc);
591 }
592}
593
594static DECLCALLBACK(int) drvvdAsyncIOOpen(void *pvUser, const char *pszLocation,
595 uint32_t fOpen,
596 PFNVDCOMPLETED pfnCompleted,
597 void **ppStorage)
598{
599 PVBOXDISK pThis = (PVBOXDISK)pvUser;
600 PDRVVDSTORAGEBACKEND pStorageBackend = NULL;
601 int rc = VINF_SUCCESS;
602
603 /*
604 * Check whether the backend wants to open a block device and try to prepare it
605 * if we didn't claim it yet.
606 *
607 * We only create a block device manager on demand to not waste any resources.
608 */
609 if (HBDMgrIsBlockDevice(pszLocation))
610 {
611 if (pThis->hHbdMgr == NIL_HBDMGR)
612 rc = HBDMgrCreate(&pThis->hHbdMgr);
613
614 if ( RT_SUCCESS(rc)
615 && !HBDMgrIsBlockDeviceClaimed(pThis->hHbdMgr, pszLocation))
616 rc = HBDMgrClaimBlockDevice(pThis->hHbdMgr, pszLocation);
617
618 if (RT_FAILURE(rc))
619 return rc;
620 }
621
622 pStorageBackend = (PDRVVDSTORAGEBACKEND)RTMemAllocZ(sizeof(DRVVDSTORAGEBACKEND));
623 if (pStorageBackend)
624 {
625 pStorageBackend->fSyncIoPending = false;
626 pStorageBackend->rcReqLast = VINF_SUCCESS;
627 pStorageBackend->pfnCompleted = pfnCompleted;
628
629 rc = RTSemEventCreate(&pStorageBackend->EventSem);
630 if (RT_SUCCESS(rc))
631 {
632 rc = PDMDrvHlpAsyncCompletionTemplateCreate(pThis->pDrvIns, &pStorageBackend->pTemplate,
633 drvvdAsyncTaskCompleted, pStorageBackend, "AsyncTaskCompleted");
634 if (RT_SUCCESS(rc))
635 {
636 uint32_t fFlags = (fOpen & RTFILE_O_ACCESS_MASK) == RTFILE_O_READ
637 ? PDMACEP_FILE_FLAGS_READ_ONLY
638 : 0;
639 if (pThis->fShareable)
640 {
641 Assert((fOpen & RTFILE_O_DENY_MASK) == RTFILE_O_DENY_NONE);
642
643 fFlags |= PDMACEP_FILE_FLAGS_DONT_LOCK;
644 }
645 if (pThis->fAsyncIoWithHostCache)
646 fFlags |= PDMACEP_FILE_FLAGS_HOST_CACHE_ENABLED;
647
648 rc = PDMR3AsyncCompletionEpCreateForFile(&pStorageBackend->pEndpoint,
649 pszLocation, fFlags,
650 pStorageBackend->pTemplate);
651
652 if (RT_SUCCESS(rc))
653 {
654 if (pThis->pszBwGroup)
655 rc = PDMR3AsyncCompletionEpSetBwMgr(pStorageBackend->pEndpoint, pThis->pszBwGroup);
656
657 if (RT_SUCCESS(rc))
658 {
659 LogFlow(("drvvdAsyncIOOpen: Successfully opened '%s'; fOpen=%#x pStorage=%p\n",
660 pszLocation, fOpen, pStorageBackend));
661 *ppStorage = pStorageBackend;
662 return VINF_SUCCESS;
663 }
664
665 PDMR3AsyncCompletionEpClose(pStorageBackend->pEndpoint);
666 }
667
668 PDMR3AsyncCompletionTemplateDestroy(pStorageBackend->pTemplate);
669 }
670 RTSemEventDestroy(pStorageBackend->EventSem);
671 }
672 RTMemFree(pStorageBackend);
673 }
674 else
675 rc = VERR_NO_MEMORY;
676
677 return rc;
678}
679
680static DECLCALLBACK(int) drvvdAsyncIOClose(void *pvUser, void *pStorage)
681{
682 RT_NOREF(pvUser);
683 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
684
685 /*
686 * We don't unclaim any block devices on purpose here because they
687 * might get reopened shortly (switching to readonly during suspend)
688 *
689 * Block devices will get unclaimed during destruction of the driver.
690 */
691
692 PDMR3AsyncCompletionEpClose(pStorageBackend->pEndpoint);
693 PDMR3AsyncCompletionTemplateDestroy(pStorageBackend->pTemplate);
694 RTSemEventDestroy(pStorageBackend->EventSem);
695 RTMemFree(pStorageBackend);
696 return VINF_SUCCESS;;
697}
698
699static DECLCALLBACK(int) drvvdAsyncIOReadSync(void *pvUser, void *pStorage, uint64_t uOffset,
700 void *pvBuf, size_t cbRead, size_t *pcbRead)
701{
702 RT_NOREF(pvUser);
703 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
704 RTSGSEG DataSeg;
705 PPDMASYNCCOMPLETIONTASK pTask;
706
707 bool fOld = ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, true);
708 Assert(!fOld); NOREF(fOld);
709 DataSeg.cbSeg = cbRead;
710 DataSeg.pvSeg = pvBuf;
711
712 int rc = PDMR3AsyncCompletionEpRead(pStorageBackend->pEndpoint, uOffset, &DataSeg, 1, cbRead, NULL, &pTask);
713 if (RT_FAILURE(rc))
714 return rc;
715
716 if (rc == VINF_AIO_TASK_PENDING)
717 {
718 /* Wait */
719 rc = RTSemEventWait(pStorageBackend->EventSem, RT_INDEFINITE_WAIT);
720 AssertRC(rc);
721 }
722 else
723 ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, false);
724
725 if (pcbRead)
726 *pcbRead = cbRead;
727
728 return pStorageBackend->rcReqLast;
729}
730
731static DECLCALLBACK(int) drvvdAsyncIOWriteSync(void *pvUser, void *pStorage, uint64_t uOffset,
732 const void *pvBuf, size_t cbWrite, size_t *pcbWritten)
733{
734 RT_NOREF(pvUser);
735 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
736 RTSGSEG DataSeg;
737 PPDMASYNCCOMPLETIONTASK pTask;
738
739 bool fOld = ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, true);
740 Assert(!fOld); NOREF(fOld);
741 DataSeg.cbSeg = cbWrite;
742 DataSeg.pvSeg = (void *)pvBuf;
743
744 int rc = PDMR3AsyncCompletionEpWrite(pStorageBackend->pEndpoint, uOffset, &DataSeg, 1, cbWrite, NULL, &pTask);
745 if (RT_FAILURE(rc))
746 return rc;
747
748 if (rc == VINF_AIO_TASK_PENDING)
749 {
750 /* Wait */
751 rc = RTSemEventWait(pStorageBackend->EventSem, RT_INDEFINITE_WAIT);
752 AssertRC(rc);
753 }
754 else
755 ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, false);
756
757 if (pcbWritten)
758 *pcbWritten = cbWrite;
759
760 return pStorageBackend->rcReqLast;
761}
762
763static DECLCALLBACK(int) drvvdAsyncIOFlushSync(void *pvUser, void *pStorage)
764{
765 RT_NOREF(pvUser);
766 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
767 PPDMASYNCCOMPLETIONTASK pTask;
768
769 LogFlowFunc(("pvUser=%#p pStorage=%#p\n", pvUser, pStorage));
770
771 bool fOld = ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, true);
772 Assert(!fOld); NOREF(fOld);
773
774 int rc = PDMR3AsyncCompletionEpFlush(pStorageBackend->pEndpoint, NULL, &pTask);
775 if (RT_FAILURE(rc))
776 return rc;
777
778 if (rc == VINF_AIO_TASK_PENDING)
779 {
780 /* Wait */
781 LogFlowFunc(("Waiting for flush to complete\n"));
782 rc = RTSemEventWait(pStorageBackend->EventSem, RT_INDEFINITE_WAIT);
783 AssertRC(rc);
784 }
785 else
786 ASMAtomicXchgBool(&pStorageBackend->fSyncIoPending, false);
787
788 return pStorageBackend->rcReqLast;
789}
790
791static DECLCALLBACK(int) drvvdAsyncIOReadAsync(void *pvUser, void *pStorage, uint64_t uOffset,
792 PCRTSGSEG paSegments, size_t cSegments,
793 size_t cbRead, void *pvCompletion,
794 void **ppTask)
795{
796 RT_NOREF(pvUser);
797 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
798
799 int rc = PDMR3AsyncCompletionEpRead(pStorageBackend->pEndpoint, uOffset, paSegments, (unsigned)cSegments, cbRead,
800 pvCompletion, (PPPDMASYNCCOMPLETIONTASK)ppTask);
801 if (rc == VINF_AIO_TASK_PENDING)
802 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
803
804 return rc;
805}
806
807static DECLCALLBACK(int) drvvdAsyncIOWriteAsync(void *pvUser, void *pStorage, uint64_t uOffset,
808 PCRTSGSEG paSegments, size_t cSegments,
809 size_t cbWrite, void *pvCompletion,
810 void **ppTask)
811{
812 RT_NOREF(pvUser);
813 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
814
815 int rc = PDMR3AsyncCompletionEpWrite(pStorageBackend->pEndpoint, uOffset, paSegments, (unsigned)cSegments, cbWrite,
816 pvCompletion, (PPPDMASYNCCOMPLETIONTASK)ppTask);
817 if (rc == VINF_AIO_TASK_PENDING)
818 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
819
820 return rc;
821}
822
823static DECLCALLBACK(int) drvvdAsyncIOFlushAsync(void *pvUser, void *pStorage,
824 void *pvCompletion, void **ppTask)
825{
826 RT_NOREF(pvUser);
827 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
828
829 int rc = PDMR3AsyncCompletionEpFlush(pStorageBackend->pEndpoint, pvCompletion,
830 (PPPDMASYNCCOMPLETIONTASK)ppTask);
831 if (rc == VINF_AIO_TASK_PENDING)
832 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
833
834 return rc;
835}
836
837static DECLCALLBACK(int) drvvdAsyncIOGetSize(void *pvUser, void *pStorage, uint64_t *pcbSize)
838{
839 RT_NOREF(pvUser);
840 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
841
842 return PDMR3AsyncCompletionEpGetSize(pStorageBackend->pEndpoint, pcbSize);
843}
844
845static DECLCALLBACK(int) drvvdAsyncIOSetSize(void *pvUser, void *pStorage, uint64_t cbSize)
846{
847 RT_NOREF(pvUser);
848 PDRVVDSTORAGEBACKEND pStorageBackend = (PDRVVDSTORAGEBACKEND)pStorage;
849
850 return PDMR3AsyncCompletionEpSetSize(pStorageBackend->pEndpoint, cbSize);
851}
852
853static DECLCALLBACK(int) drvvdAsyncIOSetAllocationSize(void *pvUser, void *pvStorage, uint64_t cbSize, uint32_t fFlags)
854{
855 RT_NOREF(pvUser, pvStorage, cbSize, fFlags);
856 return VERR_NOT_SUPPORTED;
857}
858
859#endif /* VBOX_WITH_PDM_ASYNC_COMPLETION */
860
861
862/*********************************************************************************************************************************
863* VD Thread Synchronization interface implementation *
864*********************************************************************************************************************************/
865
866static DECLCALLBACK(int) drvvdThreadStartRead(void *pvUser)
867{
868 PVBOXDISK pThis = (PVBOXDISK)pvUser;
869
870 return RTSemRWRequestRead(pThis->MergeLock, RT_INDEFINITE_WAIT);
871}
872
873static DECLCALLBACK(int) drvvdThreadFinishRead(void *pvUser)
874{
875 PVBOXDISK pThis = (PVBOXDISK)pvUser;
876
877 return RTSemRWReleaseRead(pThis->MergeLock);
878}
879
880static DECLCALLBACK(int) drvvdThreadStartWrite(void *pvUser)
881{
882 PVBOXDISK pThis = (PVBOXDISK)pvUser;
883
884 return RTSemRWRequestWrite(pThis->MergeLock, RT_INDEFINITE_WAIT);
885}
886
887static DECLCALLBACK(int) drvvdThreadFinishWrite(void *pvUser)
888{
889 PVBOXDISK pThis = (PVBOXDISK)pvUser;
890
891 return RTSemRWReleaseWrite(pThis->MergeLock);
892}
893
894
895/*********************************************************************************************************************************
896* VD Configuration interface implementation *
897*********************************************************************************************************************************/
898
899static DECLCALLBACK(bool) drvvdCfgAreKeysValid(void *pvUser, const char *pszzValid)
900{
901 return CFGMR3AreValuesValid((PCFGMNODE)pvUser, pszzValid);
902}
903
904static DECLCALLBACK(int) drvvdCfgQuerySize(void *pvUser, const char *pszName, size_t *pcb)
905{
906 return CFGMR3QuerySize((PCFGMNODE)pvUser, pszName, pcb);
907}
908
909static DECLCALLBACK(int) drvvdCfgQuery(void *pvUser, const char *pszName, char *pszString, size_t cchString)
910{
911 return CFGMR3QueryString((PCFGMNODE)pvUser, pszName, pszString, cchString);
912}
913
914static DECLCALLBACK(int) drvvdCfgQueryBytes(void *pvUser, const char *pszName, void *ppvData, size_t cbData)
915{
916 return CFGMR3QueryBytes((PCFGMNODE)pvUser, pszName, ppvData, cbData);
917}
918
919
920/*******************************************************************************
921* VD Crypto interface implementation for the encryption support *
922*******************************************************************************/
923
924static DECLCALLBACK(int) drvvdCryptoKeyRetain(void *pvUser, const char *pszId, const uint8_t **ppbKey, size_t *pcbKey)
925{
926 PVBOXDISK pThis = (PVBOXDISK)pvUser;
927 int rc = VINF_SUCCESS;
928
929 AssertPtr(pThis->pIfSecKey);
930 if (pThis->pIfSecKey)
931 rc = pThis->pIfSecKey->pfnKeyRetain(pThis->pIfSecKey, pszId, ppbKey, pcbKey);
932 else
933 rc = VERR_NOT_SUPPORTED;
934
935 return rc;
936}
937
938static DECLCALLBACK(int) drvvdCryptoKeyRelease(void *pvUser, const char *pszId)
939{
940 PVBOXDISK pThis = (PVBOXDISK)pvUser;
941 int rc = VINF_SUCCESS;
942
943 AssertPtr(pThis->pIfSecKey);
944 if (pThis->pIfSecKey)
945 rc = pThis->pIfSecKey->pfnKeyRelease(pThis->pIfSecKey, pszId);
946 else
947 rc = VERR_NOT_SUPPORTED;
948
949 return rc;
950}
951
952static DECLCALLBACK(int) drvvdCryptoKeyStorePasswordRetain(void *pvUser, const char *pszId, const char **ppszPassword)
953{
954 PVBOXDISK pThis = (PVBOXDISK)pvUser;
955 int rc = VINF_SUCCESS;
956
957 AssertPtr(pThis->pIfSecKey);
958 if (pThis->pIfSecKey)
959 rc = pThis->pIfSecKey->pfnPasswordRetain(pThis->pIfSecKey, pszId, ppszPassword);
960 else
961 rc = VERR_NOT_SUPPORTED;
962
963 return rc;
964}
965
966static DECLCALLBACK(int) drvvdCryptoKeyStorePasswordRelease(void *pvUser, const char *pszId)
967{
968 PVBOXDISK pThis = (PVBOXDISK)pvUser;
969 int rc = VINF_SUCCESS;
970
971 AssertPtr(pThis->pIfSecKey);
972 if (pThis->pIfSecKey)
973 rc = pThis->pIfSecKey->pfnPasswordRelease(pThis->pIfSecKey, pszId);
974 else
975 rc = VERR_NOT_SUPPORTED;
976
977 return rc;
978}
979
980#ifdef VBOX_WITH_INIP
981
982
983/*********************************************************************************************************************************
984* VD TCP network stack interface implementation - INIP case *
985*********************************************************************************************************************************/
986
987/**
988 * vvl: this structure duplicate meaning of sockaddr,
989 * perhaps it'd be better to get rid of it.
990 */
991typedef union INIPSOCKADDRUNION
992{
993 struct sockaddr Addr;
994 struct sockaddr_in Ipv4;
995#if LWIP_IPV6
996 struct sockaddr_in6 Ipv6;
997#endif
998} INIPSOCKADDRUNION;
999
1000typedef struct INIPSOCKET
1001{
1002 int hSock;
1003} INIPSOCKET, *PINIPSOCKET;
1004
1005static DECLCALLBACK(int) drvvdINIPFlush(VDSOCKET Sock);
1006
1007/** @interface_method_impl{VDINTERFACETCPNET,pfnSocketCreate} */
1008static DECLCALLBACK(int) drvvdINIPSocketCreate(uint32_t fFlags, PVDSOCKET pSock)
1009{
1010 PINIPSOCKET pSocketInt = NULL;
1011
1012 /*
1013 * The extended select method is not supported because it is impossible to wakeup
1014 * the thread.
1015 */
1016 if (fFlags & VD_INTERFACETCPNET_CONNECT_EXTENDED_SELECT)
1017 return VERR_NOT_SUPPORTED;
1018
1019 pSocketInt = (PINIPSOCKET)RTMemAllocZ(sizeof(INIPSOCKET));
1020 if (pSocketInt)
1021 {
1022 pSocketInt->hSock = INT32_MAX;
1023 *pSock = (VDSOCKET)pSocketInt;
1024 return VINF_SUCCESS;
1025 }
1026
1027 return VERR_NO_MEMORY;
1028}
1029
1030/** @interface_method_impl{VDINTERFACETCPNET,pfnSocketCreate} */
1031static DECLCALLBACK(int) drvvdINIPSocketDestroy(VDSOCKET Sock)
1032{
1033 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1034
1035 RTMemFree(pSocketInt);
1036 return VINF_SUCCESS;
1037}
1038
1039/** @interface_method_impl{VDINTERFACETCPNET,pfnClientConnect} */
1040static DECLCALLBACK(int) drvvdINIPClientConnect(VDSOCKET Sock, const char *pszAddress, uint32_t uPort,
1041 RTMSINTERVAL cMillies)
1042{
1043 int rc = VINF_SUCCESS;
1044 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1045 int iInetFamily = PF_INET;
1046 struct in_addr ip;
1047#if LWIP_IPV6
1048 ip6_addr_t ip6;
1049 RT_ZERO(ip6);
1050#endif
1051
1052 NOREF(cMillies); /* LwIP doesn't support connect timeout. */
1053 RT_ZERO(ip); /* Shut up MSC. */
1054
1055 /* Check whether lwIP is set up in this VM instance. */
1056 if (!DevINIPConfigured())
1057 {
1058 LogRelFunc(("no IP stack\n"));
1059 return VERR_NET_HOST_UNREACHABLE;
1060 }
1061 /* Resolve hostname. As there is no standard resolver for lwIP yet,
1062 * just accept numeric IP addresses for now. */
1063#if LWIP_IPV6
1064 if (inet6_aton(pszAddress, &ip6))
1065 iInetFamily = PF_INET6;
1066 else /* concatination with if */
1067#endif
1068 if (!lwip_inet_aton(pszAddress, &ip))
1069 {
1070 LogRelFunc(("cannot resolve IP %s\n", pszAddress));
1071 return VERR_NET_HOST_UNREACHABLE;
1072 }
1073 /* Create socket and connect. */
1074 int iSock = lwip_socket(iInetFamily, SOCK_STREAM, 0);
1075 if (iSock != -1)
1076 {
1077 struct sockaddr *pSockAddr = NULL;
1078 struct sockaddr_in InAddr = {0};
1079#if LWIP_IPV6
1080 struct sockaddr_in6 In6Addr = {0};
1081#endif
1082 if (iInetFamily == PF_INET)
1083 {
1084 InAddr.sin_family = AF_INET;
1085 InAddr.sin_port = htons(uPort);
1086 InAddr.sin_addr = ip;
1087 InAddr.sin_len = sizeof(InAddr);
1088 pSockAddr = (struct sockaddr *)&InAddr;
1089 }
1090#if LWIP_IPV6
1091 else
1092 {
1093 In6Addr.sin6_family = AF_INET6;
1094 In6Addr.sin6_port = htons(uPort);
1095 memcpy(&In6Addr.sin6_addr, &ip6, sizeof(ip6));
1096 In6Addr.sin6_len = sizeof(In6Addr);
1097 pSockAddr = (struct sockaddr *)&In6Addr;
1098 }
1099#endif
1100 if ( pSockAddr
1101 && !lwip_connect(iSock, pSockAddr, pSockAddr->sa_len))
1102 {
1103 pSocketInt->hSock = iSock;
1104 return VINF_SUCCESS;
1105 }
1106 rc = VERR_NET_CONNECTION_REFUSED; /** @todo real solution needed */
1107 lwip_close(iSock);
1108 }
1109 else
1110 rc = VERR_NET_CONNECTION_REFUSED; /** @todo real solution needed */
1111 return rc;
1112}
1113
1114/** @interface_method_impl{VDINTERFACETCPNET,pfnClientClose} */
1115static DECLCALLBACK(int) drvvdINIPClientClose(VDSOCKET Sock)
1116{
1117 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1118
1119 lwip_close(pSocketInt->hSock);
1120 pSocketInt->hSock = INT32_MAX;
1121 return VINF_SUCCESS; /** @todo real solution needed */
1122}
1123
1124/** @interface_method_impl{VDINTERFACETCPNET,pfnIsClientConnected} */
1125static DECLCALLBACK(bool) drvvdINIPIsClientConnected(VDSOCKET Sock)
1126{
1127 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1128
1129 return pSocketInt->hSock != INT32_MAX;
1130}
1131
1132/** @interface_method_impl{VDINTERFACETCPNET,pfnSelectOne} */
1133static DECLCALLBACK(int) drvvdINIPSelectOne(VDSOCKET Sock, RTMSINTERVAL cMillies)
1134{
1135 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1136 fd_set fdsetR;
1137 FD_ZERO(&fdsetR);
1138 FD_SET((uintptr_t)pSocketInt->hSock, &fdsetR);
1139 fd_set fdsetE = fdsetR;
1140
1141 int rc;
1142 if (cMillies == RT_INDEFINITE_WAIT)
1143 rc = lwip_select(pSocketInt->hSock + 1, &fdsetR, NULL, &fdsetE, NULL);
1144 else
1145 {
1146 struct timeval timeout;
1147 timeout.tv_sec = cMillies / 1000;
1148 timeout.tv_usec = (cMillies % 1000) * 1000;
1149 rc = lwip_select(pSocketInt->hSock + 1, &fdsetR, NULL, &fdsetE, &timeout);
1150 }
1151 if (rc > 0)
1152 return VINF_SUCCESS;
1153 if (rc == 0)
1154 return VERR_TIMEOUT;
1155 return VERR_NET_CONNECTION_REFUSED; /** @todo real solution needed */
1156}
1157
1158/** @interface_method_impl{VDINTERFACETCPNET,pfnRead} */
1159static DECLCALLBACK(int) drvvdINIPRead(VDSOCKET Sock, void *pvBuffer, size_t cbBuffer, size_t *pcbRead)
1160{
1161 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1162
1163 /* Do params checking */
1164 if (!pvBuffer || !cbBuffer)
1165 {
1166 AssertMsgFailed(("Invalid params\n"));
1167 return VERR_INVALID_PARAMETER;
1168 }
1169
1170 /*
1171 * Read loop.
1172 * If pcbRead is NULL we have to fill the entire buffer!
1173 */
1174 size_t cbRead = 0;
1175 size_t cbToRead = cbBuffer;
1176 for (;;)
1177 {
1178 /** @todo this clipping here is just in case (the send function
1179 * needed it, so I added it here, too). Didn't investigate if this
1180 * really has issues. Better be safe than sorry. */
1181 ssize_t cbBytesRead = lwip_recv(pSocketInt->hSock, (char *)pvBuffer + cbRead,
1182 RT_MIN(cbToRead, 32768), 0);
1183 if (cbBytesRead < 0)
1184 return VERR_NET_CONNECTION_REFUSED; /** @todo real solution */
1185 if (cbBytesRead == 0 && errno) /** @todo r=bird: lwip_recv will not touch errno on Windows. This may apply to other hosts as well */
1186 return VERR_NET_CONNECTION_REFUSED; /** @todo real solution */
1187 if (pcbRead)
1188 {
1189 /* return partial data */
1190 *pcbRead = cbBytesRead;
1191 break;
1192 }
1193
1194 /* read more? */
1195 cbRead += cbBytesRead;
1196 if (cbRead == cbBuffer)
1197 break;
1198
1199 /* next */
1200 cbToRead = cbBuffer - cbRead;
1201 }
1202
1203 return VINF_SUCCESS;
1204}
1205
1206/** @interface_method_impl{VDINTERFACETCPNET,pfnWrite} */
1207static DECLCALLBACK(int) drvvdINIPWrite(VDSOCKET Sock, const void *pvBuffer, size_t cbBuffer)
1208{
1209 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1210
1211 do
1212 {
1213 /** @todo lwip send only supports up to 65535 bytes in a single
1214 * send (stupid limitation buried in the code), so make sure we
1215 * don't get any wraparounds. This should be moved to DevINIP
1216 * stack interface once that's implemented. */
1217 ssize_t cbWritten = lwip_send(pSocketInt->hSock, (void *)pvBuffer,
1218 RT_MIN(cbBuffer, 32768), 0);
1219 if (cbWritten < 0)
1220 return VERR_NET_CONNECTION_REFUSED; /** @todo real solution needed */
1221 AssertMsg(cbBuffer >= (size_t)cbWritten, ("Wrote more than we requested!!! cbWritten=%d cbBuffer=%d\n",
1222 cbWritten, cbBuffer));
1223 cbBuffer -= cbWritten;
1224 pvBuffer = (const char *)pvBuffer + cbWritten;
1225 } while (cbBuffer);
1226
1227 return VINF_SUCCESS;
1228}
1229
1230/** @interface_method_impl{VDINTERFACETCPNET,pfnSgWrite} */
1231static DECLCALLBACK(int) drvvdINIPSgWrite(VDSOCKET Sock, PCRTSGBUF pSgBuf)
1232{
1233 int rc = VINF_SUCCESS;
1234
1235 /* This is an extremely crude emulation, however it's good enough
1236 * for our iSCSI code. INIP has no sendmsg(). */
1237 for (unsigned i = 0; i < pSgBuf->cSegs; i++)
1238 {
1239 rc = drvvdINIPWrite(Sock, pSgBuf->paSegs[i].pvSeg,
1240 pSgBuf->paSegs[i].cbSeg);
1241 if (RT_FAILURE(rc))
1242 break;
1243 }
1244 if (RT_SUCCESS(rc))
1245 drvvdINIPFlush(Sock);
1246
1247 return rc;
1248}
1249
1250/** @interface_method_impl{VDINTERFACETCPNET,pfnFlush} */
1251static DECLCALLBACK(int) drvvdINIPFlush(VDSOCKET Sock)
1252{
1253 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1254
1255 int fFlag = 1;
1256 lwip_setsockopt(pSocketInt->hSock, IPPROTO_TCP, TCP_NODELAY,
1257 (const char *)&fFlag, sizeof(fFlag));
1258 fFlag = 0;
1259 lwip_setsockopt(pSocketInt->hSock, IPPROTO_TCP, TCP_NODELAY,
1260 (const char *)&fFlag, sizeof(fFlag));
1261 return VINF_SUCCESS;
1262}
1263
1264/** @interface_method_impl{VDINTERFACETCPNET,pfnSetSendCoalescing} */
1265static DECLCALLBACK(int) drvvdINIPSetSendCoalescing(VDSOCKET Sock, bool fEnable)
1266{
1267 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1268
1269 int fFlag = fEnable ? 0 : 1;
1270 lwip_setsockopt(pSocketInt->hSock, IPPROTO_TCP, TCP_NODELAY,
1271 (const char *)&fFlag, sizeof(fFlag));
1272 return VINF_SUCCESS;
1273}
1274
1275/** @interface_method_impl{VDINTERFACETCPNET,pfnGetLocalAddress} */
1276static DECLCALLBACK(int) drvvdINIPGetLocalAddress(VDSOCKET Sock, PRTNETADDR pAddr)
1277{
1278 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1279 INIPSOCKADDRUNION u;
1280 socklen_t cbAddr = sizeof(u);
1281 RT_ZERO(u);
1282 if (!lwip_getsockname(pSocketInt->hSock, &u.Addr, &cbAddr))
1283 {
1284 /*
1285 * Convert the address.
1286 */
1287 if ( cbAddr == sizeof(struct sockaddr_in)
1288 && u.Addr.sa_family == AF_INET)
1289 {
1290 RT_ZERO(*pAddr);
1291 pAddr->enmType = RTNETADDRTYPE_IPV4;
1292 pAddr->uPort = RT_N2H_U16(u.Ipv4.sin_port);
1293 pAddr->uAddr.IPv4.u = u.Ipv4.sin_addr.s_addr;
1294 }
1295#if LWIP_IPV6
1296 else if ( cbAddr == sizeof(struct sockaddr_in6)
1297 && u.Addr.sa_family == AF_INET6)
1298 {
1299 RT_ZERO(*pAddr);
1300 pAddr->enmType = RTNETADDRTYPE_IPV6;
1301 pAddr->uPort = RT_N2H_U16(u.Ipv6.sin6_port);
1302 memcpy(&pAddr->uAddr.IPv6, &u.Ipv6.sin6_addr, sizeof(RTNETADDRIPV6));
1303 }
1304#endif
1305 else
1306 return VERR_NET_ADDRESS_FAMILY_NOT_SUPPORTED;
1307 return VINF_SUCCESS;
1308 }
1309 return VERR_NET_OPERATION_NOT_SUPPORTED;
1310}
1311
1312/** @interface_method_impl{VDINTERFACETCPNET,pfnGetPeerAddress} */
1313static DECLCALLBACK(int) drvvdINIPGetPeerAddress(VDSOCKET Sock, PRTNETADDR pAddr)
1314{
1315 PINIPSOCKET pSocketInt = (PINIPSOCKET)Sock;
1316 INIPSOCKADDRUNION u;
1317 socklen_t cbAddr = sizeof(u);
1318 RT_ZERO(u);
1319 if (!lwip_getpeername(pSocketInt->hSock, &u.Addr, &cbAddr))
1320 {
1321 /*
1322 * Convert the address.
1323 */
1324 if ( cbAddr == sizeof(struct sockaddr_in)
1325 && u.Addr.sa_family == AF_INET)
1326 {
1327 RT_ZERO(*pAddr);
1328 pAddr->enmType = RTNETADDRTYPE_IPV4;
1329 pAddr->uPort = RT_N2H_U16(u.Ipv4.sin_port);
1330 pAddr->uAddr.IPv4.u = u.Ipv4.sin_addr.s_addr;
1331 }
1332#if LWIP_IPV6
1333 else if ( cbAddr == sizeof(struct sockaddr_in6)
1334 && u.Addr.sa_family == AF_INET6)
1335 {
1336 RT_ZERO(*pAddr);
1337 pAddr->enmType = RTNETADDRTYPE_IPV6;
1338 pAddr->uPort = RT_N2H_U16(u.Ipv6.sin6_port);
1339 memcpy(&pAddr->uAddr.IPv6, &u.Ipv6.sin6_addr, sizeof(RTNETADDRIPV6));
1340 }
1341#endif
1342 else
1343 return VERR_NET_ADDRESS_FAMILY_NOT_SUPPORTED;
1344 return VINF_SUCCESS;
1345 }
1346 return VERR_NET_OPERATION_NOT_SUPPORTED;
1347}
1348
1349/** @interface_method_impl{VDINTERFACETCPNET,pfnSelectOneEx} */
1350static DECLCALLBACK(int) drvvdINIPSelectOneEx(VDSOCKET Sock, uint32_t fEvents, uint32_t *pfEvents, RTMSINTERVAL cMillies)
1351{
1352 RT_NOREF(Sock, fEvents, pfEvents, cMillies);
1353 AssertMsgFailed(("Not supported!\n"));
1354 return VERR_NOT_SUPPORTED;
1355}
1356
1357/** @interface_method_impl{VDINTERFACETCPNET,pfnPoke} */
1358static DECLCALLBACK(int) drvvdINIPPoke(VDSOCKET Sock)
1359{
1360 RT_NOREF(Sock);
1361 AssertMsgFailed(("Not supported!\n"));
1362 return VERR_NOT_SUPPORTED;
1363}
1364
1365#endif /* VBOX_WITH_INIP */
1366
1367
1368/*********************************************************************************************************************************
1369* VD TCP network stack interface implementation - Host TCP case *
1370*********************************************************************************************************************************/
1371
1372/**
1373 * Socket data.
1374 */
1375typedef struct VDSOCKETINT
1376{
1377 /** IPRT socket handle. */
1378 RTSOCKET hSocket;
1379 /** Pollset with the wakeup pipe and socket. */
1380 RTPOLLSET hPollSet;
1381 /** Pipe endpoint - read (in the pollset). */
1382 RTPIPE hPipeR;
1383 /** Pipe endpoint - write. */
1384 RTPIPE hPipeW;
1385 /** Flag whether the thread was woken up. */
1386 volatile bool fWokenUp;
1387 /** Flag whether the thread is waiting in the select call. */
1388 volatile bool fWaiting;
1389 /** Old event mask. */
1390 uint32_t fEventsOld;
1391} VDSOCKETINT, *PVDSOCKETINT;
1392
1393/** Pollset id of the socket. */
1394#define VDSOCKET_POLL_ID_SOCKET 0
1395/** Pollset id of the pipe. */
1396#define VDSOCKET_POLL_ID_PIPE 1
1397
1398/** @interface_method_impl{VDINTERFACETCPNET,pfnSocketCreate} */
1399static DECLCALLBACK(int) drvvdTcpSocketCreate(uint32_t fFlags, PVDSOCKET phVdSock)
1400{
1401 int rc = VINF_SUCCESS;
1402 int rc2 = VINF_SUCCESS;
1403 PVDSOCKETINT pSockInt = NULL;
1404
1405 pSockInt = (PVDSOCKETINT)RTMemAllocZ(sizeof(VDSOCKETINT));
1406 if (!pSockInt)
1407 return VERR_NO_MEMORY;
1408
1409 pSockInt->hSocket = NIL_RTSOCKET;
1410 pSockInt->hPollSet = NIL_RTPOLLSET;
1411 pSockInt->hPipeR = NIL_RTPIPE;
1412 pSockInt->hPipeW = NIL_RTPIPE;
1413 pSockInt->fWokenUp = false;
1414 pSockInt->fWaiting = false;
1415
1416 if (fFlags & VD_INTERFACETCPNET_CONNECT_EXTENDED_SELECT)
1417 {
1418 /* Init pipe and pollset. */
1419 rc = RTPipeCreate(&pSockInt->hPipeR, &pSockInt->hPipeW, 0);
1420 if (RT_SUCCESS(rc))
1421 {
1422 rc = RTPollSetCreate(&pSockInt->hPollSet);
1423 if (RT_SUCCESS(rc))
1424 {
1425 rc = RTPollSetAddPipe(pSockInt->hPollSet, pSockInt->hPipeR,
1426 RTPOLL_EVT_READ, VDSOCKET_POLL_ID_PIPE);
1427 if (RT_SUCCESS(rc))
1428 {
1429 *phVdSock = pSockInt;
1430 return VINF_SUCCESS;
1431 }
1432
1433 RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_PIPE);
1434 rc2 = RTPollSetDestroy(pSockInt->hPollSet);
1435 AssertRC(rc2);
1436 }
1437
1438 rc2 = RTPipeClose(pSockInt->hPipeR);
1439 AssertRC(rc2);
1440 rc2 = RTPipeClose(pSockInt->hPipeW);
1441 AssertRC(rc2);
1442 }
1443 }
1444 else
1445 {
1446 *phVdSock = pSockInt;
1447 return VINF_SUCCESS;
1448 }
1449
1450 RTMemFree(pSockInt);
1451
1452 return rc;
1453}
1454
1455/** @interface_method_impl{VDINTERFACETCPNET,pfnSocketDestroy} */
1456static DECLCALLBACK(int) drvvdTcpSocketDestroy(VDSOCKET hVdSock)
1457{
1458 int rc = VINF_SUCCESS;
1459 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1460
1461 /* Destroy the pipe and pollset if necessary. */
1462 if (pSockInt->hPollSet != NIL_RTPOLLSET)
1463 {
1464 if (pSockInt->hSocket != NIL_RTSOCKET)
1465 {
1466 rc = RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_SOCKET);
1467 Assert(RT_SUCCESS(rc) || rc == VERR_POLL_HANDLE_ID_NOT_FOUND);
1468 }
1469 rc = RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_PIPE);
1470 AssertRC(rc);
1471 rc = RTPollSetDestroy(pSockInt->hPollSet);
1472 AssertRC(rc);
1473 rc = RTPipeClose(pSockInt->hPipeR);
1474 AssertRC(rc);
1475 rc = RTPipeClose(pSockInt->hPipeW);
1476 AssertRC(rc);
1477 }
1478
1479 if (pSockInt->hSocket != NIL_RTSOCKET)
1480 rc = RTTcpClientCloseEx(pSockInt->hSocket, false /*fGracefulShutdown*/);
1481
1482 RTMemFree(pSockInt);
1483
1484 return rc;
1485}
1486
1487/** @interface_method_impl{VDINTERFACETCPNET,pfnClientConnect} */
1488static DECLCALLBACK(int) drvvdTcpClientConnect(VDSOCKET hVdSock, const char *pszAddress, uint32_t uPort,
1489 RTMSINTERVAL cMillies)
1490{
1491 int rc = VINF_SUCCESS;
1492 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1493
1494 rc = RTTcpClientConnectEx(pszAddress, uPort, &pSockInt->hSocket, cMillies, NULL);
1495 if (RT_SUCCESS(rc))
1496 {
1497 /* Add to the pollset if required. */
1498 if (pSockInt->hPollSet != NIL_RTPOLLSET)
1499 {
1500 pSockInt->fEventsOld = RTPOLL_EVT_READ | RTPOLL_EVT_WRITE | RTPOLL_EVT_ERROR;
1501
1502 rc = RTPollSetAddSocket(pSockInt->hPollSet, pSockInt->hSocket,
1503 pSockInt->fEventsOld, VDSOCKET_POLL_ID_SOCKET);
1504 }
1505
1506 if (RT_SUCCESS(rc))
1507 return VINF_SUCCESS;
1508
1509 rc = RTTcpClientCloseEx(pSockInt->hSocket, false /*fGracefulShutdown*/);
1510 }
1511
1512 return rc;
1513}
1514
1515/** @interface_method_impl{VDINTERFACETCPNET,pfnClientClose} */
1516static DECLCALLBACK(int) drvvdTcpClientClose(VDSOCKET hVdSock)
1517{
1518 int rc = VINF_SUCCESS;
1519 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1520
1521 if (pSockInt->hPollSet != NIL_RTPOLLSET)
1522 {
1523 rc = RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_SOCKET);
1524 AssertRC(rc);
1525 }
1526
1527 rc = RTTcpClientCloseEx(pSockInt->hSocket, false /*fGracefulShutdown*/);
1528 pSockInt->hSocket = NIL_RTSOCKET;
1529
1530 return rc;
1531}
1532
1533/** @interface_method_impl{VDINTERFACETCPNET,pfnIsClientConnected} */
1534static DECLCALLBACK(bool) drvvdTcpIsClientConnected(VDSOCKET hVdSock)
1535{
1536 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1537
1538 return pSockInt->hSocket != NIL_RTSOCKET;
1539}
1540
1541/** @interface_method_impl{VDINTERFACETCPNET,pfnSelectOne} */
1542static DECLCALLBACK(int) drvvdTcpSelectOne(VDSOCKET hVdSock, RTMSINTERVAL cMillies)
1543{
1544 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1545
1546 return RTTcpSelectOne(pSockInt->hSocket, cMillies);
1547}
1548
1549/** @interface_method_impl{VDINTERFACETCPNET,pfnRead} */
1550static DECLCALLBACK(int) drvvdTcpRead(VDSOCKET hVdSock, void *pvBuffer, size_t cbBuffer, size_t *pcbRead)
1551{
1552 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1553
1554 return RTTcpRead(pSockInt->hSocket, pvBuffer, cbBuffer, pcbRead);
1555}
1556
1557/** @interface_method_impl{VDINTERFACETCPNET,pfnWrite} */
1558static DECLCALLBACK(int) drvvdTcpWrite(VDSOCKET hVdSock, const void *pvBuffer, size_t cbBuffer)
1559{
1560 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1561
1562 return RTTcpWrite(pSockInt->hSocket, pvBuffer, cbBuffer);
1563}
1564
1565/** @interface_method_impl{VDINTERFACETCPNET,pfnSgWrite} */
1566static DECLCALLBACK(int) drvvdTcpSgWrite(VDSOCKET hVdSock, PCRTSGBUF pSgBuf)
1567{
1568 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1569
1570 return RTTcpSgWrite(pSockInt->hSocket, pSgBuf);
1571}
1572
1573/** @interface_method_impl{VDINTERFACETCPNET,pfnReadNB} */
1574static DECLCALLBACK(int) drvvdTcpReadNB(VDSOCKET hVdSock, void *pvBuffer, size_t cbBuffer, size_t *pcbRead)
1575{
1576 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1577
1578 return RTTcpReadNB(pSockInt->hSocket, pvBuffer, cbBuffer, pcbRead);
1579}
1580
1581/** @interface_method_impl{VDINTERFACETCPNET,pfnWriteNB} */
1582static DECLCALLBACK(int) drvvdTcpWriteNB(VDSOCKET hVdSock, const void *pvBuffer, size_t cbBuffer, size_t *pcbWritten)
1583{
1584 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1585
1586 return RTTcpWriteNB(pSockInt->hSocket, pvBuffer, cbBuffer, pcbWritten);
1587}
1588
1589/** @interface_method_impl{VDINTERFACETCPNET,pfnSgWriteNB} */
1590static DECLCALLBACK(int) drvvdTcpSgWriteNB(VDSOCKET hVdSock, PRTSGBUF pSgBuf, size_t *pcbWritten)
1591{
1592 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1593
1594 return RTTcpSgWriteNB(pSockInt->hSocket, pSgBuf, pcbWritten);
1595}
1596
1597/** @interface_method_impl{VDINTERFACETCPNET,pfnFlush} */
1598static DECLCALLBACK(int) drvvdTcpFlush(VDSOCKET hVdSock)
1599{
1600 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1601
1602 return RTTcpFlush(pSockInt->hSocket);
1603}
1604
1605/** @interface_method_impl{VDINTERFACETCPNET,pfnSetSendCoalescing} */
1606static DECLCALLBACK(int) drvvdTcpSetSendCoalescing(VDSOCKET hVdSock, bool fEnable)
1607{
1608 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1609
1610 return RTTcpSetSendCoalescing(pSockInt->hSocket, fEnable);
1611}
1612
1613/** @interface_method_impl{VDINTERFACETCPNET,pfnGetLocalAddress} */
1614static DECLCALLBACK(int) drvvdTcpGetLocalAddress(VDSOCKET hVdSock, PRTNETADDR pAddr)
1615{
1616 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1617
1618 return RTTcpGetLocalAddress(pSockInt->hSocket, pAddr);
1619}
1620
1621/** @interface_method_impl{VDINTERFACETCPNET,pfnGetPeerAddress} */
1622static DECLCALLBACK(int) drvvdTcpGetPeerAddress(VDSOCKET hVdSock, PRTNETADDR pAddr)
1623{
1624 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1625
1626 return RTTcpGetPeerAddress(pSockInt->hSocket, pAddr);
1627}
1628
1629static DECLCALLBACK(int) drvvdTcpSelectOneExPoll(VDSOCKET hVdSock, uint32_t fEvents,
1630 uint32_t *pfEvents, RTMSINTERVAL cMillies)
1631{
1632 int rc = VINF_SUCCESS;
1633 uint32_t id = 0;
1634 uint32_t fEventsRecv = 0;
1635 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1636
1637 *pfEvents = 0;
1638
1639 if ( pSockInt->fEventsOld != fEvents
1640 && pSockInt->hSocket != NIL_RTSOCKET)
1641 {
1642 uint32_t fPollEvents = 0;
1643
1644 if (fEvents & VD_INTERFACETCPNET_EVT_READ)
1645 fPollEvents |= RTPOLL_EVT_READ;
1646 if (fEvents & VD_INTERFACETCPNET_EVT_WRITE)
1647 fPollEvents |= RTPOLL_EVT_WRITE;
1648 if (fEvents & VD_INTERFACETCPNET_EVT_ERROR)
1649 fPollEvents |= RTPOLL_EVT_ERROR;
1650
1651 rc = RTPollSetEventsChange(pSockInt->hPollSet, VDSOCKET_POLL_ID_SOCKET, fPollEvents);
1652 if (RT_FAILURE(rc))
1653 return rc;
1654
1655 pSockInt->fEventsOld = fEvents;
1656 }
1657
1658 ASMAtomicXchgBool(&pSockInt->fWaiting, true);
1659 if (ASMAtomicXchgBool(&pSockInt->fWokenUp, false))
1660 {
1661 ASMAtomicXchgBool(&pSockInt->fWaiting, false);
1662 return VERR_INTERRUPTED;
1663 }
1664
1665 rc = RTPoll(pSockInt->hPollSet, cMillies, &fEventsRecv, &id);
1666 Assert(RT_SUCCESS(rc) || rc == VERR_TIMEOUT);
1667
1668 ASMAtomicXchgBool(&pSockInt->fWaiting, false);
1669
1670 if (RT_SUCCESS(rc))
1671 {
1672 if (id == VDSOCKET_POLL_ID_SOCKET)
1673 {
1674 fEventsRecv &= RTPOLL_EVT_VALID_MASK;
1675
1676 if (fEventsRecv & RTPOLL_EVT_READ)
1677 *pfEvents |= VD_INTERFACETCPNET_EVT_READ;
1678 if (fEventsRecv & RTPOLL_EVT_WRITE)
1679 *pfEvents |= VD_INTERFACETCPNET_EVT_WRITE;
1680 if (fEventsRecv & RTPOLL_EVT_ERROR)
1681 *pfEvents |= VD_INTERFACETCPNET_EVT_ERROR;
1682 }
1683 else
1684 {
1685 size_t cbRead = 0;
1686 uint8_t abBuf[10];
1687 Assert(id == VDSOCKET_POLL_ID_PIPE);
1688 Assert((fEventsRecv & RTPOLL_EVT_VALID_MASK) == RTPOLL_EVT_READ);
1689
1690 /* We got interrupted, drain the pipe. */
1691 rc = RTPipeRead(pSockInt->hPipeR, abBuf, sizeof(abBuf), &cbRead);
1692 AssertRC(rc);
1693
1694 ASMAtomicXchgBool(&pSockInt->fWokenUp, false);
1695
1696 rc = VERR_INTERRUPTED;
1697 }
1698 }
1699
1700 return rc;
1701}
1702
1703/** @interface_method_impl{VDINTERFACETCPNET,pfnSelectOneEx} */
1704static DECLCALLBACK(int) drvvdTcpSelectOneExNoPoll(VDSOCKET hVdSock, uint32_t fEvents, uint32_t *pfEvents, RTMSINTERVAL cMillies)
1705{
1706 RT_NOREF(cMillies); /** @todo timeouts */
1707 int rc = VINF_SUCCESS;
1708 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1709
1710 *pfEvents = 0;
1711
1712 ASMAtomicXchgBool(&pSockInt->fWaiting, true);
1713 if (ASMAtomicXchgBool(&pSockInt->fWokenUp, false))
1714 {
1715 ASMAtomicXchgBool(&pSockInt->fWaiting, false);
1716 return VERR_INTERRUPTED;
1717 }
1718
1719 if ( pSockInt->hSocket == NIL_RTSOCKET
1720 || !fEvents)
1721 {
1722 /*
1723 * Only the pipe is configured or the caller doesn't wait for a socket event,
1724 * wait until there is something to read from the pipe.
1725 */
1726 size_t cbRead = 0;
1727 char ch = 0;
1728 rc = RTPipeReadBlocking(pSockInt->hPipeR, &ch, 1, &cbRead);
1729 if (RT_SUCCESS(rc))
1730 {
1731 Assert(cbRead == 1);
1732 rc = VERR_INTERRUPTED;
1733 ASMAtomicXchgBool(&pSockInt->fWokenUp, false);
1734 }
1735 }
1736 else
1737 {
1738 uint32_t fSelectEvents = 0;
1739
1740 if (fEvents & VD_INTERFACETCPNET_EVT_READ)
1741 fSelectEvents |= RTSOCKET_EVT_READ;
1742 if (fEvents & VD_INTERFACETCPNET_EVT_WRITE)
1743 fSelectEvents |= RTSOCKET_EVT_WRITE;
1744 if (fEvents & VD_INTERFACETCPNET_EVT_ERROR)
1745 fSelectEvents |= RTSOCKET_EVT_ERROR;
1746
1747 if (fEvents & VD_INTERFACETCPNET_HINT_INTERRUPT)
1748 {
1749 uint32_t fEventsRecv = 0;
1750
1751 /* Make sure the socket is not in the pollset. */
1752 rc = RTPollSetRemove(pSockInt->hPollSet, VDSOCKET_POLL_ID_SOCKET);
1753 Assert(RT_SUCCESS(rc) || rc == VERR_POLL_HANDLE_ID_NOT_FOUND);
1754
1755 for (;;)
1756 {
1757 uint32_t id = 0;
1758 rc = RTPoll(pSockInt->hPollSet, 5, &fEvents, &id);
1759 if (rc == VERR_TIMEOUT)
1760 {
1761 /* Check the socket. */
1762 rc = RTTcpSelectOneEx(pSockInt->hSocket, fSelectEvents, &fEventsRecv, 0);
1763 if (RT_SUCCESS(rc))
1764 {
1765 if (fEventsRecv & RTSOCKET_EVT_READ)
1766 *pfEvents |= VD_INTERFACETCPNET_EVT_READ;
1767 if (fEventsRecv & RTSOCKET_EVT_WRITE)
1768 *pfEvents |= VD_INTERFACETCPNET_EVT_WRITE;
1769 if (fEventsRecv & RTSOCKET_EVT_ERROR)
1770 *pfEvents |= VD_INTERFACETCPNET_EVT_ERROR;
1771 break; /* Quit */
1772 }
1773 else if (rc != VERR_TIMEOUT)
1774 break;
1775 }
1776 else if (RT_SUCCESS(rc))
1777 {
1778 size_t cbRead = 0;
1779 uint8_t abBuf[10];
1780 Assert(id == VDSOCKET_POLL_ID_PIPE);
1781 Assert((fEventsRecv & RTPOLL_EVT_VALID_MASK) == RTPOLL_EVT_READ);
1782
1783 /* We got interrupted, drain the pipe. */
1784 rc = RTPipeRead(pSockInt->hPipeR, abBuf, sizeof(abBuf), &cbRead);
1785 AssertRC(rc);
1786
1787 ASMAtomicXchgBool(&pSockInt->fWokenUp, false);
1788
1789 rc = VERR_INTERRUPTED;
1790 break;
1791 }
1792 else
1793 break;
1794 }
1795 }
1796 else /* The caller waits for a socket event. */
1797 {
1798 uint32_t fEventsRecv = 0;
1799
1800 /* Loop until we got woken up or a socket event occurred. */
1801 for (;;)
1802 {
1803 /** @todo find an adaptive wait algorithm based on the
1804 * number of wakeups in the past. */
1805 rc = RTTcpSelectOneEx(pSockInt->hSocket, fSelectEvents, &fEventsRecv, 5);
1806 if (rc == VERR_TIMEOUT)
1807 {
1808 /* Check if there is an event pending. */
1809 size_t cbRead = 0;
1810 char ch = 0;
1811 rc = RTPipeRead(pSockInt->hPipeR, &ch, 1, &cbRead);
1812 if (RT_SUCCESS(rc) && rc != VINF_TRY_AGAIN)
1813 {
1814 Assert(cbRead == 1);
1815 rc = VERR_INTERRUPTED;
1816 ASMAtomicXchgBool(&pSockInt->fWokenUp, false);
1817 break; /* Quit */
1818 }
1819 else
1820 Assert(rc == VINF_TRY_AGAIN);
1821 }
1822 else if (RT_SUCCESS(rc))
1823 {
1824 if (fEventsRecv & RTSOCKET_EVT_READ)
1825 *pfEvents |= VD_INTERFACETCPNET_EVT_READ;
1826 if (fEventsRecv & RTSOCKET_EVT_WRITE)
1827 *pfEvents |= VD_INTERFACETCPNET_EVT_WRITE;
1828 if (fEventsRecv & RTSOCKET_EVT_ERROR)
1829 *pfEvents |= VD_INTERFACETCPNET_EVT_ERROR;
1830 break; /* Quit */
1831 }
1832 else
1833 break;
1834 }
1835 }
1836 }
1837
1838 ASMAtomicXchgBool(&pSockInt->fWaiting, false);
1839
1840 return rc;
1841}
1842
1843/** @interface_method_impl{VDINTERFACETCPNET,pfnPoke} */
1844static DECLCALLBACK(int) drvvdTcpPoke(VDSOCKET hVdSock)
1845{
1846 int rc = VINF_SUCCESS;
1847 size_t cbWritten = 0;
1848 PVDSOCKETINT pSockInt = (PVDSOCKETINT)hVdSock;
1849
1850 ASMAtomicXchgBool(&pSockInt->fWokenUp, true);
1851
1852 if (ASMAtomicReadBool(&pSockInt->fWaiting))
1853 {
1854 rc = RTPipeWrite(pSockInt->hPipeW, "", 1, &cbWritten);
1855 Assert(RT_SUCCESS(rc) || cbWritten == 0);
1856 }
1857
1858 return VINF_SUCCESS;
1859}
1860
1861/**
1862 * Checks the prerequisites for encrypted I/O.
1863 *
1864 * @returns VBox status code.
1865 * @param pThis The VD driver instance data.
1866 * @param fSetError Flag whether to set a runtime error.
1867 */
1868static int drvvdKeyCheckPrereqs(PVBOXDISK pThis, bool fSetError)
1869{
1870 if ( pThis->pCfgCrypto
1871 && !pThis->pIfSecKey)
1872 {
1873 AssertPtr(pThis->pIfSecKeyHlp);
1874 pThis->pIfSecKeyHlp->pfnKeyMissingNotify(pThis->pIfSecKeyHlp);
1875
1876 if (fSetError)
1877 {
1878 int rc = PDMDrvHlpVMSetRuntimeError(pThis->pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_DEKMISSING",
1879 N_("VD: The DEK for this disk is missing"));
1880 AssertRC(rc);
1881 }
1882 return VERR_VD_DEK_MISSING;
1883 }
1884
1885 return VINF_SUCCESS;
1886}
1887
1888
1889/*********************************************************************************************************************************
1890* Media interface methods *
1891*********************************************************************************************************************************/
1892
1893/** @interface_method_impl{PDMIMEDIA,pfnRead} */
1894static DECLCALLBACK(int) drvvdRead(PPDMIMEDIA pInterface,
1895 uint64_t off, void *pvBuf, size_t cbRead)
1896{
1897 int rc = VINF_SUCCESS;
1898
1899 LogFlowFunc(("off=%#llx pvBuf=%p cbRead=%d\n", off, pvBuf, cbRead));
1900 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
1901
1902 /*
1903 * Check the state.
1904 */
1905 if (!pThis->pDisk)
1906 {
1907 AssertMsgFailed(("Invalid state! Not mounted!\n"));
1908 return VERR_PDM_MEDIA_NOT_MOUNTED;
1909 }
1910
1911 rc = drvvdKeyCheckPrereqs(pThis, true /* fSetError */);
1912 if (RT_FAILURE(rc))
1913 return rc;
1914
1915 STAM_REL_COUNTER_INC(&pThis->StatReqsSubmitted);
1916 STAM_REL_COUNTER_INC(&pThis->StatReqsRead);
1917
1918 if (!pThis->fBootAccelActive)
1919 rc = VDRead(pThis->pDisk, off, pvBuf, cbRead);
1920 else
1921 {
1922 /* Can we serve the request from the buffer? */
1923 if ( off >= pThis->offDisk
1924 && off - pThis->offDisk < pThis->cbDataValid)
1925 {
1926 size_t cbToCopy = RT_MIN(cbRead, pThis->offDisk + pThis->cbDataValid - off);
1927
1928 memcpy(pvBuf, pThis->pbData + (off - pThis->offDisk), cbToCopy);
1929 cbRead -= cbToCopy;
1930 off += cbToCopy;
1931 pvBuf = (char *)pvBuf + cbToCopy;
1932 }
1933
1934 if ( cbRead > 0
1935 && cbRead < pThis->cbBootAccelBuffer)
1936 {
1937 /* Increase request to the buffer size and read. */
1938 pThis->cbDataValid = RT_MIN(pThis->cbDisk - off, pThis->cbBootAccelBuffer);
1939 pThis->offDisk = off;
1940 rc = VDRead(pThis->pDisk, off, pThis->pbData, pThis->cbDataValid);
1941 if (RT_FAILURE(rc))
1942 pThis->cbDataValid = 0;
1943 else
1944 memcpy(pvBuf, pThis->pbData, cbRead);
1945 }
1946 else if (cbRead >= pThis->cbBootAccelBuffer)
1947 {
1948 pThis->fBootAccelActive = false; /* Deactiviate */
1949 }
1950 }
1951
1952 if (RT_SUCCESS(rc))
1953 {
1954 STAM_REL_COUNTER_INC(&pThis->StatReqsSucceeded);
1955 STAM_REL_COUNTER_ADD(&pThis->StatBytesRead, cbRead);
1956 Log2(("%s: off=%#llx pvBuf=%p cbRead=%d\n%.*Rhxd\n", __FUNCTION__,
1957 off, pvBuf, cbRead, cbRead, pvBuf));
1958 }
1959 else
1960 STAM_REL_COUNTER_INC(&pThis->StatReqsFailed);
1961
1962 LogFlowFunc(("returns %Rrc\n", rc));
1963 return rc;
1964}
1965
1966/** @interface_method_impl{PDMIMEDIA,pfnRead} */
1967static DECLCALLBACK(int) drvvdReadPcBios(PPDMIMEDIA pInterface,
1968 uint64_t off, void *pvBuf, size_t cbRead)
1969{
1970 int rc = VINF_SUCCESS;
1971
1972 LogFlowFunc(("off=%#llx pvBuf=%p cbRead=%d\n", off, pvBuf, cbRead));
1973 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
1974
1975 /*
1976 * Check the state.
1977 */
1978 if (!pThis->pDisk)
1979 {
1980 AssertMsgFailed(("Invalid state! Not mounted!\n"));
1981 return VERR_PDM_MEDIA_NOT_MOUNTED;
1982 }
1983
1984 if ( pThis->pCfgCrypto
1985 && !pThis->pIfSecKey)
1986 return VERR_VD_DEK_MISSING;
1987
1988 if (!pThis->fBootAccelActive)
1989 rc = VDRead(pThis->pDisk, off, pvBuf, cbRead);
1990 else
1991 {
1992 /* Can we serve the request from the buffer? */
1993 if ( off >= pThis->offDisk
1994 && off - pThis->offDisk < pThis->cbDataValid)
1995 {
1996 size_t cbToCopy = RT_MIN(cbRead, pThis->offDisk + pThis->cbDataValid - off);
1997
1998 memcpy(pvBuf, pThis->pbData + (off - pThis->offDisk), cbToCopy);
1999 cbRead -= cbToCopy;
2000 off += cbToCopy;
2001 pvBuf = (char *)pvBuf + cbToCopy;
2002 }
2003
2004 if ( cbRead > 0
2005 && cbRead < pThis->cbBootAccelBuffer)
2006 {
2007 /* Increase request to the buffer size and read. */
2008 pThis->cbDataValid = RT_MIN(pThis->cbDisk - off, pThis->cbBootAccelBuffer);
2009 pThis->offDisk = off;
2010 rc = VDRead(pThis->pDisk, off, pThis->pbData, pThis->cbDataValid);
2011 if (RT_FAILURE(rc))
2012 pThis->cbDataValid = 0;
2013 else
2014 memcpy(pvBuf, pThis->pbData, cbRead);
2015 }
2016 else if (cbRead >= pThis->cbBootAccelBuffer)
2017 {
2018 pThis->fBootAccelActive = false; /* Deactiviate */
2019 }
2020 }
2021
2022 if (RT_SUCCESS(rc))
2023 Log2(("%s: off=%#llx pvBuf=%p cbRead=%d\n%.*Rhxd\n", __FUNCTION__,
2024 off, pvBuf, cbRead, cbRead, pvBuf));
2025 LogFlowFunc(("returns %Rrc\n", rc));
2026 return rc;
2027}
2028
2029
2030/** @interface_method_impl{PDMIMEDIA,pfnWrite} */
2031static DECLCALLBACK(int) drvvdWrite(PPDMIMEDIA pInterface,
2032 uint64_t off, const void *pvBuf,
2033 size_t cbWrite)
2034{
2035 LogFlowFunc(("off=%#llx pvBuf=%p cbWrite=%d\n", off, pvBuf, cbWrite));
2036 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2037 Log2(("%s: off=%#llx pvBuf=%p cbWrite=%d\n%.*Rhxd\n", __FUNCTION__,
2038 off, pvBuf, cbWrite, cbWrite, pvBuf));
2039
2040 /*
2041 * Check the state.
2042 */
2043 if (!pThis->pDisk)
2044 {
2045 AssertMsgFailed(("Invalid state! Not mounted!\n"));
2046 return VERR_PDM_MEDIA_NOT_MOUNTED;
2047 }
2048
2049 /* Set an FTM checkpoint as this operation changes the state permanently. */
2050 PDMDrvHlpFTSetCheckpoint(pThis->pDrvIns, FTMCHECKPOINTTYPE_STORAGE);
2051
2052 int rc = drvvdKeyCheckPrereqs(pThis, true /* fSetError */);
2053 if (RT_FAILURE(rc))
2054 return rc;
2055
2056 /* Invalidate any buffer if boot acceleration is enabled. */
2057 if (pThis->fBootAccelActive)
2058 {
2059 pThis->cbDataValid = 0;
2060 pThis->offDisk = 0;
2061 }
2062
2063 STAM_REL_COUNTER_INC(&pThis->StatReqsSubmitted);
2064 STAM_REL_COUNTER_INC(&pThis->StatReqsWrite);
2065
2066 rc = VDWrite(pThis->pDisk, off, pvBuf, cbWrite);
2067#ifdef VBOX_PERIODIC_FLUSH
2068 if (pThis->cbFlushInterval)
2069 {
2070 pThis->cbDataWritten += (uint32_t)cbWrite;
2071 if (pThis->cbDataWritten > pThis->cbFlushInterval)
2072 {
2073 pThis->cbDataWritten = 0;
2074 VDFlush(pThis->pDisk);
2075 }
2076 }
2077#endif /* VBOX_PERIODIC_FLUSH */
2078
2079 if (RT_SUCCESS(rc))
2080 {
2081 STAM_REL_COUNTER_INC(&pThis->StatReqsSucceeded);
2082 STAM_REL_COUNTER_ADD(&pThis->StatBytesWritten, cbWrite);
2083 }
2084 else
2085 STAM_REL_COUNTER_INC(&pThis->StatReqsFailed);
2086
2087 LogFlowFunc(("returns %Rrc\n", rc));
2088 return rc;
2089}
2090
2091/** @interface_method_impl{PDMIMEDIA,pfnFlush} */
2092static DECLCALLBACK(int) drvvdFlush(PPDMIMEDIA pInterface)
2093{
2094 LogFlowFunc(("\n"));
2095 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2096
2097 /*
2098 * Check the state.
2099 */
2100 if (!pThis->pDisk)
2101 {
2102 AssertMsgFailed(("Invalid state! Not mounted!\n"));
2103 return VERR_PDM_MEDIA_NOT_MOUNTED;
2104 }
2105
2106#ifdef VBOX_IGNORE_FLUSH
2107 if (pThis->fIgnoreFlush)
2108 return VINF_SUCCESS;
2109#endif /* VBOX_IGNORE_FLUSH */
2110
2111 STAM_REL_COUNTER_INC(&pThis->StatReqsSubmitted);
2112 STAM_REL_COUNTER_INC(&pThis->StatReqsFlush);
2113
2114 int rc = VDFlush(pThis->pDisk);
2115 if (RT_SUCCESS(rc))
2116 STAM_REL_COUNTER_INC(&pThis->StatReqsSucceeded);
2117 else
2118 STAM_REL_COUNTER_INC(&pThis->StatReqsFailed);
2119
2120 LogFlowFunc(("returns %Rrc\n", rc));
2121 return rc;
2122}
2123
2124/** @interface_method_impl{PDMIMEDIA,pfnMerge} */
2125static DECLCALLBACK(int) drvvdMerge(PPDMIMEDIA pInterface,
2126 PFNSIMPLEPROGRESS pfnProgress,
2127 void *pvUser)
2128{
2129 LogFlowFunc(("\n"));
2130 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2131 int rc = VINF_SUCCESS;
2132
2133 /*
2134 * Check the state.
2135 */
2136 if (!pThis->pDisk)
2137 {
2138 AssertMsgFailed(("Invalid state! Not mounted!\n"));
2139 return VERR_PDM_MEDIA_NOT_MOUNTED;
2140 }
2141
2142 /* Note: There is an unavoidable race between destruction and another
2143 * thread invoking this function. This is handled safely and gracefully by
2144 * atomically invalidating the lock handle in drvvdDestruct. */
2145 int rc2 = RTSemFastMutexRequest(pThis->MergeCompleteMutex);
2146 AssertRC(rc2);
2147 if (RT_SUCCESS(rc2) && pThis->fMergePending)
2148 {
2149 /* Take shortcut: PFNSIMPLEPROGRESS is exactly the same type as
2150 * PFNVDPROGRESS, so there's no need for a conversion function. */
2151 /** @todo maybe introduce a conversion which limits update frequency. */
2152 PVDINTERFACE pVDIfsOperation = NULL;
2153 VDINTERFACEPROGRESS VDIfProgress;
2154 VDIfProgress.pfnProgress = pfnProgress;
2155 rc2 = VDInterfaceAdd(&VDIfProgress.Core, "DrvVD_VDIProgress", VDINTERFACETYPE_PROGRESS,
2156 pvUser, sizeof(VDINTERFACEPROGRESS), &pVDIfsOperation);
2157 AssertRC(rc2);
2158 pThis->fMergePending = false;
2159 rc = VDMerge(pThis->pDisk, pThis->uMergeSource,
2160 pThis->uMergeTarget, pVDIfsOperation);
2161 }
2162 rc2 = RTSemFastMutexRelease(pThis->MergeCompleteMutex);
2163 AssertRC(rc2);
2164 LogFlowFunc(("returns %Rrc\n", rc));
2165 return rc;
2166}
2167
2168/** @interface_method_impl{PDMIMEDIA,pfnSetSecKeyIf} */
2169static DECLCALLBACK(int) drvvdSetSecKeyIf(PPDMIMEDIA pInterface, PPDMISECKEY pIfSecKey, PPDMISECKEYHLP pIfSecKeyHlp)
2170{
2171 LogFlowFunc(("\n"));
2172 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2173 int rc = VINF_SUCCESS;
2174
2175 if (pThis->pCfgCrypto)
2176 {
2177 PVDINTERFACE pVDIfFilter = NULL;
2178
2179 pThis->pIfSecKeyHlp = pIfSecKeyHlp;
2180
2181 if ( pThis->pIfSecKey
2182 && !pIfSecKey)
2183 {
2184 /* Unload the crypto filter first to make sure it doesn't access the keys anymore. */
2185 rc = VDFilterRemove(pThis->pDisk, VD_FILTER_FLAGS_DEFAULT);
2186 AssertRC(rc);
2187
2188 pThis->pIfSecKey = NULL;
2189 }
2190
2191 if ( pIfSecKey
2192 && RT_SUCCESS(rc))
2193 {
2194 pThis->pIfSecKey = pIfSecKey;
2195
2196 rc = VDInterfaceAdd(&pThis->VDIfCfg.Core, "DrvVD_Config", VDINTERFACETYPE_CONFIG,
2197 pThis->pCfgCrypto, sizeof(VDINTERFACECONFIG), &pVDIfFilter);
2198 AssertRC(rc);
2199
2200 rc = VDInterfaceAdd(&pThis->VDIfCrypto.Core, "DrvVD_Crypto", VDINTERFACETYPE_CRYPTO,
2201 pThis, sizeof(VDINTERFACECRYPTO), &pVDIfFilter);
2202 AssertRC(rc);
2203
2204 /* Load the crypt filter plugin. */
2205 rc = VDFilterAdd(pThis->pDisk, "CRYPT", VD_FILTER_FLAGS_DEFAULT, pVDIfFilter);
2206 if (RT_FAILURE(rc))
2207 pThis->pIfSecKey = NULL;
2208 }
2209 }
2210 else
2211 rc = VERR_NOT_SUPPORTED;
2212
2213 LogFlowFunc(("returns %Rrc\n", rc));
2214 return rc;
2215}
2216
2217/** @interface_method_impl{PDMIMEDIA,pfnGetSize} */
2218static DECLCALLBACK(uint64_t) drvvdGetSize(PPDMIMEDIA pInterface)
2219{
2220 LogFlowFunc(("\n"));
2221 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2222
2223 /*
2224 * Check the state.
2225 */
2226 if (!pThis->pDisk)
2227 return 0;
2228
2229 uint64_t cb = VDGetSize(pThis->pDisk, VD_LAST_IMAGE);
2230 LogFlowFunc(("returns %#llx (%llu)\n", cb, cb));
2231 return cb;
2232}
2233
2234/** @interface_method_impl{PDMIMEDIA,pfnGetSectorSize} */
2235static DECLCALLBACK(uint32_t) drvvdGetSectorSize(PPDMIMEDIA pInterface)
2236{
2237 LogFlowFunc(("\n"));
2238 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2239
2240 /*
2241 * Check the state.
2242 */
2243 if (!pThis->pDisk)
2244 return 0;
2245
2246 uint32_t cb = VDGetSectorSize(pThis->pDisk, VD_LAST_IMAGE);
2247 LogFlowFunc(("returns %u\n", cb));
2248 return cb;
2249}
2250
2251/** @interface_method_impl{PDMIMEDIA,pfnIsReadOnly} */
2252static DECLCALLBACK(bool) drvvdIsReadOnly(PPDMIMEDIA pInterface)
2253{
2254 LogFlowFunc(("\n"));
2255 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2256
2257 /*
2258 * Check the state.
2259 */
2260 if (!pThis->pDisk)
2261 return false;
2262
2263 bool f = VDIsReadOnly(pThis->pDisk);
2264 LogFlowFunc(("returns %d\n", f));
2265 return f;
2266}
2267
2268/** @interface_method_impl{PDMIMEDIA,pfnIsNonRotational} */
2269static DECLCALLBACK(bool) drvvdIsNonRotational(PPDMIMEDIA pInterface)
2270{
2271 LogFlowFunc(("\n"));
2272 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2273
2274 return pThis->fNonRotational;
2275}
2276
2277/** @interface_method_impl{PDMIMEDIA,pfnBiosGetPCHSGeometry} */
2278static DECLCALLBACK(int) drvvdBiosGetPCHSGeometry(PPDMIMEDIA pInterface,
2279 PPDMMEDIAGEOMETRY pPCHSGeometry)
2280{
2281 LogFlowFunc(("\n"));
2282 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2283 VDGEOMETRY geo;
2284
2285 /*
2286 * Check the state.
2287 */
2288 if (!pThis->pDisk)
2289 return VERR_PDM_MEDIA_NOT_MOUNTED;
2290
2291 /*
2292 * Use configured/cached values if present.
2293 */
2294 if ( pThis->PCHSGeometry.cCylinders > 0
2295 && pThis->PCHSGeometry.cHeads > 0
2296 && pThis->PCHSGeometry.cSectors > 0)
2297 {
2298 *pPCHSGeometry = pThis->PCHSGeometry;
2299 LogFlow(("%s: returns VINF_SUCCESS {%d,%d,%d}\n", __FUNCTION__, pThis->PCHSGeometry.cCylinders, pThis->PCHSGeometry.cHeads, pThis->PCHSGeometry.cSectors));
2300 return VINF_SUCCESS;
2301 }
2302
2303 int rc = VDGetPCHSGeometry(pThis->pDisk, VD_LAST_IMAGE, &geo);
2304 if (RT_SUCCESS(rc))
2305 {
2306 pPCHSGeometry->cCylinders = geo.cCylinders;
2307 pPCHSGeometry->cHeads = geo.cHeads;
2308 pPCHSGeometry->cSectors = geo.cSectors;
2309 pThis->PCHSGeometry = *pPCHSGeometry;
2310 }
2311 else
2312 {
2313 LogFunc(("geometry not available.\n"));
2314 rc = VERR_PDM_GEOMETRY_NOT_SET;
2315 }
2316 LogFlowFunc(("returns %Rrc (CHS=%d/%d/%d)\n",
2317 rc, pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads, pPCHSGeometry->cSectors));
2318 return rc;
2319}
2320
2321/** @interface_method_impl{PDMIMEDIA,pfnBiosSetPCHSGeometry} */
2322static DECLCALLBACK(int) drvvdBiosSetPCHSGeometry(PPDMIMEDIA pInterface,
2323 PCPDMMEDIAGEOMETRY pPCHSGeometry)
2324{
2325 LogFlowFunc(("CHS=%d/%d/%d\n",
2326 pPCHSGeometry->cCylinders, pPCHSGeometry->cHeads, pPCHSGeometry->cSectors));
2327 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2328 VDGEOMETRY geo;
2329
2330 /*
2331 * Check the state.
2332 */
2333 if (!pThis->pDisk)
2334 {
2335 AssertMsgFailed(("Invalid state! Not mounted!\n"));
2336 return VERR_PDM_MEDIA_NOT_MOUNTED;
2337 }
2338
2339 geo.cCylinders = pPCHSGeometry->cCylinders;
2340 geo.cHeads = pPCHSGeometry->cHeads;
2341 geo.cSectors = pPCHSGeometry->cSectors;
2342 int rc = VDSetPCHSGeometry(pThis->pDisk, VD_LAST_IMAGE, &geo);
2343 if (rc == VERR_VD_GEOMETRY_NOT_SET)
2344 rc = VERR_PDM_GEOMETRY_NOT_SET;
2345 if (RT_SUCCESS(rc))
2346 pThis->PCHSGeometry = *pPCHSGeometry;
2347 LogFlowFunc(("returns %Rrc\n", rc));
2348 return rc;
2349}
2350
2351/** @interface_method_impl{PDMIMEDIA,pfnBiosGetLCHSGeometry} */
2352static DECLCALLBACK(int) drvvdBiosGetLCHSGeometry(PPDMIMEDIA pInterface,
2353 PPDMMEDIAGEOMETRY pLCHSGeometry)
2354{
2355 LogFlowFunc(("\n"));
2356 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2357 VDGEOMETRY geo;
2358
2359 /*
2360 * Check the state.
2361 */
2362 if (!pThis->pDisk)
2363 return VERR_PDM_MEDIA_NOT_MOUNTED;
2364
2365 /*
2366 * Use configured/cached values if present.
2367 */
2368 if ( pThis->LCHSGeometry.cCylinders > 0
2369 && pThis->LCHSGeometry.cHeads > 0
2370 && pThis->LCHSGeometry.cSectors > 0)
2371 {
2372 *pLCHSGeometry = pThis->LCHSGeometry;
2373 LogFlow(("%s: returns VINF_SUCCESS {%d,%d,%d}\n", __FUNCTION__, pThis->LCHSGeometry.cCylinders, pThis->LCHSGeometry.cHeads, pThis->LCHSGeometry.cSectors));
2374 return VINF_SUCCESS;
2375 }
2376
2377 int rc = VDGetLCHSGeometry(pThis->pDisk, VD_LAST_IMAGE, &geo);
2378 if (RT_SUCCESS(rc))
2379 {
2380 pLCHSGeometry->cCylinders = geo.cCylinders;
2381 pLCHSGeometry->cHeads = geo.cHeads;
2382 pLCHSGeometry->cSectors = geo.cSectors;
2383 pThis->LCHSGeometry = *pLCHSGeometry;
2384 }
2385 else
2386 {
2387 LogFunc(("geometry not available.\n"));
2388 rc = VERR_PDM_GEOMETRY_NOT_SET;
2389 }
2390 LogFlowFunc(("returns %Rrc (CHS=%d/%d/%d)\n",
2391 rc, pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads, pLCHSGeometry->cSectors));
2392 return rc;
2393}
2394
2395/** @interface_method_impl{PDMIMEDIA,pfnBiosSetLCHSGeometry} */
2396static DECLCALLBACK(int) drvvdBiosSetLCHSGeometry(PPDMIMEDIA pInterface,
2397 PCPDMMEDIAGEOMETRY pLCHSGeometry)
2398{
2399 LogFlowFunc(("CHS=%d/%d/%d\n",
2400 pLCHSGeometry->cCylinders, pLCHSGeometry->cHeads, pLCHSGeometry->cSectors));
2401 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2402 VDGEOMETRY geo;
2403
2404 /*
2405 * Check the state.
2406 */
2407 if (!pThis->pDisk)
2408 {
2409 AssertMsgFailed(("Invalid state! Not mounted!\n"));
2410 return VERR_PDM_MEDIA_NOT_MOUNTED;
2411 }
2412
2413 geo.cCylinders = pLCHSGeometry->cCylinders;
2414 geo.cHeads = pLCHSGeometry->cHeads;
2415 geo.cSectors = pLCHSGeometry->cSectors;
2416 int rc = VDSetLCHSGeometry(pThis->pDisk, VD_LAST_IMAGE, &geo);
2417 if (rc == VERR_VD_GEOMETRY_NOT_SET)
2418 rc = VERR_PDM_GEOMETRY_NOT_SET;
2419 if (RT_SUCCESS(rc))
2420 pThis->LCHSGeometry = *pLCHSGeometry;
2421 LogFlowFunc(("returns %Rrc\n", rc));
2422 return rc;
2423}
2424
2425/** @interface_method_impl{PDMIMEDIA,pfnBiosIsVisible} */
2426static DECLCALLBACK(bool) drvvdBiosIsVisible(PPDMIMEDIA pInterface)
2427{
2428 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2429 LogFlow(("drvvdBiosIsVisible: returns %d\n", pThis->fBiosVisible));
2430 return pThis->fBiosVisible;
2431}
2432
2433/** @interface_method_impl{PDMIMEDIA,pfnGetType} */
2434static DECLCALLBACK(PDMMEDIATYPE) drvvdGetType(PPDMIMEDIA pInterface)
2435{
2436 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2437 LogFlow(("drvvdBiosIsVisible: returns %d\n", pThis->fBiosVisible));
2438 return pThis->enmType;
2439}
2440
2441/** @interface_method_impl{PDMIMEDIA,pfnGetUuid} */
2442static DECLCALLBACK(int) drvvdGetUuid(PPDMIMEDIA pInterface, PRTUUID pUuid)
2443{
2444 LogFlowFunc(("\n"));
2445 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2446
2447 /*
2448 * Copy the uuid.
2449 */
2450 *pUuid = pThis->Uuid;
2451 LogFlowFunc(("returns {%RTuuid}\n", pUuid));
2452 return VINF_SUCCESS;
2453}
2454
2455/** @interface_method_impl{PDMIMEDIA,pfnDiscard} */
2456static DECLCALLBACK(int) drvvdDiscard(PPDMIMEDIA pInterface, PCRTRANGE paRanges, unsigned cRanges)
2457{
2458 LogFlowFunc(("\n"));
2459 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2460
2461 STAM_REL_COUNTER_INC(&pThis->StatReqsSubmitted);
2462 STAM_REL_COUNTER_INC(&pThis->StatReqsDiscard);
2463
2464 int rc = VDDiscardRanges(pThis->pDisk, paRanges, cRanges);
2465 if (RT_SUCCESS(rc))
2466 STAM_REL_COUNTER_INC(&pThis->StatReqsSucceeded);
2467 else
2468 STAM_REL_COUNTER_INC(&pThis->StatReqsFailed);
2469
2470 LogFlowFunc(("returns %Rrc\n", rc));
2471 return rc;
2472}
2473
2474/** @interface_method_impl{PDMIMEDIA,pfnGetRegionCount} */
2475static DECLCALLBACK(uint32_t) drvvdGetRegionCount(PPDMIMEDIA pInterface)
2476{
2477 LogFlowFunc(("\n"));
2478 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2479 uint32_t cRegions = 0;
2480
2481 if (pThis->pDisk)
2482 {
2483 if (!pThis->pRegionList)
2484 {
2485 int rc = VDQueryRegions(pThis->pDisk, VD_LAST_IMAGE, VD_REGION_LIST_F_LOC_SIZE_BLOCKS,
2486 &pThis->pRegionList);
2487 if (RT_SUCCESS(rc))
2488 cRegions = pThis->pRegionList->cRegions;
2489 }
2490 else
2491 cRegions = pThis->pRegionList->cRegions;
2492 }
2493
2494 LogFlowFunc(("returns %u\n", cRegions));
2495 return cRegions;
2496}
2497
2498/** @interface_method_impl{PDMIMEDIA,pfnQueryRegionProperties} */
2499static DECLCALLBACK(int) drvvdQueryRegionProperties(PPDMIMEDIA pInterface, uint32_t uRegion, uint64_t *pu64LbaStart,
2500 uint64_t *pcBlocks, uint64_t *pcbBlock,
2501 PVDREGIONDATAFORM penmDataForm)
2502{
2503 LogFlowFunc(("\n"));
2504 int rc = VINF_SUCCESS;
2505 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2506
2507 if ( pThis->pRegionList
2508 && uRegion < pThis->pRegionList->cRegions)
2509 {
2510 PCVDREGIONDESC pRegion = &pThis->pRegionList->aRegions[uRegion];
2511
2512 if (pu64LbaStart)
2513 *pu64LbaStart = pRegion->offRegion;
2514 if (pcBlocks)
2515 *pcBlocks = pRegion->cRegionBlocksOrBytes;
2516 if (pcbBlock)
2517 *pcbBlock = pRegion->cbBlock;
2518 if (penmDataForm)
2519 *penmDataForm = pRegion->enmDataForm;
2520 }
2521 else
2522 rc = VERR_NOT_FOUND;
2523
2524 LogFlowFunc(("returns %Rrc\n", rc));
2525 return rc;
2526}
2527
2528/** @interface_method_impl{PDMIMEDIA,pfnQueryRegionPropertiesForLba} */
2529static DECLCALLBACK(int) drvvdQueryRegionPropertiesForLba(PPDMIMEDIA pInterface, uint64_t u64LbaStart,
2530 uint32_t *puRegion, uint64_t *pcBlocks,
2531 uint64_t *pcbBlock, PVDREGIONDATAFORM penmDataForm)
2532{
2533 LogFlowFunc(("\n"));
2534 int rc = VINF_SUCCESS;
2535 PVBOXDISK pThis = PDMIMEDIA_2_VBOXDISK(pInterface);
2536
2537 if (!pThis->pRegionList)
2538 rc = VDQueryRegions(pThis->pDisk, VD_LAST_IMAGE, VD_REGION_LIST_F_LOC_SIZE_BLOCKS,
2539 &pThis->pRegionList);
2540
2541 if (RT_SUCCESS(rc))
2542 {
2543 rc = VERR_NOT_FOUND;
2544
2545 for (uint32_t i = 0; i < pThis->pRegionList->cRegions; i++)
2546 {
2547 PCVDREGIONDESC pRegion = &pThis->pRegionList->aRegions[i];
2548 if ( pRegion->offRegion <= u64LbaStart
2549 && pRegion->offRegion + pRegion->cRegionBlocksOrBytes > u64LbaStart)
2550 {
2551 uint64_t offRegion = u64LbaStart - pRegion->offRegion;
2552
2553 if (puRegion)
2554 *puRegion = i;
2555 if (pcBlocks)
2556 *pcBlocks = pRegion->cRegionBlocksOrBytes - offRegion;
2557 if (pcbBlock)
2558 *pcbBlock = pRegion->cbBlock;
2559 if (penmDataForm)
2560 *penmDataForm = pRegion->enmDataForm;
2561
2562 rc = VINF_SUCCESS;
2563 }
2564 }
2565 }
2566 else
2567 rc = VERR_NOT_FOUND;
2568
2569 LogFlowFunc(("returns %Rrc\n", rc));
2570 return rc;
2571}
2572
2573/* -=-=-=-=- IMount -=-=-=-=- */
2574
2575/** @interface_method_impl{PDMIMOUNT,pfnUnmount} */
2576static DECLCALLBACK(int) drvvdUnmount(PPDMIMOUNT pInterface, bool fForce, bool fEject)
2577{
2578 RT_NOREF(fEject);
2579 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2580
2581 /*
2582 * Validate state.
2583 */
2584 if (!pThis->pDisk)
2585 {
2586 Log(("drvvdUnmount: Not mounted\n"));
2587 return VERR_PDM_MEDIA_NOT_MOUNTED;
2588 }
2589 if (pThis->fLocked && !fForce)
2590 {
2591 Log(("drvvdUnmount: Locked\n"));
2592 return VERR_PDM_MEDIA_LOCKED;
2593 }
2594
2595 /* Media is no longer locked even if it was previously. */
2596 pThis->fLocked = false;
2597 drvvdPowerOffOrDestructOrUnmount(pThis->pDrvIns);
2598
2599 /*
2600 * Notify driver/device above us.
2601 */
2602 if (pThis->pDrvMountNotify)
2603 pThis->pDrvMountNotify->pfnUnmountNotify(pThis->pDrvMountNotify);
2604 Log(("drvblockUnmount: success\n"));
2605 return VINF_SUCCESS;
2606}
2607
2608
2609/** @interface_method_impl{PDMIMOUNT,pfnIsMounted} */
2610static DECLCALLBACK(bool) drvvdIsMounted(PPDMIMOUNT pInterface)
2611{
2612 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2613 return pThis->pDisk != NULL;
2614}
2615
2616/** @interface_method_impl{PDMIMOUNT,pfnLock} */
2617static DECLCALLBACK(int) drvvdLock(PPDMIMOUNT pInterface)
2618{
2619 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2620 Log(("drvblockLock: %d -> %d\n", pThis->fLocked, true));
2621 pThis->fLocked = true;
2622 return VINF_SUCCESS;
2623}
2624
2625/** @interface_method_impl{PDMIMOUNT,pfnUnlock} */
2626static DECLCALLBACK(int) drvvdUnlock(PPDMIMOUNT pInterface)
2627{
2628 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2629 Log(("drvblockUnlock: %d -> %d\n", pThis->fLocked, false));
2630 pThis->fLocked = false;
2631 return VINF_SUCCESS;
2632}
2633
2634/** @interface_method_impl{PDMIMOUNT,pfnIsLocked} */
2635static DECLCALLBACK(bool) drvvdIsLocked(PPDMIMOUNT pInterface)
2636{
2637 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMount);
2638 return pThis->fLocked;
2639}
2640
2641
2642static DECLCALLBACK(void) drvvdBlkCacheReqComplete(void *pvUser1, void *pvUser2, int rcReq)
2643{
2644 PVBOXDISK pThis = (PVBOXDISK)pvUser1;
2645
2646 AssertPtr(pThis->pBlkCache);
2647 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, (PPDMBLKCACHEIOXFER)pvUser2, rcReq);
2648}
2649
2650
2651/** @copydoc FNPDMBLKCACHEXFERCOMPLETEDRV */
2652static DECLCALLBACK(void) drvvdBlkCacheXferCompleteIoReq(PPDMDRVINS pDrvIns, void *pvUser, int rc)
2653{
2654 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
2655
2656 drvvdMediaExIoReqCompleteWorker(pThis, (PPDMMEDIAEXIOREQINT)pvUser, rc, true /* fUpNotify */);
2657}
2658
2659/** @copydoc FNPDMBLKCACHEXFERENQUEUEDRV */
2660static DECLCALLBACK(int) drvvdBlkCacheXferEnqueue(PPDMDRVINS pDrvIns,
2661 PDMBLKCACHEXFERDIR enmXferDir,
2662 uint64_t off, size_t cbXfer,
2663 PCRTSGBUF pSgBuf, PPDMBLKCACHEIOXFER hIoXfer)
2664{
2665 int rc = VINF_SUCCESS;
2666 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
2667
2668 Assert (!pThis->pCfgCrypto);
2669
2670 switch (enmXferDir)
2671 {
2672 case PDMBLKCACHEXFERDIR_READ:
2673 rc = VDAsyncRead(pThis->pDisk, off, cbXfer, pSgBuf, drvvdBlkCacheReqComplete,
2674 pThis, hIoXfer);
2675 break;
2676 case PDMBLKCACHEXFERDIR_WRITE:
2677 rc = VDAsyncWrite(pThis->pDisk, off, cbXfer, pSgBuf, drvvdBlkCacheReqComplete,
2678 pThis, hIoXfer);
2679 break;
2680 case PDMBLKCACHEXFERDIR_FLUSH:
2681 rc = VDAsyncFlush(pThis->pDisk, drvvdBlkCacheReqComplete, pThis, hIoXfer);
2682 break;
2683 default:
2684 AssertMsgFailed(("Invalid transfer type %d\n", enmXferDir));
2685 rc = VERR_INVALID_PARAMETER;
2686 }
2687
2688 if (rc == VINF_VD_ASYNC_IO_FINISHED)
2689 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, hIoXfer, VINF_SUCCESS);
2690 else if (RT_FAILURE(rc) && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
2691 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, hIoXfer, rc);
2692
2693 return VINF_SUCCESS;
2694}
2695
2696/** @copydoc FNPDMBLKCACHEXFERENQUEUEDISCARDDRV */
2697static DECLCALLBACK(int) drvvdBlkCacheXferEnqueueDiscard(PPDMDRVINS pDrvIns, PCRTRANGE paRanges,
2698 unsigned cRanges, PPDMBLKCACHEIOXFER hIoXfer)
2699{
2700 int rc = VINF_SUCCESS;
2701 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
2702
2703 rc = VDAsyncDiscardRanges(pThis->pDisk, paRanges, cRanges,
2704 drvvdBlkCacheReqComplete, pThis, hIoXfer);
2705
2706 if (rc == VINF_VD_ASYNC_IO_FINISHED)
2707 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, hIoXfer, VINF_SUCCESS);
2708 else if (RT_FAILURE(rc) && rc != VERR_VD_ASYNC_IO_IN_PROGRESS)
2709 PDMR3BlkCacheIoXferComplete(pThis->pBlkCache, hIoXfer, rc);
2710
2711 return VINF_SUCCESS;
2712}
2713
2714
2715/*********************************************************************************************************************************
2716* Extended media interface methods *
2717*********************************************************************************************************************************/
2718
2719static void drvvdMediaExIoReqWarningDiskFull(PPDMDRVINS pDrvIns)
2720{
2721 int rc;
2722 LogRel(("VD#%u: Host disk full\n", pDrvIns->iInstance));
2723 rc = PDMDrvHlpVMSetRuntimeError(pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_DISKFULL",
2724 N_("Host system reported disk full. VM execution is suspended. You can resume after freeing some space"));
2725 AssertRC(rc);
2726}
2727
2728static void drvvdMediaExIoReqWarningFileTooBig(PPDMDRVINS pDrvIns)
2729{
2730 int rc;
2731 LogRel(("VD#%u: File too big\n", pDrvIns->iInstance));
2732 rc = PDMDrvHlpVMSetRuntimeError(pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_FILETOOBIG",
2733 N_("Host system reported that the file size limit of the host file system has been exceeded. VM execution is suspended. You need to move your virtual hard disk to a filesystem which allows bigger files"));
2734 AssertRC(rc);
2735}
2736
2737static void drvvdMediaExIoReqWarningISCSI(PPDMDRVINS pDrvIns)
2738{
2739 int rc;
2740 LogRel(("VD#%u: iSCSI target unavailable\n", pDrvIns->iInstance));
2741 rc = PDMDrvHlpVMSetRuntimeError(pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_ISCSIDOWN",
2742 N_("The iSCSI target has stopped responding. VM execution is suspended. You can resume when it is available again"));
2743 AssertRC(rc);
2744}
2745
2746static void drvvdMediaExIoReqWarningDekMissing(PPDMDRVINS pDrvIns)
2747{
2748 LogRel(("VD#%u: DEK is missing\n", pDrvIns->iInstance));
2749 int rc = PDMDrvHlpVMSetRuntimeError(pDrvIns, VMSETRTERR_FLAGS_SUSPEND | VMSETRTERR_FLAGS_NO_WAIT, "DrvVD_DEKMISSING",
2750 N_("VD: The DEK for this disk is missing"));
2751 AssertRC(rc);
2752}
2753
2754/**
2755 * Checks whether a given status code indicates a recoverable error
2756 * suspending the VM if it is.
2757 *
2758 * @returns Flag indicating whether the status code is a recoverable error
2759 * (full disk, broken network connection).
2760 * @param pThis VBox disk container instance data.
2761 * @param rc Status code to check.
2762 */
2763bool drvvdMediaExIoReqIsRedoSetWarning(PVBOXDISK pThis, int rc)
2764{
2765 if (rc == VERR_DISK_FULL)
2766 {
2767 if (ASMAtomicCmpXchgBool(&pThis->fRedo, true, false))
2768 drvvdMediaExIoReqWarningDiskFull(pThis->pDrvIns);
2769 return true;
2770 }
2771 if (rc == VERR_FILE_TOO_BIG)
2772 {
2773 if (ASMAtomicCmpXchgBool(&pThis->fRedo, true, false))
2774 drvvdMediaExIoReqWarningFileTooBig(pThis->pDrvIns);
2775 return true;
2776 }
2777 if (rc == VERR_BROKEN_PIPE || rc == VERR_NET_CONNECTION_REFUSED)
2778 {
2779 /* iSCSI connection abort (first error) or failure to reestablish
2780 * connection (second error). Pause VM. On resume we'll retry. */
2781 if (ASMAtomicCmpXchgBool(&pThis->fRedo, true, false))
2782 drvvdMediaExIoReqWarningISCSI(pThis->pDrvIns);
2783 return true;
2784 }
2785 if (rc == VERR_VD_DEK_MISSING)
2786 {
2787 /* Error message already set. */
2788 if (ASMAtomicCmpXchgBool(&pThis->fRedo, true, false))
2789 drvvdMediaExIoReqWarningDekMissing(pThis->pDrvIns);
2790 return true;
2791 }
2792
2793 return false;
2794}
2795
2796/**
2797 * Syncs the memory buffers between the I/O request allocator and the internal buffer.
2798 *
2799 * @returns VBox status code.
2800 * @param pThis VBox disk container instance data.
2801 * @param pIoReq I/O request to sync.
2802 * @param fToIoBuf Flag indicating the sync direction.
2803 * true to copy data from the allocators buffer to our internal buffer.
2804 * false for the other direction.
2805 */
2806DECLINLINE(int) drvvdMediaExIoReqBufSync(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, bool fToIoBuf)
2807{
2808 int rc = VINF_SUCCESS;
2809
2810 Assert(pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE);
2811 Assert(pIoReq->ReadWrite.cbIoBuf > 0);
2812
2813 if (!pIoReq->ReadWrite.fDirectBuf)
2814 {
2815 /* Make sure the buffer is reset. */
2816 RTSgBufReset(&pIoReq->ReadWrite.IoBuf.SgBuf);
2817
2818 size_t const offSrc = pIoReq->ReadWrite.cbReq - pIoReq->ReadWrite.cbReqLeft;
2819 Assert((uint32_t)offSrc == offSrc);
2820 if (fToIoBuf)
2821 rc = pThis->pDrvMediaExPort->pfnIoReqCopyToBuf(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0], (uint32_t)offSrc,
2822 &pIoReq->ReadWrite.IoBuf.SgBuf,
2823 RT_MIN(pIoReq->ReadWrite.cbIoBuf, pIoReq->ReadWrite.cbReqLeft));
2824 else
2825 rc = pThis->pDrvMediaExPort->pfnIoReqCopyFromBuf(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0], (uint32_t)offSrc,
2826 &pIoReq->ReadWrite.IoBuf.SgBuf,
2827 (uint32_t)RT_MIN(pIoReq->ReadWrite.cbIoBuf, pIoReq->ReadWrite.cbReqLeft));
2828
2829 RTSgBufReset(&pIoReq->ReadWrite.IoBuf.SgBuf);
2830 }
2831 return rc;
2832}
2833
2834/**
2835 * Hashes the I/O request ID to an index for the allocated I/O request bin.
2836 */
2837DECLINLINE(unsigned) drvvdMediaExIoReqIdHash(PDMMEDIAEXIOREQID uIoReqId)
2838{
2839 return uIoReqId % DRVVD_VDIOREQ_ALLOC_BINS; /** @todo Find something better? */
2840}
2841
2842/**
2843 * Inserts the given I/O request in to the list of allocated I/O requests.
2844 *
2845 * @returns VBox status code.
2846 * @param pThis VBox disk container instance data.
2847 * @param pIoReq I/O request to insert.
2848 */
2849static int drvvdMediaExIoReqInsert(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
2850{
2851 int rc = VINF_SUCCESS;
2852 unsigned idxBin = drvvdMediaExIoReqIdHash(pIoReq->uIoReqId);
2853
2854 rc = RTSemFastMutexRequest(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
2855 if (RT_SUCCESS(rc))
2856 {
2857 /* Search for conflicting I/O request ID. */
2858 PPDMMEDIAEXIOREQINT pIt;
2859 RTListForEach(&pThis->aIoReqAllocBins[idxBin].LstIoReqAlloc, pIt, PDMMEDIAEXIOREQINT, NdAllocatedList)
2860 {
2861 if (RT_UNLIKELY( pIt->uIoReqId == pIoReq->uIoReqId
2862 && pIt->enmState != VDIOREQSTATE_CANCELED))
2863 {
2864 rc = VERR_PDM_MEDIAEX_IOREQID_CONFLICT;
2865 break;
2866 }
2867 }
2868 if (RT_SUCCESS(rc))
2869 RTListAppend(&pThis->aIoReqAllocBins[idxBin].LstIoReqAlloc, &pIoReq->NdAllocatedList);
2870 RTSemFastMutexRelease(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
2871 }
2872
2873 return rc;
2874}
2875
2876/**
2877 * Removes the given I/O request from the list of allocated I/O requests.
2878 *
2879 * @returns VBox status code.
2880 * @param pThis VBox disk container instance data.
2881 * @param pIoReq I/O request to insert.
2882 */
2883static int drvvdMediaExIoReqRemove(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
2884{
2885 int rc = VINF_SUCCESS;
2886 unsigned idxBin = drvvdMediaExIoReqIdHash(pIoReq->uIoReqId);
2887
2888 rc = RTSemFastMutexRequest(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
2889 if (RT_SUCCESS(rc))
2890 {
2891 RTListNodeRemove(&pIoReq->NdAllocatedList);
2892 RTSemFastMutexRelease(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
2893 }
2894
2895 return rc;
2896}
2897
2898/**
2899 * Retires a given I/O request marking it as complete and notiyfing the
2900 * device/driver above about the completion if requested.
2901 *
2902 * @returns VBox status code.
2903 * @param pThis VBox disk container instance data.
2904 * @param pIoReq I/O request to complete.
2905 * @param rcReq The status code the request completed with.
2906 * @param fUpNotify Flag whether to notify the driver/device above us about the completion.
2907 */
2908static void drvvdMediaExIoReqRetire(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, int rcReq, bool fUpNotify)
2909{
2910 LogFlowFunc(("pThis=%#p pIoReq=%#p rcReq=%Rrc fUpNotify=%RTbool\n",
2911 pThis, pIoReq, rcReq, fUpNotify));
2912
2913 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_COMPLETING, VDIOREQSTATE_ACTIVE);
2914 if (fXchg)
2915 ASMAtomicDecU32(&pThis->cIoReqsActive);
2916 else
2917 {
2918 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
2919 rcReq = VERR_PDM_MEDIAEX_IOREQ_CANCELED;
2920 }
2921
2922 ASMAtomicXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_COMPLETED);
2923 drvvdMediaExIoReqBufFree(pThis, pIoReq);
2924
2925 /*
2926 * Leave a release log entry if the request was active for more than 25 seconds
2927 * (30 seconds is the timeout of the guest).
2928 */
2929 uint64_t tsNow = RTTimeMilliTS();
2930 if (tsNow - pIoReq->tsSubmit >= 25 * 1000)
2931 {
2932 const char *pcszReq = NULL;
2933
2934 switch (pIoReq->enmType)
2935 {
2936 case PDMMEDIAEXIOREQTYPE_READ:
2937 pcszReq = "Read";
2938 break;
2939 case PDMMEDIAEXIOREQTYPE_WRITE:
2940 pcszReq = "Write";
2941 break;
2942 case PDMMEDIAEXIOREQTYPE_FLUSH:
2943 pcszReq = "Flush";
2944 break;
2945 case PDMMEDIAEXIOREQTYPE_DISCARD:
2946 pcszReq = "Discard";
2947 break;
2948 default:
2949 pcszReq = "<Invalid>";
2950 }
2951
2952 LogRel(("VD#%u: %s request was active for %llu seconds\n",
2953 pThis->pDrvIns->iInstance, pcszReq, (tsNow - pIoReq->tsSubmit) / 1000));
2954 }
2955
2956 if (RT_FAILURE(rcReq))
2957 {
2958 /* Log the error. */
2959 if (pThis->cErrors++ < DRVVD_MAX_LOG_REL_ERRORS)
2960 {
2961 if (rcReq == VERR_PDM_MEDIAEX_IOREQ_CANCELED)
2962 {
2963 if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH)
2964 LogRel(("VD#%u: Aborted flush returned rc=%Rrc\n",
2965 pThis->pDrvIns->iInstance, rcReq));
2966 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
2967 LogRel(("VD#%u: Aborted discard returned rc=%Rrc\n",
2968 pThis->pDrvIns->iInstance, rcReq));
2969 else
2970 LogRel(("VD#%u: Aborted %s (%u bytes left) returned rc=%Rrc\n",
2971 pThis->pDrvIns->iInstance,
2972 pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
2973 ? "read"
2974 : "write",
2975 pIoReq->ReadWrite.cbReqLeft, rcReq));
2976 }
2977 else
2978 {
2979 if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH)
2980 LogRel(("VD#%u: Flush returned rc=%Rrc\n",
2981 pThis->pDrvIns->iInstance, rcReq));
2982 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
2983 LogRel(("VD#%u: Discard returned rc=%Rrc\n",
2984 pThis->pDrvIns->iInstance, rcReq));
2985 else
2986 LogRel(("VD#%u: %s (%u bytes left) returned rc=%Rrc\n",
2987 pThis->pDrvIns->iInstance,
2988 pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
2989 ? "Read"
2990 : "Write",
2991 pIoReq->ReadWrite.cbReqLeft, rcReq));
2992 }
2993 }
2994
2995 STAM_REL_COUNTER_INC(&pThis->StatReqsFailed);
2996 }
2997 else
2998 {
2999 STAM_REL_COUNTER_INC(&pThis->StatReqsSucceeded);
3000
3001 switch (pIoReq->enmType)
3002 {
3003 case PDMMEDIAEXIOREQTYPE_READ:
3004 STAM_REL_COUNTER_ADD(&pThis->StatBytesRead, pIoReq->ReadWrite.cbReq);
3005 break;
3006 case PDMMEDIAEXIOREQTYPE_WRITE:
3007 STAM_REL_COUNTER_ADD(&pThis->StatBytesWritten, pIoReq->ReadWrite.cbReq);
3008 break;
3009 default:
3010 break;
3011 }
3012 }
3013
3014 if (fUpNotify)
3015 {
3016 int rc = pThis->pDrvMediaExPort->pfnIoReqCompleteNotify(pThis->pDrvMediaExPort,
3017 pIoReq, &pIoReq->abAlloc[0], rcReq);
3018 AssertRC(rc);
3019 }
3020
3021 LogFlowFunc(("returns\n"));
3022}
3023
3024/**
3025 * I/O request completion worker.
3026 *
3027 * @returns VBox status code.
3028 * @param pThis VBox disk container instance data.
3029 * @param pIoReq I/O request to complete.
3030 * @param rcReq The status code the request completed with.
3031 * @param fUpNotify Flag whether to notify the driver/device above us about the completion.
3032 */
3033static int drvvdMediaExIoReqCompleteWorker(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, int rcReq, bool fUpNotify)
3034{
3035 LogFlowFunc(("pThis=%#p pIoReq=%#p rcReq=%Rrc fUpNotify=%RTbool\n",
3036 pThis, pIoReq, rcReq, fUpNotify));
3037
3038 /*
3039 * For a read we need to sync the memory before continuing to process
3040 * the request further.
3041 */
3042 if ( RT_SUCCESS(rcReq)
3043 && pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ)
3044 rcReq = drvvdMediaExIoReqBufSync(pThis, pIoReq, false /* fToIoBuf */);
3045
3046 /*
3047 * When the request owner instructs us to handle recoverable errors like full disks
3048 * do it. Mark the request as suspended, notify the owner and put the request on the
3049 * redo list.
3050 */
3051 if ( RT_FAILURE(rcReq)
3052 && (pIoReq->fFlags & PDMIMEDIAEX_F_SUSPEND_ON_RECOVERABLE_ERR)
3053 && drvvdMediaExIoReqIsRedoSetWarning(pThis, rcReq))
3054 {
3055 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_SUSPENDED, VDIOREQSTATE_ACTIVE);
3056 if (fXchg)
3057 {
3058 /* Put on redo list and adjust active request counter. */
3059 RTCritSectEnter(&pThis->CritSectIoReqRedo);
3060 RTListAppend(&pThis->LstIoReqRedo, &pIoReq->NdLstWait);
3061 RTCritSectLeave(&pThis->CritSectIoReqRedo);
3062 ASMAtomicDecU32(&pThis->cIoReqsActive);
3063 pThis->pDrvMediaExPort->pfnIoReqStateChanged(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0],
3064 PDMMEDIAEXIOREQSTATE_SUSPENDED);
3065 rcReq = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
3066 }
3067 else
3068 {
3069 /* Request was canceled inbetween, so don't care and notify the owner about the completed request. */
3070 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
3071 drvvdMediaExIoReqRetire(pThis, pIoReq, rcReq, fUpNotify);
3072 }
3073 }
3074 else
3075 {
3076 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
3077 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
3078 {
3079 /* Adjust the remaining amount to transfer. */
3080 Assert(pIoReq->ReadWrite.cbIoBuf > 0 || rcReq == VERR_PDM_MEDIAEX_IOREQ_CANCELED);
3081
3082 size_t cbReqIo = RT_MIN(pIoReq->ReadWrite.cbReqLeft, pIoReq->ReadWrite.cbIoBuf);
3083 pIoReq->ReadWrite.offStart += cbReqIo;
3084 pIoReq->ReadWrite.cbReqLeft -= cbReqIo;
3085 }
3086
3087 if ( RT_FAILURE(rcReq)
3088 || !pIoReq->ReadWrite.cbReqLeft
3089 || ( pIoReq->enmType != PDMMEDIAEXIOREQTYPE_READ
3090 && pIoReq->enmType != PDMMEDIAEXIOREQTYPE_WRITE))
3091 drvvdMediaExIoReqRetire(pThis, pIoReq, rcReq, fUpNotify);
3092 else
3093 drvvdMediaExIoReqReadWriteProcess(pThis, pIoReq, fUpNotify);
3094 }
3095
3096 LogFlowFunc(("returns %Rrc\n", rcReq));
3097 return rcReq;
3098}
3099
3100
3101/**
3102 * Allocates a memory buffer suitable for I/O for the given request.
3103 *
3104 * @returns VBox status code.
3105 * @retval VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS if there is no I/O memory available to allocate and
3106 * the request was placed on a waiting list.
3107 * @param pThis VBox disk container instance data.
3108 * @param pIoReq I/O request to allocate memory for.
3109 * @param cb Size of the buffer.
3110 */
3111DECLINLINE(int) drvvdMediaExIoReqBufAlloc(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, size_t cb)
3112{
3113 int rc = VERR_NOT_SUPPORTED;
3114 LogFlowFunc(("pThis=%#p pIoReq=%#p cb=%zu\n", pThis, pIoReq, cb));
3115
3116/** @todo This does not work at all with encryption enabled because the encryption plugin
3117 * encrypts the data in place trashing guest memory and causing data corruption later on!
3118 *
3119 * DO NOT ENABLE UNLESS YOU WANT YOUR DATA SHREDDED!!!
3120 */
3121#if 0
3122 if ( cb == _4K
3123 && pThis->pDrvMediaExPort->pfnIoReqQueryBuf)
3124 {
3125 /* Try to get a direct pointer to the buffer first. */
3126 void *pvBuf = NULL;
3127 size_t cbBuf = 0;
3128
3129 STAM_COUNTER_INC(&pThis->StatQueryBufAttempts);
3130 rc = pThis->pDrvMediaExPort->pfnIoReqQueryBuf(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0],
3131 &pvBuf, &cbBuf);
3132 if (RT_SUCCESS(rc))
3133 {
3134 STAM_COUNTER_INC(&pThis->StatQueryBufSuccess);
3135 pIoReq->ReadWrite.cbIoBuf = cbBuf;
3136 pIoReq->ReadWrite.fDirectBuf = true;
3137 pIoReq->ReadWrite.Direct.Seg.pvSeg = pvBuf;
3138 pIoReq->ReadWrite.Direct.Seg.cbSeg = cbBuf;
3139 RTSgBufInit(&pIoReq->ReadWrite.Direct.SgBuf, &pIoReq->ReadWrite.Direct.Seg, 1);
3140 pIoReq->ReadWrite.pSgBuf = &pIoReq->ReadWrite.Direct.SgBuf;
3141 }
3142 }
3143#endif
3144
3145 if (RT_FAILURE(rc))
3146 {
3147 rc = IOBUFMgrAllocBuf(pThis->hIoBufMgr, &pIoReq->ReadWrite.IoBuf, cb, &pIoReq->ReadWrite.cbIoBuf);
3148 if (rc == VERR_NO_MEMORY)
3149 {
3150 LogFlowFunc(("Could not allocate memory for request, deferring\n"));
3151 RTCritSectEnter(&pThis->CritSectIoReqsIoBufWait);
3152 RTListAppend(&pThis->LstIoReqIoBufWait, &pIoReq->NdLstWait);
3153 RTCritSectLeave(&pThis->CritSectIoReqsIoBufWait);
3154 ASMAtomicIncU32(&pThis->cIoReqsWaiting);
3155 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
3156 }
3157 else
3158 {
3159 LogFlowFunc(("Allocated %zu bytes of memory\n", pIoReq->ReadWrite.cbIoBuf));
3160 Assert(pIoReq->ReadWrite.cbIoBuf > 0);
3161 pIoReq->ReadWrite.fDirectBuf = false;
3162 pIoReq->ReadWrite.pSgBuf = &pIoReq->ReadWrite.IoBuf.SgBuf;
3163 }
3164 }
3165
3166 LogFlowFunc(("returns %Rrc\n", rc));
3167 return rc;
3168}
3169
3170/**
3171 * Wrapper around the various ways to read from the underlying medium (cache, async vs. sync).
3172 *
3173 * @returns VBox status code.
3174 * @param pThis VBox disk container instance data.
3175 * @param pIoReq I/O request to process.
3176 * @param cbReqIo Transfer size.
3177 * @param pcbReqIo Where to store the amount of transferred data.
3178 */
3179static int drvvdMediaExIoReqReadWrapper(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, size_t cbReqIo, size_t *pcbReqIo)
3180{
3181 int rc = VINF_SUCCESS;
3182
3183 LogFlowFunc(("pThis=%#p pIoReq=%#p cbReqIo=%zu pcbReqIo=%#p\n", pThis, pIoReq, cbReqIo, pcbReqIo));
3184
3185 Assert(cbReqIo > 0);
3186
3187 if ( pThis->fAsyncIOSupported
3188 && !(pIoReq->fFlags & PDMIMEDIAEX_F_SYNC))
3189 {
3190 if (pThis->pBlkCache)
3191 {
3192 rc = PDMR3BlkCacheRead(pThis->pBlkCache, pIoReq->ReadWrite.offStart,
3193 pIoReq->ReadWrite.pSgBuf, cbReqIo, pIoReq);
3194 if (rc == VINF_SUCCESS)
3195 rc = VINF_VD_ASYNC_IO_FINISHED;
3196 else if (rc == VINF_AIO_TASK_PENDING)
3197 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
3198 }
3199 else
3200 rc = VDAsyncRead(pThis->pDisk, pIoReq->ReadWrite.offStart, cbReqIo, pIoReq->ReadWrite.pSgBuf,
3201 drvvdMediaExIoReqComplete, pThis, pIoReq);
3202 }
3203 else
3204 {
3205 void *pvBuf = RTSgBufGetNextSegment(pIoReq->ReadWrite.pSgBuf, &cbReqIo);
3206
3207 Assert(cbReqIo > 0 && VALID_PTR(pvBuf));
3208 rc = VDRead(pThis->pDisk, pIoReq->ReadWrite.offStart, pvBuf, cbReqIo);
3209 if (RT_SUCCESS(rc))
3210 rc = VINF_VD_ASYNC_IO_FINISHED;
3211 }
3212
3213 *pcbReqIo = cbReqIo;
3214
3215 LogFlowFunc(("returns %Rrc *pcbReqIo=%zu\n", rc, *pcbReqIo));
3216 return rc;
3217}
3218
3219/**
3220 * Wrapper around the various ways to write to the underlying medium (cache, async vs. sync).
3221 *
3222 * @returns VBox status code.
3223 * @param pThis VBox disk container instance data.
3224 * @param pIoReq I/O request to process.
3225 * @param cbReqIo Transfer size.
3226 * @param pcbReqIo Where to store the amount of transferred data.
3227 */
3228static int drvvdMediaExIoReqWriteWrapper(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, size_t cbReqIo, size_t *pcbReqIo)
3229{
3230 int rc = VINF_SUCCESS;
3231
3232 Assert(cbReqIo > 0);
3233
3234 LogFlowFunc(("pThis=%#p pIoReq=%#p cbReqIo=%zu pcbReqIo=%#p\n", pThis, pIoReq, cbReqIo, pcbReqIo));
3235
3236 if ( pThis->fAsyncIOSupported
3237 && !(pIoReq->fFlags & PDMIMEDIAEX_F_SYNC))
3238 {
3239 if (pThis->pBlkCache)
3240 {
3241 rc = PDMR3BlkCacheWrite(pThis->pBlkCache, pIoReq->ReadWrite.offStart,
3242 pIoReq->ReadWrite.pSgBuf, cbReqIo, pIoReq);
3243 if (rc == VINF_SUCCESS)
3244 rc = VINF_VD_ASYNC_IO_FINISHED;
3245 else if (rc == VINF_AIO_TASK_PENDING)
3246 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
3247 }
3248 else
3249 rc = VDAsyncWrite(pThis->pDisk, pIoReq->ReadWrite.offStart, cbReqIo, pIoReq->ReadWrite.pSgBuf,
3250 drvvdMediaExIoReqComplete, pThis, pIoReq);
3251 }
3252 else
3253 {
3254 void *pvBuf = RTSgBufGetNextSegment(pIoReq->ReadWrite.pSgBuf, &cbReqIo);
3255
3256 Assert(cbReqIo > 0 && VALID_PTR(pvBuf));
3257 rc = VDWrite(pThis->pDisk, pIoReq->ReadWrite.offStart, pvBuf, cbReqIo);
3258 if (RT_SUCCESS(rc))
3259 rc = VINF_VD_ASYNC_IO_FINISHED;
3260 }
3261
3262 *pcbReqIo = cbReqIo;
3263
3264 LogFlowFunc(("returns %Rrc *pcbReqIo=%zu\n", rc, *pcbReqIo));
3265 return rc;
3266}
3267
3268/**
3269 * Wrapper around the various ways to flush all data to the underlying medium (cache, async vs. sync).
3270 *
3271 * @returns VBox status code.
3272 * @param pThis VBox disk container instance data.
3273 * @param pIoReq I/O request to process.
3274 */
3275static int drvvdMediaExIoReqFlushWrapper(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
3276{
3277 int rc = VINF_SUCCESS;
3278
3279 LogFlowFunc(("pThis=%#p pIoReq=%#p\n", pThis, pIoReq));
3280
3281 if ( pThis->fAsyncIOSupported
3282 && !(pIoReq->fFlags & PDMIMEDIAEX_F_SYNC))
3283 {
3284 if (pThis->pBlkCache)
3285 {
3286 rc = PDMR3BlkCacheFlush(pThis->pBlkCache, pIoReq);
3287 if (rc == VINF_SUCCESS)
3288 rc = VINF_VD_ASYNC_IO_FINISHED;
3289 else if (rc == VINF_AIO_TASK_PENDING)
3290 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
3291 }
3292 else
3293 rc = VDAsyncFlush(pThis->pDisk, drvvdMediaExIoReqComplete, pThis, pIoReq);
3294 }
3295 else
3296 {
3297 rc = VDFlush(pThis->pDisk);
3298 if (RT_SUCCESS(rc))
3299 rc = VINF_VD_ASYNC_IO_FINISHED;
3300 }
3301
3302 LogFlowFunc(("returns %Rrc\n", rc));
3303 return rc;
3304}
3305
3306/**
3307 * Wrapper around the various ways to discard data blocks on the underlying medium (cache, async vs. sync).
3308 *
3309 * @returns VBox status code.
3310 * @param pThis VBox disk container instance data.
3311 * @param pIoReq I/O request to process.
3312 */
3313static int drvvdMediaExIoReqDiscardWrapper(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
3314{
3315 int rc = VINF_SUCCESS;
3316
3317 LogFlowFunc(("pThis=%#p pIoReq=%#p\n", pThis, pIoReq));
3318
3319 if ( pThis->fAsyncIOSupported
3320 && !(pIoReq->fFlags & PDMIMEDIAEX_F_SYNC))
3321 {
3322 if (pThis->pBlkCache)
3323 {
3324 rc = PDMR3BlkCacheDiscard(pThis->pBlkCache, pIoReq->Discard.paRanges, pIoReq->Discard.cRanges, pIoReq);
3325 if (rc == VINF_SUCCESS)
3326 rc = VINF_VD_ASYNC_IO_FINISHED;
3327 else if (rc == VINF_AIO_TASK_PENDING)
3328 rc = VERR_VD_ASYNC_IO_IN_PROGRESS;
3329 }
3330 else
3331 rc = VDAsyncDiscardRanges(pThis->pDisk, pIoReq->Discard.paRanges, pIoReq->Discard.cRanges,
3332 drvvdMediaExIoReqComplete, pThis, pIoReq);
3333 }
3334 else
3335 {
3336 rc = VDDiscardRanges(pThis->pDisk, pIoReq->Discard.paRanges, pIoReq->Discard.cRanges);
3337 if (RT_SUCCESS(rc))
3338 rc = VINF_VD_ASYNC_IO_FINISHED;
3339 }
3340
3341 LogFlowFunc(("returns %Rrc\n", rc));
3342 return rc;
3343}
3344
3345/**
3346 * Processes a read/write request.
3347 *
3348 * @returns VBox status code.
3349 * @param pThis VBox disk container instance data.
3350 * @param pIoReq I/O request to process.
3351 * @param fUpNotify Flag whether to notify the driver/device above us about the completion.
3352 */
3353static int drvvdMediaExIoReqReadWriteProcess(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq, bool fUpNotify)
3354{
3355 int rc = VINF_SUCCESS;
3356
3357 LogFlowFunc(("pThis=%#p pIoReq=%#p fUpNotify=%RTbool\n", pThis, pIoReq, fUpNotify));
3358
3359 Assert(pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE);
3360
3361 rc = drvvdKeyCheckPrereqs(pThis, false /* fSetError */);
3362
3363 while ( pIoReq->ReadWrite.cbReqLeft
3364 && rc == VINF_SUCCESS)
3365 {
3366 Assert(pIoReq->ReadWrite.cbIoBuf > 0);
3367
3368 size_t cbReqIo = RT_MIN(pIoReq->ReadWrite.cbReqLeft, pIoReq->ReadWrite.cbIoBuf);
3369
3370 if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ)
3371 rc = drvvdMediaExIoReqReadWrapper(pThis, pIoReq, cbReqIo, &cbReqIo);
3372 else
3373 {
3374 /* Sync memory buffer from the request initiator. */
3375 rc = drvvdMediaExIoReqBufSync(pThis, pIoReq, true /* fToIoBuf */);
3376 if (RT_SUCCESS(rc))
3377 rc = drvvdMediaExIoReqWriteWrapper(pThis, pIoReq, cbReqIo, &cbReqIo);
3378 }
3379
3380 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3381 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
3382 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
3383 {
3384 /*
3385 * Don't sync the buffer or update the I/O state for the last chunk as it is done
3386 * already in the completion worker called below.
3387 */
3388 if (cbReqIo < pIoReq->ReadWrite.cbReqLeft)
3389 {
3390 if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ)
3391 rc = drvvdMediaExIoReqBufSync(pThis, pIoReq, false /* fToIoBuf */);
3392 else
3393 rc = VINF_SUCCESS;
3394 pIoReq->ReadWrite.offStart += cbReqIo;
3395 pIoReq->ReadWrite.cbReqLeft -= cbReqIo;
3396 }
3397 else
3398 {
3399 rc = VINF_SUCCESS;
3400 break;
3401 }
3402 }
3403 }
3404
3405 if (rc != VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS)
3406 rc = drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rc, fUpNotify);
3407
3408 LogFlowFunc(("returns %Rrc\n", rc));
3409 return rc;
3410}
3411
3412
3413/**
3414 * Frees a I/O memory buffer allocated previously.
3415 *
3416 * @returns nothing.
3417 * @param pThis VBox disk container instance data.
3418 * @param pIoReq I/O request for which to free memory.
3419 */
3420DECLINLINE(void) drvvdMediaExIoReqBufFree(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
3421{
3422 LogFlowFunc(("pThis=%#p pIoReq=%#p{.cbIoBuf=%zu}\n", pThis, pIoReq, pIoReq->ReadWrite.cbIoBuf));
3423
3424 if ( ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
3425 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
3426 && !pIoReq->ReadWrite.fDirectBuf
3427 && pIoReq->ReadWrite.cbIoBuf > 0)
3428 {
3429 IOBUFMgrFreeBuf(&pIoReq->ReadWrite.IoBuf);
3430
3431 uint32_t cIoReqsWaiting = ASMAtomicXchgU32(&pThis->cIoReqsWaiting, 0);
3432 if (cIoReqsWaiting > 0)
3433 {
3434 RTLISTANCHOR LstIoReqProcess;
3435 RTLISTANCHOR LstIoReqCanceled;
3436 RTListInit(&LstIoReqProcess);
3437 RTListInit(&LstIoReqCanceled);
3438
3439 /* Try to process as many requests as possible. */
3440 RTCritSectEnter(&pThis->CritSectIoReqsIoBufWait);
3441 PPDMMEDIAEXIOREQINT pIoReqCur, pIoReqNext;
3442
3443 RTListForEachSafe(&pThis->LstIoReqIoBufWait, pIoReqCur, pIoReqNext, PDMMEDIAEXIOREQINT, NdLstWait)
3444 {
3445 LogFlowFunc(("Found I/O request %#p on waiting list, trying to allocate buffer of size %zu bytes\n",
3446 pIoReqCur, pIoReqCur->ReadWrite.cbReq));
3447
3448 /* Allocate a suitable I/O buffer for this request. */
3449 int rc = IOBUFMgrAllocBuf(pThis->hIoBufMgr, &pIoReqCur->ReadWrite.IoBuf, pIoReqCur->ReadWrite.cbReq,
3450 &pIoReqCur->ReadWrite.cbIoBuf);
3451 if (rc == VINF_SUCCESS)
3452 {
3453 Assert(pIoReqCur->ReadWrite.cbIoBuf > 0);
3454
3455 cIoReqsWaiting--;
3456 RTListNodeRemove(&pIoReqCur->NdLstWait);
3457
3458 pIoReqCur->ReadWrite.fDirectBuf = false;
3459 pIoReqCur->ReadWrite.pSgBuf = &pIoReqCur->ReadWrite.IoBuf.SgBuf;
3460
3461 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReqCur->enmState,
3462 VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
3463 if (RT_UNLIKELY(!fXchg))
3464 {
3465 /* Must have been canceled inbetween. */
3466 Assert(pIoReqCur->enmState == VDIOREQSTATE_CANCELED);
3467
3468 /* Free the buffer here already again to let other requests get a chance to allocate the memory. */
3469 IOBUFMgrFreeBuf(&pIoReq->ReadWrite.IoBuf);
3470 pIoReqCur->ReadWrite.cbIoBuf = 0;
3471 RTListAppend(&LstIoReqCanceled, &pIoReqCur->NdLstWait);
3472 }
3473 else
3474 {
3475 ASMAtomicIncU32(&pThis->cIoReqsActive);
3476 RTListAppend(&LstIoReqProcess, &pIoReqCur->NdLstWait);
3477 }
3478 }
3479 else
3480 {
3481 Assert(rc == VERR_NO_MEMORY);
3482 break;
3483 }
3484 }
3485 RTCritSectLeave(&pThis->CritSectIoReqsIoBufWait);
3486
3487 ASMAtomicAddU32(&pThis->cIoReqsWaiting, cIoReqsWaiting);
3488
3489 /* Process the requests we could allocate memory for and the ones which got canceled outside the lock now. */
3490 RTListForEachSafe(&LstIoReqCanceled, pIoReqCur, pIoReqNext, PDMMEDIAEXIOREQINT, NdLstWait)
3491 {
3492 RTListNodeRemove(&pIoReqCur->NdLstWait);
3493 drvvdMediaExIoReqCompleteWorker(pThis, pIoReqCur, VERR_PDM_MEDIAEX_IOREQ_CANCELED, true /* fUpNotify */);
3494 }
3495
3496 RTListForEachSafe(&LstIoReqProcess, pIoReqCur, pIoReqNext, PDMMEDIAEXIOREQINT, NdLstWait)
3497 {
3498 RTListNodeRemove(&pIoReqCur->NdLstWait);
3499 drvvdMediaExIoReqReadWriteProcess(pThis, pIoReqCur, true /* fUpNotify */);
3500 }
3501 }
3502 }
3503
3504 LogFlowFunc(("returns\n"));
3505}
3506
3507
3508/**
3509 * Returns a string description of the given request state.
3510 *
3511 * @returns Pointer to the stringified state.
3512 * @param enmState The state.
3513 */
3514DECLINLINE(const char *) drvvdMediaExIoReqStateStringify(VDIOREQSTATE enmState)
3515{
3516#define STATE2STR(a_State) case VDIOREQSTATE_##a_State: return #a_State
3517 switch (enmState)
3518 {
3519 STATE2STR(INVALID);
3520 STATE2STR(FREE);
3521 STATE2STR(ALLOCATED);
3522 STATE2STR(ACTIVE);
3523 STATE2STR(SUSPENDED);
3524 STATE2STR(COMPLETING);
3525 STATE2STR(COMPLETED);
3526 STATE2STR(CANCELED);
3527 default:
3528 AssertMsgFailed(("Unknown state %u\n", enmState));
3529 return "UNKNOWN";
3530 }
3531#undef STATE2STR
3532}
3533
3534
3535/**
3536 * Returns a string description of the given request type.
3537 *
3538 * @returns Pointer to the stringified type.
3539 * @param enmType The request type.
3540 */
3541DECLINLINE(const char *) drvvdMediaExIoReqTypeStringify(PDMMEDIAEXIOREQTYPE enmType)
3542{
3543#define TYPE2STR(a_Type) case PDMMEDIAEXIOREQTYPE_##a_Type: return #a_Type
3544 switch (enmType)
3545 {
3546 TYPE2STR(INVALID);
3547 TYPE2STR(FLUSH);
3548 TYPE2STR(WRITE);
3549 TYPE2STR(READ);
3550 TYPE2STR(DISCARD);
3551 TYPE2STR(SCSI);
3552 default:
3553 AssertMsgFailed(("Unknown type %u\n", enmType));
3554 return "UNKNOWN";
3555 }
3556#undef TYPE2STR
3557}
3558
3559
3560/**
3561 * Dumps the interesting bits about the given I/O request to the release log.
3562 *
3563 * @returns nothing.
3564 * @param pThis VBox disk container instance data.
3565 * @param pIoReq The I/O request to dump.
3566 */
3567static void drvvdMediaExIoReqLogRel(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
3568{
3569 uint64_t offStart = 0;
3570 size_t cbReq = 0;
3571 size_t cbLeft = 0;
3572 size_t cbBufSize = 0;
3573 uint64_t tsActive = RTTimeMilliTS() - pIoReq->tsSubmit;
3574
3575 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
3576 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
3577 {
3578 offStart = pIoReq->ReadWrite.offStart;
3579 cbReq = pIoReq->ReadWrite.cbReq;
3580 cbLeft = pIoReq->ReadWrite.cbReqLeft;
3581 cbBufSize = pIoReq->ReadWrite.cbIoBuf;
3582 }
3583
3584 LogRel(("VD#%u: Request{%#p}:\n"
3585 " Type=%s State=%s Id=%#llx SubmitTs=%llu {%llu} Flags=%#x\n"
3586 " Offset=%llu Size=%zu Left=%zu BufSize=%zu\n",
3587 pThis->pDrvIns->iInstance, pIoReq,
3588 drvvdMediaExIoReqTypeStringify(pIoReq->enmType),
3589 drvvdMediaExIoReqStateStringify(pIoReq->enmState),
3590 pIoReq->uIoReqId, pIoReq->tsSubmit, tsActive, pIoReq->fFlags,
3591 offStart, cbReq, cbLeft, cbBufSize));
3592}
3593
3594
3595/**
3596 * Returns whether the VM is in a running state.
3597 *
3598 * @returns Flag indicating whether the VM is currently in a running state.
3599 * @param pThis VBox disk container instance data.
3600 */
3601DECLINLINE(bool) drvvdMediaExIoReqIsVmRunning(PVBOXDISK pThis)
3602{
3603 VMSTATE enmVmState = PDMDrvHlpVMState(pThis->pDrvIns);
3604 if ( enmVmState == VMSTATE_RESUMING
3605 || enmVmState == VMSTATE_RUNNING
3606 || enmVmState == VMSTATE_RUNNING_LS
3607 || enmVmState == VMSTATE_RUNNING_FT
3608 || enmVmState == VMSTATE_RESETTING
3609 || enmVmState == VMSTATE_RESETTING_LS
3610 || enmVmState == VMSTATE_SOFT_RESETTING
3611 || enmVmState == VMSTATE_SOFT_RESETTING_LS
3612 || enmVmState == VMSTATE_SUSPENDING
3613 || enmVmState == VMSTATE_SUSPENDING_LS
3614 || enmVmState == VMSTATE_SUSPENDING_EXT_LS)
3615 return true;
3616
3617 return false;
3618}
3619
3620/**
3621 * @copydoc FNVDASYNCTRANSFERCOMPLETE
3622 */
3623static DECLCALLBACK(void) drvvdMediaExIoReqComplete(void *pvUser1, void *pvUser2, int rcReq)
3624{
3625 PVBOXDISK pThis = (PVBOXDISK)pvUser1;
3626 PPDMMEDIAEXIOREQINT pIoReq = (PPDMMEDIAEXIOREQINT)pvUser2;
3627
3628 drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rcReq, true /* fUpNotify */);
3629}
3630
3631/**
3632 * Tries to cancel the given I/O request returning the result.
3633 *
3634 * @returns Flag whether the request was successfully canceled or whether it
3635 * already complete inbetween.
3636 * @param pThis VBox disk container instance data.
3637 * @param pIoReq The I/O request to cancel.
3638 */
3639static bool drvvdMediaExIoReqCancel(PVBOXDISK pThis, PPDMMEDIAEXIOREQINT pIoReq)
3640{
3641 bool fXchg = false;
3642 VDIOREQSTATE enmStateOld = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3643
3644 drvvdMediaExIoReqLogRel(pThis, pIoReq);
3645
3646 /*
3647 * We might have to try canceling the request multiple times if it transitioned from
3648 * ALLOCATED to ACTIVE or to SUSPENDED between reading the state and trying to change it.
3649 */
3650 while ( ( enmStateOld == VDIOREQSTATE_ALLOCATED
3651 || enmStateOld == VDIOREQSTATE_ACTIVE
3652 || enmStateOld == VDIOREQSTATE_SUSPENDED)
3653 && !fXchg)
3654 {
3655 fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_CANCELED, enmStateOld);
3656 if (fXchg)
3657 break;
3658
3659 enmStateOld = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3660 }
3661
3662 if (fXchg)
3663 ASMAtomicDecU32(&pThis->cIoReqsActive);
3664
3665 return fXchg;
3666}
3667
3668/**
3669 * @interface_method_impl{PDMIMEDIAEX,pfnQueryFeatures}
3670 */
3671static DECLCALLBACK(int) drvvdQueryFeatures(PPDMIMEDIAEX pInterface, uint32_t *pfFeatures)
3672{
3673 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3674
3675 AssertPtrReturn(pfFeatures, VERR_INVALID_POINTER);
3676
3677 uint32_t fFeatures = 0;
3678 if (pThis->fAsyncIOSupported)
3679 fFeatures |= PDMIMEDIAEX_FEATURE_F_ASYNC;
3680 if (pThis->IMedia.pfnDiscard)
3681 fFeatures |= PDMIMEDIAEX_FEATURE_F_DISCARD;
3682
3683 *pfFeatures = fFeatures;
3684
3685 return VINF_SUCCESS;
3686}
3687
3688
3689/**
3690 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqAllocSizeSet}
3691 */
3692static DECLCALLBACK(int) drvvdIoReqAllocSizeSet(PPDMIMEDIAEX pInterface, size_t cbIoReqAlloc)
3693{
3694 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3695 if (RT_UNLIKELY(pThis->hIoReqCache != NIL_RTMEMCACHE))
3696 return VERR_INVALID_STATE;
3697
3698 return RTMemCacheCreate(&pThis->hIoReqCache, sizeof(PDMMEDIAEXIOREQINT) + cbIoReqAlloc, 0, UINT32_MAX,
3699 NULL, NULL, NULL, 0);
3700}
3701
3702/**
3703 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqAlloc}
3704 */
3705static DECLCALLBACK(int) drvvdIoReqAlloc(PPDMIMEDIAEX pInterface, PPDMMEDIAEXIOREQ phIoReq, void **ppvIoReqAlloc,
3706 PDMMEDIAEXIOREQID uIoReqId, uint32_t fFlags)
3707{
3708 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3709
3710 AssertReturn(!(fFlags & ~PDMIMEDIAEX_F_VALID), VERR_INVALID_PARAMETER);
3711
3712 PPDMMEDIAEXIOREQINT pIoReq = (PPDMMEDIAEXIOREQINT)RTMemCacheAlloc(pThis->hIoReqCache);
3713
3714 if (RT_UNLIKELY(!pIoReq))
3715 return VERR_NO_MEMORY;
3716
3717 pIoReq->uIoReqId = uIoReqId;
3718 pIoReq->fFlags = fFlags;
3719 pIoReq->pDisk = pThis;
3720 pIoReq->enmState = VDIOREQSTATE_ALLOCATED;
3721 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_INVALID;
3722
3723 int rc = drvvdMediaExIoReqInsert(pThis, pIoReq);
3724 if (RT_SUCCESS(rc))
3725 {
3726 *phIoReq = pIoReq;
3727 *ppvIoReqAlloc = &pIoReq->abAlloc[0];
3728 }
3729 else
3730 RTMemCacheFree(pThis->hIoReqCache, pIoReq);
3731
3732 return rc;
3733}
3734
3735/**
3736 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqFree}
3737 */
3738static DECLCALLBACK(int) drvvdIoReqFree(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq)
3739{
3740 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3741 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3742
3743 if ( pIoReq->enmState != VDIOREQSTATE_COMPLETED
3744 && pIoReq->enmState != VDIOREQSTATE_ALLOCATED)
3745 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3746
3747 /* Remove from allocated list. */
3748 int rc = drvvdMediaExIoReqRemove(pThis, pIoReq);
3749 if (RT_FAILURE(rc))
3750 return rc;
3751
3752 /* Free any associated I/O memory. */
3753 drvvdMediaExIoReqBufFree(pThis, pIoReq);
3754
3755 /* For discard request discard the range array. */
3756 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD
3757 && pIoReq->Discard.paRanges)
3758 {
3759 RTMemFree(pIoReq->Discard.paRanges);
3760 pIoReq->Discard.paRanges = NULL;
3761 }
3762
3763 pIoReq->enmState = VDIOREQSTATE_FREE;
3764 RTMemCacheFree(pThis->hIoReqCache, pIoReq);
3765 return VINF_SUCCESS;
3766}
3767
3768/**
3769 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqQueryResidual}
3770 */
3771static DECLCALLBACK(int) drvvdIoReqQueryResidual(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, size_t *pcbResidual)
3772{
3773 RT_NOREF1(pInterface);
3774
3775 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3776
3777 if (pIoReq->enmState != VDIOREQSTATE_COMPLETED)
3778 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3779
3780 if ( pIoReq->enmType != PDMMEDIAEXIOREQTYPE_READ
3781 && pIoReq->enmType != PDMMEDIAEXIOREQTYPE_WRITE
3782 && pIoReq->enmType != PDMMEDIAEXIOREQTYPE_FLUSH)
3783 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3784
3785 *pcbResidual = 0; /* No data left to transfer always. */
3786 return VINF_SUCCESS;
3787}
3788
3789/**
3790 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqQueryXferSize}
3791 */
3792static DECLCALLBACK(int) drvvdIoReqQueryXferSize(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, size_t *pcbXfer)
3793{
3794 int rc = VINF_SUCCESS;
3795 RT_NOREF1(pInterface);
3796
3797 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3798
3799 if (pIoReq->enmState != VDIOREQSTATE_COMPLETED)
3800 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3801
3802 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
3803 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
3804 *pcbXfer = pIoReq->ReadWrite.cbReq;
3805 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH)
3806 *pcbXfer = 0;
3807 else
3808 rc = VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3809
3810 return rc;
3811}
3812
3813/**
3814 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqCancelAll}
3815 */
3816static DECLCALLBACK(int) drvvdIoReqCancelAll(PPDMIMEDIAEX pInterface)
3817{
3818 int rc = VINF_SUCCESS;
3819 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3820
3821 LogRel(("VD#%u: Cancelling all active requests\n", pThis->pDrvIns->iInstance));
3822
3823 for (unsigned idxBin = 0; idxBin < RT_ELEMENTS(pThis->aIoReqAllocBins); idxBin++)
3824 {
3825 rc = RTSemFastMutexRequest(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
3826 if (RT_SUCCESS(rc))
3827 {
3828 /* Search for I/O request with ID. */
3829 PPDMMEDIAEXIOREQINT pIt;
3830
3831 RTListForEach(&pThis->aIoReqAllocBins[idxBin].LstIoReqAlloc, pIt, PDMMEDIAEXIOREQINT, NdAllocatedList)
3832 {
3833 drvvdMediaExIoReqCancel(pThis, pIt);
3834 }
3835 RTSemFastMutexRelease(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
3836 }
3837 }
3838
3839 return rc;
3840}
3841
3842/**
3843 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqCancel}
3844 */
3845static DECLCALLBACK(int) drvvdIoReqCancel(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQID uIoReqId)
3846{
3847 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3848 unsigned idxBin = drvvdMediaExIoReqIdHash(uIoReqId);
3849
3850 LogRel(("VD#%u: Trying to cancel request %#llx\n", pThis->pDrvIns->iInstance, uIoReqId));
3851
3852 int rc = RTSemFastMutexRequest(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
3853 if (RT_SUCCESS(rc))
3854 {
3855 /* Search for I/O request with ID. */
3856 PPDMMEDIAEXIOREQINT pIt;
3857 rc = VERR_PDM_MEDIAEX_IOREQID_NOT_FOUND;
3858
3859 RTListForEach(&pThis->aIoReqAllocBins[idxBin].LstIoReqAlloc, pIt, PDMMEDIAEXIOREQINT, NdAllocatedList)
3860 {
3861 if (pIt->uIoReqId == uIoReqId)
3862 {
3863 if (drvvdMediaExIoReqCancel(pThis, pIt))
3864 rc = VINF_SUCCESS;
3865
3866 break;
3867 }
3868 }
3869 RTSemFastMutexRelease(pThis->aIoReqAllocBins[idxBin].hMtxLstIoReqAlloc);
3870 }
3871
3872 return rc;
3873}
3874
3875/**
3876 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqRead}
3877 */
3878static DECLCALLBACK(int) drvvdIoReqRead(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, uint64_t off, size_t cbRead)
3879{
3880 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3881 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3882 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3883
3884 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
3885 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3886
3887 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
3888 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3889
3890 STAM_REL_COUNTER_INC(&pThis->StatReqsSubmitted);
3891 STAM_REL_COUNTER_INC(&pThis->StatReqsRead);
3892
3893 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_READ;
3894 pIoReq->tsSubmit = RTTimeMilliTS();
3895 pIoReq->ReadWrite.offStart = off;
3896 pIoReq->ReadWrite.cbReq = cbRead;
3897 pIoReq->ReadWrite.cbReqLeft = cbRead;
3898 /* Allocate a suitable I/O buffer for this request. */
3899 int rc = drvvdMediaExIoReqBufAlloc(pThis, pIoReq, cbRead);
3900 if (rc == VINF_SUCCESS)
3901 {
3902 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
3903 if (RT_UNLIKELY(!fXchg))
3904 {
3905 /* Must have been canceled inbetween. */
3906 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
3907 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3908 }
3909 ASMAtomicIncU32(&pThis->cIoReqsActive);
3910
3911 rc = drvvdMediaExIoReqReadWriteProcess(pThis, pIoReq, false /* fUpNotify */);
3912 }
3913
3914 return rc;
3915}
3916
3917/**
3918 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqWrite}
3919 */
3920static DECLCALLBACK(int) drvvdIoReqWrite(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, uint64_t off, size_t cbWrite)
3921{
3922 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3923 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3924 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3925
3926 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
3927 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3928
3929 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
3930 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3931
3932 STAM_REL_COUNTER_INC(&pThis->StatReqsSubmitted);
3933 STAM_REL_COUNTER_INC(&pThis->StatReqsWrite);
3934
3935 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_WRITE;
3936 pIoReq->tsSubmit = RTTimeMilliTS();
3937 pIoReq->ReadWrite.offStart = off;
3938 pIoReq->ReadWrite.cbReq = cbWrite;
3939 pIoReq->ReadWrite.cbReqLeft = cbWrite;
3940 /* Allocate a suitable I/O buffer for this request. */
3941 int rc = drvvdMediaExIoReqBufAlloc(pThis, pIoReq, cbWrite);
3942 if (rc == VINF_SUCCESS)
3943 {
3944 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
3945 if (RT_UNLIKELY(!fXchg))
3946 {
3947 /* Must have been canceled inbetween. */
3948 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
3949 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3950 }
3951 ASMAtomicIncU32(&pThis->cIoReqsActive);
3952
3953 rc = drvvdMediaExIoReqReadWriteProcess(pThis, pIoReq, false /* fUpNotify */);
3954 }
3955
3956 return rc;
3957}
3958
3959/**
3960 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqFlush}
3961 */
3962static DECLCALLBACK(int) drvvdIoReqFlush(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq)
3963{
3964 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
3965 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
3966 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
3967
3968 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
3969 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3970
3971 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
3972 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
3973
3974 STAM_REL_COUNTER_INC(&pThis->StatReqsSubmitted);
3975 STAM_REL_COUNTER_INC(&pThis->StatReqsFlush);
3976
3977 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_FLUSH;
3978 pIoReq->tsSubmit = RTTimeMilliTS();
3979 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
3980 if (RT_UNLIKELY(!fXchg))
3981 {
3982 /* Must have been canceled inbetween. */
3983 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
3984 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
3985 }
3986
3987 ASMAtomicIncU32(&pThis->cIoReqsActive);
3988 int rc = drvvdMediaExIoReqFlushWrapper(pThis, pIoReq);
3989 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
3990 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
3991 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
3992 rc = VINF_SUCCESS;
3993
3994 if (rc != VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS)
3995 rc = drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rc, false /* fUpNotify */);
3996
3997 return rc;
3998}
3999
4000/**
4001 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqDiscard}
4002 */
4003static DECLCALLBACK(int) drvvdIoReqDiscard(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, unsigned cRangesMax)
4004{
4005 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
4006 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
4007 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
4008
4009 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
4010 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
4011
4012 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
4013 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
4014
4015 STAM_REL_COUNTER_INC(&pThis->StatReqsSubmitted);
4016 STAM_REL_COUNTER_INC(&pThis->StatReqsDiscard);
4017
4018 /* Copy the ranges over now, this can be optimized in the future. */
4019 pIoReq->Discard.paRanges = (PRTRANGE)RTMemAllocZ(cRangesMax * sizeof(RTRANGE));
4020 if (RT_UNLIKELY(!pIoReq->Discard.paRanges))
4021 return VERR_NO_MEMORY;
4022
4023 int rc = pThis->pDrvMediaExPort->pfnIoReqQueryDiscardRanges(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0],
4024 0, cRangesMax, pIoReq->Discard.paRanges,
4025 &pIoReq->Discard.cRanges);
4026 if (RT_SUCCESS(rc))
4027 {
4028 pIoReq->enmType = PDMMEDIAEXIOREQTYPE_DISCARD;
4029 pIoReq->tsSubmit = RTTimeMilliTS();
4030 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_ALLOCATED);
4031 if (RT_UNLIKELY(!fXchg))
4032 {
4033 /* Must have been canceled inbetween. */
4034 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
4035 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
4036 }
4037
4038 ASMAtomicIncU32(&pThis->cIoReqsActive);
4039 rc = drvvdMediaExIoReqDiscardWrapper(pThis, pIoReq);
4040 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4041 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
4042 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
4043 rc = VINF_SUCCESS;
4044
4045 if (rc != VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS)
4046 rc = drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rc, false /* fUpNotify */);
4047 }
4048
4049 return rc;
4050}
4051
4052/**
4053 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqSendScsiCmd}
4054 */
4055static DECLCALLBACK(int) drvvdIoReqSendScsiCmd(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq, uint32_t uLun,
4056 const uint8_t *pbCdb, size_t cbCdb, PDMMEDIAEXIOREQSCSITXDIR enmTxDir,
4057 size_t cbBuf, uint8_t *pabSense, size_t cbSense, uint8_t *pu8ScsiSts,
4058 uint32_t cTimeoutMillies)
4059{
4060 RT_NOREF10(pInterface, uLun, pbCdb, cbCdb, enmTxDir, cbBuf, pabSense, cbSense, pu8ScsiSts, cTimeoutMillies);
4061 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
4062 VDIOREQSTATE enmState = (VDIOREQSTATE)ASMAtomicReadU32((volatile uint32_t *)&pIoReq->enmState);
4063
4064 if (RT_UNLIKELY(enmState == VDIOREQSTATE_CANCELED))
4065 return VERR_PDM_MEDIAEX_IOREQ_CANCELED;
4066
4067 if (RT_UNLIKELY(enmState != VDIOREQSTATE_ALLOCATED))
4068 return VERR_PDM_MEDIAEX_IOREQ_INVALID_STATE;
4069
4070 return VERR_NOT_SUPPORTED;
4071}
4072
4073/**
4074 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqGetActiveCount}
4075 */
4076static DECLCALLBACK(uint32_t) drvvdIoReqGetActiveCount(PPDMIMEDIAEX pInterface)
4077{
4078 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
4079 return ASMAtomicReadU32(&pThis->cIoReqsActive);
4080}
4081
4082/**
4083 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqGetSuspendedCount}
4084 */
4085static DECLCALLBACK(uint32_t) drvvdIoReqGetSuspendedCount(PPDMIMEDIAEX pInterface)
4086{
4087 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
4088
4089 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), 0);
4090
4091 uint32_t cIoReqSuspended = 0;
4092 PPDMMEDIAEXIOREQINT pIoReq;
4093 RTCritSectEnter(&pThis->CritSectIoReqRedo);
4094 RTListForEach(&pThis->LstIoReqRedo, pIoReq, PDMMEDIAEXIOREQINT, NdLstWait)
4095 {
4096 cIoReqSuspended++;
4097 }
4098 RTCritSectLeave(&pThis->CritSectIoReqRedo);
4099
4100 return cIoReqSuspended;
4101}
4102
4103/**
4104 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqQuerySuspendedStart}
4105 */
4106static DECLCALLBACK(int) drvvdIoReqQuerySuspendedStart(PPDMIMEDIAEX pInterface, PPDMMEDIAEXIOREQ phIoReq,
4107 void **ppvIoReqAlloc)
4108{
4109 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
4110
4111 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), VERR_INVALID_STATE);
4112 AssertReturn(!RTListIsEmpty(&pThis->LstIoReqRedo), VERR_NOT_FOUND);
4113
4114 RTCritSectEnter(&pThis->CritSectIoReqRedo);
4115 PPDMMEDIAEXIOREQINT pIoReq = RTListGetFirst(&pThis->LstIoReqRedo, PDMMEDIAEXIOREQINT, NdLstWait);
4116 *phIoReq = pIoReq;
4117 *ppvIoReqAlloc = &pIoReq->abAlloc[0];
4118 RTCritSectLeave(&pThis->CritSectIoReqRedo);
4119
4120 return VINF_SUCCESS;
4121}
4122
4123/**
4124 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqQuerySuspendedNext}
4125 */
4126static DECLCALLBACK(int) drvvdIoReqQuerySuspendedNext(PPDMIMEDIAEX pInterface, PDMMEDIAEXIOREQ hIoReq,
4127 PPDMMEDIAEXIOREQ phIoReqNext, void **ppvIoReqAllocNext)
4128{
4129 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
4130 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
4131
4132 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), VERR_INVALID_STATE);
4133 AssertPtrReturn(pIoReq, VERR_INVALID_HANDLE);
4134 AssertReturn(!RTListNodeIsLast(&pThis->LstIoReqRedo, &pIoReq->NdLstWait), VERR_NOT_FOUND);
4135
4136 RTCritSectEnter(&pThis->CritSectIoReqRedo);
4137 PPDMMEDIAEXIOREQINT pIoReqNext = RTListNodeGetNext(&pIoReq->NdLstWait, PDMMEDIAEXIOREQINT, NdLstWait);
4138 *phIoReqNext = pIoReqNext;
4139 *ppvIoReqAllocNext = &pIoReqNext->abAlloc[0];
4140 RTCritSectLeave(&pThis->CritSectIoReqRedo);
4141
4142 return VINF_SUCCESS;
4143}
4144
4145/**
4146 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqSuspendedSave}
4147 */
4148static DECLCALLBACK(int) drvvdIoReqSuspendedSave(PPDMIMEDIAEX pInterface, PSSMHANDLE pSSM, PDMMEDIAEXIOREQ hIoReq)
4149{
4150 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
4151 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
4152
4153 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), VERR_INVALID_STATE);
4154 AssertPtrReturn(pIoReq, VERR_INVALID_HANDLE);
4155 AssertReturn(pIoReq->enmState == VDIOREQSTATE_SUSPENDED, VERR_INVALID_STATE);
4156
4157 SSMR3PutU32(pSSM, DRVVD_IOREQ_SAVED_STATE_VERSION);
4158 SSMR3PutU32(pSSM, (uint32_t)pIoReq->enmType);
4159 SSMR3PutU32(pSSM, pIoReq->uIoReqId);
4160 SSMR3PutU32(pSSM, pIoReq->fFlags);
4161 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
4162 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
4163 {
4164 SSMR3PutU64(pSSM, pIoReq->ReadWrite.offStart);
4165 SSMR3PutU64(pSSM, pIoReq->ReadWrite.cbReq);
4166 SSMR3PutU64(pSSM, pIoReq->ReadWrite.cbReqLeft);
4167 }
4168 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
4169 {
4170 SSMR3PutU32(pSSM, pIoReq->Discard.cRanges);
4171 for (unsigned i = 0; i < pIoReq->Discard.cRanges; i++)
4172 {
4173 SSMR3PutU64(pSSM, pIoReq->Discard.paRanges[i].offStart);
4174 SSMR3PutU64(pSSM, pIoReq->Discard.paRanges[i].cbRange);
4175 }
4176 }
4177
4178 return SSMR3PutU32(pSSM, UINT32_MAX); /* sanity/terminator */
4179}
4180
4181/**
4182 * @interface_method_impl{PDMIMEDIAEX,pfnIoReqSuspendedLoad}
4183 */
4184static DECLCALLBACK(int) drvvdIoReqSuspendedLoad(PPDMIMEDIAEX pInterface, PSSMHANDLE pSSM, PDMMEDIAEXIOREQ hIoReq)
4185{
4186 PVBOXDISK pThis = RT_FROM_MEMBER(pInterface, VBOXDISK, IMediaEx);
4187 PPDMMEDIAEXIOREQINT pIoReq = hIoReq;
4188
4189 AssertReturn(!drvvdMediaExIoReqIsVmRunning(pThis), VERR_INVALID_STATE);
4190 AssertPtrReturn(pIoReq, VERR_INVALID_HANDLE);
4191 AssertReturn(pIoReq->enmState == VDIOREQSTATE_ALLOCATED, VERR_INVALID_STATE);
4192
4193 uint32_t u32;
4194 uint64_t u64;
4195 int rc = VINF_SUCCESS;
4196 bool fPlaceOnRedoList = true;
4197
4198 SSMR3GetU32(pSSM, &u32);
4199 if (u32 <= DRVVD_IOREQ_SAVED_STATE_VERSION)
4200 {
4201 SSMR3GetU32(pSSM, &u32);
4202 AssertReturn( u32 == PDMMEDIAEXIOREQTYPE_WRITE
4203 || u32 == PDMMEDIAEXIOREQTYPE_READ
4204 || u32 == PDMMEDIAEXIOREQTYPE_DISCARD
4205 || u32 == PDMMEDIAEXIOREQTYPE_FLUSH,
4206 VERR_SSM_DATA_UNIT_FORMAT_CHANGED);
4207 pIoReq->enmType = (PDMMEDIAEXIOREQTYPE)u32;
4208
4209 SSMR3GetU32(pSSM, &u32);
4210 AssertReturn(u32 == pIoReq->uIoReqId, VERR_SSM_DATA_UNIT_FORMAT_CHANGED);
4211
4212 SSMR3GetU32(pSSM, &u32);
4213 AssertReturn(u32 == pIoReq->fFlags, VERR_SSM_DATA_UNIT_FORMAT_CHANGED);
4214
4215 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
4216 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
4217 {
4218 SSMR3GetU64(pSSM, &pIoReq->ReadWrite.offStart);
4219 SSMR3GetU64(pSSM, &u64);
4220 pIoReq->ReadWrite.cbReq = (size_t)u64;
4221 SSMR3GetU64(pSSM, &u64);
4222 pIoReq->ReadWrite.cbReqLeft = (size_t)u64;
4223
4224 /*
4225 * Try to allocate enough I/O buffer, if this fails for some reason put it onto the
4226 * waiting list instead of the redo list.
4227 */
4228 pIoReq->ReadWrite.cbIoBuf = 0;
4229 rc = IOBUFMgrAllocBuf(pThis->hIoBufMgr, &pIoReq->ReadWrite.IoBuf, pIoReq->ReadWrite.cbReqLeft,
4230 &pIoReq->ReadWrite.cbIoBuf);
4231 if (rc == VERR_NO_MEMORY)
4232 {
4233 pIoReq->enmState = VDIOREQSTATE_ALLOCATED;
4234 ASMAtomicIncU32(&pThis->cIoReqsWaiting);
4235 RTListAppend(&pThis->LstIoReqIoBufWait, &pIoReq->NdLstWait);
4236 fPlaceOnRedoList = false;
4237 rc = VINF_SUCCESS;
4238 }
4239 else
4240 {
4241 pIoReq->ReadWrite.fDirectBuf = false;
4242 pIoReq->ReadWrite.pSgBuf = &pIoReq->ReadWrite.IoBuf.SgBuf;
4243 }
4244 }
4245 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
4246 {
4247 rc = SSMR3GetU32(pSSM, &pIoReq->Discard.cRanges);
4248 if (RT_SUCCESS(rc))
4249 {
4250 pIoReq->Discard.paRanges = (PRTRANGE)RTMemAllocZ(pIoReq->Discard.cRanges * sizeof(RTRANGE));
4251 if (RT_LIKELY(pIoReq->Discard.paRanges))
4252 {
4253 for (unsigned i = 0; i < pIoReq->Discard.cRanges; i++)
4254 {
4255 SSMR3GetU64(pSSM, &pIoReq->Discard.paRanges[i].offStart);
4256 SSMR3GetU64(pSSM, &u64);
4257 pIoReq->Discard.paRanges[i].cbRange = (size_t)u64;
4258 }
4259 }
4260 else
4261 rc = VERR_NO_MEMORY;
4262 }
4263 }
4264
4265 if (RT_SUCCESS(rc))
4266 rc = SSMR3GetU32(pSSM, &u32); /* sanity/terminator */
4267 if (RT_SUCCESS(rc))
4268 AssertReturn(u32 == UINT32_MAX, VERR_SSM_DATA_UNIT_FORMAT_CHANGED);
4269 if ( RT_SUCCESS(rc)
4270 && fPlaceOnRedoList)
4271 {
4272 /* Mark as suspended */
4273 pIoReq->enmState = VDIOREQSTATE_SUSPENDED;
4274
4275 /* Link into suspended list so it gets kicked off again when we resume. */
4276 RTCritSectEnter(&pThis->CritSectIoReqRedo);
4277 RTListAppend(&pThis->LstIoReqRedo, &pIoReq->NdLstWait);
4278 RTCritSectLeave(&pThis->CritSectIoReqRedo);
4279 }
4280 }
4281
4282 return rc;
4283}
4284
4285/**
4286 * Loads all configured plugins.
4287 *
4288 * @returns VBox status code.
4289 * @param pCfg CFGM node holding plugin list.
4290 */
4291static int drvvdLoadPlugins(PCFGMNODE pCfg)
4292{
4293 PCFGMNODE pCfgPlugins = CFGMR3GetChild(pCfg, "Plugins");
4294
4295 if (pCfgPlugins)
4296 {
4297 PCFGMNODE pPluginCur = CFGMR3GetFirstChild(pCfgPlugins);
4298 while (pPluginCur)
4299 {
4300 int rc = VINF_SUCCESS;
4301 char *pszPluginFilename = NULL;
4302 rc = CFGMR3QueryStringAlloc(pPluginCur, "Path", &pszPluginFilename);
4303 if (RT_SUCCESS(rc))
4304 rc = VDPluginLoadFromFilename(pszPluginFilename);
4305
4306 if (RT_FAILURE(rc))
4307 LogRel(("VD: Failed to load plugin '%s' with %Rrc, continuing\n", pszPluginFilename, rc));
4308
4309 pPluginCur = CFGMR3GetNextChild(pPluginCur);
4310 }
4311 }
4312
4313 return VINF_SUCCESS;
4314}
4315
4316
4317/**
4318 * Sets up the disk filter chain.
4319 *
4320 * @returns VBox status code.
4321 * @param pThis The disk instance.
4322 * @param pCfg CFGM node holding the filter parameters.
4323 */
4324static int drvvdSetupFilters(PVBOXDISK pThis, PCFGMNODE pCfg)
4325{
4326 int rc = VINF_SUCCESS;
4327 PCFGMNODE pCfgFilter = CFGMR3GetChild(pCfg, "Filters");
4328
4329 if (pCfgFilter)
4330 {
4331 PCFGMNODE pCfgFilterConfig = CFGMR3GetChild(pCfgFilter, "VDConfig");
4332 char *pszFilterName = NULL;
4333 VDINTERFACECONFIG VDIfConfig;
4334 PVDINTERFACE pVDIfsFilter = NULL;
4335
4336 rc = CFGMR3QueryStringAlloc(pCfgFilter, "FilterName", &pszFilterName);
4337 if (RT_SUCCESS(rc))
4338 {
4339 VDIfConfig.pfnAreKeysValid = drvvdCfgAreKeysValid;
4340 VDIfConfig.pfnQuerySize = drvvdCfgQuerySize;
4341 VDIfConfig.pfnQuery = drvvdCfgQuery;
4342 VDIfConfig.pfnQueryBytes = drvvdCfgQueryBytes;
4343 rc = VDInterfaceAdd(&VDIfConfig.Core, "DrvVD_Config", VDINTERFACETYPE_CONFIG,
4344 pCfgFilterConfig, sizeof(VDINTERFACECONFIG), &pVDIfsFilter);
4345 AssertRC(rc);
4346
4347 rc = VDFilterAdd(pThis->pDisk, pszFilterName, VD_FILTER_FLAGS_DEFAULT, pVDIfsFilter);
4348
4349 MMR3HeapFree(pszFilterName);
4350 }
4351 }
4352
4353 return rc;
4354}
4355
4356
4357/**
4358 * Translates a PDMMEDIATYPE value into a string.
4359 *
4360 * @returns Read only string.
4361 * @param enmType The type value.
4362 */
4363static const char *drvvdGetTypeName(PDMMEDIATYPE enmType)
4364{
4365 switch (enmType)
4366 {
4367 case PDMMEDIATYPE_ERROR: return "ERROR";
4368 case PDMMEDIATYPE_FLOPPY_360: return "FLOPPY_360";
4369 case PDMMEDIATYPE_FLOPPY_720: return "FLOPPY_720";
4370 case PDMMEDIATYPE_FLOPPY_1_20: return "FLOPPY_1_20";
4371 case PDMMEDIATYPE_FLOPPY_1_44: return "FLOPPY_1_44";
4372 case PDMMEDIATYPE_FLOPPY_2_88: return "FLOPPY_2_88";
4373 case PDMMEDIATYPE_FLOPPY_FAKE_15_6: return "FLOPPY_FAKE_15_6";
4374 case PDMMEDIATYPE_FLOPPY_FAKE_63_5: return "FLOPPY_FAKE_63_5";
4375 case PDMMEDIATYPE_CDROM: return "CDROM";
4376 case PDMMEDIATYPE_DVD: return "DVD";
4377 case PDMMEDIATYPE_HARD_DISK: return "HARD_DISK";
4378 default: return "Unknown";
4379 }
4380}
4381
4382/**
4383 * Returns the appropriate PDMMEDIATYPE for t he given string.
4384 *
4385 * @returns PDMMEDIATYPE
4386 * @param pszType The string representation of the media type.
4387 */
4388static PDMMEDIATYPE drvvdGetMediaTypeFromString(const char *pszType)
4389{
4390 PDMMEDIATYPE enmType = PDMMEDIATYPE_ERROR;
4391
4392 if (!strcmp(pszType, "HardDisk"))
4393 enmType = PDMMEDIATYPE_HARD_DISK;
4394 else if (!strcmp(pszType, "DVD"))
4395 enmType = PDMMEDIATYPE_DVD;
4396 else if (!strcmp(pszType, "CDROM"))
4397 enmType = PDMMEDIATYPE_CDROM;
4398 else if (!strcmp(pszType, "Floppy 2.88"))
4399 enmType = PDMMEDIATYPE_FLOPPY_2_88;
4400 else if (!strcmp(pszType, "Floppy 1.44"))
4401 enmType = PDMMEDIATYPE_FLOPPY_1_44;
4402 else if (!strcmp(pszType, "Floppy 1.20"))
4403 enmType = PDMMEDIATYPE_FLOPPY_1_20;
4404 else if (!strcmp(pszType, "Floppy 720"))
4405 enmType = PDMMEDIATYPE_FLOPPY_720;
4406 else if (!strcmp(pszType, "Floppy 360"))
4407 enmType = PDMMEDIATYPE_FLOPPY_360;
4408 else if (!strcmp(pszType, "Floppy 15.6"))
4409 enmType = PDMMEDIATYPE_FLOPPY_FAKE_15_6;
4410 else if (!strcmp(pszType, "Floppy 63.5"))
4411 enmType = PDMMEDIATYPE_FLOPPY_FAKE_63_5;
4412
4413 return enmType;
4414}
4415
4416/**
4417 * Converts PDMMEDIATYPE to the appropriate VDTYPE.
4418 *
4419 * @returns The VDTYPE.
4420 * @param enmType The PDMMEDIATYPE to convert from.
4421 */
4422static VDTYPE drvvdGetVDFromMediaType(PDMMEDIATYPE enmType)
4423{
4424 if (PDMMEDIATYPE_IS_FLOPPY(enmType))
4425 return VDTYPE_FLOPPY;
4426 else if (enmType == PDMMEDIATYPE_DVD || enmType == PDMMEDIATYPE_CDROM)
4427 return VDTYPE_OPTICAL_DISC;
4428 else if (enmType == PDMMEDIATYPE_HARD_DISK)
4429 return VDTYPE_HDD;
4430
4431 AssertMsgFailed(("Invalid media type %d{%s} given!\n", enmType, drvvdGetTypeName(enmType)));
4432 return VDTYPE_HDD;
4433}
4434
4435/**
4436 * Registers statistics associated with the given media driver.
4437 *
4438 * @returns VBox status code.
4439 * @param pThis The media driver instance.
4440 */
4441static int drvvdStatsRegister(PVBOXDISK pThis)
4442{
4443 PPDMDRVINS pDrvIns = pThis->pDrvIns;
4444 uint32_t iInstance, iLUN;
4445 const char *pcszController;
4446
4447 int rc = pThis->pDrvMediaPort->pfnQueryDeviceLocation(pThis->pDrvMediaPort, &pcszController,
4448 &iInstance, &iLUN);
4449 if (RT_SUCCESS(rc))
4450 {
4451 char *pszCtrlUpper = RTStrDup(pcszController);
4452 if (pszCtrlUpper)
4453 {
4454 RTStrToUpper(pszCtrlUpper);
4455
4456 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatQueryBufAttempts, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS,
4457 STAMUNIT_COUNT, "Number of attempts to query a direct buffer.",
4458 "/Devices/%s%u/Port%u/QueryBufAttempts", pszCtrlUpper, iInstance, iLUN);
4459 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatQueryBufSuccess, STAMTYPE_COUNTER, STAMVISIBILITY_ALWAYS,
4460 STAMUNIT_COUNT, "Number of succeeded attempts to query a direct buffer.",
4461 "/Devices/%s%u/Port%u/QueryBufSuccess", pszCtrlUpper, iInstance, iLUN);
4462
4463 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatBytesRead, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_BYTES,
4464 "Amount of data read.", "/Devices/%s%u/Port%u/ReadBytes", pszCtrlUpper, iInstance, iLUN);
4465 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatBytesWritten, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_BYTES,
4466 "Amount of data written.", "/Devices/%s%u/Port%u/WrittenBytes", pszCtrlUpper, iInstance, iLUN);
4467
4468 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatReqsSubmitted, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_COUNT,
4469 "Number of I/O requests submitted.", "/Devices/%s%u/Port%u/ReqsSubmitted", pszCtrlUpper, iInstance, iLUN);
4470 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatReqsFailed, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_COUNT,
4471 "Number of I/O requests failed.", "/Devices/%s%u/Port%u/ReqsFailed", pszCtrlUpper, iInstance, iLUN);
4472 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatReqsSucceeded, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_COUNT,
4473 "Number of I/O requests succeeded.", "/Devices/%s%u/Port%u/ReqsSucceeded", pszCtrlUpper, iInstance, iLUN);
4474 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatReqsFlush, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_COUNT,
4475 "Number of flush I/O requests submitted.", "/Devices/%s%u/Port%u/ReqsFlush", pszCtrlUpper, iInstance, iLUN);
4476 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatReqsWrite, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_COUNT,
4477 "Number of write I/O requests submitted.", "/Devices/%s%u/Port%u/ReqsWrite", pszCtrlUpper, iInstance, iLUN);
4478 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatReqsRead, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_COUNT,
4479 "Number of read I/O requests submitted.", "/Devices/%s%u/Port%u/ReqsRead", pszCtrlUpper, iInstance, iLUN);
4480 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatReqsDiscard, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_COUNT,
4481 "Number of discard I/O requests submitted.", "/Devices/%s%u/Port%u/ReqsDiscard", pszCtrlUpper, iInstance, iLUN);
4482
4483 PDMDrvHlpSTAMRegisterF(pDrvIns, &pThis->StatReqsPerSec, STAMTYPE_COUNTER, STAMVISIBILITY_USED, STAMUNIT_OCCURENCES,
4484 "Number of processed I/O requests per second.", "/Devices/%s%u/Port%u/ReqsPerSec",
4485 pszCtrlUpper, iInstance, iLUN);
4486
4487 RTStrFree(pszCtrlUpper);
4488 }
4489 else
4490 rc = VERR_NO_STR_MEMORY;
4491 }
4492
4493 return rc;
4494}
4495
4496/**
4497 * Deregisters statistics associated with the given media driver.
4498 *
4499 * @returns nothing.
4500 * @param pThis The media driver instance.
4501 */
4502static void drvvdStatsDeregister(PVBOXDISK pThis)
4503{
4504 PPDMDRVINS pDrvIns = pThis->pDrvIns;
4505
4506 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatQueryBufAttempts);
4507 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatQueryBufSuccess);
4508
4509 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatBytesRead);
4510 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatBytesWritten);
4511 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatReqsSubmitted);
4512 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatReqsFailed);
4513 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatReqsSucceeded);
4514 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatReqsFlush);
4515 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatReqsWrite);
4516 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatReqsRead);
4517 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatReqsDiscard);
4518 PDMDrvHlpSTAMDeregister(pDrvIns, &pThis->StatReqsPerSec);
4519}
4520
4521
4522/*********************************************************************************************************************************
4523* Base interface methods *
4524*********************************************************************************************************************************/
4525
4526/**
4527 * @interface_method_impl{PDMIBASE,pfnQueryInterface}
4528 */
4529static DECLCALLBACK(void *) drvvdQueryInterface(PPDMIBASE pInterface, const char *pszIID)
4530{
4531 PPDMDRVINS pDrvIns = PDMIBASE_2_PDMDRV(pInterface);
4532 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4533
4534 PDMIBASE_RETURN_INTERFACE(pszIID, PDMIBASE, &pDrvIns->IBase);
4535 PDMIBASE_RETURN_INTERFACE(pszIID, PDMIMEDIA, &pThis->IMedia);
4536 PDMIBASE_RETURN_INTERFACE(pszIID, PDMIMOUNT, pThis->fMountable ? &pThis->IMount : NULL);
4537 PDMIBASE_RETURN_INTERFACE(pszIID, PDMIMEDIAEX, pThis->pDrvMediaExPort ? &pThis->IMediaEx : NULL);
4538 return NULL;
4539}
4540
4541
4542/*********************************************************************************************************************************
4543* Saved state notification methods *
4544*********************************************************************************************************************************/
4545
4546/**
4547 * Load done callback for re-opening the image writable during teleportation.
4548 *
4549 * This is called both for successful and failed load runs, we only care about
4550 * successful ones.
4551 *
4552 * @returns VBox status code.
4553 * @param pDrvIns The driver instance.
4554 * @param pSSM The saved state handle.
4555 */
4556static DECLCALLBACK(int) drvvdLoadDone(PPDMDRVINS pDrvIns, PSSMHANDLE pSSM)
4557{
4558 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4559 Assert(!pThis->fErrorUseRuntime);
4560
4561 /* Drop out if we don't have any work to do or if it's a failed load. */
4562 if ( !pThis->fTempReadOnly
4563 || RT_FAILURE(SSMR3HandleGetStatus(pSSM)))
4564 return VINF_SUCCESS;
4565
4566 int rc = drvvdSetWritable(pThis);
4567 if (RT_FAILURE(rc)) /** @todo does the bugger set any errors? */
4568 return SSMR3SetLoadError(pSSM, rc, RT_SRC_POS,
4569 N_("Failed to write lock the images"));
4570 return VINF_SUCCESS;
4571}
4572
4573
4574/*********************************************************************************************************************************
4575* Driver methods *
4576*********************************************************************************************************************************/
4577
4578/**
4579 * Worker for the power off or destruct callback.
4580 *
4581 * @returns nothing.
4582 * @param pDrvIns The driver instance.
4583 */
4584static void drvvdPowerOffOrDestructOrUnmount(PPDMDRVINS pDrvIns)
4585{
4586 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4587 LogFlowFunc(("\n"));
4588
4589 RTSEMFASTMUTEX mutex;
4590 ASMAtomicXchgHandle(&pThis->MergeCompleteMutex, NIL_RTSEMFASTMUTEX, &mutex);
4591 if (mutex != NIL_RTSEMFASTMUTEX)
4592 {
4593 /* Request the semaphore to wait until a potentially running merge
4594 * operation has been finished. */
4595 int rc = RTSemFastMutexRequest(mutex);
4596 AssertRC(rc);
4597 pThis->fMergePending = false;
4598 rc = RTSemFastMutexRelease(mutex);
4599 AssertRC(rc);
4600 rc = RTSemFastMutexDestroy(mutex);
4601 AssertRC(rc);
4602 }
4603
4604 if (RT_VALID_PTR(pThis->pBlkCache))
4605 {
4606 PDMR3BlkCacheRelease(pThis->pBlkCache);
4607 pThis->pBlkCache = NULL;
4608 }
4609
4610 if (RT_VALID_PTR(pThis->pRegionList))
4611 {
4612 VDRegionListFree(pThis->pRegionList);
4613 pThis->pRegionList = NULL;
4614 }
4615
4616 if (RT_VALID_PTR(pThis->pDisk))
4617 {
4618 VDDestroy(pThis->pDisk);
4619 pThis->pDisk = NULL;
4620 }
4621 drvvdFreeImages(pThis);
4622}
4623
4624/**
4625 * @copydoc FNPDMDRVPOWEROFF
4626 */
4627static DECLCALLBACK(void) drvvdPowerOff(PPDMDRVINS pDrvIns)
4628{
4629 PDMDRV_CHECK_VERSIONS_RETURN_VOID(pDrvIns);
4630 drvvdPowerOffOrDestructOrUnmount(pDrvIns);
4631}
4632
4633/**
4634 * @callback_method_impl{FNPDMDRVRESUME}
4635 *
4636 * VM resume notification that we use to undo what the temporary read-only image
4637 * mode set by drvvdSuspend.
4638 *
4639 * Also switch to runtime error mode if we're resuming after a state load
4640 * without having been powered on first.
4641 *
4642 * @todo The VMSetError vs VMSetRuntimeError mess must be fixed elsewhere,
4643 * we're making assumptions about Main behavior here!
4644 */
4645static DECLCALLBACK(void) drvvdResume(PPDMDRVINS pDrvIns)
4646{
4647 LogFlowFunc(("\n"));
4648 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4649
4650 drvvdSetWritable(pThis);
4651 pThis->fErrorUseRuntime = true;
4652
4653 if (pThis->pBlkCache)
4654 {
4655 int rc = PDMR3BlkCacheResume(pThis->pBlkCache);
4656 AssertRC(rc);
4657 }
4658
4659 if (pThis->pDrvMediaExPort)
4660 {
4661 /* Kick of any request we have to redo. */
4662 PPDMMEDIAEXIOREQINT pIoReq, pIoReqNext;
4663 RTCritSectEnter(&pThis->CritSectIoReqRedo);
4664 RTListForEachSafe(&pThis->LstIoReqRedo, pIoReq, pIoReqNext, PDMMEDIAEXIOREQINT, NdLstWait)
4665 {
4666 int rc = VINF_SUCCESS;
4667 bool fXchg = ASMAtomicCmpXchgU32((volatile uint32_t *)&pIoReq->enmState, VDIOREQSTATE_ACTIVE, VDIOREQSTATE_SUSPENDED);
4668
4669 RTListNodeRemove(&pIoReq->NdLstWait);
4670 ASMAtomicIncU32(&pThis->cIoReqsActive);
4671
4672 if (fXchg)
4673 {
4674 pThis->pDrvMediaExPort->pfnIoReqStateChanged(pThis->pDrvMediaExPort, pIoReq, &pIoReq->abAlloc[0],
4675 PDMMEDIAEXIOREQSTATE_ACTIVE);
4676 if ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_READ
4677 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_WRITE)
4678 rc = drvvdMediaExIoReqReadWriteProcess(pThis, pIoReq, true /* fUpNotify */);
4679 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH)
4680 {
4681 rc = drvvdMediaExIoReqFlushWrapper(pThis, pIoReq);
4682 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4683 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
4684 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
4685 rc = VINF_SUCCESS;
4686 }
4687 else if (pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD)
4688 {
4689 rc = drvvdMediaExIoReqDiscardWrapper(pThis, pIoReq);
4690 if (rc == VERR_VD_ASYNC_IO_IN_PROGRESS)
4691 rc = VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS;
4692 else if (rc == VINF_VD_ASYNC_IO_FINISHED)
4693 rc = VINF_SUCCESS;
4694 }
4695 else
4696 AssertMsgFailed(("Invalid request type %u\n", pIoReq->enmType));
4697
4698 /* The read write process will call the completion callback on its own. */
4699 if ( rc != VINF_PDM_MEDIAEX_IOREQ_IN_PROGRESS
4700 && ( pIoReq->enmType == PDMMEDIAEXIOREQTYPE_DISCARD
4701 || pIoReq->enmType == PDMMEDIAEXIOREQTYPE_FLUSH))
4702 {
4703 Assert( ( pIoReq->enmType != PDMMEDIAEXIOREQTYPE_WRITE
4704 && pIoReq->enmType != PDMMEDIAEXIOREQTYPE_READ)
4705 || !pIoReq->ReadWrite.cbReqLeft
4706 || RT_FAILURE(rc));
4707 drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, rc, true /* fUpNotify */);
4708 }
4709
4710 }
4711 else
4712 {
4713 /* Request was canceled inbetween, so don't care and notify the owner about the completed request. */
4714 Assert(pIoReq->enmState == VDIOREQSTATE_CANCELED);
4715 drvvdMediaExIoReqCompleteWorker(pThis, pIoReq, VERR_PDM_MEDIAEX_IOREQ_CANCELED, true /* fUpNotify */);
4716 }
4717 }
4718 Assert(RTListIsEmpty(&pThis->LstIoReqRedo));
4719 RTCritSectLeave(&pThis->CritSectIoReqRedo);
4720 }
4721}
4722
4723/**
4724 * @callback_method_impl{FNPDMDRVSUSPEND}
4725 *
4726 * When the VM is being suspended, temporarily change to read-only image mode.
4727 *
4728 * This is important for several reasons:
4729 * -# It makes sure that there are no pending writes to the image. Most
4730 * backends implements this by closing and reopening the image in read-only
4731 * mode.
4732 * -# It allows Main to read the images during snapshotting without having
4733 * to account for concurrent writes.
4734 * -# This is essential for making teleportation targets sharing images work
4735 * right. Both with regards to caching and with regards to file sharing
4736 * locks (RTFILE_O_DENY_*). (See also drvvdLoadDone.)
4737 */
4738static DECLCALLBACK(void) drvvdSuspend(PPDMDRVINS pDrvIns)
4739{
4740 LogFlowFunc(("\n"));
4741 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4742
4743 if (pThis->pBlkCache)
4744 {
4745 int rc = PDMR3BlkCacheSuspend(pThis->pBlkCache);
4746 AssertRC(rc);
4747 }
4748
4749 drvvdSetReadonly(pThis);
4750}
4751
4752/**
4753 * @callback_method_impl{FNPDMDRVPOWERON}
4754 */
4755static DECLCALLBACK(void) drvvdPowerOn(PPDMDRVINS pDrvIns)
4756{
4757 LogFlowFunc(("\n"));
4758 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4759 drvvdSetWritable(pThis);
4760 pThis->fErrorUseRuntime = true;
4761}
4762
4763/**
4764 * @callback_method_impl{FNPDMDRVRESET}
4765 */
4766static DECLCALLBACK(void) drvvdReset(PPDMDRVINS pDrvIns)
4767{
4768 LogFlowFunc(("\n"));
4769 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4770
4771 if (pThis->pBlkCache)
4772 {
4773 int rc = PDMR3BlkCacheClear(pThis->pBlkCache);
4774 AssertRC(rc);
4775 }
4776
4777 if (pThis->fBootAccelEnabled)
4778 {
4779 pThis->fBootAccelActive = true;
4780 pThis->cbDataValid = 0;
4781 pThis->offDisk = 0;
4782 }
4783}
4784
4785/**
4786 * @callback_method_impl{FNPDMDRVDESTRUCT}
4787 */
4788static DECLCALLBACK(void) drvvdDestruct(PPDMDRVINS pDrvIns)
4789{
4790 PDMDRV_CHECK_VERSIONS_RETURN_VOID(pDrvIns);
4791 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4792 LogFlowFunc(("\n"));
4793
4794 /*
4795 * Make sure the block cache and disks are closed when this driver is
4796 * destroyed. This method will get called without calling the power off
4797 * callback first when we reconfigure the driver chain after a snapshot.
4798 */
4799 drvvdPowerOffOrDestructOrUnmount(pDrvIns);
4800 if (pThis->MergeLock != NIL_RTSEMRW)
4801 {
4802 int rc = RTSemRWDestroy(pThis->MergeLock);
4803 AssertRC(rc);
4804 pThis->MergeLock = NIL_RTSEMRW;
4805 }
4806 if (pThis->pbData)
4807 {
4808 RTMemFree(pThis->pbData);
4809 pThis->pbData = NULL;
4810 }
4811 if (pThis->pszBwGroup)
4812 {
4813 MMR3HeapFree(pThis->pszBwGroup);
4814 pThis->pszBwGroup = NULL;
4815 }
4816 if (pThis->hHbdMgr != NIL_HBDMGR)
4817 HBDMgrDestroy(pThis->hHbdMgr);
4818 if (pThis->hIoReqCache != NIL_RTMEMCACHE)
4819 RTMemCacheDestroy(pThis->hIoReqCache);
4820 if (pThis->hIoBufMgr != NIL_IOBUFMGR)
4821 IOBUFMgrDestroy(pThis->hIoBufMgr);
4822 if (RTCritSectIsInitialized(&pThis->CritSectIoReqsIoBufWait))
4823 RTCritSectDelete(&pThis->CritSectIoReqsIoBufWait);
4824 if (RTCritSectIsInitialized(&pThis->CritSectIoReqRedo))
4825 RTCritSectDelete(&pThis->CritSectIoReqRedo);
4826 for (unsigned i = 0; i < RT_ELEMENTS(pThis->aIoReqAllocBins); i++)
4827 if (pThis->aIoReqAllocBins[i].hMtxLstIoReqAlloc != NIL_RTSEMFASTMUTEX)
4828 RTSemFastMutexDestroy(pThis->aIoReqAllocBins[i].hMtxLstIoReqAlloc);
4829
4830 drvvdStatsDeregister(pThis);
4831}
4832
4833/**
4834 * @callback_method_impl{FNPDMDRVCONSTRUCT,
4835 * Construct a VBox disk media driver instance.}
4836 */
4837static DECLCALLBACK(int) drvvdConstruct(PPDMDRVINS pDrvIns, PCFGMNODE pCfg, uint32_t fFlags)
4838{
4839 RT_NOREF(fFlags);
4840 LogFlowFunc(("\n"));
4841 PDMDRV_CHECK_VERSIONS_RETURN(pDrvIns);
4842 PVBOXDISK pThis = PDMINS_2_DATA(pDrvIns, PVBOXDISK);
4843 int rc = VINF_SUCCESS;
4844 char *pszName = NULL; /* The path of the disk image file. */
4845 char *pszFormat = NULL; /* The format backed to use for this image. */
4846 char *pszCachePath = NULL; /* The path to the cache image. */
4847 char *pszCacheFormat = NULL; /* The format backend to use for the cache image. */
4848 bool fReadOnly = false; /* True if the media is read-only. */
4849 bool fMaybeReadOnly = false; /* True if the media may or may not be read-only. */
4850 bool fHonorZeroWrites = false; /* True if zero blocks should be written. */
4851
4852 /*
4853 * Init the static parts.
4854 */
4855 pDrvIns->IBase.pfnQueryInterface = drvvdQueryInterface;
4856 pThis->pDrvIns = pDrvIns;
4857 pThis->fTempReadOnly = false;
4858 pThis->pDisk = NULL;
4859 pThis->fAsyncIOSupported = false;
4860 pThis->fShareable = false;
4861 pThis->fMergePending = false;
4862 pThis->MergeCompleteMutex = NIL_RTSEMFASTMUTEX;
4863 pThis->MergeLock = NIL_RTSEMRW;
4864 pThis->uMergeSource = VD_LAST_IMAGE;
4865 pThis->uMergeTarget = VD_LAST_IMAGE;
4866 pThis->pCfgCrypto = NULL;
4867 pThis->pIfSecKey = NULL;
4868 pThis->hIoReqCache = NIL_RTMEMCACHE;
4869 pThis->hIoBufMgr = NIL_IOBUFMGR;
4870 pThis->pRegionList = NULL;
4871
4872 for (unsigned i = 0; i < RT_ELEMENTS(pThis->aIoReqAllocBins); i++)
4873 pThis->aIoReqAllocBins[i].hMtxLstIoReqAlloc = NIL_RTSEMFASTMUTEX;
4874
4875 /* IMedia */
4876 pThis->IMedia.pfnRead = drvvdRead;
4877 pThis->IMedia.pfnReadPcBios = drvvdReadPcBios;
4878 pThis->IMedia.pfnWrite = drvvdWrite;
4879 pThis->IMedia.pfnFlush = drvvdFlush;
4880 pThis->IMedia.pfnMerge = drvvdMerge;
4881 pThis->IMedia.pfnSetSecKeyIf = drvvdSetSecKeyIf;
4882 pThis->IMedia.pfnGetSize = drvvdGetSize;
4883 pThis->IMedia.pfnGetSectorSize = drvvdGetSectorSize;
4884 pThis->IMedia.pfnIsReadOnly = drvvdIsReadOnly;
4885 pThis->IMedia.pfnIsNonRotational = drvvdIsNonRotational;
4886 pThis->IMedia.pfnBiosGetPCHSGeometry = drvvdBiosGetPCHSGeometry;
4887 pThis->IMedia.pfnBiosSetPCHSGeometry = drvvdBiosSetPCHSGeometry;
4888 pThis->IMedia.pfnBiosGetLCHSGeometry = drvvdBiosGetLCHSGeometry;
4889 pThis->IMedia.pfnBiosSetLCHSGeometry = drvvdBiosSetLCHSGeometry;
4890 pThis->IMedia.pfnBiosIsVisible = drvvdBiosIsVisible;
4891 pThis->IMedia.pfnGetType = drvvdGetType;
4892 pThis->IMedia.pfnGetUuid = drvvdGetUuid;
4893 pThis->IMedia.pfnDiscard = drvvdDiscard;
4894 pThis->IMedia.pfnSendCmd = NULL;
4895 pThis->IMedia.pfnGetRegionCount = drvvdGetRegionCount;
4896 pThis->IMedia.pfnQueryRegionProperties = drvvdQueryRegionProperties;
4897 pThis->IMedia.pfnQueryRegionPropertiesForLba = drvvdQueryRegionPropertiesForLba;
4898
4899 /* IMount */
4900 pThis->IMount.pfnUnmount = drvvdUnmount;
4901 pThis->IMount.pfnIsMounted = drvvdIsMounted;
4902 pThis->IMount.pfnLock = drvvdLock;
4903 pThis->IMount.pfnUnlock = drvvdUnlock;
4904 pThis->IMount.pfnIsLocked = drvvdIsLocked;
4905
4906 /* IMediaEx */
4907 pThis->IMediaEx.pfnQueryFeatures = drvvdQueryFeatures;
4908 pThis->IMediaEx.pfnIoReqAllocSizeSet = drvvdIoReqAllocSizeSet;
4909 pThis->IMediaEx.pfnIoReqAlloc = drvvdIoReqAlloc;
4910 pThis->IMediaEx.pfnIoReqFree = drvvdIoReqFree;
4911 pThis->IMediaEx.pfnIoReqQueryResidual = drvvdIoReqQueryResidual;
4912 pThis->IMediaEx.pfnIoReqQueryXferSize = drvvdIoReqQueryXferSize;
4913 pThis->IMediaEx.pfnIoReqCancelAll = drvvdIoReqCancelAll;
4914 pThis->IMediaEx.pfnIoReqCancel = drvvdIoReqCancel;
4915 pThis->IMediaEx.pfnIoReqRead = drvvdIoReqRead;
4916 pThis->IMediaEx.pfnIoReqWrite = drvvdIoReqWrite;
4917 pThis->IMediaEx.pfnIoReqFlush = drvvdIoReqFlush;
4918 pThis->IMediaEx.pfnIoReqDiscard = drvvdIoReqDiscard;
4919 pThis->IMediaEx.pfnIoReqSendScsiCmd = drvvdIoReqSendScsiCmd;
4920 pThis->IMediaEx.pfnIoReqGetActiveCount = drvvdIoReqGetActiveCount;
4921 pThis->IMediaEx.pfnIoReqGetSuspendedCount = drvvdIoReqGetSuspendedCount;
4922 pThis->IMediaEx.pfnIoReqQuerySuspendedStart = drvvdIoReqQuerySuspendedStart;
4923 pThis->IMediaEx.pfnIoReqQuerySuspendedNext = drvvdIoReqQuerySuspendedNext;
4924 pThis->IMediaEx.pfnIoReqSuspendedSave = drvvdIoReqSuspendedSave;
4925 pThis->IMediaEx.pfnIoReqSuspendedLoad = drvvdIoReqSuspendedLoad;
4926
4927 /* Initialize supported VD interfaces. */
4928 pThis->pVDIfsDisk = NULL;
4929
4930 pThis->VDIfError.pfnError = drvvdErrorCallback;
4931 pThis->VDIfError.pfnMessage = NULL;
4932 rc = VDInterfaceAdd(&pThis->VDIfError.Core, "DrvVD_VDIError", VDINTERFACETYPE_ERROR,
4933 pDrvIns, sizeof(VDINTERFACEERROR), &pThis->pVDIfsDisk);
4934 AssertRC(rc);
4935
4936 /* List of images is empty now. */
4937 pThis->pImages = NULL;
4938
4939 pThis->pDrvMediaPort = PDMIBASE_QUERY_INTERFACE(pDrvIns->pUpBase, PDMIMEDIAPORT);
4940 if (!pThis->pDrvMediaPort)
4941 return PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_MISSING_INTERFACE_ABOVE,
4942 N_("No media port interface above"));
4943
4944 pThis->pDrvMountNotify = PDMIBASE_QUERY_INTERFACE(pDrvIns->pUpBase, PDMIMOUNTNOTIFY);
4945
4946 /*
4947 * Try to attach the optional extended media interface port above and initialize associated
4948 * structures if available.
4949 */
4950 pThis->pDrvMediaExPort = PDMIBASE_QUERY_INTERFACE(pDrvIns->pUpBase, PDMIMEDIAEXPORT);
4951 if (pThis->pDrvMediaExPort)
4952 {
4953 for (unsigned i = 0; i < RT_ELEMENTS(pThis->aIoReqAllocBins); i++)
4954 {
4955 rc = RTSemFastMutexCreate(&pThis->aIoReqAllocBins[i].hMtxLstIoReqAlloc);
4956 if (RT_FAILURE(rc))
4957 break;
4958 RTListInit(&pThis->aIoReqAllocBins[i].LstIoReqAlloc);
4959 }
4960
4961 if (RT_SUCCESS(rc))
4962 rc = RTCritSectInit(&pThis->CritSectIoReqsIoBufWait);
4963
4964 if (RT_SUCCESS(rc))
4965 rc = RTCritSectInit(&pThis->CritSectIoReqRedo);
4966
4967 if (RT_FAILURE(rc))
4968 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Creating Mutex failed"));
4969
4970 RTListInit(&pThis->LstIoReqIoBufWait);
4971 RTListInit(&pThis->LstIoReqRedo);
4972 }
4973
4974 /* Before we access any VD API load all given plugins. */
4975 rc = drvvdLoadPlugins(pCfg);
4976 if (RT_FAILURE(rc))
4977 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Loading VD plugins failed"));
4978
4979 /*
4980 * Validate configuration and find all parent images.
4981 * It's sort of up side down from the image dependency tree.
4982 */
4983 bool fHostIP = false;
4984 bool fUseNewIo = false;
4985 bool fUseBlockCache = false;
4986 bool fDiscard = false;
4987 bool fInformAboutZeroBlocks = false;
4988 bool fSkipConsistencyChecks = false;
4989 bool fEmptyDrive = false;
4990 unsigned iLevel = 0;
4991 PCFGMNODE pCurNode = pCfg;
4992 uint32_t cbIoBufMax = 0;
4993
4994 for (;;)
4995 {
4996 bool fValid;
4997
4998 if (pCurNode == pCfg)
4999 {
5000 /* Toplevel configuration additionally contains the global image
5001 * open flags. Some might be converted to per-image flags later. */
5002 fValid = CFGMR3AreValuesValid(pCurNode,
5003 "Format\0Path\0"
5004 "ReadOnly\0MaybeReadOnly\0TempReadOnly\0Shareable\0HonorZeroWrites\0"
5005 "HostIPStack\0UseNewIo\0BootAcceleration\0BootAccelerationBuffer\0"
5006 "SetupMerge\0MergeSource\0MergeTarget\0BwGroup\0Type\0BlockCache\0"
5007 "CachePath\0CacheFormat\0Discard\0InformAboutZeroBlocks\0"
5008 "SkipConsistencyChecks\0"
5009 "Locked\0BIOSVisible\0Cylinders\0Heads\0Sectors\0Mountable\0"
5010 "EmptyDrive\0IoBufMax\0NonRotationalMedium\0"
5011#if defined(VBOX_PERIODIC_FLUSH) || defined(VBOX_IGNORE_FLUSH)
5012 "FlushInterval\0IgnoreFlush\0IgnoreFlushAsync\0"
5013#endif /* !(VBOX_PERIODIC_FLUSH || VBOX_IGNORE_FLUSH) */
5014 );
5015 }
5016 else
5017 {
5018 /* All other image configurations only contain image name and
5019 * the format information. */
5020 fValid = CFGMR3AreValuesValid(pCurNode, "Format\0Path\0"
5021 "MergeSource\0MergeTarget\0");
5022 }
5023 if (!fValid)
5024 {
5025 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_DRVINS_UNKNOWN_CFG_VALUES,
5026 RT_SRC_POS, N_("DrvVD: Configuration error: keys incorrect at level %d"), iLevel);
5027 break;
5028 }
5029
5030 if (pCurNode == pCfg)
5031 {
5032 rc = CFGMR3QueryBoolDef(pCurNode, "HostIPStack", &fHostIP, true);
5033 if (RT_FAILURE(rc))
5034 {
5035 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5036 N_("DrvVD: Configuration error: Querying \"HostIPStack\" as boolean failed"));
5037 break;
5038 }
5039
5040 rc = CFGMR3QueryBoolDef(pCurNode, "HonorZeroWrites", &fHonorZeroWrites, false);
5041 if (RT_FAILURE(rc))
5042 {
5043 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5044 N_("DrvVD: Configuration error: Querying \"HonorZeroWrites\" as boolean failed"));
5045 break;
5046 }
5047
5048 rc = CFGMR3QueryBoolDef(pCurNode, "ReadOnly", &fReadOnly, false);
5049 if (RT_FAILURE(rc))
5050 {
5051 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5052 N_("DrvVD: Configuration error: Querying \"ReadOnly\" as boolean failed"));
5053 break;
5054 }
5055
5056 rc = CFGMR3QueryBoolDef(pCurNode, "MaybeReadOnly", &fMaybeReadOnly, false);
5057 if (RT_FAILURE(rc))
5058 {
5059 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5060 N_("DrvVD: Configuration error: Querying \"MaybeReadOnly\" as boolean failed"));
5061 break;
5062 }
5063
5064 rc = CFGMR3QueryBoolDef(pCurNode, "TempReadOnly", &pThis->fTempReadOnly, false);
5065 if (RT_FAILURE(rc))
5066 {
5067 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5068 N_("DrvVD: Configuration error: Querying \"TempReadOnly\" as boolean failed"));
5069 break;
5070 }
5071 if (fReadOnly && pThis->fTempReadOnly)
5072 {
5073 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5074 N_("DrvVD: Configuration error: Both \"ReadOnly\" and \"TempReadOnly\" are set"));
5075 break;
5076 }
5077
5078 rc = CFGMR3QueryBoolDef(pCurNode, "Shareable", &pThis->fShareable, false);
5079 if (RT_FAILURE(rc))
5080 {
5081 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5082 N_("DrvVD: Configuration error: Querying \"Shareable\" as boolean failed"));
5083 break;
5084 }
5085
5086 rc = CFGMR3QueryBoolDef(pCurNode, "UseNewIo", &fUseNewIo, false);
5087 if (RT_FAILURE(rc))
5088 {
5089 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5090 N_("DrvVD: Configuration error: Querying \"UseNewIo\" as boolean failed"));
5091 break;
5092 }
5093 rc = CFGMR3QueryBoolDef(pCurNode, "SetupMerge", &pThis->fMergePending, false);
5094 if (RT_FAILURE(rc))
5095 {
5096 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5097 N_("DrvVD: Configuration error: Querying \"SetupMerge\" as boolean failed"));
5098 break;
5099 }
5100 if (fReadOnly && pThis->fMergePending)
5101 {
5102 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5103 N_("DrvVD: Configuration error: Both \"ReadOnly\" and \"MergePending\" are set"));
5104 break;
5105 }
5106 rc = CFGMR3QueryBoolDef(pCurNode, "BootAcceleration", &pThis->fBootAccelEnabled, false);
5107 if (RT_FAILURE(rc))
5108 {
5109 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5110 N_("DrvVD: Configuration error: Querying \"BootAcceleration\" as boolean failed"));
5111 break;
5112 }
5113 rc = CFGMR3QueryU32Def(pCurNode, "BootAccelerationBuffer", (uint32_t *)&pThis->cbBootAccelBuffer, 16 * _1K);
5114 if (RT_FAILURE(rc))
5115 {
5116 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5117 N_("DrvVD: Configuration error: Querying \"BootAccelerationBuffer\" as integer failed"));
5118 break;
5119 }
5120 rc = CFGMR3QueryBoolDef(pCurNode, "BlockCache", &fUseBlockCache, false);
5121 if (RT_FAILURE(rc))
5122 {
5123 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5124 N_("DrvVD: Configuration error: Querying \"BlockCache\" as boolean failed"));
5125 break;
5126 }
5127 rc = CFGMR3QueryStringAlloc(pCurNode, "BwGroup", &pThis->pszBwGroup);
5128 if (RT_FAILURE(rc) && rc != VERR_CFGM_VALUE_NOT_FOUND)
5129 {
5130 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5131 N_("DrvVD: Configuration error: Querying \"BwGroup\" as string failed"));
5132 break;
5133 }
5134 else
5135 rc = VINF_SUCCESS;
5136 rc = CFGMR3QueryBoolDef(pCurNode, "Discard", &fDiscard, false);
5137 if (RT_FAILURE(rc))
5138 {
5139 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5140 N_("DrvVD: Configuration error: Querying \"Discard\" as boolean failed"));
5141 break;
5142 }
5143 if (fReadOnly && fDiscard)
5144 {
5145 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5146 N_("DrvVD: Configuration error: Both \"ReadOnly\" and \"Discard\" are set"));
5147 break;
5148 }
5149 rc = CFGMR3QueryBoolDef(pCurNode, "InformAboutZeroBlocks", &fInformAboutZeroBlocks, false);
5150 if (RT_FAILURE(rc))
5151 {
5152 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5153 N_("DrvVD: Configuration error: Querying \"InformAboutZeroBlocks\" as boolean failed"));
5154 break;
5155 }
5156 rc = CFGMR3QueryBoolDef(pCurNode, "SkipConsistencyChecks", &fSkipConsistencyChecks, true);
5157 if (RT_FAILURE(rc))
5158 {
5159 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5160 N_("DrvVD: Configuration error: Querying \"SKipConsistencyChecks\" as boolean failed"));
5161 break;
5162 }
5163
5164 char *psz = NULL;
5165 rc = CFGMR3QueryStringAlloc(pCfg, "Type", &psz);
5166 if (RT_FAILURE(rc))
5167 return PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_BLOCK_NO_TYPE, N_("Failed to obtain the sub type"));
5168 pThis->enmType = drvvdGetMediaTypeFromString(psz);
5169 if (pThis->enmType == PDMMEDIATYPE_ERROR)
5170 {
5171 PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_BLOCK_UNKNOWN_TYPE, RT_SRC_POS,
5172 N_("Unknown type \"%s\""), psz);
5173 MMR3HeapFree(psz);
5174 return VERR_PDM_BLOCK_UNKNOWN_TYPE;
5175 }
5176 MMR3HeapFree(psz); psz = NULL;
5177
5178 rc = CFGMR3QueryStringAlloc(pCurNode, "CachePath", &pszCachePath);
5179 if (RT_FAILURE(rc) && rc != VERR_CFGM_VALUE_NOT_FOUND)
5180 {
5181 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5182 N_("DrvVD: Configuration error: Querying \"CachePath\" as string failed"));
5183 break;
5184 }
5185 else
5186 rc = VINF_SUCCESS;
5187
5188 if (pszCachePath)
5189 {
5190 rc = CFGMR3QueryStringAlloc(pCurNode, "CacheFormat", &pszCacheFormat);
5191 if (RT_FAILURE(rc))
5192 {
5193 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5194 N_("DrvVD: Configuration error: Querying \"CacheFormat\" as string failed"));
5195 break;
5196 }
5197 }
5198
5199 /* Mountable */
5200 rc = CFGMR3QueryBoolDef(pCfg, "Mountable", &pThis->fMountable, false);
5201 if (RT_FAILURE(rc))
5202 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Mountable\" from the config"));
5203
5204 /* Locked */
5205 rc = CFGMR3QueryBoolDef(pCfg, "Locked", &pThis->fLocked, false);
5206 if (RT_FAILURE(rc))
5207 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Locked\" from the config"));
5208
5209 /* BIOS visible */
5210 rc = CFGMR3QueryBoolDef(pCfg, "BIOSVisible", &pThis->fBiosVisible, true);
5211 if (RT_FAILURE(rc))
5212 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"BIOSVisible\" from the config"));
5213
5214 /* Cylinders */
5215 rc = CFGMR3QueryU32Def(pCfg, "Cylinders", &pThis->LCHSGeometry.cCylinders, 0);
5216 if (RT_FAILURE(rc))
5217 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Cylinders\" from the config"));
5218
5219 /* Heads */
5220 rc = CFGMR3QueryU32Def(pCfg, "Heads", &pThis->LCHSGeometry.cHeads, 0);
5221 if (RT_FAILURE(rc))
5222 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Heads\" from the config"));
5223
5224 /* Sectors */
5225 rc = CFGMR3QueryU32Def(pCfg, "Sectors", &pThis->LCHSGeometry.cSectors, 0);
5226 if (RT_FAILURE(rc))
5227 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Sectors\" from the config"));
5228
5229 /* Uuid */
5230 rc = CFGMR3QueryStringAlloc(pCfg, "Uuid", &psz);
5231 if (rc == VERR_CFGM_VALUE_NOT_FOUND)
5232 RTUuidClear(&pThis->Uuid);
5233 else if (RT_SUCCESS(rc))
5234 {
5235 rc = RTUuidFromStr(&pThis->Uuid, psz);
5236 if (RT_FAILURE(rc))
5237 {
5238 PDMDrvHlpVMSetError(pDrvIns, rc, RT_SRC_POS, N_("Uuid from string failed on \"%s\""), psz);
5239 MMR3HeapFree(psz);
5240 return rc;
5241 }
5242 MMR3HeapFree(psz); psz = NULL;
5243 }
5244 else
5245 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"Uuid\" from the config"));
5246
5247#ifdef VBOX_PERIODIC_FLUSH
5248 rc = CFGMR3QueryU32Def(pCfg, "FlushInterval", &pThis->cbFlushInterval, 0);
5249 if (RT_FAILURE(rc))
5250 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"FlushInterval\" from the config"));
5251#endif /* VBOX_PERIODIC_FLUSH */
5252
5253#ifdef VBOX_IGNORE_FLUSH
5254 rc = CFGMR3QueryBoolDef(pCfg, "IgnoreFlush", &pThis->fIgnoreFlush, true);
5255 if (RT_FAILURE(rc))
5256 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"IgnoreFlush\" from the config"));
5257
5258 if (pThis->fIgnoreFlush)
5259 LogRel(("DrvVD: Flushes will be ignored\n"));
5260 else
5261 LogRel(("DrvVD: Flushes will be passed to the disk\n"));
5262
5263 rc = CFGMR3QueryBoolDef(pCfg, "IgnoreFlushAsync", &pThis->fIgnoreFlushAsync, false);
5264 if (RT_FAILURE(rc))
5265 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"IgnoreFlushAsync\" from the config"));
5266
5267 if (pThis->fIgnoreFlushAsync)
5268 LogRel(("DrvVD: Async flushes will be ignored\n"));
5269 else
5270 LogRel(("DrvVD: Async flushes will be passed to the disk\n"));
5271#endif /* VBOX_IGNORE_FLUSH */
5272
5273 rc = CFGMR3QueryBoolDef(pCurNode, "EmptyDrive", &fEmptyDrive, false);
5274 if (RT_FAILURE(rc))
5275 {
5276 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5277 N_("DrvVD: Configuration error: Querying \"EmptyDrive\" as boolean failed"));
5278 break;
5279 }
5280
5281 rc = CFGMR3QueryU32Def(pCfg, "IoBufMax", &cbIoBufMax, 5 * _1M);
5282 if (RT_FAILURE(rc))
5283 return PDMDRV_SET_ERROR(pDrvIns, rc, N_("Failed to query \"IoBufMax\" from the config"));
5284
5285 rc = CFGMR3QueryBoolDef(pCfg, "NonRotationalMedium", &pThis->fNonRotational, false);
5286 if (RT_FAILURE(rc))
5287 return PDMDRV_SET_ERROR(pDrvIns, rc,
5288 N_("DrvVD configuration error: Querying \"NonRotationalMedium\" as boolean failed"));
5289 }
5290
5291 PCFGMNODE pParent = CFGMR3GetChild(pCurNode, "Parent");
5292 if (!pParent)
5293 break;
5294 pCurNode = pParent;
5295 iLevel++;
5296 }
5297
5298 if (pThis->pDrvMediaExPort)
5299 rc = IOBUFMgrCreate(&pThis->hIoBufMgr, cbIoBufMax, pThis->pCfgCrypto ? IOBUFMGR_F_REQUIRE_NOT_PAGABLE : IOBUFMGR_F_DEFAULT);
5300
5301 if ( !fEmptyDrive
5302 && RT_SUCCESS(rc))
5303 {
5304 /*
5305 * Create the image container and the necessary interfaces.
5306 */
5307 if (RT_SUCCESS(rc))
5308 {
5309 /*
5310 * The image has a bandwidth group but the host cache is enabled.
5311 * Use the async I/O framework but tell it to enable the host cache.
5312 */
5313 if (!fUseNewIo && pThis->pszBwGroup)
5314 {
5315 pThis->fAsyncIoWithHostCache = true;
5316 fUseNewIo = true;
5317 }
5318
5319 /** @todo quick hack to work around problems in the async I/O
5320 * implementation (rw semaphore thread ownership problem)
5321 * while a merge is running. Remove once this is fixed. */
5322 if (pThis->fMergePending)
5323 fUseNewIo = false;
5324
5325 if (RT_SUCCESS(rc) && pThis->fMergePending)
5326 {
5327 rc = RTSemFastMutexCreate(&pThis->MergeCompleteMutex);
5328 if (RT_SUCCESS(rc))
5329 rc = RTSemRWCreate(&pThis->MergeLock);
5330 if (RT_SUCCESS(rc))
5331 {
5332 pThis->VDIfThreadSync.pfnStartRead = drvvdThreadStartRead;
5333 pThis->VDIfThreadSync.pfnFinishRead = drvvdThreadFinishRead;
5334 pThis->VDIfThreadSync.pfnStartWrite = drvvdThreadStartWrite;
5335 pThis->VDIfThreadSync.pfnFinishWrite = drvvdThreadFinishWrite;
5336
5337 rc = VDInterfaceAdd(&pThis->VDIfThreadSync.Core, "DrvVD_ThreadSync", VDINTERFACETYPE_THREADSYNC,
5338 pThis, sizeof(VDINTERFACETHREADSYNC), &pThis->pVDIfsDisk);
5339 }
5340 else
5341 {
5342 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5343 N_("DrvVD: Failed to create semaphores for \"MergePending\""));
5344 }
5345 }
5346
5347 if (RT_SUCCESS(rc))
5348 {
5349 rc = VDCreate(pThis->pVDIfsDisk, drvvdGetVDFromMediaType(pThis->enmType), &pThis->pDisk);
5350 /* Error message is already set correctly. */
5351 }
5352 }
5353
5354 if (pThis->pDrvMediaExPort && fUseNewIo)
5355 pThis->fAsyncIOSupported = true;
5356
5357 uint64_t tsStart = RTTimeNanoTS();
5358
5359 unsigned iImageIdx = 0;
5360 while (pCurNode && RT_SUCCESS(rc))
5361 {
5362 /* Allocate per-image data. */
5363 PVBOXIMAGE pImage = drvvdNewImage(pThis);
5364 if (!pImage)
5365 {
5366 rc = VERR_NO_MEMORY;
5367 break;
5368 }
5369
5370 /*
5371 * Read the image configuration.
5372 */
5373 rc = CFGMR3QueryStringAlloc(pCurNode, "Path", &pszName);
5374 if (RT_FAILURE(rc))
5375 {
5376 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5377 N_("DrvVD: Configuration error: Querying \"Path\" as string failed"));
5378 break;
5379 }
5380
5381 rc = CFGMR3QueryStringAlloc(pCurNode, "Format", &pszFormat);
5382 if (RT_FAILURE(rc))
5383 {
5384 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5385 N_("DrvVD: Configuration error: Querying \"Format\" as string failed"));
5386 break;
5387 }
5388
5389 bool fMergeSource;
5390 rc = CFGMR3QueryBoolDef(pCurNode, "MergeSource", &fMergeSource, false);
5391 if (RT_FAILURE(rc))
5392 {
5393 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5394 N_("DrvVD: Configuration error: Querying \"MergeSource\" as boolean failed"));
5395 break;
5396 }
5397 if (fMergeSource)
5398 {
5399 if (pThis->uMergeSource == VD_LAST_IMAGE)
5400 pThis->uMergeSource = iImageIdx;
5401 else
5402 {
5403 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5404 N_("DrvVD: Configuration error: Multiple \"MergeSource\" occurrences"));
5405 break;
5406 }
5407 }
5408
5409 bool fMergeTarget;
5410 rc = CFGMR3QueryBoolDef(pCurNode, "MergeTarget", &fMergeTarget, false);
5411 if (RT_FAILURE(rc))
5412 {
5413 rc = PDMDRV_SET_ERROR(pDrvIns, rc,
5414 N_("DrvVD: Configuration error: Querying \"MergeTarget\" as boolean failed"));
5415 break;
5416 }
5417 if (fMergeTarget)
5418 {
5419 if (pThis->uMergeTarget == VD_LAST_IMAGE)
5420 pThis->uMergeTarget = iImageIdx;
5421 else
5422 {
5423 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5424 N_("DrvVD: Configuration error: Multiple \"MergeTarget\" occurrences"));
5425 break;
5426 }
5427 }
5428
5429 PCFGMNODE pCfgVDConfig = CFGMR3GetChild(pCurNode, "VDConfig");
5430 pImage->VDIfConfig.pfnAreKeysValid = drvvdCfgAreKeysValid;
5431 pImage->VDIfConfig.pfnQuerySize = drvvdCfgQuerySize;
5432 pImage->VDIfConfig.pfnQuery = drvvdCfgQuery;
5433 pImage->VDIfConfig.pfnQueryBytes = NULL;
5434 rc = VDInterfaceAdd(&pImage->VDIfConfig.Core, "DrvVD_Config", VDINTERFACETYPE_CONFIG,
5435 pCfgVDConfig, sizeof(VDINTERFACECONFIG), &pImage->pVDIfsImage);
5436 AssertRC(rc);
5437
5438 /* Check VDConfig for encryption config. */
5439 if (pCfgVDConfig)
5440 pThis->pCfgCrypto = CFGMR3GetChild(pCfgVDConfig, "CRYPT");
5441
5442 if (pThis->pCfgCrypto)
5443 {
5444 /* Setup VDConfig interface for disk encryption support. */
5445 pThis->VDIfCfg.pfnAreKeysValid = drvvdCfgAreKeysValid;
5446 pThis->VDIfCfg.pfnQuerySize = drvvdCfgQuerySize;
5447 pThis->VDIfCfg.pfnQuery = drvvdCfgQuery;
5448 pThis->VDIfCfg.pfnQueryBytes = NULL;
5449
5450 pThis->VDIfCrypto.pfnKeyRetain = drvvdCryptoKeyRetain;
5451 pThis->VDIfCrypto.pfnKeyRelease = drvvdCryptoKeyRelease;
5452 pThis->VDIfCrypto.pfnKeyStorePasswordRetain = drvvdCryptoKeyStorePasswordRetain;
5453 pThis->VDIfCrypto.pfnKeyStorePasswordRelease = drvvdCryptoKeyStorePasswordRelease;
5454 }
5455
5456 /* Unconditionally insert the TCPNET interface, don't bother to check
5457 * if an image really needs it. Will be ignored. Since the TCPNET
5458 * interface is per image we could make this more flexible in the
5459 * future if we want to. */
5460 /* Construct TCPNET callback table depending on the config. This is
5461 * done unconditionally, as uninterested backends will ignore it. */
5462 if (fHostIP)
5463 {
5464 pImage->VDIfTcpNet.pfnSocketCreate = drvvdTcpSocketCreate;
5465 pImage->VDIfTcpNet.pfnSocketDestroy = drvvdTcpSocketDestroy;
5466 pImage->VDIfTcpNet.pfnClientConnect = drvvdTcpClientConnect;
5467 pImage->VDIfTcpNet.pfnIsClientConnected = drvvdTcpIsClientConnected;
5468 pImage->VDIfTcpNet.pfnClientClose = drvvdTcpClientClose;
5469 pImage->VDIfTcpNet.pfnSelectOne = drvvdTcpSelectOne;
5470 pImage->VDIfTcpNet.pfnRead = drvvdTcpRead;
5471 pImage->VDIfTcpNet.pfnWrite = drvvdTcpWrite;
5472 pImage->VDIfTcpNet.pfnSgWrite = drvvdTcpSgWrite;
5473 pImage->VDIfTcpNet.pfnReadNB = drvvdTcpReadNB;
5474 pImage->VDIfTcpNet.pfnWriteNB = drvvdTcpWriteNB;
5475 pImage->VDIfTcpNet.pfnSgWriteNB = drvvdTcpSgWriteNB;
5476 pImage->VDIfTcpNet.pfnFlush = drvvdTcpFlush;
5477 pImage->VDIfTcpNet.pfnSetSendCoalescing = drvvdTcpSetSendCoalescing;
5478 pImage->VDIfTcpNet.pfnGetLocalAddress = drvvdTcpGetLocalAddress;
5479 pImage->VDIfTcpNet.pfnGetPeerAddress = drvvdTcpGetPeerAddress;
5480
5481 /*
5482 * There is a 15ms delay between receiving the data and marking the socket
5483 * as readable on Windows XP which hurts async I/O performance of
5484 * TCP backends badly. Provide a different select method without
5485 * using poll on XP.
5486 * This is only used on XP because it is not as efficient as the one using poll
5487 * and all other Windows versions are working fine.
5488 */
5489 char szOS[64];
5490 memset(szOS, 0, sizeof(szOS));
5491 rc = RTSystemQueryOSInfo(RTSYSOSINFO_PRODUCT, &szOS[0], sizeof(szOS));
5492
5493 if (RT_SUCCESS(rc) && !strncmp(szOS, "Windows XP", 10))
5494 {
5495 LogRel(("VD: Detected Windows XP, disabled poll based waiting for TCP\n"));
5496 pImage->VDIfTcpNet.pfnSelectOneEx = drvvdTcpSelectOneExNoPoll;
5497 }
5498 else
5499 pImage->VDIfTcpNet.pfnSelectOneEx = drvvdTcpSelectOneExPoll;
5500
5501 pImage->VDIfTcpNet.pfnPoke = drvvdTcpPoke;
5502 }
5503 else
5504 {
5505#ifndef VBOX_WITH_INIP
5506 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_DRVINS_UNKNOWN_CFG_VALUES,
5507 RT_SRC_POS, N_("DrvVD: Configuration error: TCP over Internal Networking not compiled in"));
5508#else /* VBOX_WITH_INIP */
5509 pImage->VDIfTcpNet.pfnSocketCreate = drvvdINIPSocketCreate;
5510 pImage->VDIfTcpNet.pfnSocketDestroy = drvvdINIPSocketDestroy;
5511 pImage->VDIfTcpNet.pfnClientConnect = drvvdINIPClientConnect;
5512 pImage->VDIfTcpNet.pfnClientClose = drvvdINIPClientClose;
5513 pImage->VDIfTcpNet.pfnIsClientConnected = drvvdINIPIsClientConnected;
5514 pImage->VDIfTcpNet.pfnSelectOne = drvvdINIPSelectOne;
5515 pImage->VDIfTcpNet.pfnRead = drvvdINIPRead;
5516 pImage->VDIfTcpNet.pfnWrite = drvvdINIPWrite;
5517 pImage->VDIfTcpNet.pfnSgWrite = drvvdINIPSgWrite;
5518 pImage->VDIfTcpNet.pfnFlush = drvvdINIPFlush;
5519 pImage->VDIfTcpNet.pfnSetSendCoalescing = drvvdINIPSetSendCoalescing;
5520 pImage->VDIfTcpNet.pfnGetLocalAddress = drvvdINIPGetLocalAddress;
5521 pImage->VDIfTcpNet.pfnGetPeerAddress = drvvdINIPGetPeerAddress;
5522 pImage->VDIfTcpNet.pfnSelectOneEx = drvvdINIPSelectOneEx;
5523 pImage->VDIfTcpNet.pfnPoke = drvvdINIPPoke;
5524#endif /* VBOX_WITH_INIP */
5525 }
5526 rc = VDInterfaceAdd(&pImage->VDIfTcpNet.Core, "DrvVD_TCPNET",
5527 VDINTERFACETYPE_TCPNET, NULL,
5528 sizeof(VDINTERFACETCPNET), &pImage->pVDIfsImage);
5529 AssertRC(rc);
5530
5531 /* Insert the custom I/O interface only if we're told to use new IO.
5532 * Since the I/O interface is per image we could make this more
5533 * flexible in the future if we want to. */
5534 if (fUseNewIo)
5535 {
5536#ifdef VBOX_WITH_PDM_ASYNC_COMPLETION
5537 pImage->VDIfIo.pfnOpen = drvvdAsyncIOOpen;
5538 pImage->VDIfIo.pfnClose = drvvdAsyncIOClose;
5539 pImage->VDIfIo.pfnGetSize = drvvdAsyncIOGetSize;
5540 pImage->VDIfIo.pfnSetSize = drvvdAsyncIOSetSize;
5541 pImage->VDIfIo.pfnSetAllocationSize = drvvdAsyncIOSetAllocationSize;
5542 pImage->VDIfIo.pfnReadSync = drvvdAsyncIOReadSync;
5543 pImage->VDIfIo.pfnWriteSync = drvvdAsyncIOWriteSync;
5544 pImage->VDIfIo.pfnFlushSync = drvvdAsyncIOFlushSync;
5545 pImage->VDIfIo.pfnReadAsync = drvvdAsyncIOReadAsync;
5546 pImage->VDIfIo.pfnWriteAsync = drvvdAsyncIOWriteAsync;
5547 pImage->VDIfIo.pfnFlushAsync = drvvdAsyncIOFlushAsync;
5548#else /* !VBOX_WITH_PDM_ASYNC_COMPLETION */
5549 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_DRVINS_UNKNOWN_CFG_VALUES,
5550 RT_SRC_POS, N_("DrvVD: Configuration error: Async Completion Framework not compiled in"));
5551#endif /* !VBOX_WITH_PDM_ASYNC_COMPLETION */
5552 if (RT_SUCCESS(rc))
5553 rc = VDInterfaceAdd(&pImage->VDIfIo.Core, "DrvVD_IO", VDINTERFACETYPE_IO,
5554 pThis, sizeof(VDINTERFACEIO), &pImage->pVDIfsImage);
5555 AssertRC(rc);
5556 }
5557
5558 /*
5559 * Open the image.
5560 */
5561 unsigned uOpenFlags;
5562 if (fReadOnly || pThis->fTempReadOnly || iLevel != 0)
5563 uOpenFlags = VD_OPEN_FLAGS_READONLY;
5564 else
5565 uOpenFlags = VD_OPEN_FLAGS_NORMAL;
5566 if (fHonorZeroWrites)
5567 uOpenFlags |= VD_OPEN_FLAGS_HONOR_ZEROES;
5568 if (pThis->fAsyncIOSupported)
5569 uOpenFlags |= VD_OPEN_FLAGS_ASYNC_IO;
5570 if (pThis->fShareable)
5571 uOpenFlags |= VD_OPEN_FLAGS_SHAREABLE;
5572 if (fDiscard && iLevel == 0)
5573 uOpenFlags |= VD_OPEN_FLAGS_DISCARD;
5574 if (fInformAboutZeroBlocks)
5575 uOpenFlags |= VD_OPEN_FLAGS_INFORM_ABOUT_ZERO_BLOCKS;
5576 if ( (uOpenFlags & VD_OPEN_FLAGS_READONLY)
5577 && fSkipConsistencyChecks)
5578 uOpenFlags |= VD_OPEN_FLAGS_SKIP_CONSISTENCY_CHECKS;
5579
5580 /* Try to open backend in async I/O mode first. */
5581 rc = VDOpen(pThis->pDisk, pszFormat, pszName, uOpenFlags, pImage->pVDIfsImage);
5582 if (rc == VERR_NOT_SUPPORTED)
5583 {
5584 pThis->fAsyncIOSupported = false;
5585 uOpenFlags &= ~VD_OPEN_FLAGS_ASYNC_IO;
5586 rc = VDOpen(pThis->pDisk, pszFormat, pszName, uOpenFlags, pImage->pVDIfsImage);
5587 }
5588
5589 if (rc == VERR_VD_DISCARD_NOT_SUPPORTED)
5590 {
5591 fDiscard = false;
5592 uOpenFlags &= ~VD_OPEN_FLAGS_DISCARD;
5593 rc = VDOpen(pThis->pDisk, pszFormat, pszName, uOpenFlags, pImage->pVDIfsImage);
5594 }
5595
5596 if (!fDiscard)
5597 {
5598 pThis->IMedia.pfnDiscard = NULL;
5599 pThis->IMediaEx.pfnIoReqDiscard = NULL;
5600 }
5601
5602 if (RT_SUCCESS(rc))
5603 {
5604 LogFunc(("%d - Opened '%s' in %s mode\n",
5605 iLevel, pszName,
5606 VDIsReadOnly(pThis->pDisk) ? "read-only" : "read-write"));
5607 if ( VDIsReadOnly(pThis->pDisk)
5608 && !fReadOnly
5609 && !fMaybeReadOnly
5610 && !pThis->fTempReadOnly
5611 && iLevel == 0)
5612 {
5613 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_VD_IMAGE_READ_ONLY, RT_SRC_POS,
5614 N_("Failed to open image '%s' for writing due to wrong permissions"),
5615 pszName);
5616 break;
5617 }
5618 }
5619 else
5620 {
5621 rc = PDMDrvHlpVMSetError(pDrvIns, rc, RT_SRC_POS,
5622 N_("Failed to open image '%s' in %s mode"), pszName,
5623 (uOpenFlags & VD_OPEN_FLAGS_READONLY) ? "read-only" : "read-write");
5624 break;
5625 }
5626
5627 MMR3HeapFree(pszName);
5628 pszName = NULL;
5629 MMR3HeapFree(pszFormat);
5630 pszFormat = NULL;
5631
5632 /* next */
5633 iLevel--;
5634 iImageIdx++;
5635 pCurNode = CFGMR3GetParent(pCurNode);
5636 }
5637
5638 LogRel(("VD: Opening the disk took %lld ns\n", RTTimeNanoTS() - tsStart));
5639
5640 /* Open the cache image if set. */
5641 if ( RT_SUCCESS(rc)
5642 && RT_VALID_PTR(pszCachePath))
5643 {
5644 /* Insert the custom I/O interface only if we're told to use new IO.
5645 * Since the I/O interface is per image we could make this more
5646 * flexible in the future if we want to. */
5647 if (fUseNewIo)
5648 {
5649#ifdef VBOX_WITH_PDM_ASYNC_COMPLETION
5650 pThis->VDIfIoCache.pfnOpen = drvvdAsyncIOOpen;
5651 pThis->VDIfIoCache.pfnClose = drvvdAsyncIOClose;
5652 pThis->VDIfIoCache.pfnGetSize = drvvdAsyncIOGetSize;
5653 pThis->VDIfIoCache.pfnSetSize = drvvdAsyncIOSetSize;
5654 pThis->VDIfIoCache.pfnReadSync = drvvdAsyncIOReadSync;
5655 pThis->VDIfIoCache.pfnWriteSync = drvvdAsyncIOWriteSync;
5656 pThis->VDIfIoCache.pfnFlushSync = drvvdAsyncIOFlushSync;
5657 pThis->VDIfIoCache.pfnReadAsync = drvvdAsyncIOReadAsync;
5658 pThis->VDIfIoCache.pfnWriteAsync = drvvdAsyncIOWriteAsync;
5659 pThis->VDIfIoCache.pfnFlushAsync = drvvdAsyncIOFlushAsync;
5660#else /* !VBOX_WITH_PDM_ASYNC_COMPLETION */
5661 rc = PDMDrvHlpVMSetError(pDrvIns, VERR_PDM_DRVINS_UNKNOWN_CFG_VALUES,
5662 RT_SRC_POS, N_("DrvVD: Configuration error: Async Completion Framework not compiled in"));
5663#endif /* !VBOX_WITH_PDM_ASYNC_COMPLETION */
5664 if (RT_SUCCESS(rc))
5665 rc = VDInterfaceAdd(&pThis->VDIfIoCache.Core, "DrvVD_IO", VDINTERFACETYPE_IO,
5666 pThis, sizeof(VDINTERFACEIO), &pThis->pVDIfsCache);
5667 AssertRC(rc);
5668 }
5669
5670 rc = VDCacheOpen(pThis->pDisk, pszCacheFormat, pszCachePath, VD_OPEN_FLAGS_NORMAL, pThis->pVDIfsCache);
5671 if (RT_FAILURE(rc))
5672 rc = PDMDRV_SET_ERROR(pDrvIns, rc, N_("DrvVD: Could not open cache image"));
5673 }
5674
5675 if (RT_VALID_PTR(pszCachePath))
5676 MMR3HeapFree(pszCachePath);
5677 if (RT_VALID_PTR(pszCacheFormat))
5678 MMR3HeapFree(pszCacheFormat);
5679
5680 if ( RT_SUCCESS(rc)
5681 && pThis->fMergePending
5682 && ( pThis->uMergeSource == VD_LAST_IMAGE
5683 || pThis->uMergeTarget == VD_LAST_IMAGE))
5684 {
5685 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5686 N_("DrvVD: Configuration error: Inconsistent image merge data"));
5687 }
5688
5689 /* Create the block cache if enabled. */
5690 if ( fUseBlockCache
5691 && !pThis->fShareable
5692 && !fDiscard
5693 && !pThis->pCfgCrypto /* Disk encryption disables the block cache for security reasons */
5694 && RT_SUCCESS(rc))
5695 {
5696 /*
5697 * We need a unique ID for the block cache (to identify the owner of data
5698 * blocks in a saved state). UUIDs are not really suitable because
5699 * there are image formats which don't support them. Furthermore it is
5700 * possible that a new diff image was attached after a saved state
5701 * which changes the UUID.
5702 * However the device "name + device instance + LUN" triple the disk is
5703 * attached to is always constant for saved states.
5704 */
5705 char *pszId = NULL;
5706 uint32_t iInstance, iLUN;
5707 const char *pcszController;
5708
5709 rc = pThis->pDrvMediaPort->pfnQueryDeviceLocation(pThis->pDrvMediaPort, &pcszController,
5710 &iInstance, &iLUN);
5711 if (RT_FAILURE(rc))
5712 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5713 N_("DrvVD: Configuration error: Could not query device data"));
5714 else
5715 {
5716 int cbStr = RTStrAPrintf(&pszId, "%s-%d-%d", pcszController, iInstance, iLUN);
5717
5718 if (cbStr > 0)
5719 {
5720 rc = PDMDrvHlpBlkCacheRetain(pDrvIns, &pThis->pBlkCache,
5721 drvvdBlkCacheXferCompleteIoReq,
5722 drvvdBlkCacheXferEnqueue,
5723 drvvdBlkCacheXferEnqueueDiscard,
5724 pszId);
5725 if (rc == VERR_NOT_SUPPORTED)
5726 {
5727 LogRel(("VD: Block cache is not supported\n"));
5728 rc = VINF_SUCCESS;
5729 }
5730 else
5731 AssertRC(rc);
5732
5733 RTStrFree(pszId);
5734 }
5735 else
5736 rc = PDMDRV_SET_ERROR(pDrvIns, VERR_PDM_DRIVER_INVALID_PROPERTIES,
5737 N_("DrvVD: Out of memory when creating block cache"));
5738 }
5739 }
5740
5741 if (RT_SUCCESS(rc))
5742 rc = drvvdSetupFilters(pThis, pCfg);
5743
5744 /*
5745 * Register a load-done callback so we can undo TempReadOnly config before
5746 * we get to drvvdResume. Automatically deregistered upon destruction.
5747 */
5748 if (RT_SUCCESS(rc))
5749 rc = PDMDrvHlpSSMRegisterEx(pDrvIns, 0 /* version */, 0 /* cbGuess */,
5750 NULL /*pfnLivePrep*/, NULL /*pfnLiveExec*/, NULL /*pfnLiveVote*/,
5751 NULL /*pfnSavePrep*/, NULL /*pfnSaveExec*/, NULL /*pfnSaveDone*/,
5752 NULL /*pfnDonePrep*/, NULL /*pfnLoadExec*/, drvvdLoadDone);
5753
5754 /* Setup the boot acceleration stuff if enabled. */
5755 if (RT_SUCCESS(rc) && pThis->fBootAccelEnabled)
5756 {
5757 pThis->cbDisk = VDGetSize(pThis->pDisk, VD_LAST_IMAGE);
5758 Assert(pThis->cbDisk > 0);
5759 pThis->pbData = (uint8_t *)RTMemAllocZ(pThis->cbBootAccelBuffer);
5760 if (pThis->pbData)
5761 {
5762 pThis->fBootAccelActive = true;
5763 pThis->offDisk = 0;
5764 pThis->cbDataValid = 0;
5765 LogRel(("VD: Boot acceleration enabled\n"));
5766 }
5767 else
5768 LogRel(("VD: Boot acceleration, out of memory, disabled\n"));
5769 }
5770
5771 if ( RTUuidIsNull(&pThis->Uuid)
5772 && pThis->enmType == PDMMEDIATYPE_HARD_DISK)
5773 VDGetUuid(pThis->pDisk, 0, &pThis->Uuid);
5774
5775 /*
5776 * Automatically upgrade the floppy drive if the specified one is too
5777 * small to represent the whole boot time image. (We cannot do this later
5778 * since the BIOS (and others) gets the info via CMOS.)
5779 *
5780 * This trick should make 2.88 images as well as the fake 15.6 and 63.5 MB
5781 * images despite the hardcoded default 1.44 drive.
5782 */
5783 if ( PDMMEDIATYPE_IS_FLOPPY(pThis->enmType)
5784 && pThis->pDisk)
5785 {
5786 uint64_t const cbFloppyImg = VDGetSize(pThis->pDisk, VD_LAST_IMAGE);
5787 PDMMEDIATYPE const enmCfgType = pThis->enmType;
5788 switch (enmCfgType)
5789 {
5790 default:
5791 AssertFailed();
5792 RT_FALL_THRU();
5793 case PDMMEDIATYPE_FLOPPY_360:
5794 if (cbFloppyImg > 40 * 2 * 9 * 512)
5795 pThis->enmType = PDMMEDIATYPE_FLOPPY_720;
5796 RT_FALL_THRU();
5797 case PDMMEDIATYPE_FLOPPY_720:
5798 if (cbFloppyImg > 80 * 2 * 14 * 512)
5799 pThis->enmType = PDMMEDIATYPE_FLOPPY_1_20;
5800 RT_FALL_THRU();
5801 case PDMMEDIATYPE_FLOPPY_1_20:
5802 if (cbFloppyImg > 80 * 2 * 20 * 512)
5803 pThis->enmType = PDMMEDIATYPE_FLOPPY_1_44;
5804 RT_FALL_THRU();
5805 case PDMMEDIATYPE_FLOPPY_1_44:
5806 if (cbFloppyImg > 80 * 2 * 24 * 512)
5807 pThis->enmType = PDMMEDIATYPE_FLOPPY_2_88;
5808 RT_FALL_THRU();
5809 case PDMMEDIATYPE_FLOPPY_2_88:
5810 if (cbFloppyImg > 80 * 2 * 48 * 512)
5811 pThis->enmType = PDMMEDIATYPE_FLOPPY_FAKE_15_6;
5812 RT_FALL_THRU();
5813 case PDMMEDIATYPE_FLOPPY_FAKE_15_6:
5814 if (cbFloppyImg > 255 * 2 * 63 * 512)
5815 pThis->enmType = PDMMEDIATYPE_FLOPPY_FAKE_63_5;
5816 RT_FALL_THRU();
5817 case PDMMEDIATYPE_FLOPPY_FAKE_63_5:
5818 if (cbFloppyImg > 255 * 2 * 255 * 512)
5819 LogRel(("Warning: Floppy image is larger that 63.5 MB! (%llu bytes)\n", cbFloppyImg));
5820 break;
5821 }
5822 if (pThis->enmType != enmCfgType)
5823 LogRel(("DrvVD: Automatically upgraded floppy drive from %s to %s to better support the %u byte image\n",
5824 drvvdGetTypeName(enmCfgType), drvvdGetTypeName(pThis->enmType), cbFloppyImg));
5825 }
5826 } /* !fEmptyDrive */
5827
5828 if (RT_SUCCESS(rc))
5829 drvvdStatsRegister(pThis);
5830
5831 if (RT_FAILURE(rc))
5832 {
5833 if (RT_VALID_PTR(pszName))
5834 MMR3HeapFree(pszName);
5835 if (RT_VALID_PTR(pszFormat))
5836 MMR3HeapFree(pszFormat);
5837 /* drvvdDestruct does the rest. */
5838 }
5839
5840 LogFlowFunc(("returns %Rrc\n", rc));
5841 return rc;
5842}
5843
5844/**
5845 * VBox disk container media driver registration record.
5846 */
5847const PDMDRVREG g_DrvVD =
5848{
5849 /* u32Version */
5850 PDM_DRVREG_VERSION,
5851 /* szName */
5852 "VD",
5853 /* szRCMod */
5854 "",
5855 /* szR0Mod */
5856 "",
5857 /* pszDescription */
5858 "Generic VBox disk media driver.",
5859 /* fFlags */
5860 PDM_DRVREG_FLAGS_HOST_BITS_DEFAULT,
5861 /* fClass. */
5862 PDM_DRVREG_CLASS_MEDIA,
5863 /* cMaxInstances */
5864 ~0U,
5865 /* cbInstance */
5866 sizeof(VBOXDISK),
5867 /* pfnConstruct */
5868 drvvdConstruct,
5869 /* pfnDestruct */
5870 drvvdDestruct,
5871 /* pfnRelocate */
5872 NULL,
5873 /* pfnIOCtl */
5874 NULL,
5875 /* pfnPowerOn */
5876 drvvdPowerOn,
5877 /* pfnReset */
5878 drvvdReset,
5879 /* pfnSuspend */
5880 drvvdSuspend,
5881 /* pfnResume */
5882 drvvdResume,
5883 /* pfnAttach */
5884 NULL,
5885 /* pfnDetach */
5886 NULL,
5887 /* pfnPowerOff */
5888 drvvdPowerOff,
5889 /* pfnSoftReset */
5890 NULL,
5891 /* u32EndVersion */
5892 PDM_DRVREG_VERSION
5893};
5894
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette