VirtualBox

source: vbox/trunk/src/VBox/Runtime/r3/win/fileaio-win.cpp@ 25240

Last change on this file since 25240 was 21494, checked in by vboxsync, 15 years ago

Runtime/fileaio-win: Fix a possible race

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 17.0 KB
Line 
1/* $Id: fileaio-win.cpp 21494 2009-07-10 20:11:26Z vboxsync $ */
2/** @file
3 * IPRT - File async I/O, native implementation for the Windows host platform.
4 */
5
6/*
7 * Copyright (C) 2006-2007 Sun Microsystems, Inc.
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * The contents of this file may alternatively be used under the terms
18 * of the Common Development and Distribution License Version 1.0
19 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20 * VirtualBox OSE distribution, in which case the provisions of the
21 * CDDL are applicable instead of those of the GPL.
22 *
23 * You may elect to license modified versions of this file under the
24 * terms and conditions of either the GPL or the CDDL or both.
25 *
26 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa
27 * Clara, CA 95054 USA or visit http://www.sun.com if you need
28 * additional information or have any questions.
29 */
30
31
32/*******************************************************************************
33* Header Files *
34*******************************************************************************/
35#define LOG_GROUP RTLOGGROUP_DIR
36
37#include <iprt/asm.h>
38#include <iprt/file.h>
39#include <iprt/mem.h>
40#include <iprt/assert.h>
41#include <iprt/string.h>
42#include <iprt/err.h>
43#include <iprt/log.h>
44#include "internal/fileaio.h"
45
46#include <Windows.h>
47
48/*******************************************************************************
49* Structures and Typedefs *
50*******************************************************************************/
51
52/**
53 * Transfer direction.
54 */
55typedef enum TRANSFERDIRECTION
56{
57 TRANSFERDIRECTION_INVALID = 0,
58 /** Read. */
59 TRANSFERDIRECTION_READ,
60 /** Write. */
61 TRANSFERDIRECTION_WRITE,
62 /** The usual 32-bit hack. */
63 TRANSFERDIRECTION_32BIT_HACK = 0x7fffffff
64} TRANSFERDIRECTION;
65
66/**
67 * Async I/O completion context state.
68 */
69typedef struct RTFILEAIOCTXINTERNAL
70{
71 /** handle to I/O completion port. */
72 HANDLE hIoCompletionPort;
73 /** Current number of requests pending. */
74 volatile int32_t cRequests;
75 /** Flag whether the thread was woken up. */
76 volatile bool fWokenUp;
77 /** Flag whether the thread is currently waiting. */
78 volatile bool fWaiting;
79 /** Magic value (RTFILEAIOCTX_MAGIC). */
80 uint32_t u32Magic;
81} RTFILEAIOCTXINTERNAL;
82/** Pointer to an internal context structure. */
83typedef RTFILEAIOCTXINTERNAL *PRTFILEAIOCTXINTERNAL;
84
85/**
86 * Async I/O request state.
87 */
88typedef struct RTFILEAIOREQINTERNAL
89{
90 /** Overlapped structure. */
91 OVERLAPPED Overlapped;
92 /** Current state the request is in. */
93 RTFILEAIOREQSTATE enmState;
94 /** The file handle. */
95 HANDLE hFile;
96 /** Kind of transfer Read/Write. */
97 TRANSFERDIRECTION enmTransferDirection;
98 /** Number of bytes to transfer. */
99 size_t cbTransfer;
100 /** Pointer to the buffer. */
101 void *pvBuf;
102 /** Opaque user data. */
103 void *pvUser;
104 /** Flag whether the request completed. */
105 bool fCompleted;
106 /** Number of bytes transfered successfully. */
107 size_t cbTransfered;
108 /** Error code of the completed request. */
109 int Rc;
110 /** Completion context we are assigned to. */
111 PRTFILEAIOCTXINTERNAL pCtxInt;
112 /** Magic value (RTFILEAIOREQ_MAGIC). */
113 uint32_t u32Magic;
114} RTFILEAIOREQINTERNAL;
115/** Pointer to an internal request structure. */
116typedef RTFILEAIOREQINTERNAL *PRTFILEAIOREQINTERNAL;
117
118/*******************************************************************************
119* Defined Constants And Macros *
120*******************************************************************************/
121/** Id for the wakeup event. */
122#define AIO_CONTEXT_WAKEUP_EVENT 1
123/** Converts a pointer to an OVERLAPPED structure to a internal request. */
124#define OVERLAPPED_2_RTFILEAIOREQINTERNAL(pOverlapped) ( (PRTFILEAIOREQINTERNAL)((uintptr_t)(pOverlapped) - RT_OFFSETOF(RTFILEAIOREQINTERNAL, Overlapped)) )
125
126RTR3DECL(int) RTFileAioGetLimits(PRTFILEAIOLIMITS pAioLimits)
127{
128 int rcBSD = 0;
129 AssertPtrReturn(pAioLimits, VERR_INVALID_POINTER);
130
131 /* No limits known. */
132 pAioLimits->cReqsOutstandingMax = RTFILEAIO_UNLIMITED_REQS;
133 pAioLimits->cbBufferAlignment = 0;
134
135 return VINF_SUCCESS;
136}
137
138RTR3DECL(int) RTFileAioReqCreate(PRTFILEAIOREQ phReq)
139{
140 AssertPtrReturn(phReq, VERR_INVALID_POINTER);
141
142 PRTFILEAIOREQINTERNAL pReqInt = (PRTFILEAIOREQINTERNAL)RTMemAllocZ(sizeof(RTFILEAIOREQINTERNAL));
143 if (RT_UNLIKELY(!pReqInt))
144 return VERR_NO_MEMORY;
145
146 pReqInt->pCtxInt = NULL;
147 pReqInt->fCompleted = false;
148 pReqInt->u32Magic = RTFILEAIOREQ_MAGIC;
149 RTFILEAIOREQ_SET_STATE(pReqInt, COMPLETED);
150
151 *phReq = (RTFILEAIOREQ)pReqInt;
152
153 return VINF_SUCCESS;
154}
155
156RTDECL(int) RTFileAioReqDestroy(RTFILEAIOREQ hReq)
157{
158 /*
159 * Validate the handle and ignore nil.
160 */
161 if (hReq == NIL_RTFILEAIOREQ)
162 return VINF_SUCCESS;
163 PRTFILEAIOREQINTERNAL pReqInt = hReq;
164 RTFILEAIOREQ_VALID_RETURN(pReqInt);
165 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_IN_PROGRESS);
166
167 /*
168 * Trash the magic and free it.
169 */
170 ASMAtomicUoWriteU32(&pReqInt->u32Magic, ~RTFILEAIOREQ_MAGIC);
171 RTMemFree(pReqInt);
172 return VINF_SUCCESS;
173}
174
175/**
176 * Worker setting up the request.
177 */
178DECLINLINE(int) rtFileAioReqPrepareTransfer(RTFILEAIOREQ hReq, RTFILE hFile,
179 TRANSFERDIRECTION enmTransferDirection,
180 RTFOFF off, void *pvBuf, size_t cbTransfer,
181 void *pvUser)
182{
183 /*
184 * Validate the input.
185 */
186 PRTFILEAIOREQINTERNAL pReqInt = hReq;
187 RTFILEAIOREQ_VALID_RETURN(pReqInt);
188 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_IN_PROGRESS);
189 Assert(hFile != NIL_RTFILE);
190 AssertPtr(pvBuf);
191 Assert(off >= 0);
192 Assert(cbTransfer > 0);
193
194 pReqInt->enmTransferDirection = enmTransferDirection;
195 pReqInt->hFile = (HANDLE)hFile;
196 pReqInt->Overlapped.Offset = (DWORD)(off & 0xffffffff);
197 pReqInt->Overlapped.OffsetHigh = (DWORD)(off >> 32);
198 pReqInt->cbTransfer = cbTransfer;
199 pReqInt->pvBuf = pvBuf;
200 pReqInt->pvUser = pvUser;
201 pReqInt->fCompleted = false;
202
203 return VINF_SUCCESS;
204}
205
206RTDECL(int) RTFileAioReqPrepareRead(RTFILEAIOREQ hReq, RTFILE hFile, RTFOFF off,
207 void *pvBuf, size_t cbRead, void *pvUser)
208{
209 return rtFileAioReqPrepareTransfer(hReq, hFile, TRANSFERDIRECTION_READ,
210 off, pvBuf, cbRead, pvUser);
211}
212
213RTDECL(int) RTFileAioReqPrepareWrite(RTFILEAIOREQ hReq, RTFILE hFile, RTFOFF off,
214 void *pvBuf, size_t cbWrite, void *pvUser)
215{
216 return rtFileAioReqPrepareTransfer(hReq, hFile, TRANSFERDIRECTION_WRITE,
217 off, pvBuf, cbWrite, pvUser);
218}
219
220RTDECL(int) RTFileAioReqPrepareFlush(RTFILEAIOREQ hReq, RTFILE hFile, void *pvUser)
221{
222 PRTFILEAIOREQINTERNAL pReqInt = hReq;
223 RTFILEAIOREQ_VALID_RETURN(pReqInt);
224 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_IN_PROGRESS);
225 AssertReturn(hFile != NIL_RTFILE, VERR_INVALID_HANDLE);
226
227 /** @todo: Flushing is not available */
228#if 0
229 return rtFileAsyncPrepareTransfer(pRequest, File, TRANSFERDIRECTION_FLUSH,
230 0, NULL, 0, pvUser);
231#endif
232 return VERR_NOT_IMPLEMENTED;
233}
234
235RTDECL(void *) RTFileAioReqGetUser(RTFILEAIOREQ hReq)
236{
237 PRTFILEAIOREQINTERNAL pReqInt = hReq;
238 RTFILEAIOREQ_VALID_RETURN_RC(pReqInt, NULL);
239
240 return pReqInt->pvUser;
241}
242
243RTDECL(int) RTFileAioReqCancel(RTFILEAIOREQ hReq)
244{
245 PRTFILEAIOREQINTERNAL pReqInt = hReq;
246 RTFILEAIOREQ_VALID_RETURN(pReqInt);
247 RTFILEAIOREQ_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_NOT_SUBMITTED);
248
249 /**
250 * @todo r=aeichner It is not possible to cancel specific
251 * requests on Windows before Vista.
252 * CancelIo cancels all requests for a file issued by the
253 * calling thread and CancelIoEx which does what we need
254 * is only available from Vista and up.
255 * The solution is to return VERR_FILE_AIO_IN_PROGRESS
256 * if the request didn't completed yet (checked above).
257 * Shouldn't be a big issue because a request is normally
258 * only canceled if it exceeds a timeout which is quite huge.
259 */
260 return VERR_FILE_AIO_COMPLETED;
261}
262
263RTDECL(int) RTFileAioReqGetRC(RTFILEAIOREQ hReq, size_t *pcbTransfered)
264{
265 int rc = VINF_SUCCESS;
266 PRTFILEAIOREQINTERNAL pReqInt = hReq;
267 RTFILEAIOREQ_VALID_RETURN(pReqInt);
268 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_IN_PROGRESS);
269 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, PREPARED, VERR_FILE_AIO_NOT_SUBMITTED);
270
271 rc = pReqInt->Rc;
272 if (pcbTransfered && RT_SUCCESS(rc))
273 *pcbTransfered = pReqInt->cbTransfered;
274
275 return rc;
276}
277
278RTDECL(int) RTFileAioCtxCreate(PRTFILEAIOCTX phAioCtx, uint32_t cAioReqsMax)
279{
280 PRTFILEAIOCTXINTERNAL pCtxInt;
281 AssertPtrReturn(phAioCtx, VERR_INVALID_POINTER);
282
283 pCtxInt = (PRTFILEAIOCTXINTERNAL)RTMemAllocZ(sizeof(RTFILEAIOCTXINTERNAL));
284 if (RT_UNLIKELY(!pCtxInt))
285 return VERR_NO_MEMORY;
286
287 pCtxInt->hIoCompletionPort = CreateIoCompletionPort(INVALID_HANDLE_VALUE,
288 NULL,
289 0,
290 0);
291 if (RT_UNLIKELY(!pCtxInt->hIoCompletionPort))
292 {
293 RTMemFree(pCtxInt);
294 return VERR_NO_MEMORY;
295 }
296
297 pCtxInt->u32Magic = RTFILEAIOCTX_MAGIC;
298
299 *phAioCtx = (RTFILEAIOCTX)pCtxInt;
300
301 return VINF_SUCCESS;
302}
303
304RTDECL(int) RTFileAioCtxDestroy(RTFILEAIOCTX hAioCtx)
305{
306 /* Validate the handle and ignore nil. */
307 if (hAioCtx == NIL_RTFILEAIOCTX)
308 return VINF_SUCCESS;
309 PRTFILEAIOCTXINTERNAL pCtxInt = hAioCtx;
310 RTFILEAIOCTX_VALID_RETURN(pCtxInt);
311
312 /* Cannot destroy a busy context. */
313 if (RT_UNLIKELY(pCtxInt->cRequests))
314 return VERR_FILE_AIO_BUSY;
315
316 CloseHandle(pCtxInt->hIoCompletionPort);
317 ASMAtomicUoWriteU32(&pCtxInt->u32Magic, RTFILEAIOCTX_MAGIC_DEAD);
318 RTMemFree(pCtxInt);
319
320 return VINF_SUCCESS;
321}
322
323RTDECL(int) RTFileAioCtxAssociateWithFile(RTFILEAIOCTX hAioCtx, RTFILE hFile)
324{
325 int rc = VINF_SUCCESS;
326 PRTFILEAIOCTXINTERNAL pCtxInt = hAioCtx;
327 RTFILEAIOCTX_VALID_RETURN(pCtxInt);
328
329 HANDLE hTemp = CreateIoCompletionPort((HANDLE)hFile, pCtxInt->hIoCompletionPort, 0, 1);
330 if (hTemp != pCtxInt->hIoCompletionPort)
331 rc = RTErrConvertFromWin32(GetLastError());
332
333 return rc;
334}
335
336RTDECL(uint32_t) RTFileAioCtxGetMaxReqCount(RTFILEAIOCTX hAioCtx)
337{
338 return RTFILEAIO_UNLIMITED_REQS;
339}
340
341RTDECL(int) RTFileAioCtxSubmit(RTFILEAIOCTX hAioCtx, PRTFILEAIOREQ pahReqs, size_t cReqs)
342{
343 /*
344 * Parameter validation.
345 */
346 int rc = VINF_SUCCESS;
347 PRTFILEAIOCTXINTERNAL pCtxInt = hAioCtx;
348 RTFILEAIOCTX_VALID_RETURN(pCtxInt);
349 AssertReturn(cReqs > 0, VERR_INVALID_PARAMETER);
350 AssertPtrReturn(pahReqs, VERR_INVALID_POINTER);
351 int i;
352
353 for (i = 0; i < cReqs; i++)
354 {
355 PRTFILEAIOREQINTERNAL pReqInt = pahReqs[i];
356 BOOL fSucceeded;
357
358 if (pReqInt->enmTransferDirection == TRANSFERDIRECTION_READ)
359 {
360 fSucceeded = ReadFile(pReqInt->hFile, pReqInt->pvBuf,
361 pReqInt->cbTransfer, NULL,
362 &pReqInt->Overlapped);
363 }
364 else if (pReqInt->enmTransferDirection == TRANSFERDIRECTION_WRITE)
365 {
366 fSucceeded = WriteFile(pReqInt->hFile, pReqInt->pvBuf,
367 pReqInt->cbTransfer, NULL,
368 &pReqInt->Overlapped);
369 }
370 else
371 AssertMsgFailed(("Invalid transfer direction\n"));
372
373 if (RT_UNLIKELY(!fSucceeded && GetLastError() != ERROR_IO_PENDING))
374 {
375 RTFILEAIOREQ_SET_STATE(pReqInt, COMPLETED);
376 rc = RTErrConvertFromWin32(GetLastError());
377 pReqInt->Rc = rc;
378 break;
379 }
380 RTFILEAIOREQ_SET_STATE(pReqInt, SUBMITTED);
381 }
382
383 ASMAtomicAddS32(&pCtxInt->cRequests, i);
384
385 return rc;
386}
387
388RTDECL(int) RTFileAioCtxWait(RTFILEAIOCTX hAioCtx, size_t cMinReqs, unsigned cMillisTimeout,
389 PRTFILEAIOREQ pahReqs, size_t cReqs, uint32_t *pcReqs)
390{
391 /*
392 * Validate the parameters, making sure to always set pcReqs.
393 */
394 AssertPtrReturn(pcReqs, VERR_INVALID_POINTER);
395 *pcReqs = 0; /* always set */
396 PRTFILEAIOCTXINTERNAL pCtxInt = hAioCtx;
397 RTFILEAIOCTX_VALID_RETURN(pCtxInt);
398 AssertPtrReturn(pahReqs, VERR_INVALID_POINTER);
399 AssertReturn(cReqs != 0, VERR_INVALID_PARAMETER);
400 AssertReturn(cReqs >= cMinReqs, VERR_OUT_OF_RANGE);
401
402 /*
403 * Can't wait if there are no requests around.
404 */
405 if (RT_UNLIKELY(ASMAtomicUoReadS32(&pCtxInt->cRequests) == 0))
406 return VERR_FILE_AIO_NO_REQUEST;
407
408 /* Wait for at least one. */
409 if (!cMinReqs)
410 cMinReqs = 1;
411
412 /*
413 * Loop until we're woken up, hit an error (incl timeout), or
414 * have collected the desired number of requests.
415 */
416 int rc = VINF_SUCCESS;
417 int cRequestsCompleted = 0;
418 while ( !pCtxInt->fWokenUp
419 && (cMinReqs > 0))
420 {
421 uint64_t StartNanoTS = 0;
422 DWORD dwTimeout = cMillisTimeout == RT_INDEFINITE_WAIT ? INFINITE : cMillisTimeout;
423 DWORD cbTransfered;
424 LPOVERLAPPED pOverlapped;
425 ULONG_PTR lCompletionKey;
426 BOOL fSucceeded;
427
428 if (cMillisTimeout != RT_INDEFINITE_WAIT)
429 StartNanoTS = RTTimeNanoTS();
430
431 ASMAtomicXchgBool(&pCtxInt->fWaiting, true);
432 fSucceeded = GetQueuedCompletionStatus(pCtxInt->hIoCompletionPort,
433 &cbTransfered,
434 &lCompletionKey,
435 &pOverlapped,
436 dwTimeout);
437 ASMAtomicXchgBool(&pCtxInt->fWaiting, false);
438 if (!fSucceeded)
439 {
440 /* Includes VERR_TIMEOUT */
441 rc = RTErrConvertFromWin32(GetLastError());
442 break;
443 }
444
445 /* Check if we got woken up. */
446 if (lCompletionKey == AIO_CONTEXT_WAKEUP_EVENT)
447 break;
448 else
449 {
450 /* A request completed. */
451 PRTFILEAIOREQINTERNAL pReqInt = OVERLAPPED_2_RTFILEAIOREQINTERNAL(pOverlapped);
452 AssertPtr(pReqInt);
453 Assert(pReqInt->u32Magic == RTFILEAIOREQ_MAGIC);
454
455 /* Mark the request as finished. */
456 RTFILEAIOREQ_SET_STATE(pReqInt, COMPLETED);
457
458 /* completion status. */
459 DWORD cbTransfered;
460 fSucceeded = GetOverlappedResult(pReqInt->hFile,
461 &pReqInt->Overlapped,
462 &cbTransfered,
463 FALSE);
464 pReqInt->cbTransfered = cbTransfered;
465 pReqInt->Rc = VINF_SUCCESS;
466
467 pahReqs[cRequestsCompleted++] = (RTFILEAIOREQ)pReqInt;
468
469 /* Update counter. */
470 cMinReqs --;
471
472 if (cMillisTimeout != RT_INDEFINITE_WAIT)
473 {
474 /* Recalculate timeout. */
475 uint64_t NanoTS = RTTimeNanoTS();
476 uint64_t cMilliesElapsed = (NanoTS - StartNanoTS) / 1000000;
477 cMillisTimeout -= cMilliesElapsed;
478 }
479 }
480 }
481
482 /*
483 * Update the context state and set the return value.
484 */
485 *pcReqs = cRequestsCompleted;
486 ASMAtomicSubS32(&pCtxInt->cRequests, cRequestsCompleted);
487
488 /*
489 * Clear the wakeup flag and set rc.
490 */
491 bool fWokenUp = ASMAtomicXchgBool(&pCtxInt->fWokenUp, false);
492
493 if ( fWokenUp
494 && RT_SUCCESS(rc))
495 rc = VERR_INTERRUPTED;
496
497 return rc;
498}
499
500RTDECL(int) RTFileAioCtxWakeup(RTFILEAIOCTX hAioCtx)
501{
502 int rc = VINF_SUCCESS;
503 PRTFILEAIOCTXINTERNAL pCtxInt = hAioCtx;
504 RTFILEAIOCTX_VALID_RETURN(pCtxInt);
505
506 bool fWokenUp = ASMAtomicXchgBool(&pCtxInt->fWokenUp, true);
507 bool fWaiting = ASMAtomicReadBool(&pCtxInt->fWaiting);
508
509 if ( !fWokenUp
510 && fWaiting)
511 {
512 BOOL fSucceeded = PostQueuedCompletionStatus(pCtxInt->hIoCompletionPort,
513 0, AIO_CONTEXT_WAKEUP_EVENT,
514 NULL);
515
516 if (!fSucceeded)
517 rc = RTErrConvertFromWin32(GetLastError());
518 }
519
520 return rc;
521}
522
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette