VirtualBox

source: vbox/trunk/src/VBox/Runtime/r3/solaris/fileaio-solaris.cpp@ 48647

Last change on this file since 48647 was 45678, checked in by vboxsync, 12 years ago

Runtime/aio: Add flags parameter to RTFileAioCtxCreate

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 17.9 KB
Line 
1/* $Id: fileaio-solaris.cpp 45678 2013-04-23 11:28:41Z vboxsync $ */
2/** @file
3 * IPRT - File async I/O, native implementation for the Solaris host platform.
4 */
5
6/*
7 * Copyright (C) 2006-2012 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * The contents of this file may alternatively be used under the terms
18 * of the Common Development and Distribution License Version 1.0
19 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20 * VirtualBox OSE distribution, in which case the provisions of the
21 * CDDL are applicable instead of those of the GPL.
22 *
23 * You may elect to license modified versions of this file under the
24 * terms and conditions of either the GPL or the CDDL or both.
25 */
26
27/*******************************************************************************
28* Header Files *
29*******************************************************************************/
30#define LOG_GROUP RTLOGGROUP_FILE
31#include <iprt/asm.h>
32#include <iprt/file.h>
33#include <iprt/mem.h>
34#include <iprt/assert.h>
35#include <iprt/string.h>
36#include <iprt/err.h>
37#include <iprt/log.h>
38#include "internal/fileaio.h"
39
40#include <port.h>
41#include <aio.h>
42#include <errno.h>
43#include <unistd.h>
44
45
46/*******************************************************************************
47* Structures and Typedefs *
48*******************************************************************************/
49/**
50 * Async I/O completion context state.
51 */
52typedef struct RTFILEAIOCTXINTERNAL
53{
54 /** Handle to the port. */
55 int iPort;
56 /** Current number of requests active on this context. */
57 volatile int32_t cRequests;
58 /** Flags given during creation. */
59 uint32_t fFlags;
60 /** Magic value (RTFILEAIOCTX_MAGIC). */
61 uint32_t u32Magic;
62} RTFILEAIOCTXINTERNAL;
63/** Pointer to an internal context structure. */
64typedef RTFILEAIOCTXINTERNAL *PRTFILEAIOCTXINTERNAL;
65
66/**
67 * Async I/O request state.
68 */
69typedef struct RTFILEAIOREQINTERNAL
70{
71 /** The aio control block. Must be the FIRST
72 * element. */
73 struct aiocb AioCB;
74 /** Current state the request is in. */
75 RTFILEAIOREQSTATE enmState;
76 /** Flag whether this is a flush request. */
77 bool fFlush;
78 /** Port notifier object to associate a request to a port. */
79 port_notify_t PortNotifier;
80 /** Opaque user data. */
81 void *pvUser;
82 /** Completion context we are assigned to. */
83 PRTFILEAIOCTXINTERNAL pCtxInt;
84 /** Magic value (RTFILEAIOREQ_MAGIC). */
85 uint32_t u32Magic;
86} RTFILEAIOREQINTERNAL;
87/** Pointer to an internal request structure. */
88typedef RTFILEAIOREQINTERNAL *PRTFILEAIOREQINTERNAL;
89
90
91/*******************************************************************************
92* Defined Constants And Macros *
93*******************************************************************************/
94/** The max number of events to get in one call. */
95#define AIO_MAXIMUM_REQUESTS_PER_CONTEXT 64
96/** Id for the wakeup event. */
97#define AIO_CONTEXT_WAKEUP_EVENT 1
98
99RTR3DECL(int) RTFileAioGetLimits(PRTFILEAIOLIMITS pAioLimits)
100{
101 int rcBSD = 0;
102 AssertPtrReturn(pAioLimits, VERR_INVALID_POINTER);
103
104 /* No limits known. */
105 pAioLimits->cReqsOutstandingMax = RTFILEAIO_UNLIMITED_REQS;
106 pAioLimits->cbBufferAlignment = 0;
107
108 return VINF_SUCCESS;
109}
110
111RTR3DECL(int) RTFileAioReqCreate(PRTFILEAIOREQ phReq)
112{
113 AssertPtrReturn(phReq, VERR_INVALID_POINTER);
114
115 PRTFILEAIOREQINTERNAL pReqInt = (PRTFILEAIOREQINTERNAL)RTMemAllocZ(sizeof(RTFILEAIOREQINTERNAL));
116 if (RT_UNLIKELY(!pReqInt))
117 return VERR_NO_MEMORY;
118
119 /* Ininitialize static parts. */
120 pReqInt->AioCB.aio_sigevent.sigev_notify = SIGEV_PORT;
121 pReqInt->AioCB.aio_sigevent.sigev_value.sival_ptr = &pReqInt->PortNotifier;
122 pReqInt->PortNotifier.portnfy_user = pReqInt;
123 pReqInt->pCtxInt = NULL;
124 pReqInt->u32Magic = RTFILEAIOREQ_MAGIC;
125 RTFILEAIOREQ_SET_STATE(pReqInt, COMPLETED);
126
127 *phReq = (RTFILEAIOREQ)pReqInt;
128
129 return VINF_SUCCESS;
130}
131
132RTDECL(int) RTFileAioReqDestroy(RTFILEAIOREQ hReq)
133{
134 /*
135 * Validate the handle and ignore nil.
136 */
137 if (hReq == NIL_RTFILEAIOREQ)
138 return VINF_SUCCESS;
139 PRTFILEAIOREQINTERNAL pReqInt = hReq;
140 RTFILEAIOREQ_VALID_RETURN(pReqInt);
141 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_IN_PROGRESS);
142
143 /*
144 * Trash the magic and free it.
145 */
146 ASMAtomicUoWriteU32(&pReqInt->u32Magic, ~RTFILEAIOREQ_MAGIC);
147 RTMemFree(pReqInt);
148 return VINF_SUCCESS;
149}
150
151/**
152 * Worker setting up the request.
153 */
154DECLINLINE(int) rtFileAioReqPrepareTransfer(RTFILEAIOREQ hReq, RTFILE hFile,
155 unsigned uTransferDirection,
156 RTFOFF off, void *pvBuf, size_t cbTransfer,
157 void *pvUser)
158{
159 /*
160 * Validate the input.
161 */
162 PRTFILEAIOREQINTERNAL pReqInt = hReq;
163 RTFILEAIOREQ_VALID_RETURN(pReqInt);
164 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_IN_PROGRESS);
165 Assert(hFile != NIL_RTFILE);
166 AssertPtr(pvBuf);
167 Assert(off >= 0);
168 Assert(cbTransfer > 0);
169
170 pReqInt->AioCB.aio_lio_opcode = uTransferDirection;
171 pReqInt->AioCB.aio_fildes = RTFileToNative(hFile);
172 pReqInt->AioCB.aio_offset = off;
173 pReqInt->AioCB.aio_nbytes = cbTransfer;
174 pReqInt->AioCB.aio_buf = pvBuf;
175 pReqInt->fFlush = false;
176 pReqInt->pvUser = pvUser;
177 pReqInt->pCtxInt = NULL;
178 RTFILEAIOREQ_SET_STATE(pReqInt, PREPARED);
179
180 return VINF_SUCCESS;
181}
182
183RTDECL(int) RTFileAioReqPrepareRead(RTFILEAIOREQ hReq, RTFILE hFile, RTFOFF off,
184 void *pvBuf, size_t cbRead, void *pvUser)
185{
186 return rtFileAioReqPrepareTransfer(hReq, hFile, LIO_READ,
187 off, pvBuf, cbRead, pvUser);
188}
189
190RTDECL(int) RTFileAioReqPrepareWrite(RTFILEAIOREQ hReq, RTFILE hFile, RTFOFF off,
191 void const *pvBuf, size_t cbWrite, void *pvUser)
192{
193 return rtFileAioReqPrepareTransfer(hReq, hFile, LIO_WRITE,
194 off, (void *)pvBuf, cbWrite, pvUser);
195}
196
197RTDECL(int) RTFileAioReqPrepareFlush(RTFILEAIOREQ hReq, RTFILE hFile, void *pvUser)
198{
199 PRTFILEAIOREQINTERNAL pReqInt = (PRTFILEAIOREQINTERNAL)hReq;
200
201 RTFILEAIOREQ_VALID_RETURN(pReqInt);
202 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_IN_PROGRESS);
203 Assert(hFile != NIL_RTFILE);
204
205 pReqInt->fFlush = true;
206 pReqInt->AioCB.aio_fildes = RTFileToNative(hFile);
207 pReqInt->AioCB.aio_offset = 0;
208 pReqInt->AioCB.aio_nbytes = 0;
209 pReqInt->AioCB.aio_buf = NULL;
210 pReqInt->pvUser = pvUser;
211 RTFILEAIOREQ_SET_STATE(pReqInt, PREPARED);
212
213 return VINF_SUCCESS;
214}
215
216RTDECL(void *) RTFileAioReqGetUser(RTFILEAIOREQ hReq)
217{
218 PRTFILEAIOREQINTERNAL pReqInt = hReq;
219 RTFILEAIOREQ_VALID_RETURN_RC(pReqInt, NULL);
220
221 return pReqInt->pvUser;
222}
223
224RTDECL(int) RTFileAioReqCancel(RTFILEAIOREQ hReq)
225{
226 PRTFILEAIOREQINTERNAL pReqInt = hReq;
227 RTFILEAIOREQ_VALID_RETURN(pReqInt);
228 RTFILEAIOREQ_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_NOT_SUBMITTED);
229
230 int rcSolaris = aio_cancel(pReqInt->AioCB.aio_fildes, &pReqInt->AioCB);
231
232 if (rcSolaris == AIO_CANCELED)
233 {
234 /*
235 * Decrement request count because the request will never arrive at the
236 * completion port.
237 */
238 AssertMsg(VALID_PTR(pReqInt->pCtxInt),
239 ("Invalid state. Request was canceled but wasn't submitted\n"));
240
241 ASMAtomicDecS32(&pReqInt->pCtxInt->cRequests);
242 RTFILEAIOREQ_SET_STATE(pReqInt, COMPLETED);
243 return VINF_SUCCESS;
244 }
245 else if (rcSolaris == AIO_ALLDONE)
246 return VERR_FILE_AIO_COMPLETED;
247 else if (rcSolaris == AIO_NOTCANCELED)
248 return VERR_FILE_AIO_IN_PROGRESS;
249 else
250 return RTErrConvertFromErrno(errno);
251}
252
253RTDECL(int) RTFileAioReqGetRC(RTFILEAIOREQ hReq, size_t *pcbTransfered)
254{
255 PRTFILEAIOREQINTERNAL pReqInt = hReq;
256 RTFILEAIOREQ_VALID_RETURN(pReqInt);
257 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, SUBMITTED, VERR_FILE_AIO_IN_PROGRESS);
258 RTFILEAIOREQ_NOT_STATE_RETURN_RC(pReqInt, PREPARED, VERR_FILE_AIO_NOT_SUBMITTED);
259 AssertPtrNull(pcbTransfered);
260
261 int rcSol = aio_error(&pReqInt->AioCB);
262 Assert(rcSol != EINPROGRESS); /* Handled by our own state handling. */
263
264 if (rcSol == 0)
265 {
266 if (pcbTransfered)
267 *pcbTransfered = aio_return(&pReqInt->AioCB);
268 return VINF_SUCCESS;
269 }
270
271 /* An error occurred. */
272 return RTErrConvertFromErrno(rcSol);
273}
274
275RTDECL(int) RTFileAioCtxCreate(PRTFILEAIOCTX phAioCtx, uint32_t cAioReqsMax,
276 uint32_t fFlags)
277{
278 int rc = VINF_SUCCESS;
279 PRTFILEAIOCTXINTERNAL pCtxInt;
280 AssertPtrReturn(phAioCtx, VERR_INVALID_POINTER);
281 AssertReturn(!(fFlags & ~RTFILEAIOCTX_FLAGS_VALID_MASK), VERR_INVALID_PARAMETER);
282
283 pCtxInt = (PRTFILEAIOCTXINTERNAL)RTMemAllocZ(sizeof(RTFILEAIOCTXINTERNAL));
284 if (RT_UNLIKELY(!pCtxInt))
285 return VERR_NO_MEMORY;
286
287 /* Init the event handle. */
288 pCtxInt->iPort = port_create();
289 if (RT_LIKELY(pCtxInt->iPort > 0))
290 {
291 pCtxInt->fFlags = fFlags;
292 pCtxInt->u32Magic = RTFILEAIOCTX_MAGIC;
293 *phAioCtx = (RTFILEAIOCTX)pCtxInt;
294 }
295 else
296 {
297 RTMemFree(pCtxInt);
298 rc = RTErrConvertFromErrno(errno);
299 }
300
301 return rc;
302}
303
304RTDECL(int) RTFileAioCtxDestroy(RTFILEAIOCTX hAioCtx)
305{
306 /* Validate the handle and ignore nil. */
307 if (hAioCtx == NIL_RTFILEAIOCTX)
308 return VINF_SUCCESS;
309 PRTFILEAIOCTXINTERNAL pCtxInt = hAioCtx;
310 RTFILEAIOCTX_VALID_RETURN(pCtxInt);
311
312 /* Cannot destroy a busy context. */
313 if (RT_UNLIKELY(pCtxInt->cRequests))
314 return VERR_FILE_AIO_BUSY;
315
316 close(pCtxInt->iPort);
317 ASMAtomicUoWriteU32(&pCtxInt->u32Magic, RTFILEAIOCTX_MAGIC_DEAD);
318 RTMemFree(pCtxInt);
319
320 return VINF_SUCCESS;
321}
322
323RTDECL(uint32_t) RTFileAioCtxGetMaxReqCount(RTFILEAIOCTX hAioCtx)
324{
325 return RTFILEAIO_UNLIMITED_REQS;
326}
327
328RTDECL(int) RTFileAioCtxAssociateWithFile(RTFILEAIOCTX hAioCtx, RTFILE hFile)
329{
330 return VINF_SUCCESS;
331}
332
333RTDECL(int) RTFileAioCtxSubmit(RTFILEAIOCTX hAioCtx, PRTFILEAIOREQ pahReqs, size_t cReqs)
334{
335 /*
336 * Parameter validation.
337 */
338 int rc = VINF_SUCCESS;
339 PRTFILEAIOCTXINTERNAL pCtxInt = hAioCtx;
340 RTFILEAIOCTX_VALID_RETURN(pCtxInt);
341 AssertReturn(cReqs > 0, VERR_INVALID_PARAMETER);
342 AssertPtrReturn(pahReqs, VERR_INVALID_POINTER);
343 size_t i = cReqs;
344
345 do
346 {
347 int rcSol = 0;
348 size_t cReqsSubmit = 0;
349 PRTFILEAIOREQINTERNAL pReqInt;
350
351 while(i-- > 0)
352 {
353 pReqInt = pahReqs[i];
354 if (RTFILEAIOREQ_IS_NOT_VALID(pReqInt))
355 {
356 /* Undo everything and stop submitting. */
357 for (size_t iUndo = 0; iUndo < i; iUndo++)
358 {
359 pReqInt = pahReqs[iUndo];
360 RTFILEAIOREQ_SET_STATE(pReqInt, PREPARED);
361 pReqInt->pCtxInt = NULL;
362 }
363 rc = VERR_INVALID_HANDLE;
364 break;
365 }
366
367 pReqInt->PortNotifier.portnfy_port = pCtxInt->iPort;
368 pReqInt->pCtxInt = pCtxInt;
369 RTFILEAIOREQ_SET_STATE(pReqInt, SUBMITTED);
370
371 if (pReqInt->fFlush)
372 break;
373
374 cReqsSubmit++;
375 }
376
377 if (cReqsSubmit)
378 {
379 rcSol = lio_listio(LIO_NOWAIT, (struct aiocb **)pahReqs, cReqsSubmit, NULL);
380 if (RT_UNLIKELY(rcSol < 0))
381 {
382 if (rcSol == EAGAIN)
383 rc = VERR_FILE_AIO_INSUFFICIENT_RESSOURCES;
384 else
385 rc = RTErrConvertFromErrno(errno);
386
387 /* Check which requests got actually submitted and which not. */
388 for (i = 0; i < cReqs; i++)
389 {
390 pReqInt = pahReqs[i];
391 rcSol = aio_error(&pReqInt->AioCB);
392 if (rcSol == EINVAL)
393 {
394 /* Was not submitted. */
395 RTFILEAIOREQ_SET_STATE(pReqInt, PREPARED);
396 pReqInt->pCtxInt = NULL;
397 }
398 else if (rcSol != EINPROGRESS)
399 {
400 /* The request encountered an error. */
401 RTFILEAIOREQ_SET_STATE(pReqInt, COMPLETED);
402 }
403 }
404 break;
405 }
406
407 ASMAtomicAddS32(&pCtxInt->cRequests, cReqsSubmit);
408 cReqs -= cReqsSubmit;
409 pahReqs += cReqsSubmit;
410 }
411
412 if (cReqs)
413 {
414 pReqInt = pahReqs[0];
415 RTFILEAIOREQ_VALID_RETURN(pReqInt);
416
417 /*
418 * If there are still requests left we have a flush request.
419 * lio_listio does not work with this requests so
420 * we have to use aio_fsync directly.
421 */
422 rcSol = aio_fsync(O_SYNC, &pReqInt->AioCB);
423 if (RT_UNLIKELY(rcSol < 0))
424 {
425 RTFILEAIOREQ_SET_STATE(pReqInt, COMPLETED);
426 rc = RTErrConvertFromErrno(errno);
427 break;
428 }
429
430 ASMAtomicIncS32(&pCtxInt->cRequests);
431 cReqs--;
432 pahReqs++;
433 }
434 } while (cReqs);
435
436 return rc;
437}
438
439RTDECL(int) RTFileAioCtxWait(RTFILEAIOCTX hAioCtx, size_t cMinReqs, RTMSINTERVAL cMillies,
440 PRTFILEAIOREQ pahReqs, size_t cReqs, uint32_t *pcReqs)
441{
442 int rc = VINF_SUCCESS;
443 int cRequestsCompleted = 0;
444
445 /*
446 * Validate the parameters, making sure to always set pcReqs.
447 */
448 AssertPtrReturn(pcReqs, VERR_INVALID_POINTER);
449 *pcReqs = 0; /* always set */
450 PRTFILEAIOCTXINTERNAL pCtxInt = hAioCtx;
451 RTFILEAIOCTX_VALID_RETURN(pCtxInt);
452 AssertPtrReturn(pahReqs, VERR_INVALID_POINTER);
453 AssertReturn(cReqs != 0, VERR_INVALID_PARAMETER);
454 AssertReturn(cReqs >= cMinReqs, VERR_OUT_OF_RANGE);
455
456 if ( RT_UNLIKELY(ASMAtomicReadS32(&pCtxInt->cRequests) == 0)
457 && !(pCtxInt->fFlags & RTFILEAIOCTX_FLAGS_WAIT_WITHOUT_PENDING_REQUESTS))
458 return VERR_FILE_AIO_NO_REQUEST;
459
460 /*
461 * Convert the timeout if specified.
462 */
463 struct timespec *pTimeout = NULL;
464 struct timespec Timeout = {0,0};
465 uint64_t StartNanoTS = 0;
466 if (cMillies != RT_INDEFINITE_WAIT)
467 {
468 Timeout.tv_sec = cMillies / 1000;
469 Timeout.tv_nsec = cMillies % 1000 * 1000000;
470 pTimeout = &Timeout;
471 StartNanoTS = RTTimeNanoTS();
472 }
473
474 /* Wait for at least one. */
475 if (!cMinReqs)
476 cMinReqs = 1;
477
478 while ( cMinReqs
479 && RT_SUCCESS_NP(rc))
480 {
481 port_event_t aPortEvents[AIO_MAXIMUM_REQUESTS_PER_CONTEXT];
482 uint_t cRequests = cMinReqs;
483 int cRequestsToWait = RT_MIN(cReqs, AIO_MAXIMUM_REQUESTS_PER_CONTEXT);
484 int rcSol;
485 uint64_t StartTime;
486
487 rcSol = port_getn(pCtxInt->iPort, &aPortEvents[0], cRequestsToWait, &cRequests, pTimeout);
488
489 if (RT_UNLIKELY(rcSol < 0))
490 rc = RTErrConvertFromErrno(errno);
491
492 /* Process received events. */
493 for (uint_t i = 0; i < cRequests; i++)
494 {
495 if (aPortEvents[i].portev_source == PORT_SOURCE_ALERT)
496 {
497 Assert(aPortEvents[i].portev_events == AIO_CONTEXT_WAKEUP_EVENT);
498 rc = VERR_INTERRUPTED; /* We've got interrupted. */
499 /* Reset the port. */
500 port_alert(pCtxInt->iPort, PORT_ALERT_SET, 0, NULL);
501 }
502 else
503 {
504 PRTFILEAIOREQINTERNAL pReqInt = (PRTFILEAIOREQINTERNAL)aPortEvents[i].portev_user;
505 AssertPtr(pReqInt);
506 Assert(pReqInt->u32Magic == RTFILEAIOREQ_MAGIC);
507
508 /* A request has finished. */
509 pahReqs[cRequestsCompleted++] = pReqInt;
510
511 /* Mark the request as finished. */
512 RTFILEAIOREQ_SET_STATE(pReqInt, COMPLETED);
513 }
514 }
515
516 /*
517 * Done Yet? If not advance and try again.
518 */
519 if (cRequests >= cMinReqs)
520 break;
521 cMinReqs -= cRequests;
522 cReqs -= cRequests;
523
524 if (cMillies != RT_INDEFINITE_WAIT)
525 {
526 uint64_t NanoTS = RTTimeNanoTS();
527 uint64_t cMilliesElapsed = (NanoTS - StartNanoTS) / 1000000;
528
529 /* The syscall supposedly updates it, but we're paranoid. :-) */
530 if (cMilliesElapsed < cMillies)
531 {
532 Timeout.tv_sec = (cMillies - (RTMSINTERVAL)cMilliesElapsed) / 1000;
533 Timeout.tv_nsec = (cMillies - (RTMSINTERVAL)cMilliesElapsed) % 1000 * 1000000;
534 }
535 else
536 {
537 Timeout.tv_sec = 0;
538 Timeout.tv_nsec = 0;
539 }
540 }
541 }
542
543 /*
544 * Update the context state and set the return value.
545 */
546 *pcReqs = cRequestsCompleted;
547 ASMAtomicSubS32(&pCtxInt->cRequests, cRequestsCompleted);
548
549 return rc;
550}
551
552RTDECL(int) RTFileAioCtxWakeup(RTFILEAIOCTX hAioCtx)
553{
554 int rc = VINF_SUCCESS;
555 PRTFILEAIOCTXINTERNAL pCtxInt = hAioCtx;
556 RTFILEAIOCTX_VALID_RETURN(pCtxInt);
557
558 rc = port_alert(pCtxInt->iPort, PORT_ALERT_UPDATE, AIO_CONTEXT_WAKEUP_EVENT, NULL);
559 if (RT_UNLIKELY((rc < 0) && (errno != EBUSY)))
560 return RTErrConvertFromErrno(errno);
561
562 return VINF_SUCCESS;
563}
564
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette