1 /* Handle general operations.
2 Copyright (C) 1997, 1998 Free Software Foundation, Inc.
3 This file is part of the GNU C Library.
4 Contributed by Ulrich Drepper <drepper@cygnus.com>, 1997.
6 The GNU C Library is free software; you can redistribute it and/or
7 modify it under the terms of the GNU Library General Public License as
8 published by the Free Software Foundation; either version 2 of the
9 License, or (at your option) any later version.
11 The GNU C Library is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 Library General Public License for more details.
16 You should have received a copy of the GNU Library General Public
17 License along with the GNU C Library; see the file COPYING.LIB. If not,
18 write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
19 Boston, MA 02111-1307, USA. */
31 /* Pool of request list entries. */
32 static struct requestlist
**pool
;
34 /* Number of total and allocated pool entries. */
35 static size_t pool_tab_size
;
36 static size_t pool_size
;
38 /* We implement a two dimensional array but allocate each row separately.
39 The macro below determines how many entries should be used per row.
40 It should better be a power of two. */
41 #define ENTRIES_PER_ROW 16
43 /* The row table is incremented in units of this. */
46 /* List of available entries. */
47 static struct requestlist
*freelist
;
49 /* List of request waiting to be processed. */
50 static struct requestlist
*runlist
;
52 /* Structure list of all currently processed requests. */
53 static struct requestlist
*requests
;
55 /* Number of threads currently running. */
59 /* These are the values used to optimize the use of AIO. The user can
60 overwrite them by using the `aio_init' function. */
61 static struct aioinit optim
=
63 20, /* int aio_threads; Maximal number of threads. */
64 256, /* int aio_num; Number of expected simultanious requests. */
73 /* Since the list is global we need a mutex protecting it. */
74 pthread_mutex_t __aio_requests_mutex
= PTHREAD_RECURSIVE_MUTEX_INITIALIZER_NP
;
77 /* Functions to handle request list pool. */
78 static struct requestlist
*
81 struct requestlist
*result
;
85 struct requestlist
*new_row
;
88 /* Compute new size. */
89 new_size
= pool_size
? pool_size
+ ENTRIES_PER_ROW
: optim
.aio_num
;
91 if ((new_size
/ ENTRIES_PER_ROW
) >= pool_tab_size
)
93 size_t new_tab_size
= new_size
/ ENTRIES_PER_ROW
;
94 struct requestlist
**new_tab
;
96 new_tab
= (struct requestlist
**)
97 realloc (pool
, (new_tab_size
* sizeof (struct requestlist
*)));
102 pool_tab_size
= new_tab_size
;
110 new_row
= (struct requestlist
*)
111 calloc (new_size
, sizeof (struct requestlist
));
116 for (cnt
= 0; cnt
< new_size
/ ENTRIES_PER_ROW
; ++cnt
)
117 pool
[cnt
] = &new_row
[cnt
* ENTRIES_PER_ROW
];
121 /* Allocat one new row. */
122 new_row
= (struct requestlist
*)
123 calloc (ENTRIES_PER_ROW
, sizeof (struct requestlist
));
127 pool
[new_size
/ ENTRIES_PER_ROW
] = new_row
;
130 /* Put all the new entries in the freelist. */
133 new_row
->next_prio
= freelist
;
134 freelist
= new_row
++;
136 while (++pool_size
< new_size
);
140 freelist
= freelist
->next_prio
;
147 __aio_free_request (struct requestlist
*elem
)
150 elem
->next_prio
= freelist
;
156 __aio_find_req (aiocb_union
*elem
)
158 struct requestlist
*runp
= requests
;
159 int fildes
= elem
->aiocb
.aio_fildes
;
161 while (runp
!= NULL
&& runp
->aiocbp
->aiocb
.aio_fildes
< fildes
)
162 runp
= runp
->next_fd
;
165 if (runp
->aiocbp
->aiocb
.aio_fildes
!= fildes
)
168 while (runp
!= NULL
&& runp
->aiocbp
!= elem
)
169 runp
= runp
->next_prio
;
176 __aio_find_req_fd (int fildes
)
178 struct requestlist
*runp
= requests
;
180 while (runp
!= NULL
&& runp
->aiocbp
->aiocb
.aio_fildes
< fildes
)
181 runp
= runp
->next_fd
;
183 return (runp
!= NULL
&& runp
->aiocbp
->aiocb
.aio_fildes
== fildes
188 /* The thread handler. */
189 static void *handle_fildes_io (void *arg
);
192 /* User optimization. */
194 __aio_init (const struct aioinit
*init
)
197 pthread_mutex_lock (&__aio_requests_mutex
);
199 /* Only allow writing new values if the table is not yet allocated. */
202 optim
.aio_threads
= init
->aio_threads
< 1 ? 1 : init
->aio_threads
;
203 optim
.aio_num
= (init
->aio_num
< ENTRIES_PER_ROW
205 : init
->aio_num
& ~ENTRIES_PER_ROW
);
208 /* Release the mutex. */
209 pthread_mutex_unlock (&__aio_requests_mutex
);
211 weak_alias (__aio_init
, aio_init
)
214 /* The main function of the async I/O handling. It enqueues requests
215 and if necessary starts and handles threads. */
217 __aio_enqueue_request (aiocb_union
*aiocbp
, int operation
)
221 struct sched_param param
;
222 struct requestlist
*last
, *runp
, *newp
;
225 if (aiocbp
->aiocb
.aio_reqprio
< 0
226 || aiocbp
->aiocb
.aio_reqprio
> AIO_PRIO_DELTA_MAX
)
228 /* Invalid priority value. */
229 __set_errno (EINVAL
);
230 aiocbp
->aiocb
.__error_code
= EINVAL
;
231 aiocbp
->aiocb
.__return_value
= -1;
235 /* Compute priority for this request. */
236 pthread_getschedparam (pthread_self (), &policy
, ¶m
);
237 prio
= param
.sched_priority
- aiocbp
->aiocb
.aio_reqprio
;
240 pthread_mutex_lock (&__aio_requests_mutex
);
244 /* First look whether the current file descriptor is currently
247 && runp
->aiocbp
->aiocb
.aio_fildes
< aiocbp
->aiocb
.aio_fildes
)
250 runp
= runp
->next_fd
;
253 /* Get a new element for the waiting list. */
257 __set_errno (EAGAIN
);
258 pthread_mutex_unlock (&__aio_requests_mutex
);
261 newp
->aiocbp
= aiocbp
;
262 newp
->waiting
= NULL
;
264 aiocbp
->aiocb
.__abs_prio
= prio
;
265 aiocbp
->aiocb
.__policy
= policy
;
266 aiocbp
->aiocb
.aio_lio_opcode
= operation
;
267 aiocbp
->aiocb
.__error_code
= EINPROGRESS
;
268 aiocbp
->aiocb
.__return_value
= 0;
271 && runp
->aiocbp
->aiocb
.aio_fildes
== aiocbp
->aiocb
.aio_fildes
)
273 /* The current file descriptor is worked on. It makes no sense
274 to start another thread since this new thread would fight
275 with the running thread for the resources. But we also cannot
276 say that the thread processing this desriptor shall immediately
277 after finishing the current job process this request if there
278 are other threads in the running queue which have a higher
281 /* Simply enqueue it after the running one according to the
283 while (runp
->next_prio
!= NULL
284 && runp
->next_prio
->aiocbp
->aiocb
.__abs_prio
>= prio
)
285 runp
= runp
->next_prio
;
287 newp
->next_prio
= runp
->next_prio
;
288 runp
->next_prio
= newp
;
294 /* Enqueue this request for a new descriptor. */
297 newp
->last_fd
= NULL
;
298 newp
->next_fd
= requests
;
299 if (requests
!= NULL
)
300 requests
->last_fd
= newp
;
305 newp
->next_fd
= last
->next_fd
;
306 newp
->last_fd
= last
;
307 last
->next_fd
= newp
;
308 if (newp
->next_fd
!= NULL
)
309 newp
->next_fd
->last_fd
= newp
;
312 newp
->next_prio
= NULL
;
317 /* We try to create a new thread for this file descriptor. The
318 function which gets called will handle all available requests
319 for this descriptor and when all are processed it will
322 If no new thread can be created or if the specified limit of
323 threads for AIO is reached we queue the request. */
325 /* See if we can create a thread. */
326 if (nthreads
< optim
.aio_threads
)
331 /* Make sure the thread is created detached. */
332 pthread_attr_init (&attr
);
333 pthread_attr_setdetachstate (&attr
, PTHREAD_CREATE_DETACHED
);
335 /* Now try to start a thread. */
336 if (pthread_create (&thid
, &attr
, handle_fildes_io
, newp
) == 0)
338 /* We managed to enqueue the request. All errors which can
339 happen now can be recognized by calls to `aio_return' and
344 else if (nthreads
== 0)
345 /* We cannot create a thread in the moment and there is
346 also no thread running. This is a problem. `errno' is
347 set to EAGAIN if this is only a temporary problem. */
352 /* Enqueue the request in the run queue if it is not yet running. */
353 if (running
< yes
&& result
== 0)
355 if (runlist
== NULL
|| runlist
->aiocbp
->aiocb
.__abs_prio
< prio
)
357 newp
->next_run
= runlist
;
364 while (runp
->next_run
!= NULL
365 && runp
->next_run
->aiocbp
->aiocb
.__abs_prio
>= prio
)
366 runp
= runp
->next_run
;
368 newp
->next_run
= runp
->next_run
;
369 runp
->next_run
= newp
;
374 newp
->running
= running
;
377 /* Something went wrong. */
378 __aio_free_request (newp
);
382 /* Release the mutex. */
383 pthread_mutex_unlock (&__aio_requests_mutex
);
390 handle_fildes_io (void *arg
)
392 pthread_t self
= pthread_self ();
393 struct sched_param param
;
394 struct requestlist
*runp
= (struct requestlist
*) arg
;
399 pthread_getschedparam (self
, &policy
, ¶m
);
403 /* Update our variables. */
404 aiocbp
= runp
->aiocbp
;
405 fildes
= aiocbp
->aiocb
.aio_fildes
;
407 /* Change the priority to the requested value (if necessary). */
408 if (aiocbp
->aiocb
.__abs_prio
!= param
.sched_priority
409 || aiocbp
->aiocb
.__policy
!= policy
)
411 param
.sched_priority
= aiocbp
->aiocb
.__abs_prio
;
412 policy
= aiocbp
->aiocb
.__policy
;
413 pthread_setschedparam (self
, policy
, ¶m
);
416 /* Process request pointed to by RUNP. We must not be disturbed
418 if ((aiocbp
->aiocb
.aio_lio_opcode
& 127) == LIO_READ
)
420 if (aiocbp
->aiocb
.aio_lio_opcode
& 128)
421 aiocbp
->aiocb
.__return_value
=
422 TEMP_FAILURE_RETRY (__pread64 (fildes
,
423 (void *) aiocbp
->aiocb64
.aio_buf
,
424 aiocbp
->aiocb64
.aio_nbytes
,
425 aiocbp
->aiocb64
.aio_offset
));
427 aiocbp
->aiocb
.__return_value
=
428 TEMP_FAILURE_RETRY (pread (fildes
,
429 (void *) aiocbp
->aiocb
.aio_buf
,
430 aiocbp
->aiocb
.aio_nbytes
,
431 aiocbp
->aiocb
.aio_offset
));
433 else if ((aiocbp
->aiocb
.aio_lio_opcode
& 127) == LIO_WRITE
)
435 if (aiocbp
->aiocb
.aio_lio_opcode
& 128)
436 aiocbp
->aiocb
.__return_value
=
437 TEMP_FAILURE_RETRY (__pwrite64 (fildes
,
438 (const void *) aiocbp
->aiocb64
.aio_buf
,
439 aiocbp
->aiocb64
.aio_nbytes
,
440 aiocbp
->aiocb64
.aio_offset
));
442 aiocbp
->aiocb
.__return_value
=
443 TEMP_FAILURE_RETRY (pwrite (fildes
,
444 (const void *) aiocbp
->aiocb
.aio_buf
,
445 aiocbp
->aiocb
.aio_nbytes
,
446 aiocbp
->aiocb
.aio_offset
));
448 else if (aiocbp
->aiocb
.aio_lio_opcode
== LIO_DSYNC
)
449 aiocbp
->aiocb
.__return_value
= TEMP_FAILURE_RETRY (fdatasync (fildes
));
450 else if (aiocbp
->aiocb
.aio_lio_opcode
== LIO_SYNC
)
451 aiocbp
->aiocb
.__return_value
= TEMP_FAILURE_RETRY (fsync (fildes
));
454 /* This is an invalid opcode. */
455 aiocbp
->aiocb
.__return_value
= -1;
456 __set_errno (EINVAL
);
460 pthread_mutex_lock (&__aio_requests_mutex
);
462 if (aiocbp
->aiocb
.__return_value
== -1)
463 aiocbp
->aiocb
.__error_code
= errno
;
465 aiocbp
->aiocb
.__error_code
= 0;
467 /* Send the signal to notify about finished processing of the
471 /* Now dequeue the current request. */
472 if (runp
->next_prio
== NULL
)
474 /* No outstanding request for this descriptor. Remove this
475 descriptor from the list. */
476 if (runp
->next_fd
!= NULL
)
477 runp
->next_fd
->last_fd
= runp
->last_fd
;
478 if (runp
->last_fd
!= NULL
)
479 runp
->last_fd
->next_fd
= runp
->next_fd
;
481 requests
= runp
->next_fd
;
485 runp
->next_prio
->last_fd
= runp
->last_fd
;
486 runp
->next_prio
->next_fd
= runp
->next_fd
;
487 runp
->next_prio
->running
= yes
;
488 if (runp
->next_fd
!= NULL
)
489 runp
->next_fd
->last_fd
= runp
->next_prio
;
490 if (runp
->last_fd
!= NULL
)
491 runp
->last_fd
->next_fd
= runp
->next_prio
;
493 requests
= runp
->next_prio
;
496 /* Free the old element. */
497 __aio_free_request (runp
);
502 /* We must not run requests which are not marked `running'. */
503 if (runp
->running
== yes
)
504 runlist
= runp
->next_run
;
507 struct requestlist
*old
;
512 runp
= runp
->next_run
;
514 while (runp
!= NULL
&& runp
->running
!= yes
);
517 old
->next_run
= runp
->next_run
;
521 /* If no request to work on we will stop the thread. */
525 runp
->running
= allocated
;
527 /* Release the mutex. */
528 pthread_mutex_unlock (&__aio_requests_mutex
);
530 while (runp
!= NULL
);
536 /* Free allocated resources. */
538 __attribute__ ((unused
))
543 /* The first block of rows as specified in OPTIM is allocated in
547 for (row
= optim
.aio_num
/ ENTRIES_PER_ROW
; row
< pool_tab_size
; ++row
)
553 text_set_element (__libc_subfreeres
, free_res
);