sysdeps/pthread/aio_misc.c

   1 /* Handle general operations.
   2    Copyright (C) 1997-2001, 2003, 2004, 2006, 2007, 2009, 2011
   3    Free Software Foundation, Inc.
   4    This file is part of the GNU C Library.
   5    Contributed by Ulrich Drepper <drepper@cygnus.com>, 1997.
   6
   7    The GNU C Library is free software; you can redistribute it and/or
   8    modify it under the terms of the GNU Lesser General Public
   9    License as published by the Free Software Foundation; either
  10    version 2.1 of the License, or (at your option) any later version.
  11
  12    The GNU C Library is distributed in the hope that it will be useful,
  13    but WITHOUT ANY WARRANTY; without even the implied warranty of
  14    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  15    Lesser General Public License for more details.
  16
  17    You should have received a copy of the GNU Lesser General Public
  18    License along with the GNU C Library; if not, write to the Free
  19    Software Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
  20    02111-1307 USA.  */
  21
  22 #include <aio.h>
  23 #include <assert.h>
  24 #include <errno.h>
  25 #include <limits.h>
  26 #include <pthread.h>
  27 #include <stdlib.h>
  28 #include <unistd.h>
  29 #include <sys/param.h>
  30 #include <sys/stat.h>
  31 #include <sys/time.h>
  32 #include <aio_misc.h>
  33
  34 #ifndef aio_create_helper_thread
  35 # define aio_create_helper_thread __aio_create_helper_thread
  36
  37 extern inline int
  38 __aio_create_helper_thread (pthread_t *threadp, void *(*tf) (void *), void *arg)
  39 {
  40   pthread_attr_t attr;
  41
  42   /* Make sure the thread is created detached.  */
  43   pthread_attr_init (&attr);
  44   pthread_attr_setdetachstate (&attr, PTHREAD_CREATE_DETACHED);
  45
  46   int ret = pthread_create (threadp, &attr, tf, arg);
  47
  48   (void) pthread_attr_destroy (&attr);
  49   return ret;
  50 }
  51 #endif
  52
  53 static void add_request_to_runlist (struct requestlist *newrequest);
  54
  55 /* Pool of request list entries.  */
  56 static struct requestlist **pool;
  57
  58 /* Number of total and allocated pool entries.  */
  59 static size_t pool_max_size;
  60 static size_t pool_size;
  61
  62 /* We implement a two dimensional array but allocate each row separately.
  63    The macro below determines how many entries should be used per row.
  64    It should better be a power of two.  */
  65 #define ENTRIES_PER_ROW 32
  66
  67 /* How many rows we allocate at once.  */
  68 #define ROWS_STEP       8
  69
  70 /* List of available entries.  */
  71 static struct requestlist *freelist;
  72
  73 /* List of request waiting to be processed.  */
  74 static struct requestlist *runlist;
  75
  76 /* Structure list of all currently processed requests.  */
  77 static struct requestlist *requests;
  78
  79 /* Number of threads currently running.  */
  80 static int nthreads;
  81
  82 /* Number of threads waiting for work to arrive. */
  83 static int idle_thread_count;
  84
  85
  86 /* These are the values used to optimize the use of AIO.  The user can
  87    overwrite them by using the `aio_init' function.  */
  88 static struct aioinit optim =
  89 {
  90   20,   /* int aio_threads;     Maximal number of threads.  */
  91   64,   /* int aio_num;         Number of expected simultaneous requests. */
  92   0,
  93   0,
  94   0,
  95   0,
  96   1,
  97   0
  98 };
  99
 100
 101 /* Since the list is global we need a mutex protecting it.  */
 102 pthread_mutex_t __aio_requests_mutex = PTHREAD_RECURSIVE_MUTEX_INITIALIZER_NP;
 103
 104 /* When you add a request to the list and there are idle threads present,
 105    you signal this condition variable. When a thread finishes work, it waits
 106    on this condition variable for a time before it actually exits. */
 107 pthread_cond_t __aio_new_request_notification = PTHREAD_COND_INITIALIZER;
 108
 109
 110 /* Functions to handle request list pool.  */
 111 static struct requestlist *
 112 get_elem (void)
 113 {
 114   struct requestlist *result;
 115
 116   if (freelist == NULL)
 117     {
 118       struct requestlist *new_row;
 119       int cnt;
 120
 121       assert (sizeof (struct aiocb) == sizeof (struct aiocb64));
 122
 123       if (pool_size + 1 >= pool_max_size)
 124         {
 125           size_t new_max_size = pool_max_size + ROWS_STEP;
 126           struct requestlist **new_tab;
 127
 128           new_tab = (struct requestlist **)
 129             realloc (pool, new_max_size * sizeof (struct requestlist *));
 130
 131           if (new_tab == NULL)
 132             return NULL;
 133
 134           pool_max_size = new_max_size;
 135           pool = new_tab;
 136         }
 137
 138       /* Allocate the new row.  */
 139       cnt = pool_size == 0 ? optim.aio_num : ENTRIES_PER_ROW;
 140       new_row = (struct requestlist *) calloc (cnt,
 141                                                sizeof (struct requestlist));
 142       if (new_row == NULL)
 143         return NULL;
 144
 145       pool[pool_size++] = new_row;
 146
 147       /* Put all the new entries in the freelist.  */
 148       do
 149         {
 150           new_row->next_prio = freelist;
 151           freelist = new_row++;
 152         }
 153       while (--cnt > 0);
 154     }
 155
 156   result = freelist;
 157   freelist = freelist->next_prio;
 158
 159   return result;
 160 }
 161
 162
 163 void
 164 internal_function
 165 __aio_free_request (struct requestlist *elem)
 166 {
 167   elem->running = no;
 168   elem->next_prio = freelist;
 169   freelist = elem;
 170 }
 171
 172
 173 struct requestlist *
 174 internal_function
 175 __aio_find_req (aiocb_union *elem)
 176 {
 177   struct requestlist *runp = requests;
 178   int fildes = elem->aiocb.aio_fildes;
 179
 180   while (runp != NULL && runp->aiocbp->aiocb.aio_fildes < fildes)
 181     runp = runp->next_fd;
 182
 183   if (runp != NULL)
 184     {
 185       if (runp->aiocbp->aiocb.aio_fildes != fildes)
 186         runp = NULL;
 187       else
 188         while (runp != NULL && runp->aiocbp != elem)
 189           runp = runp->next_prio;
 190     }
 191
 192   return runp;
 193 }
 194
 195
 196 struct requestlist *
 197 internal_function
 198 __aio_find_req_fd (int fildes)
 199 {
 200   struct requestlist *runp = requests;
 201
 202   while (runp != NULL && runp->aiocbp->aiocb.aio_fildes < fildes)
 203     runp = runp->next_fd;
 204
 205   return (runp != NULL && runp->aiocbp->aiocb.aio_fildes == fildes
 206           ? runp : NULL);
 207 }
 208
 209
 210 void
 211 internal_function
 212 __aio_remove_request (struct requestlist *last, struct requestlist *req,
 213                       int all)
 214 {
 215   assert (req->running == yes || req->running == queued
 216           || req->running == done);
 217
 218   if (last != NULL)
 219     last->next_prio = all ? NULL : req->next_prio;
 220   else
 221     {
 222       if (all || req->next_prio == NULL)
 223         {
 224           if (req->last_fd != NULL)
 225             req->last_fd->next_fd = req->next_fd;
 226           else
 227             requests = req->next_fd;
 228           if (req->next_fd != NULL)
 229             req->next_fd->last_fd = req->last_fd;
 230         }
 231       else
 232         {
 233           if (req->last_fd != NULL)
 234             req->last_fd->next_fd = req->next_prio;
 235           else
 236             requests = req->next_prio;
 237
 238           if (req->next_fd != NULL)
 239             req->next_fd->last_fd = req->next_prio;
 240
 241           req->next_prio->last_fd = req->last_fd;
 242           req->next_prio->next_fd = req->next_fd;
 243
 244           /* Mark this entry as runnable.  */
 245           req->next_prio->running = yes;
 246         }
 247
 248       if (req->running == yes)
 249         {
 250           struct requestlist *runp = runlist;
 251
 252           last = NULL;
 253           while (runp != NULL)
 254             {
 255               if (runp == req)
 256                 {
 257                   if (last == NULL)
 258                     runlist = runp->next_run;
 259                   else
 260                     last->next_run = runp->next_run;
 261                   break;
 262                 }
 263               last = runp;
 264               runp = runp->next_run;
 265             }
 266         }
 267     }
 268 }
 269
 270
 271 /* The thread handler.  */
 272 static void *handle_fildes_io (void *arg);
 273
 274
 275 /* User optimization.  */
 276 void
 277 __aio_init (const struct aioinit *init)
 278 {
 279   /* Get the mutex.  */
 280   pthread_mutex_lock (&__aio_requests_mutex);
 281
 282   /* Only allow writing new values if the table is not yet allocated.  */
 283   if (pool == NULL)
 284     {
 285       optim.aio_threads = init->aio_threads < 1 ? 1 : init->aio_threads;
 286       assert (powerof2 (ENTRIES_PER_ROW));
 287       optim.aio_num = (init->aio_num < ENTRIES_PER_ROW
 288                        ? ENTRIES_PER_ROW
 289                        : init->aio_num & ~(ENTRIES_PER_ROW - 1));
 290     }
 291
 292   if (init->aio_idle_time != 0)
 293     optim.aio_idle_time = init->aio_idle_time;
 294
 295   /* Release the mutex.  */
 296   pthread_mutex_unlock (&__aio_requests_mutex);
 297 }
 298 weak_alias (__aio_init, aio_init)
 299
 300
 301 /* The main function of the async I/O handling.  It enqueues requests
 302    and if necessary starts and handles threads.  */
 303 struct requestlist *
 304 internal_function
 305 __aio_enqueue_request (aiocb_union *aiocbp, int operation)
 306 {
 307   int result = 0;
 308   int policy, prio;
 309   struct sched_param param;
 310   struct requestlist *last, *runp, *newp;
 311   int running = no;
 312
 313   if (operation == LIO_SYNC || operation == LIO_DSYNC)
 314     aiocbp->aiocb.aio_reqprio = 0;
 315   else if (aiocbp->aiocb.aio_reqprio < 0
 316            || aiocbp->aiocb.aio_reqprio > AIO_PRIO_DELTA_MAX)
 317     {
 318       /* Invalid priority value.  */
 319       __set_errno (EINVAL);
 320       aiocbp->aiocb.__error_code = EINVAL;
 321       aiocbp->aiocb.__return_value = -1;
 322       return NULL;
 323     }
 324
 325   /* Compute priority for this request.  */
 326   pthread_getschedparam (pthread_self (), &policy, &param);
 327   prio = param.sched_priority - aiocbp->aiocb.aio_reqprio;
 328
 329   /* Get the mutex.  */
 330   pthread_mutex_lock (&__aio_requests_mutex);
 331
 332   last = NULL;
 333   runp = requests;
 334   /* First look whether the current file descriptor is currently
 335      worked with.  */
 336   while (runp != NULL
 337          && runp->aiocbp->aiocb.aio_fildes < aiocbp->aiocb.aio_fildes)
 338     {
 339       last = runp;
 340       runp = runp->next_fd;
 341     }
 342
 343   /* Get a new element for the waiting list.  */
 344   newp = get_elem ();
 345   if (newp == NULL)
 346     {
 347       pthread_mutex_unlock (&__aio_requests_mutex);
 348       __set_errno (EAGAIN);
 349       return NULL;
 350     }
 351   newp->aiocbp = aiocbp;
 352 #ifdef BROKEN_THREAD_SIGNALS
 353   newp->caller_pid = (aiocbp->aiocb.aio_sigevent.sigev_notify == SIGEV_SIGNAL
 354                       ? getpid () : 0);
 355 #endif
 356   newp->waiting = NULL;
 357
 358   aiocbp->aiocb.__abs_prio = prio;
 359   aiocbp->aiocb.__policy = policy;
 360   aiocbp->aiocb.aio_lio_opcode = operation;
 361   aiocbp->aiocb.__error_code = EINPROGRESS;
 362   aiocbp->aiocb.__return_value = 0;
 363
 364   if (runp != NULL
 365       && runp->aiocbp->aiocb.aio_fildes == aiocbp->aiocb.aio_fildes)
 366     {
 367       /* The current file descriptor is worked on.  It makes no sense
 368          to start another thread since this new thread would fight
 369          with the running thread for the resources.  But we also cannot
 370          say that the thread processing this desriptor shall immediately
 371          after finishing the current job process this request if there
 372          are other threads in the running queue which have a higher
 373          priority.  */
 374
 375       /* Simply enqueue it after the running one according to the
 376          priority.  */
 377       last = NULL;
 378       while (runp->next_prio != NULL
 379              && runp->next_prio->aiocbp->aiocb.__abs_prio >= prio)
 380         {
 381           last = runp;
 382           runp = runp->next_prio;
 383         }
 384
 385       newp->next_prio = runp->next_prio;
 386       runp->next_prio = newp;
 387
 388       running = queued;
 389     }
 390   else
 391     {
 392       running = yes;
 393       /* Enqueue this request for a new descriptor.  */
 394       if (last == NULL)
 395         {
 396           newp->last_fd = NULL;
 397           newp->next_fd = requests;
 398           if (requests != NULL)
 399             requests->last_fd = newp;
 400           requests = newp;
 401         }
 402       else
 403         {
 404           newp->next_fd = last->next_fd;
 405           newp->last_fd = last;
 406           last->next_fd = newp;
 407           if (newp->next_fd != NULL)
 408             newp->next_fd->last_fd = newp;
 409         }
 410
 411       newp->next_prio = NULL;
 412       last = NULL;
 413     }
 414
 415   if (running == yes)
 416     {
 417       /* We try to create a new thread for this file descriptor.  The
 418          function which gets called will handle all available requests
 419          for this descriptor and when all are processed it will
 420          terminate.
 421
 422          If no new thread can be created or if the specified limit of
 423          threads for AIO is reached we queue the request.  */
 424
 425       /* See if we need to and are able to create a thread.  */
 426       if (nthreads < optim.aio_threads && idle_thread_count == 0)
 427         {
 428           pthread_t thid;
 429
 430           running = newp->running = allocated;
 431
 432           /* Now try to start a thread.  */
 433           result = aio_create_helper_thread (&thid, handle_fildes_io, newp);
 434           if (result == 0)
 435             /* We managed to enqueue the request.  All errors which can
 436                happen now can be recognized by calls to `aio_return' and
 437                `aio_error'.  */
 438             ++nthreads;
 439           else
 440             {
 441               /* Reset the running flag.  The new request is not running.  */
 442               running = newp->running = yes;
 443
 444               if (nthreads == 0)
 445                 {
 446                   /* We cannot create a thread in the moment and there is
 447                      also no thread running.  This is a problem.  `errno' is
 448                      set to EAGAIN if this is only a temporary problem.  */
 449                   __aio_remove_request (last, newp, 0);
 450                 }
 451               else
 452                 result = 0;
 453             }
 454         }
 455     }
 456
 457   /* Enqueue the request in the run queue if it is not yet running.  */
 458   if (running == yes && result == 0)
 459     {
 460       add_request_to_runlist (newp);
 461
 462       /* If there is a thread waiting for work, then let it know that we
 463          have just given it something to do. */
 464       if (idle_thread_count > 0)
 465         pthread_cond_signal (&__aio_new_request_notification);
 466     }
 467
 468   if (result == 0)
 469     newp->running = running;
 470   else
 471     {
 472       /* Something went wrong.  */
 473       __aio_free_request (newp);
 474       aiocbp->aiocb.__error_code = result;
 475       __set_errno (result);
 476       newp = NULL;
 477     }
 478
 479   /* Release the mutex.  */
 480   pthread_mutex_unlock (&__aio_requests_mutex);
 481
 482   return newp;
 483 }
 484
 485
 486 static void *
 487 handle_fildes_io (void *arg)
 488 {
 489   pthread_t self = pthread_self ();
 490   struct sched_param param;
 491   struct requestlist *runp = (struct requestlist *) arg;
 492   aiocb_union *aiocbp;
 493   int policy;
 494   int fildes;
 495
 496   pthread_getschedparam (self, &policy, &param);
 497
 498   do
 499     {
 500       /* If runp is NULL, then we were created to service the work queue
 501          in general, not to handle any particular request. In that case we
 502          skip the "do work" stuff on the first pass, and go directly to the
 503          "get work off the work queue" part of this loop, which is near the
 504          end. */
 505       if (runp == NULL)
 506         pthread_mutex_lock (&__aio_requests_mutex);
 507       else
 508         {
 509           /* Hopefully this request is marked as running.  */
 510           assert (runp->running == allocated);
 511
 512           /* Update our variables.  */
 513           aiocbp = runp->aiocbp;
 514           fildes = aiocbp->aiocb.aio_fildes;
 515
 516           /* Change the priority to the requested value (if necessary).  */
 517           if (aiocbp->aiocb.__abs_prio != param.sched_priority
 518               || aiocbp->aiocb.__policy != policy)
 519             {
 520               param.sched_priority = aiocbp->aiocb.__abs_prio;
 521               policy = aiocbp->aiocb.__policy;
 522               pthread_setschedparam (self, policy, &param);
 523             }
 524
 525           /* Process request pointed to by RUNP.  We must not be disturbed
 526              by signals.  */
 527           if ((aiocbp->aiocb.aio_lio_opcode & 127) == LIO_READ)
 528             {
 529               if (sizeof (off_t) != sizeof (off64_t)
 530                   && aiocbp->aiocb.aio_lio_opcode & 128)
 531                 aiocbp->aiocb.__return_value =
 532                   TEMP_FAILURE_RETRY (__pread64 (fildes, (void *)
 533                                                  aiocbp->aiocb64.aio_buf,
 534                                                  aiocbp->aiocb64.aio_nbytes,
 535                                                  aiocbp->aiocb64.aio_offset));
 536               else
 537                 aiocbp->aiocb.__return_value =
 538                   TEMP_FAILURE_RETRY (pread (fildes,
 539                                              (void *) aiocbp->aiocb.aio_buf,
 540                                              aiocbp->aiocb.aio_nbytes,
 541                                              aiocbp->aiocb.aio_offset));
 542
 543               if (aiocbp->aiocb.__return_value == -1 && errno == ESPIPE)
 544                 /* The Linux kernel is different from others.  It returns
 545                    ESPIPE if using pread on a socket.  Other platforms
 546                    simply ignore the offset parameter and behave like
 547                    read.  */
 548                 aiocbp->aiocb.__return_value =
 549                   TEMP_FAILURE_RETRY (read (fildes,
 550                                             (void *) aiocbp->aiocb64.aio_buf,
 551                                             aiocbp->aiocb64.aio_nbytes));
 552             }
 553           else if ((aiocbp->aiocb.aio_lio_opcode & 127) == LIO_WRITE)
 554             {
 555               if (sizeof (off_t) != sizeof (off64_t)
 556                   && aiocbp->aiocb.aio_lio_opcode & 128)
 557                 aiocbp->aiocb.__return_value =
 558                   TEMP_FAILURE_RETRY (__pwrite64 (fildes, (const void *)
 559                                                   aiocbp->aiocb64.aio_buf,
 560                                                   aiocbp->aiocb64.aio_nbytes,
 561                                                   aiocbp->aiocb64.aio_offset));
 562               else
 563                 aiocbp->aiocb.__return_value =
 564                   TEMP_FAILURE_RETRY (__libc_pwrite (fildes, (const void *)
 565                                               aiocbp->aiocb.aio_buf,
 566                                               aiocbp->aiocb.aio_nbytes,
 567                                               aiocbp->aiocb.aio_offset));
 568
 569               if (aiocbp->aiocb.__return_value == -1 && errno == ESPIPE)
 570                 /* The Linux kernel is different from others.  It returns
 571                    ESPIPE if using pwrite on a socket.  Other platforms
 572                    simply ignore the offset parameter and behave like
 573                    write.  */
 574                 aiocbp->aiocb.__return_value =
 575                   TEMP_FAILURE_RETRY (write (fildes,
 576                                              (void *) aiocbp->aiocb64.aio_buf,
 577                                              aiocbp->aiocb64.aio_nbytes));
 578             }
 579           else if (aiocbp->aiocb.aio_lio_opcode == LIO_DSYNC)
 580             aiocbp->aiocb.__return_value =
 581               TEMP_FAILURE_RETRY (fdatasync (fildes));
 582           else if (aiocbp->aiocb.aio_lio_opcode == LIO_SYNC)
 583             aiocbp->aiocb.__return_value =
 584               TEMP_FAILURE_RETRY (fsync (fildes));
 585           else
 586             {
 587               /* This is an invalid opcode.  */
 588               aiocbp->aiocb.__return_value = -1;
 589               __set_errno (EINVAL);
 590             }
 591
 592           /* Get the mutex.  */
 593           pthread_mutex_lock (&__aio_requests_mutex);
 594
 595           /* In theory we would need here a write memory barrier since the
 596              callers test using aio_error() whether the request finished
 597              and once this value != EINPROGRESS the field __return_value
 598              must be committed to memory.
 599
 600              But since the pthread_mutex_lock call involves write memory
 601              barriers as well it is not necessary.  */
 602
 603           if (aiocbp->aiocb.__return_value == -1)
 604             aiocbp->aiocb.__error_code = errno;
 605           else
 606             aiocbp->aiocb.__error_code = 0;
 607
 608           /* Send the signal to notify about finished processing of the
 609              request.  */
 610           __aio_notify (runp);
 611
 612           /* For debugging purposes we reset the running flag of the
 613              finished request.  */
 614           assert (runp->running == allocated);
 615           runp->running = done;
 616
 617           /* Now dequeue the current request.  */
 618           __aio_remove_request (NULL, runp, 0);
 619           if (runp->next_prio != NULL)
 620             add_request_to_runlist (runp->next_prio);
 621
 622           /* Free the old element.  */
 623           __aio_free_request (runp);
 624         }
 625
 626       runp = runlist;
 627
 628       /* If the runlist is empty, then we sleep for a while, waiting for
 629          something to arrive in it. */
 630       if (runp == NULL && optim.aio_idle_time >= 0)
 631         {
 632           struct timeval now;
 633           struct timespec wakeup_time;
 634
 635           ++idle_thread_count;
 636           gettimeofday (&now, NULL);
 637           wakeup_time.tv_sec = now.tv_sec + optim.aio_idle_time;
 638           wakeup_time.tv_nsec = now.tv_usec * 1000;
 639           if (wakeup_time.tv_nsec > 1000000000)
 640             {
 641               wakeup_time.tv_nsec -= 1000000000;
 642               ++wakeup_time.tv_sec;
 643             }
 644           pthread_cond_timedwait (&__aio_new_request_notification,
 645                                   &__aio_requests_mutex,
 646                                   &wakeup_time);
 647           --idle_thread_count;
 648           runp = runlist;
 649         }
 650
 651       if (runp == NULL)
 652         --nthreads;
 653       else
 654         {
 655           assert (runp->running == yes);
 656           runp->running = allocated;
 657           runlist = runp->next_run;
 658
 659           /* If we have a request to process, and there's still another in
 660              the run list, then we need to either wake up or create a new
 661              thread to service the request that is still in the run list. */
 662           if (runlist != NULL)
 663             {
 664               /* There are at least two items in the work queue to work on.
 665                  If there are other idle threads, then we should wake them
 666                  up for these other work elements; otherwise, we should try
 667                  to create a new thread. */
 668               if (idle_thread_count > 0)
 669                 pthread_cond_signal (&__aio_new_request_notification);
 670               else if (nthreads < optim.aio_threads)
 671                 {
 672                   pthread_t thid;
 673                   pthread_attr_t attr;
 674
 675                   /* Make sure the thread is created detached.  */
 676                   pthread_attr_init (&attr);
 677                   pthread_attr_setdetachstate (&attr, PTHREAD_CREATE_DETACHED);
 678
 679                   /* Now try to start a thread. If we fail, no big deal,
 680                      because we know that there is at least one thread (us)
 681                      that is working on AIO operations. */
 682                   if (pthread_create (&thid, &attr, handle_fildes_io, NULL)
 683                       == 0)
 684                     ++nthreads;
 685                 }
 686             }
 687         }
 688
 689       /* Release the mutex.  */
 690       pthread_mutex_unlock (&__aio_requests_mutex);
 691     }
 692   while (runp != NULL);
 693
 694   return NULL;
 695 }
 696
 697
 698 /* Free allocated resources.  */
 699 libc_freeres_fn (free_res)
 700 {
 701   size_t row;
 702
 703   for (row = 0; row < pool_max_size; ++row)
 704     free (pool[row]);
 705
 706   free (pool);
 707 }
 708
 709
 710 /* Add newrequest to the runlist. The __abs_prio flag of newrequest must
 711    be correctly set to do this. Also, you had better set newrequest's
 712    "running" flag to "yes" before you release your lock or you'll throw an
 713    assertion. */
 714 static void
 715 add_request_to_runlist (struct requestlist *newrequest)
 716 {
 717   int prio = newrequest->aiocbp->aiocb.__abs_prio;
 718   struct requestlist *runp;
 719
 720   if (runlist == NULL || runlist->aiocbp->aiocb.__abs_prio < prio)
 721     {
 722       newrequest->next_run = runlist;
 723       runlist = newrequest;
 724     }
 725   else
 726     {
 727       runp = runlist;
 728
 729       while (runp->next_run != NULL
 730              && runp->next_run->aiocbp->aiocb.__abs_prio >= prio)
 731         runp = runp->next_run;
 732
 733       newrequest->next_run = runp->next_run;
 734       runp->next_run = newrequest;
 735     }
 736 }