fs/lockd/svclock.c

   1 /*
   2  * linux/fs/lockd/svclock.c
   3  *
   4  * Handling of server-side locks, mostly of the blocked variety.
   5  * This is the ugliest part of lockd because we tread on very thin ice.
   6  * GRANT and CANCEL calls may get stuck, meet in mid-flight, etc.
   7  * IMNSHO introducing the grant callback into the NLM protocol was one
   8  * of the worst ideas Sun ever had. Except maybe for the idea of doing
   9  * NFS file locking at all.
  10  *
  11  * I'm trying hard to avoid race conditions by protecting most accesses
  12  * to a file's list of blocked locks through a semaphore. The global
  13  * list of blocked locks is not protected in this fashion however.
  14  * Therefore, some functions (such as the RPC callback for the async grant
  15  * call) move blocked locks towards the head of the list *while some other
  16  * process might be traversing it*. This should not be a problem in
  17  * practice, because this will only cause functions traversing the list
  18  * to visit some blocks twice.
  19  *
  20  * Copyright (C) 1996, Olaf Kirch <okir@monad.swb.de>
  21  */
  22
  23 #include <linux/types.h>
  24 #include <linux/errno.h>
  25 #include <linux/kernel.h>
  26 #include <linux/sunrpc/clnt.h>
  27 #include <linux/sunrpc/svc.h>
  28 #include <linux/lockd/nlm.h>
  29 #include <linux/lockd/lockd.h>
  30
  31
  32 #define NLMDBG_FACILITY         NLMDBG_SVCLOCK
  33
  34 static void     nlmsvc_insert_block(struct nlm_block *block, unsigned long);
  35 static int      nlmsvc_remove_block(struct nlm_block *block);
  36 static void     nlmsvc_grant_callback(struct rpc_task *task);
  37 static void     nlmsvc_notify_blocked(struct file_lock *);
  38
  39 /*
  40  * The list of blocked locks to retry
  41  */
  42 static struct nlm_block *       nlm_blocked = NULL;
  43
  44 /*
  45  * Insert a blocked lock into the global list
  46  */
  47 static void
  48 nlmsvc_insert_block(struct nlm_block *block, unsigned long when)
  49 {
  50         struct nlm_block **bp, *b;
  51
  52         dprintk("lockd: nlmsvc_insert_block(%p, %ld)\n", block, when);
  53         if (block->b_queued)
  54                 nlmsvc_remove_block(block);
  55         for (bp = &nlm_blocked; (b = *bp); bp = &b->b_next)
  56                 if (when < b->b_when)
  57                         break;
  58
  59         block->b_queued = 1;
  60         block->b_when = when;
  61         block->b_next = b;
  62         *bp = block;
  63 }
  64
  65 /*
  66  * Remove a block from the global list
  67  */
  68 static int
  69 nlmsvc_remove_block(struct nlm_block *block)
  70 {
  71         struct nlm_block **bp, *b;
  72
  73         if (!block->b_queued)
  74                 return 1;
  75         for (bp = &nlm_blocked; (b = *bp); bp = &b->b_next) {
  76                 if (b == block) {
  77                         *bp = block->b_next;
  78                         block->b_queued = 0;
  79                         return 1;
  80                 }
  81         }
  82
  83         return 0;
  84 }
  85
  86 /*
  87  * Find a block for a given lock and optionally remove it from
  88  * the list.
  89  */
  90 static struct nlm_block *
  91 nlmsvc_lookup_block(struct nlm_file *file, struct nlm_lock *lock, int remove)
  92 {
  93         struct nlm_block        **head, *block;
  94         struct file_lock        *fl;
  95
  96         dprintk("lockd: nlmsvc_lookup_block f=%p pd=%d %ld-%ld ty=%d\n",
  97                                 file, lock->fl.fl_pid, lock->fl.fl_start,
  98                                 lock->fl.fl_end, lock->fl.fl_type);
  99         for (head = &nlm_blocked; (block = *head); head = &block->b_next) {
 100                 fl = &block->b_call.a_args.lock.fl;
 101                 dprintk("       check f=%p pd=%d %ld-%ld ty=%d\n",
 102                                 block->b_file, fl->fl_pid, fl->fl_start,
 103                                 fl->fl_end, fl->fl_type);
 104                 if (block->b_file == file && nlm_compare_locks(fl, &lock->fl)) {
 105                         if (remove)
 106                                 *head = block->b_next;
 107                         return block;
 108                 }
 109         }
 110
 111         return NULL;
 112 }
 113
 114 /*
 115  * Find a block with a given NLM cookie.
 116  */
 117 static inline struct nlm_block *
 118 nlmsvc_find_block(u32 cookie)
 119 {
 120         struct nlm_block *block;
 121
 122         for (block = nlm_blocked; block; block = block->b_next) {
 123                 if (block->b_call.a_args.cookie == cookie)
 124                         break;
 125         }
 126
 127         return block;
 128 }
 129
 130 /*
 131  * Create a block and initialize it.
 132  *
 133  * Note: we explicitly set the cookie of the grant reply to that of
 134  * the blocked lock request. The spec explicitly mentions that the client
 135  * should _not_ rely on the callback containing the same cookie as the
 136  * request, but (as I found out later) that's because some implementations
 137  * do just this. Never mind the standards comittees, they support our
 138  * logging industries.
 139  */
 140 static inline struct nlm_block *
 141 nlmsvc_create_block(struct svc_rqst *rqstp, struct nlm_file *file,
 142                                 struct nlm_lock *lock, u32 cookie)
 143 {
 144         struct nlm_block        *block;
 145         struct nlm_host         *host;
 146         struct nlm_rqst         *call;
 147
 148         /* Create host handle for callback */
 149         host = nlmclnt_lookup_host(&rqstp->rq_addr,
 150                                 rqstp->rq_prot, rqstp->rq_vers);
 151         if (host == NULL)
 152                 return NULL;
 153
 154         /* Allocate memory for block, and initialize arguments */
 155         if (!(block = (struct nlm_block *) kmalloc(sizeof(*block), GFP_KERNEL)))
 156                 goto failed;
 157         memset(block, 0, sizeof(*block));
 158
 159         /* Set notifier function for VFS, and init args */
 160         lock->fl.fl_notify = nlmsvc_notify_blocked;
 161         if (!nlmclnt_setgrantargs(&block->b_call, lock))
 162                 goto failed_free;
 163         block->b_call.a_args.cookie = cookie;   /* see above */
 164
 165         dprintk("lockd: created block %p...\n", block);
 166
 167         /* Create and initialize the block */
 168         block->b_daemon = rqstp->rq_server;
 169         block->b_host   = host;
 170         block->b_file   = file;
 171
 172         /* Add to file's list of blocks */
 173         block->b_fnext  = file->f_blocks;
 174         file->f_blocks  = block;
 175
 176         /* Set up RPC arguments for callback */
 177         call = &block->b_call;
 178         call->a_host    = host;
 179         call->a_flags   = RPC_TASK_ASYNC;
 180
 181         return block;
 182
 183 failed_free:
 184         kfree(block);
 185 failed:
 186         nlm_release_host(host);
 187         return NULL;
 188 }
 189
 190 /*
 191  * Delete a block. If the lock was cancelled or the grant callback
 192  * failed, unlock is set to 1.
 193  * It is the caller's responsibility to check whether the file
 194  * can be closed hereafter.
 195  */
 196 static void
 197 nlmsvc_delete_block(struct nlm_block *block, int unlock)
 198 {
 199         struct file_lock        *fl = &block->b_call.a_args.lock.fl;
 200         struct nlm_file         *file = block->b_file;
 201         struct nlm_block        **bp;
 202
 203         dprintk("lockd: deleting block %p...\n", block);
 204
 205         /* Remove block from list */
 206         nlmsvc_remove_block(block);
 207
 208         /* If granted, unlock it, else remove from inode block list */
 209         if (unlock && block->b_granted) {
 210                 dprintk("lockd: deleting granted lock\n");
 211                 fl->fl_type = F_UNLCK;
 212                 posix_lock_file(&block->b_file->f_file, fl, 0);
 213                 block->b_granted = 0;
 214         } else {
 215                 dprintk("lockd: unblocking blocked lock\n");
 216                 posix_unblock_lock(fl);
 217         }
 218
 219         /* If the block is in the middle of a GRANT callback,
 220          * don't kill it yet. */
 221         if (block->b_incall) {
 222                 nlmsvc_insert_block(block, NLM_NEVER);
 223                 block->b_done = 1;
 224                 return;
 225         }
 226
 227         /* Remove block from file's list of blocks */
 228         for (bp = &file->f_blocks; *bp; bp = &(*bp)->b_fnext) {
 229                 if (*bp == block) {
 230                         *bp = block->b_fnext;
 231                         break;
 232                 }
 233         }
 234
 235         if (block->b_host)
 236                 nlm_release_host(block->b_host);
 237         nlmclnt_freegrantargs(&block->b_call);
 238         kfree(block);
 239 }
 240
 241 /*
 242  * Loop over all blocks and perform the action specified.
 243  * (NLM_ACT_CHECK handled by nlmsvc_inspect_file).
 244  */
 245 int
 246 nlmsvc_traverse_blocks(struct nlm_host *host, struct nlm_file *file, int action)
 247 {
 248         struct nlm_block        *block, *next;
 249
 250         down(&file->f_sema);
 251         for (block = file->f_blocks; block; block = next) {
 252                 next = block->b_fnext;
 253                 if (action == NLM_ACT_MARK)
 254                         block->b_host->h_inuse = 1;
 255                 else if (action == NLM_ACT_UNLOCK) {
 256                         if (host == NULL || host == block->b_host)
 257                                 nlmsvc_delete_block(block, 1);
 258                 }
 259         }
 260         up(&file->f_sema);
 261         return 0;
 262 }
 263
 264 /*
 265  * Attempt to establish a lock, and if it can't be granted, block it
 266  * if required.
 267  */
 268 u32
 269 nlmsvc_lock(struct svc_rqst *rqstp, struct nlm_file *file,
 270                         struct nlm_lock *lock, int wait, u32 cookie)
 271 {
 272         struct file_lock        *conflock;
 273         struct nlm_block        *block;
 274         int                     error;
 275
 276         dprintk("lockd: nlmsvc_lock(%04x/%ld, ty=%d, pi=%d, %ld-%ld, bl=%d)\n",
 277                                 file->f_file.f_dentry->d_inode->i_dev,
 278                                 file->f_file.f_dentry->d_inode->i_ino,
 279                                 lock->fl.fl_type, lock->fl.fl_pid,
 280                                 lock->fl.fl_start,
 281                                 lock->fl.fl_end,
 282                                 wait);
 283
 284         /* Lock file against concurrent access */
 285         down(&file->f_sema);
 286
 287         /* Get existing block (in case client is busy-waiting) */
 288         block = nlmsvc_lookup_block(file, lock, 0);
 289
 290         lock->fl.fl_flags |= FL_LOCKD;
 291
 292 again:
 293         if (!(conflock = posix_test_lock(&file->f_file, &lock->fl))) {
 294                 error = posix_lock_file(&file->f_file, &lock->fl, 0);
 295
 296                 if (block)
 297                         nlmsvc_delete_block(block, 0);
 298                 up(&file->f_sema);
 299
 300                 dprintk("lockd: posix_lock_file returned %d\n", -error);
 301                 switch(-error) {
 302                 case 0:
 303                         return nlm_granted;
 304                 case EDEADLK:                   /* no applicable NLM status */
 305                 case EAGAIN:
 306                         return nlm_lck_denied;
 307                 default:                        /* includes ENOLCK */
 308                         return nlm_lck_denied_nolocks;
 309                 }
 310         }
 311
 312         if (!wait) {
 313                 up(&file->f_sema);
 314                 return nlm_lck_denied;
 315         }
 316
 317         /* If we don't have a block, create and initialize it. Then
 318          * retry because we may have slept in kmalloc. */
 319         if (block == NULL) {
 320                 dprintk("lockd: blocking on this lock (allocating).\n");
 321                 if (!(block = nlmsvc_create_block(rqstp, file, lock, cookie)))
 322                         return nlm_lck_denied_nolocks;
 323                 goto again;
 324         }
 325
 326         /* Append to list of blocked */
 327         nlmsvc_insert_block(block, NLM_NEVER);
 328
 329         /* Now add block to block list of the conflicting lock */
 330         dprintk("lockd: blocking on this lock.\n");
 331         posix_block_lock(conflock, &block->b_call.a_args.lock.fl);
 332
 333         up(&file->f_sema);
 334         return nlm_lck_blocked;
 335 }
 336
 337 /*
 338  * Test for presence of a conflicting lock.
 339  */
 340 u32
 341 nlmsvc_testlock(struct nlm_file *file, struct nlm_lock *lock,
 342                                        struct nlm_lock *conflock)
 343 {
 344         struct file_lock        *fl;
 345
 346         dprintk("lockd: nlmsvc_testlock(%04x/%ld, ty=%d, %ld-%ld)\n",
 347                                 file->f_file.f_dentry->d_inode->i_dev,
 348                                 file->f_file.f_dentry->d_inode->i_ino,
 349                                 lock->fl.fl_type,
 350                                 lock->fl.fl_start,
 351                                 lock->fl.fl_end);
 352
 353         if ((fl = posix_test_lock(&file->f_file, &lock->fl)) != NULL) {
 354                 dprintk("lockd: conflicting lock(ty=%d, %ld-%ld)\n",
 355                                 fl->fl_type, fl->fl_start, fl->fl_end);
 356                 conflock->caller = "somehost";  /* FIXME */
 357                 conflock->oh.len = 0;           /* don't return OH info */
 358                 conflock->fl = *fl;
 359                 return nlm_lck_denied;
 360         }
 361
 362         return nlm_granted;
 363 }
 364
 365 /*
 366  * Remove a lock.
 367  * This implies a CANCEL call: We send a GRANT_MSG, the client replies
 368  * with a GRANT_RES call which gets lost, and calls UNLOCK immediately
 369  * afterwards. In this case the block will still be there, and hence
 370  * must be removed.
 371  */
 372 u32
 373 nlmsvc_unlock(struct nlm_file *file, struct nlm_lock *lock)
 374 {
 375         int     error;
 376
 377         dprintk("lockd: nlmsvc_unlock(%04x/%ld, pi=%d, %ld-%ld)\n",
 378                                 file->f_file.f_dentry->d_inode->i_dev,
 379                                 file->f_file.f_dentry->d_inode->i_ino,
 380                                 lock->fl.fl_pid,
 381                                 lock->fl.fl_start,
 382                                 lock->fl.fl_end);
 383
 384         /* First, cancel any lock that might be there */
 385         nlmsvc_cancel_blocked(file, lock);
 386
 387         lock->fl.fl_type = F_UNLCK;
 388         error = posix_lock_file(&file->f_file, &lock->fl, 0);
 389
 390         return (error < 0)? nlm_lck_denied_nolocks : nlm_granted;
 391 }
 392
 393 /*
 394  * Cancel a previously blocked request.
 395  *
 396  * A cancel request always overrides any grant that may currently
 397  * be in progress.
 398  * The calling procedure must check whether the file can be closed.
 399  */
 400 u32
 401 nlmsvc_cancel_blocked(struct nlm_file *file, struct nlm_lock *lock)
 402 {
 403         struct nlm_block        *block;
 404
 405         dprintk("lockd: nlmsvc_cancel(%04x/%ld, pi=%d, %ld-%ld)\n",
 406                                 file->f_file.f_dentry->d_inode->i_dev,
 407                                 file->f_file.f_dentry->d_inode->i_ino,
 408                                 lock->fl.fl_pid,
 409                                 lock->fl.fl_start,
 410                                 lock->fl.fl_end);
 411
 412         down(&file->f_sema);
 413         if ((block = nlmsvc_lookup_block(file, lock, 1)) != NULL)
 414                 nlmsvc_delete_block(block, 1);
 415         up(&file->f_sema);
 416         return nlm_granted;
 417 }
 418
 419 /*
 420  * Unblock a blocked lock request. This is a callback invoked from the
 421  * VFS layer when a lock on which we blocked is removed.
 422  *
 423  * This function doesn't grant the blocked lock instantly, but rather moves
 424  * the block to the head of nlm_blocked where it can be picked up by lockd.
 425  */
 426 static void
 427 nlmsvc_notify_blocked(struct file_lock *fl)
 428 {
 429         struct nlm_block        **bp, *block;
 430
 431         dprintk("lockd: VFS unblock notification for block %p\n", fl);
 432         posix_unblock_lock(fl);
 433         for (bp = &nlm_blocked; (block = *bp); bp = &block->b_next) {
 434                 if (&block->b_call.a_args.lock.fl == fl) {
 435                         svc_wake_up(block->b_daemon);
 436                         nlmsvc_insert_block(block, 0);
 437                         return;
 438                 }
 439         }
 440
 441         printk(KERN_WARNING "lockd: notification for unknown block!\n");
 442 }
 443
 444 /*
 445  * Try to claim a lock that was previously blocked.
 446  *
 447  * Note that we use both the RPC_GRANTED_MSG call _and_ an async
 448  * RPC thread when notifying the client. This seems like overkill...
 449  * Here's why:
 450  *  -   we don't want to use a synchronous RPC thread, otherwise
 451  *      we might find ourselves hanging on a dead portmapper.
 452  *  -   Some lockd implementations (e.g. HP) don't react to
 453  *      RPC_GRANTED calls; they seem to insist on RPC_GRANTED_MSG calls.
 454  */
 455 static void
 456 nlmsvc_grant_blocked(struct nlm_block *block)
 457 {
 458         struct nlm_file         *file = block->b_file;
 459         struct nlm_lock         *lock = &block->b_call.a_args.lock;
 460         struct file_lock        *conflock;
 461         int                     error;
 462
 463         dprintk("lockd: grant blocked lock %p\n", block);
 464
 465         /* First thing is lock the file */
 466         down(&file->f_sema);
 467
 468         /* Unlink block request from list */
 469         nlmsvc_remove_block(block);
 470
 471         /* If b_granted is true this means we've been here before.
 472          * Just retry the grant callback, possibly refreshing the RPC
 473          * binding */
 474         if (block->b_granted) {
 475                 nlm_rebind_host(block->b_host);
 476                 goto callback;
 477         }
 478
 479         /* Try the lock operation again */
 480         if ((conflock = posix_test_lock(&file->f_file, &lock->fl)) != NULL) {
 481                 /* Bummer, we blocked again */
 482                 dprintk("lockd: lock still blocked\n");
 483                 nlmsvc_insert_block(block, NLM_NEVER);
 484                 posix_block_lock(conflock, &lock->fl);
 485                 up(&file->f_sema);
 486                 return;
 487         }
 488
 489         /* Alright, no conflicting lock. Now lock it for real. If the
 490          * following yields an error, this is most probably due to low
 491          * memory. Retry the lock in a few seconds.
 492          */
 493         if ((error = posix_lock_file(&file->f_file, &lock->fl, 0)) < 0) {
 494                 printk(KERN_WARNING "lockd: unexpected error %d in %s!\n",
 495                                 -error, __FUNCTION__);
 496                 nlmsvc_insert_block(block, jiffies + 10 * HZ);
 497                 up(&file->f_sema);
 498                 return;
 499         }
 500
 501 callback:
 502         /* Lock was granted by VFS. */
 503         dprintk("lockd: GRANTing blocked lock.\n");
 504         block->b_granted = 1;
 505         block->b_incall  = 1;
 506
 507         /* Schedule next grant callback in 30 seconds */
 508         nlmsvc_insert_block(block, jiffies + 30 * HZ);
 509
 510         /* Call the client */
 511         nlmclnt_async_call(&block->b_call, NLMPROC_GRANTED_MSG,
 512                                                 nlmsvc_grant_callback);
 513         up(&file->f_sema);
 514 }
 515
 516 /*
 517  * This is the callback from the RPC layer when the NLM_GRANTED_MSG
 518  * RPC call has succeeded or timed out.
 519  * Like all RPC callbacks, it is invoked by the rpciod process, so it
 520  * better not sleep. Therefore, we put the blocked lock on the nlm_blocked
 521  * chain once more in order to have it removed by lockd itself (which can
 522  * then sleep on the file semaphore without disrupting e.g. the nfs client).
 523  */
 524 static void
 525 nlmsvc_grant_callback(struct rpc_task *task)
 526 {
 527         struct nlm_rqst         *call = (struct nlm_rqst *) task->tk_calldata;
 528         struct nlm_block        *block;
 529         unsigned long           timeout;
 530
 531         dprintk("lockd: GRANT_MSG RPC callback\n");
 532         if (!(block = nlmsvc_find_block(call->a_args.cookie))) {
 533                 dprintk("lockd: no block for cookie %x\n", call->a_args.cookie);
 534                 return;
 535         }
 536
 537         /* Technically, we should down the file semaphore here. Since we
 538          * move the block towards the head of the queue only, no harm
 539          * can be done, though. */
 540         if (task->tk_status < 0) {
 541                 /* RPC error: Re-insert for retransmission */
 542                 timeout = jiffies + 10 * HZ;
 543         } else if (block->b_done) {
 544                 /* Block already removed, kill it for real */
 545                 timeout = 0;
 546         } else {
 547                 /* Call was successful, now wait for client callback */
 548                 timeout = jiffies + 60 * HZ;
 549         }
 550         nlmsvc_insert_block(block, timeout);
 551         svc_wake_up(block->b_daemon);
 552         block->b_incall = 0;
 553
 554         nlm_release_host(call->a_host);
 555         rpc_release_task(task);
 556 }
 557
 558 /*
 559  * We received a GRANT_RES callback. Try to find the corresponding
 560  * block.
 561  */
 562 void
 563 nlmsvc_grant_reply(u32 cookie, u32 status)
 564 {
 565         struct nlm_block        *block;
 566         struct nlm_file         *file;
 567
 568         if (!(block = nlmsvc_find_block(cookie)))
 569                 return;
 570         file = block->b_file;
 571
 572         file->f_count++;
 573         down(&file->f_sema);
 574         if ((block = nlmsvc_find_block(cookie)) != NULL) {
 575                 if (status == NLM_LCK_DENIED_GRACE_PERIOD) {
 576                         /* Try again in a couple of seconds */
 577                         nlmsvc_insert_block(block, jiffies + 10 * HZ);
 578                         block = NULL;
 579                 } else {
 580                         /* Lock is now held by client, or has been rejected.
 581                          * In both cases, the block should be removed. */
 582                         file->f_count++;
 583                         up(&file->f_sema);
 584                         if (status == NLM_LCK_GRANTED)
 585                                 nlmsvc_delete_block(block, 0);
 586                         else
 587                                 nlmsvc_delete_block(block, 1);
 588                 }
 589         }
 590         if (!block)
 591                 up(&file->f_sema);
 592         nlm_release_file(file);
 593 }
 594
 595 /*
 596  * Retry all blocked locks that have been notified. This is where lockd
 597  * picks up locks that can be granted, or grant notifications that must
 598  * be retransmitted.
 599  */
 600 unsigned long
 601 nlmsvc_retry_blocked(void)
 602 {
 603         struct nlm_block        *block;
 604
 605         dprintk("nlmsvc_retry_blocked(%p, when=%ld)\n",
 606                         nlm_blocked,
 607                         nlm_blocked? nlm_blocked->b_when : 0);
 608         while ((block = nlm_blocked) && block->b_when < jiffies) {
 609                 dprintk("nlmsvc_retry_blocked(%p, when=%ld, done=%d)\n",
 610                         block, block->b_when, block->b_done);
 611                 if (block->b_done)
 612                         nlmsvc_delete_block(block, 0);
 613                 else
 614                         nlmsvc_grant_blocked(block);
 615         }
 616
 617         if ((block = nlm_blocked) && block->b_when != NLM_NEVER)
 618                 return block->b_when;
 619         return 0;
 620 }