Merge branch 'for-linus' of git://oss.sgi.com:8090/xfs/xfs-2.6
[linux-2.6/linux-2.6-openrd.git] / fs / gfs2 / glock.c
blob3f0974e1afef8bbd2b706a418f616f38e2817f71
1 /*
2 * Copyright (C) Sistina Software, Inc. 1997-2003 All rights reserved.
3 * Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved.
5 * This copyrighted material is made available to anyone wishing to use,
6 * modify, copy, or redistribute it subject to the terms and conditions
7 * of the GNU General Public License version 2.
8 */
10 #include <linux/sched.h>
11 #include <linux/slab.h>
12 #include <linux/spinlock.h>
13 #include <linux/completion.h>
14 #include <linux/buffer_head.h>
15 #include <linux/delay.h>
16 #include <linux/sort.h>
17 #include <linux/jhash.h>
18 #include <linux/kallsyms.h>
19 #include <linux/gfs2_ondisk.h>
20 #include <linux/list.h>
21 #include <linux/lm_interface.h>
22 #include <linux/wait.h>
23 #include <linux/module.h>
24 #include <linux/rwsem.h>
25 #include <asm/uaccess.h>
26 #include <linux/seq_file.h>
27 #include <linux/debugfs.h>
28 #include <linux/module.h>
29 #include <linux/kallsyms.h>
31 #include "gfs2.h"
32 #include "incore.h"
33 #include "glock.h"
34 #include "glops.h"
35 #include "inode.h"
36 #include "lm.h"
37 #include "lops.h"
38 #include "meta_io.h"
39 #include "quota.h"
40 #include "super.h"
41 #include "util.h"
43 struct gfs2_gl_hash_bucket {
44 struct hlist_head hb_list;
47 struct glock_iter {
48 int hash; /* hash bucket index */
49 struct gfs2_sbd *sdp; /* incore superblock */
50 struct gfs2_glock *gl; /* current glock struct */
51 struct hlist_head *hb_list; /* current hash bucket ptr */
52 struct seq_file *seq; /* sequence file for debugfs */
53 char string[512]; /* scratch space */
56 typedef void (*glock_examiner) (struct gfs2_glock * gl);
58 static int gfs2_dump_lockstate(struct gfs2_sbd *sdp);
59 static int dump_glock(struct glock_iter *gi, struct gfs2_glock *gl);
60 static void gfs2_glock_xmote_th(struct gfs2_glock *gl, struct gfs2_holder *gh);
61 static void gfs2_glock_drop_th(struct gfs2_glock *gl);
62 static DECLARE_RWSEM(gfs2_umount_flush_sem);
63 static struct dentry *gfs2_root;
65 #define GFS2_GL_HASH_SHIFT 15
66 #define GFS2_GL_HASH_SIZE (1 << GFS2_GL_HASH_SHIFT)
67 #define GFS2_GL_HASH_MASK (GFS2_GL_HASH_SIZE - 1)
69 static struct gfs2_gl_hash_bucket gl_hash_table[GFS2_GL_HASH_SIZE];
70 static struct dentry *gfs2_root;
73 * Despite what you might think, the numbers below are not arbitrary :-)
74 * They are taken from the ipv4 routing hash code, which is well tested
75 * and thus should be nearly optimal. Later on we might tweek the numbers
76 * but for now this should be fine.
78 * The reason for putting the locks in a separate array from the list heads
79 * is that we can have fewer locks than list heads and save memory. We use
80 * the same hash function for both, but with a different hash mask.
82 #if defined(CONFIG_SMP) || defined(CONFIG_DEBUG_SPINLOCK) || \
83 defined(CONFIG_PROVE_LOCKING)
85 #ifdef CONFIG_LOCKDEP
86 # define GL_HASH_LOCK_SZ 256
87 #else
88 # if NR_CPUS >= 32
89 # define GL_HASH_LOCK_SZ 4096
90 # elif NR_CPUS >= 16
91 # define GL_HASH_LOCK_SZ 2048
92 # elif NR_CPUS >= 8
93 # define GL_HASH_LOCK_SZ 1024
94 # elif NR_CPUS >= 4
95 # define GL_HASH_LOCK_SZ 512
96 # else
97 # define GL_HASH_LOCK_SZ 256
98 # endif
99 #endif
101 /* We never want more locks than chains */
102 #if GFS2_GL_HASH_SIZE < GL_HASH_LOCK_SZ
103 # undef GL_HASH_LOCK_SZ
104 # define GL_HASH_LOCK_SZ GFS2_GL_HASH_SIZE
105 #endif
107 static rwlock_t gl_hash_locks[GL_HASH_LOCK_SZ];
109 static inline rwlock_t *gl_lock_addr(unsigned int x)
111 return &gl_hash_locks[x & (GL_HASH_LOCK_SZ-1)];
113 #else /* not SMP, so no spinlocks required */
114 static inline rwlock_t *gl_lock_addr(unsigned int x)
116 return NULL;
118 #endif
121 * relaxed_state_ok - is a requested lock compatible with the current lock mode?
122 * @actual: the current state of the lock
123 * @requested: the lock state that was requested by the caller
124 * @flags: the modifier flags passed in by the caller
126 * Returns: 1 if the locks are compatible, 0 otherwise
129 static inline int relaxed_state_ok(unsigned int actual, unsigned requested,
130 int flags)
132 if (actual == requested)
133 return 1;
135 if (flags & GL_EXACT)
136 return 0;
138 if (actual == LM_ST_EXCLUSIVE && requested == LM_ST_SHARED)
139 return 1;
141 if (actual != LM_ST_UNLOCKED && (flags & LM_FLAG_ANY))
142 return 1;
144 return 0;
148 * gl_hash() - Turn glock number into hash bucket number
149 * @lock: The glock number
151 * Returns: The number of the corresponding hash bucket
154 static unsigned int gl_hash(const struct gfs2_sbd *sdp,
155 const struct lm_lockname *name)
157 unsigned int h;
159 h = jhash(&name->ln_number, sizeof(u64), 0);
160 h = jhash(&name->ln_type, sizeof(unsigned int), h);
161 h = jhash(&sdp, sizeof(struct gfs2_sbd *), h);
162 h &= GFS2_GL_HASH_MASK;
164 return h;
168 * glock_free() - Perform a few checks and then release struct gfs2_glock
169 * @gl: The glock to release
171 * Also calls lock module to release its internal structure for this glock.
175 static void glock_free(struct gfs2_glock *gl)
177 struct gfs2_sbd *sdp = gl->gl_sbd;
178 struct inode *aspace = gl->gl_aspace;
180 gfs2_lm_put_lock(sdp, gl->gl_lock);
182 if (aspace)
183 gfs2_aspace_put(aspace);
185 kmem_cache_free(gfs2_glock_cachep, gl);
189 * gfs2_glock_hold() - increment reference count on glock
190 * @gl: The glock to hold
194 void gfs2_glock_hold(struct gfs2_glock *gl)
196 atomic_inc(&gl->gl_ref);
200 * gfs2_glock_put() - Decrement reference count on glock
201 * @gl: The glock to put
205 int gfs2_glock_put(struct gfs2_glock *gl)
207 int rv = 0;
208 struct gfs2_sbd *sdp = gl->gl_sbd;
210 write_lock(gl_lock_addr(gl->gl_hash));
211 if (atomic_dec_and_test(&gl->gl_ref)) {
212 hlist_del(&gl->gl_list);
213 write_unlock(gl_lock_addr(gl->gl_hash));
214 BUG_ON(spin_is_locked(&gl->gl_spin));
215 gfs2_assert(sdp, gl->gl_state == LM_ST_UNLOCKED);
216 gfs2_assert(sdp, list_empty(&gl->gl_reclaim));
217 gfs2_assert(sdp, list_empty(&gl->gl_holders));
218 gfs2_assert(sdp, list_empty(&gl->gl_waiters1));
219 gfs2_assert(sdp, list_empty(&gl->gl_waiters3));
220 glock_free(gl);
221 rv = 1;
222 goto out;
224 write_unlock(gl_lock_addr(gl->gl_hash));
225 out:
226 return rv;
230 * search_bucket() - Find struct gfs2_glock by lock number
231 * @bucket: the bucket to search
232 * @name: The lock name
234 * Returns: NULL, or the struct gfs2_glock with the requested number
237 static struct gfs2_glock *search_bucket(unsigned int hash,
238 const struct gfs2_sbd *sdp,
239 const struct lm_lockname *name)
241 struct gfs2_glock *gl;
242 struct hlist_node *h;
244 hlist_for_each_entry(gl, h, &gl_hash_table[hash].hb_list, gl_list) {
245 if (!lm_name_equal(&gl->gl_name, name))
246 continue;
247 if (gl->gl_sbd != sdp)
248 continue;
250 atomic_inc(&gl->gl_ref);
252 return gl;
255 return NULL;
259 * gfs2_glock_find() - Find glock by lock number
260 * @sdp: The GFS2 superblock
261 * @name: The lock name
263 * Returns: NULL, or the struct gfs2_glock with the requested number
266 static struct gfs2_glock *gfs2_glock_find(const struct gfs2_sbd *sdp,
267 const struct lm_lockname *name)
269 unsigned int hash = gl_hash(sdp, name);
270 struct gfs2_glock *gl;
272 read_lock(gl_lock_addr(hash));
273 gl = search_bucket(hash, sdp, name);
274 read_unlock(gl_lock_addr(hash));
276 return gl;
280 * gfs2_glock_get() - Get a glock, or create one if one doesn't exist
281 * @sdp: The GFS2 superblock
282 * @number: the lock number
283 * @glops: The glock_operations to use
284 * @create: If 0, don't create the glock if it doesn't exist
285 * @glp: the glock is returned here
287 * This does not lock a glock, just finds/creates structures for one.
289 * Returns: errno
292 int gfs2_glock_get(struct gfs2_sbd *sdp, u64 number,
293 const struct gfs2_glock_operations *glops, int create,
294 struct gfs2_glock **glp)
296 struct lm_lockname name = { .ln_number = number, .ln_type = glops->go_type };
297 struct gfs2_glock *gl, *tmp;
298 unsigned int hash = gl_hash(sdp, &name);
299 int error;
301 read_lock(gl_lock_addr(hash));
302 gl = search_bucket(hash, sdp, &name);
303 read_unlock(gl_lock_addr(hash));
305 if (gl || !create) {
306 *glp = gl;
307 return 0;
310 gl = kmem_cache_alloc(gfs2_glock_cachep, GFP_KERNEL);
311 if (!gl)
312 return -ENOMEM;
314 gl->gl_flags = 0;
315 gl->gl_name = name;
316 atomic_set(&gl->gl_ref, 1);
317 gl->gl_state = LM_ST_UNLOCKED;
318 gl->gl_hash = hash;
319 gl->gl_owner_pid = 0;
320 gl->gl_ip = 0;
321 gl->gl_ops = glops;
322 gl->gl_req_gh = NULL;
323 gl->gl_req_bh = NULL;
324 gl->gl_vn = 0;
325 gl->gl_stamp = jiffies;
326 gl->gl_object = NULL;
327 gl->gl_sbd = sdp;
328 gl->gl_aspace = NULL;
329 lops_init_le(&gl->gl_le, &gfs2_glock_lops);
331 /* If this glock protects actual on-disk data or metadata blocks,
332 create a VFS inode to manage the pages/buffers holding them. */
333 if (glops == &gfs2_inode_glops || glops == &gfs2_rgrp_glops) {
334 gl->gl_aspace = gfs2_aspace_get(sdp);
335 if (!gl->gl_aspace) {
336 error = -ENOMEM;
337 goto fail;
341 error = gfs2_lm_get_lock(sdp, &name, &gl->gl_lock);
342 if (error)
343 goto fail_aspace;
345 write_lock(gl_lock_addr(hash));
346 tmp = search_bucket(hash, sdp, &name);
347 if (tmp) {
348 write_unlock(gl_lock_addr(hash));
349 glock_free(gl);
350 gl = tmp;
351 } else {
352 hlist_add_head(&gl->gl_list, &gl_hash_table[hash].hb_list);
353 write_unlock(gl_lock_addr(hash));
356 *glp = gl;
358 return 0;
360 fail_aspace:
361 if (gl->gl_aspace)
362 gfs2_aspace_put(gl->gl_aspace);
363 fail:
364 kmem_cache_free(gfs2_glock_cachep, gl);
365 return error;
369 * gfs2_holder_init - initialize a struct gfs2_holder in the default way
370 * @gl: the glock
371 * @state: the state we're requesting
372 * @flags: the modifier flags
373 * @gh: the holder structure
377 void gfs2_holder_init(struct gfs2_glock *gl, unsigned int state, unsigned flags,
378 struct gfs2_holder *gh)
380 INIT_LIST_HEAD(&gh->gh_list);
381 gh->gh_gl = gl;
382 gh->gh_ip = (unsigned long)__builtin_return_address(0);
383 gh->gh_owner_pid = current->pid;
384 gh->gh_state = state;
385 gh->gh_flags = flags;
386 gh->gh_error = 0;
387 gh->gh_iflags = 0;
388 gfs2_glock_hold(gl);
392 * gfs2_holder_reinit - reinitialize a struct gfs2_holder so we can requeue it
393 * @state: the state we're requesting
394 * @flags: the modifier flags
395 * @gh: the holder structure
397 * Don't mess with the glock.
401 void gfs2_holder_reinit(unsigned int state, unsigned flags, struct gfs2_holder *gh)
403 gh->gh_state = state;
404 gh->gh_flags = flags;
405 gh->gh_iflags = 0;
406 gh->gh_ip = (unsigned long)__builtin_return_address(0);
410 * gfs2_holder_uninit - uninitialize a holder structure (drop glock reference)
411 * @gh: the holder structure
415 void gfs2_holder_uninit(struct gfs2_holder *gh)
417 gfs2_glock_put(gh->gh_gl);
418 gh->gh_gl = NULL;
419 gh->gh_ip = 0;
422 static void gfs2_holder_wake(struct gfs2_holder *gh)
424 clear_bit(HIF_WAIT, &gh->gh_iflags);
425 smp_mb__after_clear_bit();
426 wake_up_bit(&gh->gh_iflags, HIF_WAIT);
429 static int just_schedule(void *word)
431 schedule();
432 return 0;
435 static void wait_on_holder(struct gfs2_holder *gh)
437 might_sleep();
438 wait_on_bit(&gh->gh_iflags, HIF_WAIT, just_schedule, TASK_UNINTERRUPTIBLE);
441 static void gfs2_demote_wake(struct gfs2_glock *gl)
443 clear_bit(GLF_DEMOTE, &gl->gl_flags);
444 smp_mb__after_clear_bit();
445 wake_up_bit(&gl->gl_flags, GLF_DEMOTE);
448 static void wait_on_demote(struct gfs2_glock *gl)
450 might_sleep();
451 wait_on_bit(&gl->gl_flags, GLF_DEMOTE, just_schedule, TASK_UNINTERRUPTIBLE);
455 * rq_mutex - process a mutex request in the queue
456 * @gh: the glock holder
458 * Returns: 1 if the queue is blocked
461 static int rq_mutex(struct gfs2_holder *gh)
463 struct gfs2_glock *gl = gh->gh_gl;
465 list_del_init(&gh->gh_list);
466 /* gh->gh_error never examined. */
467 set_bit(GLF_LOCK, &gl->gl_flags);
468 clear_bit(HIF_WAIT, &gh->gh_iflags);
469 smp_mb();
470 wake_up_bit(&gh->gh_iflags, HIF_WAIT);
472 return 1;
476 * rq_promote - process a promote request in the queue
477 * @gh: the glock holder
479 * Acquire a new inter-node lock, or change a lock state to more restrictive.
481 * Returns: 1 if the queue is blocked
484 static int rq_promote(struct gfs2_holder *gh)
486 struct gfs2_glock *gl = gh->gh_gl;
487 struct gfs2_sbd *sdp = gl->gl_sbd;
489 if (!relaxed_state_ok(gl->gl_state, gh->gh_state, gh->gh_flags)) {
490 if (list_empty(&gl->gl_holders)) {
491 gl->gl_req_gh = gh;
492 set_bit(GLF_LOCK, &gl->gl_flags);
493 spin_unlock(&gl->gl_spin);
495 if (atomic_read(&sdp->sd_reclaim_count) >
496 gfs2_tune_get(sdp, gt_reclaim_limit) &&
497 !(gh->gh_flags & LM_FLAG_PRIORITY)) {
498 gfs2_reclaim_glock(sdp);
499 gfs2_reclaim_glock(sdp);
502 gfs2_glock_xmote_th(gh->gh_gl, gh);
503 spin_lock(&gl->gl_spin);
505 return 1;
508 if (list_empty(&gl->gl_holders)) {
509 set_bit(HIF_FIRST, &gh->gh_iflags);
510 set_bit(GLF_LOCK, &gl->gl_flags);
511 } else {
512 struct gfs2_holder *next_gh;
513 if (gh->gh_state == LM_ST_EXCLUSIVE)
514 return 1;
515 next_gh = list_entry(gl->gl_holders.next, struct gfs2_holder,
516 gh_list);
517 if (next_gh->gh_state == LM_ST_EXCLUSIVE)
518 return 1;
521 list_move_tail(&gh->gh_list, &gl->gl_holders);
522 gh->gh_error = 0;
523 set_bit(HIF_HOLDER, &gh->gh_iflags);
525 gfs2_holder_wake(gh);
527 return 0;
531 * rq_demote - process a demote request in the queue
532 * @gh: the glock holder
534 * Returns: 1 if the queue is blocked
537 static int rq_demote(struct gfs2_glock *gl)
539 if (!list_empty(&gl->gl_holders))
540 return 1;
542 if (gl->gl_state == gl->gl_demote_state ||
543 gl->gl_state == LM_ST_UNLOCKED) {
544 gfs2_demote_wake(gl);
545 return 0;
547 set_bit(GLF_LOCK, &gl->gl_flags);
548 spin_unlock(&gl->gl_spin);
549 if (gl->gl_demote_state == LM_ST_UNLOCKED ||
550 gl->gl_state != LM_ST_EXCLUSIVE)
551 gfs2_glock_drop_th(gl);
552 else
553 gfs2_glock_xmote_th(gl, NULL);
554 spin_lock(&gl->gl_spin);
556 return 0;
560 * run_queue - process holder structures on a glock
561 * @gl: the glock
564 static void run_queue(struct gfs2_glock *gl)
566 struct gfs2_holder *gh;
567 int blocked = 1;
569 for (;;) {
570 if (test_bit(GLF_LOCK, &gl->gl_flags))
571 break;
573 if (!list_empty(&gl->gl_waiters1)) {
574 gh = list_entry(gl->gl_waiters1.next,
575 struct gfs2_holder, gh_list);
577 if (test_bit(HIF_MUTEX, &gh->gh_iflags))
578 blocked = rq_mutex(gh);
579 else
580 gfs2_assert_warn(gl->gl_sbd, 0);
582 } else if (test_bit(GLF_DEMOTE, &gl->gl_flags)) {
583 blocked = rq_demote(gl);
584 } else if (!list_empty(&gl->gl_waiters3)) {
585 gh = list_entry(gl->gl_waiters3.next,
586 struct gfs2_holder, gh_list);
588 if (test_bit(HIF_PROMOTE, &gh->gh_iflags))
589 blocked = rq_promote(gh);
590 else
591 gfs2_assert_warn(gl->gl_sbd, 0);
593 } else
594 break;
596 if (blocked)
597 break;
602 * gfs2_glmutex_lock - acquire a local lock on a glock
603 * @gl: the glock
605 * Gives caller exclusive access to manipulate a glock structure.
608 static void gfs2_glmutex_lock(struct gfs2_glock *gl)
610 struct gfs2_holder gh;
612 gfs2_holder_init(gl, 0, 0, &gh);
613 set_bit(HIF_MUTEX, &gh.gh_iflags);
614 if (test_and_set_bit(HIF_WAIT, &gh.gh_iflags))
615 BUG();
617 spin_lock(&gl->gl_spin);
618 if (test_and_set_bit(GLF_LOCK, &gl->gl_flags)) {
619 list_add_tail(&gh.gh_list, &gl->gl_waiters1);
620 } else {
621 gl->gl_owner_pid = current->pid;
622 gl->gl_ip = (unsigned long)__builtin_return_address(0);
623 clear_bit(HIF_WAIT, &gh.gh_iflags);
624 smp_mb();
625 wake_up_bit(&gh.gh_iflags, HIF_WAIT);
627 spin_unlock(&gl->gl_spin);
629 wait_on_holder(&gh);
630 gfs2_holder_uninit(&gh);
634 * gfs2_glmutex_trylock - try to acquire a local lock on a glock
635 * @gl: the glock
637 * Returns: 1 if the glock is acquired
640 static int gfs2_glmutex_trylock(struct gfs2_glock *gl)
642 int acquired = 1;
644 spin_lock(&gl->gl_spin);
645 if (test_and_set_bit(GLF_LOCK, &gl->gl_flags)) {
646 acquired = 0;
647 } else {
648 gl->gl_owner_pid = current->pid;
649 gl->gl_ip = (unsigned long)__builtin_return_address(0);
651 spin_unlock(&gl->gl_spin);
653 return acquired;
657 * gfs2_glmutex_unlock - release a local lock on a glock
658 * @gl: the glock
662 static void gfs2_glmutex_unlock(struct gfs2_glock *gl)
664 spin_lock(&gl->gl_spin);
665 clear_bit(GLF_LOCK, &gl->gl_flags);
666 gl->gl_owner_pid = 0;
667 gl->gl_ip = 0;
668 run_queue(gl);
669 BUG_ON(!spin_is_locked(&gl->gl_spin));
670 spin_unlock(&gl->gl_spin);
674 * handle_callback - process a demote request
675 * @gl: the glock
676 * @state: the state the caller wants us to change to
678 * There are only two requests that we are going to see in actual
679 * practise: LM_ST_SHARED and LM_ST_UNLOCKED
682 static void handle_callback(struct gfs2_glock *gl, unsigned int state, int remote)
684 spin_lock(&gl->gl_spin);
685 if (test_and_set_bit(GLF_DEMOTE, &gl->gl_flags) == 0) {
686 gl->gl_demote_state = state;
687 gl->gl_demote_time = jiffies;
688 if (remote && gl->gl_ops->go_type == LM_TYPE_IOPEN &&
689 gl->gl_object) {
690 struct inode *inode = igrab(gl->gl_object);
691 spin_unlock(&gl->gl_spin);
692 if (inode) {
693 d_prune_aliases(inode);
694 iput(inode);
696 return;
698 } else if (gl->gl_demote_state != LM_ST_UNLOCKED) {
699 gl->gl_demote_state = state;
701 spin_unlock(&gl->gl_spin);
705 * state_change - record that the glock is now in a different state
706 * @gl: the glock
707 * @new_state the new state
711 static void state_change(struct gfs2_glock *gl, unsigned int new_state)
713 int held1, held2;
715 held1 = (gl->gl_state != LM_ST_UNLOCKED);
716 held2 = (new_state != LM_ST_UNLOCKED);
718 if (held1 != held2) {
719 if (held2)
720 gfs2_glock_hold(gl);
721 else
722 gfs2_glock_put(gl);
725 gl->gl_state = new_state;
729 * xmote_bh - Called after the lock module is done acquiring a lock
730 * @gl: The glock in question
731 * @ret: the int returned from the lock module
735 static void xmote_bh(struct gfs2_glock *gl, unsigned int ret)
737 struct gfs2_sbd *sdp = gl->gl_sbd;
738 const struct gfs2_glock_operations *glops = gl->gl_ops;
739 struct gfs2_holder *gh = gl->gl_req_gh;
740 int prev_state = gl->gl_state;
741 int op_done = 1;
743 gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
744 gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
745 gfs2_assert_warn(sdp, !(ret & LM_OUT_ASYNC));
747 state_change(gl, ret & LM_OUT_ST_MASK);
749 if (prev_state != LM_ST_UNLOCKED && !(ret & LM_OUT_CACHEABLE)) {
750 if (glops->go_inval)
751 glops->go_inval(gl, DIO_METADATA);
752 } else if (gl->gl_state == LM_ST_DEFERRED) {
753 /* We might not want to do this here.
754 Look at moving to the inode glops. */
755 if (glops->go_inval)
756 glops->go_inval(gl, 0);
759 /* Deal with each possible exit condition */
761 if (!gh) {
762 gl->gl_stamp = jiffies;
763 if (ret & LM_OUT_CANCELED)
764 op_done = 0;
765 else
766 gfs2_demote_wake(gl);
767 } else {
768 spin_lock(&gl->gl_spin);
769 list_del_init(&gh->gh_list);
770 gh->gh_error = -EIO;
771 if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags)))
772 goto out;
773 gh->gh_error = GLR_CANCELED;
774 if (ret & LM_OUT_CANCELED)
775 goto out;
776 if (relaxed_state_ok(gl->gl_state, gh->gh_state, gh->gh_flags)) {
777 list_add_tail(&gh->gh_list, &gl->gl_holders);
778 gh->gh_error = 0;
779 set_bit(HIF_HOLDER, &gh->gh_iflags);
780 set_bit(HIF_FIRST, &gh->gh_iflags);
781 op_done = 0;
782 goto out;
784 gh->gh_error = GLR_TRYFAILED;
785 if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB))
786 goto out;
787 gh->gh_error = -EINVAL;
788 if (gfs2_assert_withdraw(sdp, 0) == -1)
789 fs_err(sdp, "ret = 0x%.8X\n", ret);
790 out:
791 spin_unlock(&gl->gl_spin);
794 if (glops->go_xmote_bh)
795 glops->go_xmote_bh(gl);
797 if (op_done) {
798 spin_lock(&gl->gl_spin);
799 gl->gl_req_gh = NULL;
800 gl->gl_req_bh = NULL;
801 clear_bit(GLF_LOCK, &gl->gl_flags);
802 run_queue(gl);
803 spin_unlock(&gl->gl_spin);
806 gfs2_glock_put(gl);
808 if (gh)
809 gfs2_holder_wake(gh);
813 * gfs2_glock_xmote_th - Call into the lock module to acquire or change a glock
814 * @gl: The glock in question
815 * @state: the requested state
816 * @flags: modifier flags to the lock call
820 void gfs2_glock_xmote_th(struct gfs2_glock *gl, struct gfs2_holder *gh)
822 struct gfs2_sbd *sdp = gl->gl_sbd;
823 int flags = gh ? gh->gh_flags : 0;
824 unsigned state = gh ? gh->gh_state : gl->gl_demote_state;
825 const struct gfs2_glock_operations *glops = gl->gl_ops;
826 int lck_flags = flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB |
827 LM_FLAG_NOEXP | LM_FLAG_ANY |
828 LM_FLAG_PRIORITY);
829 unsigned int lck_ret;
831 if (glops->go_xmote_th)
832 glops->go_xmote_th(gl);
834 gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
835 gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
836 gfs2_assert_warn(sdp, state != LM_ST_UNLOCKED);
837 gfs2_assert_warn(sdp, state != gl->gl_state);
839 gfs2_glock_hold(gl);
840 gl->gl_req_bh = xmote_bh;
842 lck_ret = gfs2_lm_lock(sdp, gl->gl_lock, gl->gl_state, state, lck_flags);
844 if (gfs2_assert_withdraw(sdp, !(lck_ret & LM_OUT_ERROR)))
845 return;
847 if (lck_ret & LM_OUT_ASYNC)
848 gfs2_assert_warn(sdp, lck_ret == LM_OUT_ASYNC);
849 else
850 xmote_bh(gl, lck_ret);
854 * drop_bh - Called after a lock module unlock completes
855 * @gl: the glock
856 * @ret: the return status
858 * Doesn't wake up the process waiting on the struct gfs2_holder (if any)
859 * Doesn't drop the reference on the glock the top half took out
863 static void drop_bh(struct gfs2_glock *gl, unsigned int ret)
865 struct gfs2_sbd *sdp = gl->gl_sbd;
866 const struct gfs2_glock_operations *glops = gl->gl_ops;
867 struct gfs2_holder *gh = gl->gl_req_gh;
869 gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
870 gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
871 gfs2_assert_warn(sdp, !ret);
873 state_change(gl, LM_ST_UNLOCKED);
874 gfs2_demote_wake(gl);
876 if (glops->go_inval)
877 glops->go_inval(gl, DIO_METADATA);
879 if (gh) {
880 spin_lock(&gl->gl_spin);
881 list_del_init(&gh->gh_list);
882 gh->gh_error = 0;
883 spin_unlock(&gl->gl_spin);
886 spin_lock(&gl->gl_spin);
887 gl->gl_req_gh = NULL;
888 gl->gl_req_bh = NULL;
889 clear_bit(GLF_LOCK, &gl->gl_flags);
890 run_queue(gl);
891 spin_unlock(&gl->gl_spin);
893 gfs2_glock_put(gl);
895 if (gh)
896 gfs2_holder_wake(gh);
900 * gfs2_glock_drop_th - call into the lock module to unlock a lock
901 * @gl: the glock
905 static void gfs2_glock_drop_th(struct gfs2_glock *gl)
907 struct gfs2_sbd *sdp = gl->gl_sbd;
908 const struct gfs2_glock_operations *glops = gl->gl_ops;
909 unsigned int ret;
911 if (glops->go_drop_th)
912 glops->go_drop_th(gl);
914 gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
915 gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
916 gfs2_assert_warn(sdp, gl->gl_state != LM_ST_UNLOCKED);
918 gfs2_glock_hold(gl);
919 gl->gl_req_bh = drop_bh;
921 ret = gfs2_lm_unlock(sdp, gl->gl_lock, gl->gl_state);
923 if (gfs2_assert_withdraw(sdp, !(ret & LM_OUT_ERROR)))
924 return;
926 if (!ret)
927 drop_bh(gl, ret);
928 else
929 gfs2_assert_warn(sdp, ret == LM_OUT_ASYNC);
933 * do_cancels - cancel requests for locks stuck waiting on an expire flag
934 * @gh: the LM_FLAG_PRIORITY holder waiting to acquire the lock
936 * Don't cancel GL_NOCANCEL requests.
939 static void do_cancels(struct gfs2_holder *gh)
941 struct gfs2_glock *gl = gh->gh_gl;
943 spin_lock(&gl->gl_spin);
945 while (gl->gl_req_gh != gh &&
946 !test_bit(HIF_HOLDER, &gh->gh_iflags) &&
947 !list_empty(&gh->gh_list)) {
948 if (gl->gl_req_bh && !(gl->gl_req_gh &&
949 (gl->gl_req_gh->gh_flags & GL_NOCANCEL))) {
950 spin_unlock(&gl->gl_spin);
951 gfs2_lm_cancel(gl->gl_sbd, gl->gl_lock);
952 msleep(100);
953 spin_lock(&gl->gl_spin);
954 } else {
955 spin_unlock(&gl->gl_spin);
956 msleep(100);
957 spin_lock(&gl->gl_spin);
961 spin_unlock(&gl->gl_spin);
965 * glock_wait_internal - wait on a glock acquisition
966 * @gh: the glock holder
968 * Returns: 0 on success
971 static int glock_wait_internal(struct gfs2_holder *gh)
973 struct gfs2_glock *gl = gh->gh_gl;
974 struct gfs2_sbd *sdp = gl->gl_sbd;
975 const struct gfs2_glock_operations *glops = gl->gl_ops;
977 if (test_bit(HIF_ABORTED, &gh->gh_iflags))
978 return -EIO;
980 if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)) {
981 spin_lock(&gl->gl_spin);
982 if (gl->gl_req_gh != gh &&
983 !test_bit(HIF_HOLDER, &gh->gh_iflags) &&
984 !list_empty(&gh->gh_list)) {
985 list_del_init(&gh->gh_list);
986 gh->gh_error = GLR_TRYFAILED;
987 run_queue(gl);
988 spin_unlock(&gl->gl_spin);
989 return gh->gh_error;
991 spin_unlock(&gl->gl_spin);
994 if (gh->gh_flags & LM_FLAG_PRIORITY)
995 do_cancels(gh);
997 wait_on_holder(gh);
998 if (gh->gh_error)
999 return gh->gh_error;
1001 gfs2_assert_withdraw(sdp, test_bit(HIF_HOLDER, &gh->gh_iflags));
1002 gfs2_assert_withdraw(sdp, relaxed_state_ok(gl->gl_state, gh->gh_state,
1003 gh->gh_flags));
1005 if (test_bit(HIF_FIRST, &gh->gh_iflags)) {
1006 gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
1008 if (glops->go_lock) {
1009 gh->gh_error = glops->go_lock(gh);
1010 if (gh->gh_error) {
1011 spin_lock(&gl->gl_spin);
1012 list_del_init(&gh->gh_list);
1013 spin_unlock(&gl->gl_spin);
1017 spin_lock(&gl->gl_spin);
1018 gl->gl_req_gh = NULL;
1019 gl->gl_req_bh = NULL;
1020 clear_bit(GLF_LOCK, &gl->gl_flags);
1021 run_queue(gl);
1022 spin_unlock(&gl->gl_spin);
1025 return gh->gh_error;
1028 static inline struct gfs2_holder *
1029 find_holder_by_owner(struct list_head *head, pid_t pid)
1031 struct gfs2_holder *gh;
1033 list_for_each_entry(gh, head, gh_list) {
1034 if (gh->gh_owner_pid == pid)
1035 return gh;
1038 return NULL;
1041 static void print_dbg(struct glock_iter *gi, const char *fmt, ...)
1043 va_list args;
1045 va_start(args, fmt);
1046 if (gi) {
1047 vsprintf(gi->string, fmt, args);
1048 seq_printf(gi->seq, gi->string);
1050 else
1051 vprintk(fmt, args);
1052 va_end(args);
1056 * add_to_queue - Add a holder to the wait queue (but look for recursion)
1057 * @gh: the holder structure to add
1061 static void add_to_queue(struct gfs2_holder *gh)
1063 struct gfs2_glock *gl = gh->gh_gl;
1064 struct gfs2_holder *existing;
1066 BUG_ON(!gh->gh_owner_pid);
1067 if (test_and_set_bit(HIF_WAIT, &gh->gh_iflags))
1068 BUG();
1070 existing = find_holder_by_owner(&gl->gl_holders, gh->gh_owner_pid);
1071 if (existing) {
1072 print_symbol(KERN_WARNING "original: %s\n", existing->gh_ip);
1073 printk(KERN_INFO "pid : %d\n", existing->gh_owner_pid);
1074 printk(KERN_INFO "lock type : %d lock state : %d\n",
1075 existing->gh_gl->gl_name.ln_type, existing->gh_gl->gl_state);
1076 print_symbol(KERN_WARNING "new: %s\n", gh->gh_ip);
1077 printk(KERN_INFO "pid : %d\n", gh->gh_owner_pid);
1078 printk(KERN_INFO "lock type : %d lock state : %d\n",
1079 gl->gl_name.ln_type, gl->gl_state);
1080 BUG();
1083 existing = find_holder_by_owner(&gl->gl_waiters3, gh->gh_owner_pid);
1084 if (existing) {
1085 print_symbol(KERN_WARNING "original: %s\n", existing->gh_ip);
1086 print_symbol(KERN_WARNING "new: %s\n", gh->gh_ip);
1087 BUG();
1090 if (gh->gh_flags & LM_FLAG_PRIORITY)
1091 list_add(&gh->gh_list, &gl->gl_waiters3);
1092 else
1093 list_add_tail(&gh->gh_list, &gl->gl_waiters3);
1097 * gfs2_glock_nq - enqueue a struct gfs2_holder onto a glock (acquire a glock)
1098 * @gh: the holder structure
1100 * if (gh->gh_flags & GL_ASYNC), this never returns an error
1102 * Returns: 0, GLR_TRYFAILED, or errno on failure
1105 int gfs2_glock_nq(struct gfs2_holder *gh)
1107 struct gfs2_glock *gl = gh->gh_gl;
1108 struct gfs2_sbd *sdp = gl->gl_sbd;
1109 int error = 0;
1111 restart:
1112 if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags))) {
1113 set_bit(HIF_ABORTED, &gh->gh_iflags);
1114 return -EIO;
1117 set_bit(HIF_PROMOTE, &gh->gh_iflags);
1119 spin_lock(&gl->gl_spin);
1120 add_to_queue(gh);
1121 run_queue(gl);
1122 spin_unlock(&gl->gl_spin);
1124 if (!(gh->gh_flags & GL_ASYNC)) {
1125 error = glock_wait_internal(gh);
1126 if (error == GLR_CANCELED) {
1127 msleep(100);
1128 goto restart;
1132 return error;
1136 * gfs2_glock_poll - poll to see if an async request has been completed
1137 * @gh: the holder
1139 * Returns: 1 if the request is ready to be gfs2_glock_wait()ed on
1142 int gfs2_glock_poll(struct gfs2_holder *gh)
1144 struct gfs2_glock *gl = gh->gh_gl;
1145 int ready = 0;
1147 spin_lock(&gl->gl_spin);
1149 if (test_bit(HIF_HOLDER, &gh->gh_iflags))
1150 ready = 1;
1151 else if (list_empty(&gh->gh_list)) {
1152 if (gh->gh_error == GLR_CANCELED) {
1153 spin_unlock(&gl->gl_spin);
1154 msleep(100);
1155 if (gfs2_glock_nq(gh))
1156 return 1;
1157 return 0;
1158 } else
1159 ready = 1;
1162 spin_unlock(&gl->gl_spin);
1164 return ready;
1168 * gfs2_glock_wait - wait for a lock acquisition that ended in a GLR_ASYNC
1169 * @gh: the holder structure
1171 * Returns: 0, GLR_TRYFAILED, or errno on failure
1174 int gfs2_glock_wait(struct gfs2_holder *gh)
1176 int error;
1178 error = glock_wait_internal(gh);
1179 if (error == GLR_CANCELED) {
1180 msleep(100);
1181 gh->gh_flags &= ~GL_ASYNC;
1182 error = gfs2_glock_nq(gh);
1185 return error;
1189 * gfs2_glock_dq - dequeue a struct gfs2_holder from a glock (release a glock)
1190 * @gh: the glock holder
1194 void gfs2_glock_dq(struct gfs2_holder *gh)
1196 struct gfs2_glock *gl = gh->gh_gl;
1197 const struct gfs2_glock_operations *glops = gl->gl_ops;
1199 if (gh->gh_flags & GL_NOCACHE)
1200 handle_callback(gl, LM_ST_UNLOCKED, 0);
1202 gfs2_glmutex_lock(gl);
1204 spin_lock(&gl->gl_spin);
1205 list_del_init(&gh->gh_list);
1207 if (list_empty(&gl->gl_holders)) {
1208 spin_unlock(&gl->gl_spin);
1210 if (glops->go_unlock)
1211 glops->go_unlock(gh);
1213 spin_lock(&gl->gl_spin);
1214 gl->gl_stamp = jiffies;
1217 clear_bit(GLF_LOCK, &gl->gl_flags);
1218 run_queue(gl);
1219 spin_unlock(&gl->gl_spin);
1222 void gfs2_glock_dq_wait(struct gfs2_holder *gh)
1224 struct gfs2_glock *gl = gh->gh_gl;
1225 gfs2_glock_dq(gh);
1226 wait_on_demote(gl);
1230 * gfs2_glock_dq_uninit - dequeue a holder from a glock and initialize it
1231 * @gh: the holder structure
1235 void gfs2_glock_dq_uninit(struct gfs2_holder *gh)
1237 gfs2_glock_dq(gh);
1238 gfs2_holder_uninit(gh);
1242 * gfs2_glock_nq_num - acquire a glock based on lock number
1243 * @sdp: the filesystem
1244 * @number: the lock number
1245 * @glops: the glock operations for the type of glock
1246 * @state: the state to acquire the glock in
1247 * @flags: modifier flags for the aquisition
1248 * @gh: the struct gfs2_holder
1250 * Returns: errno
1253 int gfs2_glock_nq_num(struct gfs2_sbd *sdp, u64 number,
1254 const struct gfs2_glock_operations *glops,
1255 unsigned int state, int flags, struct gfs2_holder *gh)
1257 struct gfs2_glock *gl;
1258 int error;
1260 error = gfs2_glock_get(sdp, number, glops, CREATE, &gl);
1261 if (!error) {
1262 error = gfs2_glock_nq_init(gl, state, flags, gh);
1263 gfs2_glock_put(gl);
1266 return error;
1270 * glock_compare - Compare two struct gfs2_glock structures for sorting
1271 * @arg_a: the first structure
1272 * @arg_b: the second structure
1276 static int glock_compare(const void *arg_a, const void *arg_b)
1278 const struct gfs2_holder *gh_a = *(const struct gfs2_holder **)arg_a;
1279 const struct gfs2_holder *gh_b = *(const struct gfs2_holder **)arg_b;
1280 const struct lm_lockname *a = &gh_a->gh_gl->gl_name;
1281 const struct lm_lockname *b = &gh_b->gh_gl->gl_name;
1283 if (a->ln_number > b->ln_number)
1284 return 1;
1285 if (a->ln_number < b->ln_number)
1286 return -1;
1287 BUG_ON(gh_a->gh_gl->gl_ops->go_type == gh_b->gh_gl->gl_ops->go_type);
1288 return 0;
1292 * nq_m_sync - synchonously acquire more than one glock in deadlock free order
1293 * @num_gh: the number of structures
1294 * @ghs: an array of struct gfs2_holder structures
1296 * Returns: 0 on success (all glocks acquired),
1297 * errno on failure (no glocks acquired)
1300 static int nq_m_sync(unsigned int num_gh, struct gfs2_holder *ghs,
1301 struct gfs2_holder **p)
1303 unsigned int x;
1304 int error = 0;
1306 for (x = 0; x < num_gh; x++)
1307 p[x] = &ghs[x];
1309 sort(p, num_gh, sizeof(struct gfs2_holder *), glock_compare, NULL);
1311 for (x = 0; x < num_gh; x++) {
1312 p[x]->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1314 error = gfs2_glock_nq(p[x]);
1315 if (error) {
1316 while (x--)
1317 gfs2_glock_dq(p[x]);
1318 break;
1322 return error;
1326 * gfs2_glock_nq_m - acquire multiple glocks
1327 * @num_gh: the number of structures
1328 * @ghs: an array of struct gfs2_holder structures
1331 * Returns: 0 on success (all glocks acquired),
1332 * errno on failure (no glocks acquired)
1335 int gfs2_glock_nq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1337 struct gfs2_holder *tmp[4];
1338 struct gfs2_holder **pph = tmp;
1339 int error = 0;
1341 switch(num_gh) {
1342 case 0:
1343 return 0;
1344 case 1:
1345 ghs->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1346 return gfs2_glock_nq(ghs);
1347 default:
1348 if (num_gh <= 4)
1349 break;
1350 pph = kmalloc(num_gh * sizeof(struct gfs2_holder *), GFP_NOFS);
1351 if (!pph)
1352 return -ENOMEM;
1355 error = nq_m_sync(num_gh, ghs, pph);
1357 if (pph != tmp)
1358 kfree(pph);
1360 return error;
1364 * gfs2_glock_dq_m - release multiple glocks
1365 * @num_gh: the number of structures
1366 * @ghs: an array of struct gfs2_holder structures
1370 void gfs2_glock_dq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1372 unsigned int x;
1374 for (x = 0; x < num_gh; x++)
1375 gfs2_glock_dq(&ghs[x]);
1379 * gfs2_glock_dq_uninit_m - release multiple glocks
1380 * @num_gh: the number of structures
1381 * @ghs: an array of struct gfs2_holder structures
1385 void gfs2_glock_dq_uninit_m(unsigned int num_gh, struct gfs2_holder *ghs)
1387 unsigned int x;
1389 for (x = 0; x < num_gh; x++)
1390 gfs2_glock_dq_uninit(&ghs[x]);
1394 * gfs2_lvb_hold - attach a LVB from a glock
1395 * @gl: The glock in question
1399 int gfs2_lvb_hold(struct gfs2_glock *gl)
1401 int error;
1403 gfs2_glmutex_lock(gl);
1405 if (!atomic_read(&gl->gl_lvb_count)) {
1406 error = gfs2_lm_hold_lvb(gl->gl_sbd, gl->gl_lock, &gl->gl_lvb);
1407 if (error) {
1408 gfs2_glmutex_unlock(gl);
1409 return error;
1411 gfs2_glock_hold(gl);
1413 atomic_inc(&gl->gl_lvb_count);
1415 gfs2_glmutex_unlock(gl);
1417 return 0;
1421 * gfs2_lvb_unhold - detach a LVB from a glock
1422 * @gl: The glock in question
1426 void gfs2_lvb_unhold(struct gfs2_glock *gl)
1428 gfs2_glock_hold(gl);
1429 gfs2_glmutex_lock(gl);
1431 gfs2_assert(gl->gl_sbd, atomic_read(&gl->gl_lvb_count) > 0);
1432 if (atomic_dec_and_test(&gl->gl_lvb_count)) {
1433 gfs2_lm_unhold_lvb(gl->gl_sbd, gl->gl_lock, gl->gl_lvb);
1434 gl->gl_lvb = NULL;
1435 gfs2_glock_put(gl);
1438 gfs2_glmutex_unlock(gl);
1439 gfs2_glock_put(gl);
1442 static void blocking_cb(struct gfs2_sbd *sdp, struct lm_lockname *name,
1443 unsigned int state)
1445 struct gfs2_glock *gl;
1447 gl = gfs2_glock_find(sdp, name);
1448 if (!gl)
1449 return;
1451 handle_callback(gl, state, 1);
1453 spin_lock(&gl->gl_spin);
1454 run_queue(gl);
1455 spin_unlock(&gl->gl_spin);
1457 gfs2_glock_put(gl);
1461 * gfs2_glock_cb - Callback used by locking module
1462 * @sdp: Pointer to the superblock
1463 * @type: Type of callback
1464 * @data: Type dependent data pointer
1466 * Called by the locking module when it wants to tell us something.
1467 * Either we need to drop a lock, one of our ASYNC requests completed, or
1468 * a journal from another client needs to be recovered.
1471 void gfs2_glock_cb(void *cb_data, unsigned int type, void *data)
1473 struct gfs2_sbd *sdp = cb_data;
1475 switch (type) {
1476 case LM_CB_NEED_E:
1477 blocking_cb(sdp, data, LM_ST_UNLOCKED);
1478 return;
1480 case LM_CB_NEED_D:
1481 blocking_cb(sdp, data, LM_ST_DEFERRED);
1482 return;
1484 case LM_CB_NEED_S:
1485 blocking_cb(sdp, data, LM_ST_SHARED);
1486 return;
1488 case LM_CB_ASYNC: {
1489 struct lm_async_cb *async = data;
1490 struct gfs2_glock *gl;
1492 down_read(&gfs2_umount_flush_sem);
1493 gl = gfs2_glock_find(sdp, &async->lc_name);
1494 if (gfs2_assert_warn(sdp, gl))
1495 return;
1496 if (!gfs2_assert_warn(sdp, gl->gl_req_bh))
1497 gl->gl_req_bh(gl, async->lc_ret);
1498 gfs2_glock_put(gl);
1499 up_read(&gfs2_umount_flush_sem);
1500 return;
1503 case LM_CB_NEED_RECOVERY:
1504 gfs2_jdesc_make_dirty(sdp, *(unsigned int *)data);
1505 if (sdp->sd_recoverd_process)
1506 wake_up_process(sdp->sd_recoverd_process);
1507 return;
1509 case LM_CB_DROPLOCKS:
1510 gfs2_gl_hash_clear(sdp, NO_WAIT);
1511 gfs2_quota_scan(sdp);
1512 return;
1514 default:
1515 gfs2_assert_warn(sdp, 0);
1516 return;
1521 * demote_ok - Check to see if it's ok to unlock a glock
1522 * @gl: the glock
1524 * Returns: 1 if it's ok
1527 static int demote_ok(struct gfs2_glock *gl)
1529 const struct gfs2_glock_operations *glops = gl->gl_ops;
1530 int demote = 1;
1532 if (test_bit(GLF_STICKY, &gl->gl_flags))
1533 demote = 0;
1534 else if (glops->go_demote_ok)
1535 demote = glops->go_demote_ok(gl);
1537 return demote;
1541 * gfs2_glock_schedule_for_reclaim - Add a glock to the reclaim list
1542 * @gl: the glock
1546 void gfs2_glock_schedule_for_reclaim(struct gfs2_glock *gl)
1548 struct gfs2_sbd *sdp = gl->gl_sbd;
1550 spin_lock(&sdp->sd_reclaim_lock);
1551 if (list_empty(&gl->gl_reclaim)) {
1552 gfs2_glock_hold(gl);
1553 list_add(&gl->gl_reclaim, &sdp->sd_reclaim_list);
1554 atomic_inc(&sdp->sd_reclaim_count);
1556 spin_unlock(&sdp->sd_reclaim_lock);
1558 wake_up(&sdp->sd_reclaim_wq);
1562 * gfs2_reclaim_glock - process the next glock on the filesystem's reclaim list
1563 * @sdp: the filesystem
1565 * Called from gfs2_glockd() glock reclaim daemon, or when promoting a
1566 * different glock and we notice that there are a lot of glocks in the
1567 * reclaim list.
1571 void gfs2_reclaim_glock(struct gfs2_sbd *sdp)
1573 struct gfs2_glock *gl;
1575 spin_lock(&sdp->sd_reclaim_lock);
1576 if (list_empty(&sdp->sd_reclaim_list)) {
1577 spin_unlock(&sdp->sd_reclaim_lock);
1578 return;
1580 gl = list_entry(sdp->sd_reclaim_list.next,
1581 struct gfs2_glock, gl_reclaim);
1582 list_del_init(&gl->gl_reclaim);
1583 spin_unlock(&sdp->sd_reclaim_lock);
1585 atomic_dec(&sdp->sd_reclaim_count);
1586 atomic_inc(&sdp->sd_reclaimed);
1588 if (gfs2_glmutex_trylock(gl)) {
1589 if (list_empty(&gl->gl_holders) &&
1590 gl->gl_state != LM_ST_UNLOCKED && demote_ok(gl))
1591 handle_callback(gl, LM_ST_UNLOCKED, 0);
1592 gfs2_glmutex_unlock(gl);
1595 gfs2_glock_put(gl);
1599 * examine_bucket - Call a function for glock in a hash bucket
1600 * @examiner: the function
1601 * @sdp: the filesystem
1602 * @bucket: the bucket
1604 * Returns: 1 if the bucket has entries
1607 static int examine_bucket(glock_examiner examiner, struct gfs2_sbd *sdp,
1608 unsigned int hash)
1610 struct gfs2_glock *gl, *prev = NULL;
1611 int has_entries = 0;
1612 struct hlist_head *head = &gl_hash_table[hash].hb_list;
1614 read_lock(gl_lock_addr(hash));
1615 /* Can't use hlist_for_each_entry - don't want prefetch here */
1616 if (hlist_empty(head))
1617 goto out;
1618 gl = list_entry(head->first, struct gfs2_glock, gl_list);
1619 while(1) {
1620 if (gl->gl_sbd == sdp) {
1621 gfs2_glock_hold(gl);
1622 read_unlock(gl_lock_addr(hash));
1623 if (prev)
1624 gfs2_glock_put(prev);
1625 prev = gl;
1626 examiner(gl);
1627 has_entries = 1;
1628 read_lock(gl_lock_addr(hash));
1630 if (gl->gl_list.next == NULL)
1631 break;
1632 gl = list_entry(gl->gl_list.next, struct gfs2_glock, gl_list);
1634 out:
1635 read_unlock(gl_lock_addr(hash));
1636 if (prev)
1637 gfs2_glock_put(prev);
1638 return has_entries;
1642 * scan_glock - look at a glock and see if we can reclaim it
1643 * @gl: the glock to look at
1647 static void scan_glock(struct gfs2_glock *gl)
1649 if (gl->gl_ops == &gfs2_inode_glops && gl->gl_object)
1650 return;
1652 if (gfs2_glmutex_trylock(gl)) {
1653 if (list_empty(&gl->gl_holders) &&
1654 gl->gl_state != LM_ST_UNLOCKED && demote_ok(gl))
1655 goto out_schedule;
1656 gfs2_glmutex_unlock(gl);
1658 return;
1660 out_schedule:
1661 gfs2_glmutex_unlock(gl);
1662 gfs2_glock_schedule_for_reclaim(gl);
1666 * gfs2_scand_internal - Look for glocks and inodes to toss from memory
1667 * @sdp: the filesystem
1671 void gfs2_scand_internal(struct gfs2_sbd *sdp)
1673 unsigned int x;
1675 for (x = 0; x < GFS2_GL_HASH_SIZE; x++)
1676 examine_bucket(scan_glock, sdp, x);
1680 * clear_glock - look at a glock and see if we can free it from glock cache
1681 * @gl: the glock to look at
1685 static void clear_glock(struct gfs2_glock *gl)
1687 struct gfs2_sbd *sdp = gl->gl_sbd;
1688 int released;
1690 spin_lock(&sdp->sd_reclaim_lock);
1691 if (!list_empty(&gl->gl_reclaim)) {
1692 list_del_init(&gl->gl_reclaim);
1693 atomic_dec(&sdp->sd_reclaim_count);
1694 spin_unlock(&sdp->sd_reclaim_lock);
1695 released = gfs2_glock_put(gl);
1696 gfs2_assert(sdp, !released);
1697 } else {
1698 spin_unlock(&sdp->sd_reclaim_lock);
1701 if (gfs2_glmutex_trylock(gl)) {
1702 if (list_empty(&gl->gl_holders) &&
1703 gl->gl_state != LM_ST_UNLOCKED)
1704 handle_callback(gl, LM_ST_UNLOCKED, 0);
1705 gfs2_glmutex_unlock(gl);
1710 * gfs2_gl_hash_clear - Empty out the glock hash table
1711 * @sdp: the filesystem
1712 * @wait: wait until it's all gone
1714 * Called when unmounting the filesystem, or when inter-node lock manager
1715 * requests DROPLOCKS because it is running out of capacity.
1718 void gfs2_gl_hash_clear(struct gfs2_sbd *sdp, int wait)
1720 unsigned long t;
1721 unsigned int x;
1722 int cont;
1724 t = jiffies;
1726 for (;;) {
1727 cont = 0;
1728 for (x = 0; x < GFS2_GL_HASH_SIZE; x++) {
1729 if (examine_bucket(clear_glock, sdp, x))
1730 cont = 1;
1733 if (!wait || !cont)
1734 break;
1736 if (time_after_eq(jiffies,
1737 t + gfs2_tune_get(sdp, gt_stall_secs) * HZ)) {
1738 fs_warn(sdp, "Unmount seems to be stalled. "
1739 "Dumping lock state...\n");
1740 gfs2_dump_lockstate(sdp);
1741 t = jiffies;
1744 down_write(&gfs2_umount_flush_sem);
1745 invalidate_inodes(sdp->sd_vfs);
1746 up_write(&gfs2_umount_flush_sem);
1747 msleep(10);
1752 * Diagnostic routines to help debug distributed deadlock
1755 static void gfs2_print_symbol(struct glock_iter *gi, const char *fmt,
1756 unsigned long address)
1758 char buffer[KSYM_SYMBOL_LEN];
1760 sprint_symbol(buffer, address);
1761 print_dbg(gi, fmt, buffer);
1765 * dump_holder - print information about a glock holder
1766 * @str: a string naming the type of holder
1767 * @gh: the glock holder
1769 * Returns: 0 on success, -ENOBUFS when we run out of space
1772 static int dump_holder(struct glock_iter *gi, char *str,
1773 struct gfs2_holder *gh)
1775 unsigned int x;
1776 struct task_struct *gh_owner;
1778 print_dbg(gi, " %s\n", str);
1779 if (gh->gh_owner_pid) {
1780 print_dbg(gi, " owner = %ld ", (long)gh->gh_owner_pid);
1781 gh_owner = find_task_by_pid(gh->gh_owner_pid);
1782 if (gh_owner)
1783 print_dbg(gi, "(%s)\n", gh_owner->comm);
1784 else
1785 print_dbg(gi, "(ended)\n");
1786 } else
1787 print_dbg(gi, " owner = -1\n");
1788 print_dbg(gi, " gh_state = %u\n", gh->gh_state);
1789 print_dbg(gi, " gh_flags =");
1790 for (x = 0; x < 32; x++)
1791 if (gh->gh_flags & (1 << x))
1792 print_dbg(gi, " %u", x);
1793 print_dbg(gi, " \n");
1794 print_dbg(gi, " error = %d\n", gh->gh_error);
1795 print_dbg(gi, " gh_iflags =");
1796 for (x = 0; x < 32; x++)
1797 if (test_bit(x, &gh->gh_iflags))
1798 print_dbg(gi, " %u", x);
1799 print_dbg(gi, " \n");
1800 gfs2_print_symbol(gi, " initialized at: %s\n", gh->gh_ip);
1802 return 0;
1806 * dump_inode - print information about an inode
1807 * @ip: the inode
1809 * Returns: 0 on success, -ENOBUFS when we run out of space
1812 static int dump_inode(struct glock_iter *gi, struct gfs2_inode *ip)
1814 unsigned int x;
1816 print_dbg(gi, " Inode:\n");
1817 print_dbg(gi, " num = %llu/%llu\n",
1818 (unsigned long long)ip->i_no_formal_ino,
1819 (unsigned long long)ip->i_no_addr);
1820 print_dbg(gi, " type = %u\n", IF2DT(ip->i_inode.i_mode));
1821 print_dbg(gi, " i_flags =");
1822 for (x = 0; x < 32; x++)
1823 if (test_bit(x, &ip->i_flags))
1824 print_dbg(gi, " %u", x);
1825 print_dbg(gi, " \n");
1826 return 0;
1830 * dump_glock - print information about a glock
1831 * @gl: the glock
1832 * @count: where we are in the buffer
1834 * Returns: 0 on success, -ENOBUFS when we run out of space
1837 static int dump_glock(struct glock_iter *gi, struct gfs2_glock *gl)
1839 struct gfs2_holder *gh;
1840 unsigned int x;
1841 int error = -ENOBUFS;
1842 struct task_struct *gl_owner;
1844 spin_lock(&gl->gl_spin);
1846 print_dbg(gi, "Glock 0x%p (%u, %llu)\n", gl, gl->gl_name.ln_type,
1847 (unsigned long long)gl->gl_name.ln_number);
1848 print_dbg(gi, " gl_flags =");
1849 for (x = 0; x < 32; x++) {
1850 if (test_bit(x, &gl->gl_flags))
1851 print_dbg(gi, " %u", x);
1853 if (!test_bit(GLF_LOCK, &gl->gl_flags))
1854 print_dbg(gi, " (unlocked)");
1855 print_dbg(gi, " \n");
1856 print_dbg(gi, " gl_ref = %d\n", atomic_read(&gl->gl_ref));
1857 print_dbg(gi, " gl_state = %u\n", gl->gl_state);
1858 if (gl->gl_owner_pid) {
1859 gl_owner = find_task_by_pid(gl->gl_owner_pid);
1860 if (gl_owner)
1861 print_dbg(gi, " gl_owner = pid %d (%s)\n",
1862 gl->gl_owner_pid, gl_owner->comm);
1863 else
1864 print_dbg(gi, " gl_owner = %d (ended)\n",
1865 gl->gl_owner_pid);
1866 } else
1867 print_dbg(gi, " gl_owner = -1\n");
1868 print_dbg(gi, " gl_ip = %lu\n", gl->gl_ip);
1869 print_dbg(gi, " req_gh = %s\n", (gl->gl_req_gh) ? "yes" : "no");
1870 print_dbg(gi, " req_bh = %s\n", (gl->gl_req_bh) ? "yes" : "no");
1871 print_dbg(gi, " lvb_count = %d\n", atomic_read(&gl->gl_lvb_count));
1872 print_dbg(gi, " object = %s\n", (gl->gl_object) ? "yes" : "no");
1873 print_dbg(gi, " le = %s\n",
1874 (list_empty(&gl->gl_le.le_list)) ? "no" : "yes");
1875 print_dbg(gi, " reclaim = %s\n",
1876 (list_empty(&gl->gl_reclaim)) ? "no" : "yes");
1877 if (gl->gl_aspace)
1878 print_dbg(gi, " aspace = 0x%p nrpages = %lu\n", gl->gl_aspace,
1879 gl->gl_aspace->i_mapping->nrpages);
1880 else
1881 print_dbg(gi, " aspace = no\n");
1882 print_dbg(gi, " ail = %d\n", atomic_read(&gl->gl_ail_count));
1883 if (gl->gl_req_gh) {
1884 error = dump_holder(gi, "Request", gl->gl_req_gh);
1885 if (error)
1886 goto out;
1888 list_for_each_entry(gh, &gl->gl_holders, gh_list) {
1889 error = dump_holder(gi, "Holder", gh);
1890 if (error)
1891 goto out;
1893 list_for_each_entry(gh, &gl->gl_waiters1, gh_list) {
1894 error = dump_holder(gi, "Waiter1", gh);
1895 if (error)
1896 goto out;
1898 list_for_each_entry(gh, &gl->gl_waiters3, gh_list) {
1899 error = dump_holder(gi, "Waiter3", gh);
1900 if (error)
1901 goto out;
1903 if (test_bit(GLF_DEMOTE, &gl->gl_flags)) {
1904 print_dbg(gi, " Demotion req to state %u (%llu uS ago)\n",
1905 gl->gl_demote_state, (unsigned long long)
1906 (jiffies - gl->gl_demote_time)*(1000000/HZ));
1908 if (gl->gl_ops == &gfs2_inode_glops && gl->gl_object) {
1909 if (!test_bit(GLF_LOCK, &gl->gl_flags) &&
1910 list_empty(&gl->gl_holders)) {
1911 error = dump_inode(gi, gl->gl_object);
1912 if (error)
1913 goto out;
1914 } else {
1915 error = -ENOBUFS;
1916 print_dbg(gi, " Inode: busy\n");
1920 error = 0;
1922 out:
1923 spin_unlock(&gl->gl_spin);
1924 return error;
1928 * gfs2_dump_lockstate - print out the current lockstate
1929 * @sdp: the filesystem
1930 * @ub: the buffer to copy the information into
1932 * If @ub is NULL, dump the lockstate to the console.
1936 static int gfs2_dump_lockstate(struct gfs2_sbd *sdp)
1938 struct gfs2_glock *gl;
1939 struct hlist_node *h;
1940 unsigned int x;
1941 int error = 0;
1943 for (x = 0; x < GFS2_GL_HASH_SIZE; x++) {
1945 read_lock(gl_lock_addr(x));
1947 hlist_for_each_entry(gl, h, &gl_hash_table[x].hb_list, gl_list) {
1948 if (gl->gl_sbd != sdp)
1949 continue;
1951 error = dump_glock(NULL, gl);
1952 if (error)
1953 break;
1956 read_unlock(gl_lock_addr(x));
1958 if (error)
1959 break;
1963 return error;
1966 int __init gfs2_glock_init(void)
1968 unsigned i;
1969 for(i = 0; i < GFS2_GL_HASH_SIZE; i++) {
1970 INIT_HLIST_HEAD(&gl_hash_table[i].hb_list);
1972 #ifdef GL_HASH_LOCK_SZ
1973 for(i = 0; i < GL_HASH_LOCK_SZ; i++) {
1974 rwlock_init(&gl_hash_locks[i]);
1976 #endif
1977 return 0;
1980 static int gfs2_glock_iter_next(struct glock_iter *gi)
1982 read_lock(gl_lock_addr(gi->hash));
1983 while (1) {
1984 if (!gi->hb_list) { /* If we don't have a hash bucket yet */
1985 gi->hb_list = &gl_hash_table[gi->hash].hb_list;
1986 if (hlist_empty(gi->hb_list)) {
1987 read_unlock(gl_lock_addr(gi->hash));
1988 gi->hash++;
1989 read_lock(gl_lock_addr(gi->hash));
1990 gi->hb_list = NULL;
1991 if (gi->hash >= GFS2_GL_HASH_SIZE) {
1992 read_unlock(gl_lock_addr(gi->hash));
1993 return 1;
1995 else
1996 continue;
1998 if (!hlist_empty(gi->hb_list)) {
1999 gi->gl = list_entry(gi->hb_list->first,
2000 struct gfs2_glock,
2001 gl_list);
2003 } else {
2004 if (gi->gl->gl_list.next == NULL) {
2005 read_unlock(gl_lock_addr(gi->hash));
2006 gi->hash++;
2007 read_lock(gl_lock_addr(gi->hash));
2008 gi->hb_list = NULL;
2009 continue;
2011 gi->gl = list_entry(gi->gl->gl_list.next,
2012 struct gfs2_glock, gl_list);
2014 if (gi->gl)
2015 break;
2017 read_unlock(gl_lock_addr(gi->hash));
2018 return 0;
2021 static void gfs2_glock_iter_free(struct glock_iter *gi)
2023 kfree(gi);
2026 static struct glock_iter *gfs2_glock_iter_init(struct gfs2_sbd *sdp)
2028 struct glock_iter *gi;
2030 gi = kmalloc(sizeof (*gi), GFP_KERNEL);
2031 if (!gi)
2032 return NULL;
2034 gi->sdp = sdp;
2035 gi->hash = 0;
2036 gi->gl = NULL;
2037 gi->hb_list = NULL;
2038 gi->seq = NULL;
2039 memset(gi->string, 0, sizeof(gi->string));
2041 if (gfs2_glock_iter_next(gi)) {
2042 gfs2_glock_iter_free(gi);
2043 return NULL;
2046 return gi;
2049 static void *gfs2_glock_seq_start(struct seq_file *file, loff_t *pos)
2051 struct glock_iter *gi;
2052 loff_t n = *pos;
2054 gi = gfs2_glock_iter_init(file->private);
2055 if (!gi)
2056 return NULL;
2058 while (n--) {
2059 if (gfs2_glock_iter_next(gi)) {
2060 gfs2_glock_iter_free(gi);
2061 return NULL;
2065 return gi;
2068 static void *gfs2_glock_seq_next(struct seq_file *file, void *iter_ptr,
2069 loff_t *pos)
2071 struct glock_iter *gi = iter_ptr;
2073 (*pos)++;
2075 if (gfs2_glock_iter_next(gi)) {
2076 gfs2_glock_iter_free(gi);
2077 return NULL;
2080 return gi;
2083 static void gfs2_glock_seq_stop(struct seq_file *file, void *iter_ptr)
2085 /* nothing for now */
2088 static int gfs2_glock_seq_show(struct seq_file *file, void *iter_ptr)
2090 struct glock_iter *gi = iter_ptr;
2092 gi->seq = file;
2093 dump_glock(gi, gi->gl);
2095 return 0;
2098 static struct seq_operations gfs2_glock_seq_ops = {
2099 .start = gfs2_glock_seq_start,
2100 .next = gfs2_glock_seq_next,
2101 .stop = gfs2_glock_seq_stop,
2102 .show = gfs2_glock_seq_show,
2105 static int gfs2_debugfs_open(struct inode *inode, struct file *file)
2107 struct seq_file *seq;
2108 int ret;
2110 ret = seq_open(file, &gfs2_glock_seq_ops);
2111 if (ret)
2112 return ret;
2114 seq = file->private_data;
2115 seq->private = inode->i_private;
2117 return 0;
2120 static const struct file_operations gfs2_debug_fops = {
2121 .owner = THIS_MODULE,
2122 .open = gfs2_debugfs_open,
2123 .read = seq_read,
2124 .llseek = seq_lseek,
2125 .release = seq_release
2128 int gfs2_create_debugfs_file(struct gfs2_sbd *sdp)
2130 sdp->debugfs_dir = debugfs_create_dir(sdp->sd_table_name, gfs2_root);
2131 if (!sdp->debugfs_dir)
2132 return -ENOMEM;
2133 sdp->debugfs_dentry_glocks = debugfs_create_file("glocks",
2134 S_IFREG | S_IRUGO,
2135 sdp->debugfs_dir, sdp,
2136 &gfs2_debug_fops);
2137 if (!sdp->debugfs_dentry_glocks)
2138 return -ENOMEM;
2140 return 0;
2143 void gfs2_delete_debugfs_file(struct gfs2_sbd *sdp)
2145 if (sdp && sdp->debugfs_dir) {
2146 if (sdp->debugfs_dentry_glocks) {
2147 debugfs_remove(sdp->debugfs_dentry_glocks);
2148 sdp->debugfs_dentry_glocks = NULL;
2150 debugfs_remove(sdp->debugfs_dir);
2151 sdp->debugfs_dir = NULL;
2155 int gfs2_register_debugfs(void)
2157 gfs2_root = debugfs_create_dir("gfs2", NULL);
2158 return gfs2_root ? 0 : -ENOMEM;
2161 void gfs2_unregister_debugfs(void)
2163 debugfs_remove(gfs2_root);
2164 gfs2_root = NULL;