[GFS2] Fix deallocation issues
[linux-2.6] / fs / gfs2 / glock.c
1 /*
2  * Copyright (C) Sistina Software, Inc.  1997-2003 All rights reserved.
3  * Copyright (C) 2004-2006 Red Hat, Inc.  All rights reserved.
4  *
5  * This copyrighted material is made available to anyone wishing to use,
6  * modify, copy, or redistribute it subject to the terms and conditions
7  * of the GNU General Public License version 2.
8  */
9
10 #include <linux/sched.h>
11 #include <linux/slab.h>
12 #include <linux/spinlock.h>
13 #include <linux/completion.h>
14 #include <linux/buffer_head.h>
15 #include <linux/delay.h>
16 #include <linux/sort.h>
17 #include <linux/jhash.h>
18 #include <linux/kallsyms.h>
19 #include <linux/gfs2_ondisk.h>
20 #include <linux/list.h>
21 #include <linux/lm_interface.h>
22 #include <linux/wait.h>
23 #include <linux/module.h>
24 #include <linux/rwsem.h>
25 #include <asm/uaccess.h>
26 #include <linux/seq_file.h>
27 #include <linux/debugfs.h>
28 #include <linux/module.h>
29 #include <linux/kallsyms.h>
30
31 #include "gfs2.h"
32 #include "incore.h"
33 #include "glock.h"
34 #include "glops.h"
35 #include "inode.h"
36 #include "lm.h"
37 #include "lops.h"
38 #include "meta_io.h"
39 #include "quota.h"
40 #include "super.h"
41 #include "util.h"
42
43 struct gfs2_gl_hash_bucket {
44         struct hlist_head hb_list;
45 };
46
47 struct glock_iter {
48         int hash;                     /* hash bucket index         */
49         struct gfs2_sbd *sdp;         /* incore superblock         */
50         struct gfs2_glock *gl;        /* current glock struct      */
51         struct hlist_head *hb_list;   /* current hash bucket ptr   */
52         struct seq_file *seq;         /* sequence file for debugfs */
53         char string[512];             /* scratch space             */
54 };
55
56 typedef void (*glock_examiner) (struct gfs2_glock * gl);
57
58 static int gfs2_dump_lockstate(struct gfs2_sbd *sdp);
59 static int dump_glock(struct glock_iter *gi, struct gfs2_glock *gl);
60 static void gfs2_glock_xmote_th(struct gfs2_glock *gl, struct gfs2_holder *gh);
61 static void gfs2_glock_drop_th(struct gfs2_glock *gl);
62 static DECLARE_RWSEM(gfs2_umount_flush_sem);
63 static struct dentry *gfs2_root;
64
65 #define GFS2_GL_HASH_SHIFT      15
66 #define GFS2_GL_HASH_SIZE       (1 << GFS2_GL_HASH_SHIFT)
67 #define GFS2_GL_HASH_MASK       (GFS2_GL_HASH_SIZE - 1)
68
69 static struct gfs2_gl_hash_bucket gl_hash_table[GFS2_GL_HASH_SIZE];
70 static struct dentry *gfs2_root;
71
72 /*
73  * Despite what you might think, the numbers below are not arbitrary :-)
74  * They are taken from the ipv4 routing hash code, which is well tested
75  * and thus should be nearly optimal. Later on we might tweek the numbers
76  * but for now this should be fine.
77  *
78  * The reason for putting the locks in a separate array from the list heads
79  * is that we can have fewer locks than list heads and save memory. We use
80  * the same hash function for both, but with a different hash mask.
81  */
82 #if defined(CONFIG_SMP) || defined(CONFIG_DEBUG_SPINLOCK) || \
83         defined(CONFIG_PROVE_LOCKING)
84
85 #ifdef CONFIG_LOCKDEP
86 # define GL_HASH_LOCK_SZ        256
87 #else
88 # if NR_CPUS >= 32
89 #  define GL_HASH_LOCK_SZ       4096
90 # elif NR_CPUS >= 16
91 #  define GL_HASH_LOCK_SZ       2048
92 # elif NR_CPUS >= 8
93 #  define GL_HASH_LOCK_SZ       1024
94 # elif NR_CPUS >= 4
95 #  define GL_HASH_LOCK_SZ       512
96 # else
97 #  define GL_HASH_LOCK_SZ       256
98 # endif
99 #endif
100
101 /* We never want more locks than chains */
102 #if GFS2_GL_HASH_SIZE < GL_HASH_LOCK_SZ
103 # undef GL_HASH_LOCK_SZ
104 # define GL_HASH_LOCK_SZ GFS2_GL_HASH_SIZE
105 #endif
106
107 static rwlock_t gl_hash_locks[GL_HASH_LOCK_SZ];
108
109 static inline rwlock_t *gl_lock_addr(unsigned int x)
110 {
111         return &gl_hash_locks[x & (GL_HASH_LOCK_SZ-1)];
112 }
113 #else /* not SMP, so no spinlocks required */
114 static inline rwlock_t *gl_lock_addr(unsigned int x)
115 {
116         return NULL;
117 }
118 #endif
119
120 /**
121  * relaxed_state_ok - is a requested lock compatible with the current lock mode?
122  * @actual: the current state of the lock
123  * @requested: the lock state that was requested by the caller
124  * @flags: the modifier flags passed in by the caller
125  *
126  * Returns: 1 if the locks are compatible, 0 otherwise
127  */
128
129 static inline int relaxed_state_ok(unsigned int actual, unsigned requested,
130                                    int flags)
131 {
132         if (actual == requested)
133                 return 1;
134
135         if (flags & GL_EXACT)
136                 return 0;
137
138         if (actual == LM_ST_EXCLUSIVE && requested == LM_ST_SHARED)
139                 return 1;
140
141         if (actual != LM_ST_UNLOCKED && (flags & LM_FLAG_ANY))
142                 return 1;
143
144         return 0;
145 }
146
147 /**
148  * gl_hash() - Turn glock number into hash bucket number
149  * @lock: The glock number
150  *
151  * Returns: The number of the corresponding hash bucket
152  */
153
154 static unsigned int gl_hash(const struct gfs2_sbd *sdp,
155                             const struct lm_lockname *name)
156 {
157         unsigned int h;
158
159         h = jhash(&name->ln_number, sizeof(u64), 0);
160         h = jhash(&name->ln_type, sizeof(unsigned int), h);
161         h = jhash(&sdp, sizeof(struct gfs2_sbd *), h);
162         h &= GFS2_GL_HASH_MASK;
163
164         return h;
165 }
166
167 /**
168  * glock_free() - Perform a few checks and then release struct gfs2_glock
169  * @gl: The glock to release
170  *
171  * Also calls lock module to release its internal structure for this glock.
172  *
173  */
174
175 static void glock_free(struct gfs2_glock *gl)
176 {
177         struct gfs2_sbd *sdp = gl->gl_sbd;
178         struct inode *aspace = gl->gl_aspace;
179
180         gfs2_lm_put_lock(sdp, gl->gl_lock);
181
182         if (aspace)
183                 gfs2_aspace_put(aspace);
184
185         kmem_cache_free(gfs2_glock_cachep, gl);
186 }
187
188 /**
189  * gfs2_glock_hold() - increment reference count on glock
190  * @gl: The glock to hold
191  *
192  */
193
194 void gfs2_glock_hold(struct gfs2_glock *gl)
195 {
196         atomic_inc(&gl->gl_ref);
197 }
198
199 /**
200  * gfs2_glock_put() - Decrement reference count on glock
201  * @gl: The glock to put
202  *
203  */
204
205 int gfs2_glock_put(struct gfs2_glock *gl)
206 {
207         int rv = 0;
208         struct gfs2_sbd *sdp = gl->gl_sbd;
209
210         write_lock(gl_lock_addr(gl->gl_hash));
211         if (atomic_dec_and_test(&gl->gl_ref)) {
212                 hlist_del(&gl->gl_list);
213                 write_unlock(gl_lock_addr(gl->gl_hash));
214                 BUG_ON(spin_is_locked(&gl->gl_spin));
215                 gfs2_assert(sdp, gl->gl_state == LM_ST_UNLOCKED);
216                 gfs2_assert(sdp, list_empty(&gl->gl_reclaim));
217                 gfs2_assert(sdp, list_empty(&gl->gl_holders));
218                 gfs2_assert(sdp, list_empty(&gl->gl_waiters1));
219                 gfs2_assert(sdp, list_empty(&gl->gl_waiters3));
220                 glock_free(gl);
221                 rv = 1;
222                 goto out;
223         }
224         write_unlock(gl_lock_addr(gl->gl_hash));
225 out:
226         return rv;
227 }
228
229 /**
230  * search_bucket() - Find struct gfs2_glock by lock number
231  * @bucket: the bucket to search
232  * @name: The lock name
233  *
234  * Returns: NULL, or the struct gfs2_glock with the requested number
235  */
236
237 static struct gfs2_glock *search_bucket(unsigned int hash,
238                                         const struct gfs2_sbd *sdp,
239                                         const struct lm_lockname *name)
240 {
241         struct gfs2_glock *gl;
242         struct hlist_node *h;
243
244         hlist_for_each_entry(gl, h, &gl_hash_table[hash].hb_list, gl_list) {
245                 if (!lm_name_equal(&gl->gl_name, name))
246                         continue;
247                 if (gl->gl_sbd != sdp)
248                         continue;
249
250                 atomic_inc(&gl->gl_ref);
251
252                 return gl;
253         }
254
255         return NULL;
256 }
257
258 /**
259  * gfs2_glock_find() - Find glock by lock number
260  * @sdp: The GFS2 superblock
261  * @name: The lock name
262  *
263  * Returns: NULL, or the struct gfs2_glock with the requested number
264  */
265
266 static struct gfs2_glock *gfs2_glock_find(const struct gfs2_sbd *sdp,
267                                           const struct lm_lockname *name)
268 {
269         unsigned int hash = gl_hash(sdp, name);
270         struct gfs2_glock *gl;
271
272         read_lock(gl_lock_addr(hash));
273         gl = search_bucket(hash, sdp, name);
274         read_unlock(gl_lock_addr(hash));
275
276         return gl;
277 }
278
279 /**
280  * gfs2_glock_get() - Get a glock, or create one if one doesn't exist
281  * @sdp: The GFS2 superblock
282  * @number: the lock number
283  * @glops: The glock_operations to use
284  * @create: If 0, don't create the glock if it doesn't exist
285  * @glp: the glock is returned here
286  *
287  * This does not lock a glock, just finds/creates structures for one.
288  *
289  * Returns: errno
290  */
291
292 int gfs2_glock_get(struct gfs2_sbd *sdp, u64 number,
293                    const struct gfs2_glock_operations *glops, int create,
294                    struct gfs2_glock **glp)
295 {
296         struct lm_lockname name = { .ln_number = number, .ln_type = glops->go_type };
297         struct gfs2_glock *gl, *tmp;
298         unsigned int hash = gl_hash(sdp, &name);
299         int error;
300
301         read_lock(gl_lock_addr(hash));
302         gl = search_bucket(hash, sdp, &name);
303         read_unlock(gl_lock_addr(hash));
304
305         if (gl || !create) {
306                 *glp = gl;
307                 return 0;
308         }
309
310         gl = kmem_cache_alloc(gfs2_glock_cachep, GFP_KERNEL);
311         if (!gl)
312                 return -ENOMEM;
313
314         gl->gl_flags = 0;
315         gl->gl_name = name;
316         atomic_set(&gl->gl_ref, 1);
317         gl->gl_state = LM_ST_UNLOCKED;
318         gl->gl_hash = hash;
319         gl->gl_owner_pid = 0;
320         gl->gl_ip = 0;
321         gl->gl_ops = glops;
322         gl->gl_req_gh = NULL;
323         gl->gl_req_bh = NULL;
324         gl->gl_vn = 0;
325         gl->gl_stamp = jiffies;
326         gl->gl_object = NULL;
327         gl->gl_sbd = sdp;
328         gl->gl_aspace = NULL;
329         lops_init_le(&gl->gl_le, &gfs2_glock_lops);
330
331         /* If this glock protects actual on-disk data or metadata blocks,
332            create a VFS inode to manage the pages/buffers holding them. */
333         if (glops == &gfs2_inode_glops || glops == &gfs2_rgrp_glops) {
334                 gl->gl_aspace = gfs2_aspace_get(sdp);
335                 if (!gl->gl_aspace) {
336                         error = -ENOMEM;
337                         goto fail;
338                 }
339         }
340
341         error = gfs2_lm_get_lock(sdp, &name, &gl->gl_lock);
342         if (error)
343                 goto fail_aspace;
344
345         write_lock(gl_lock_addr(hash));
346         tmp = search_bucket(hash, sdp, &name);
347         if (tmp) {
348                 write_unlock(gl_lock_addr(hash));
349                 glock_free(gl);
350                 gl = tmp;
351         } else {
352                 hlist_add_head(&gl->gl_list, &gl_hash_table[hash].hb_list);
353                 write_unlock(gl_lock_addr(hash));
354         }
355
356         *glp = gl;
357
358         return 0;
359
360 fail_aspace:
361         if (gl->gl_aspace)
362                 gfs2_aspace_put(gl->gl_aspace);
363 fail:
364         kmem_cache_free(gfs2_glock_cachep, gl);
365         return error;
366 }
367
368 /**
369  * gfs2_holder_init - initialize a struct gfs2_holder in the default way
370  * @gl: the glock
371  * @state: the state we're requesting
372  * @flags: the modifier flags
373  * @gh: the holder structure
374  *
375  */
376
377 void gfs2_holder_init(struct gfs2_glock *gl, unsigned int state, unsigned flags,
378                       struct gfs2_holder *gh)
379 {
380         INIT_LIST_HEAD(&gh->gh_list);
381         gh->gh_gl = gl;
382         gh->gh_ip = (unsigned long)__builtin_return_address(0);
383         gh->gh_owner_pid = current->pid;
384         gh->gh_state = state;
385         gh->gh_flags = flags;
386         gh->gh_error = 0;
387         gh->gh_iflags = 0;
388         gfs2_glock_hold(gl);
389 }
390
391 /**
392  * gfs2_holder_reinit - reinitialize a struct gfs2_holder so we can requeue it
393  * @state: the state we're requesting
394  * @flags: the modifier flags
395  * @gh: the holder structure
396  *
397  * Don't mess with the glock.
398  *
399  */
400
401 void gfs2_holder_reinit(unsigned int state, unsigned flags, struct gfs2_holder *gh)
402 {
403         gh->gh_state = state;
404         gh->gh_flags = flags;
405         gh->gh_iflags = 0;
406         gh->gh_ip = (unsigned long)__builtin_return_address(0);
407 }
408
409 /**
410  * gfs2_holder_uninit - uninitialize a holder structure (drop glock reference)
411  * @gh: the holder structure
412  *
413  */
414
415 void gfs2_holder_uninit(struct gfs2_holder *gh)
416 {
417         gfs2_glock_put(gh->gh_gl);
418         gh->gh_gl = NULL;
419         gh->gh_ip = 0;
420 }
421
422 static void gfs2_holder_wake(struct gfs2_holder *gh)
423 {
424         clear_bit(HIF_WAIT, &gh->gh_iflags);
425         smp_mb__after_clear_bit();
426         wake_up_bit(&gh->gh_iflags, HIF_WAIT);
427 }
428
429 static int just_schedule(void *word)
430 {
431         schedule();
432         return 0;
433 }
434
435 static void wait_on_holder(struct gfs2_holder *gh)
436 {
437         might_sleep();
438         wait_on_bit(&gh->gh_iflags, HIF_WAIT, just_schedule, TASK_UNINTERRUPTIBLE);
439 }
440
441 static void gfs2_demote_wake(struct gfs2_glock *gl)
442 {
443         clear_bit(GLF_DEMOTE, &gl->gl_flags);
444         smp_mb__after_clear_bit();
445         wake_up_bit(&gl->gl_flags, GLF_DEMOTE);
446 }
447
448 static void wait_on_demote(struct gfs2_glock *gl)
449 {
450         might_sleep();
451         wait_on_bit(&gl->gl_flags, GLF_DEMOTE, just_schedule, TASK_UNINTERRUPTIBLE);
452 }
453
454 /**
455  * rq_mutex - process a mutex request in the queue
456  * @gh: the glock holder
457  *
458  * Returns: 1 if the queue is blocked
459  */
460
461 static int rq_mutex(struct gfs2_holder *gh)
462 {
463         struct gfs2_glock *gl = gh->gh_gl;
464
465         list_del_init(&gh->gh_list);
466         /*  gh->gh_error never examined.  */
467         set_bit(GLF_LOCK, &gl->gl_flags);
468         clear_bit(HIF_WAIT, &gh->gh_iflags);
469         smp_mb();
470         wake_up_bit(&gh->gh_iflags, HIF_WAIT);
471
472         return 1;
473 }
474
475 /**
476  * rq_promote - process a promote request in the queue
477  * @gh: the glock holder
478  *
479  * Acquire a new inter-node lock, or change a lock state to more restrictive.
480  *
481  * Returns: 1 if the queue is blocked
482  */
483
484 static int rq_promote(struct gfs2_holder *gh)
485 {
486         struct gfs2_glock *gl = gh->gh_gl;
487         struct gfs2_sbd *sdp = gl->gl_sbd;
488
489         if (!relaxed_state_ok(gl->gl_state, gh->gh_state, gh->gh_flags)) {
490                 if (list_empty(&gl->gl_holders)) {
491                         gl->gl_req_gh = gh;
492                         set_bit(GLF_LOCK, &gl->gl_flags);
493                         spin_unlock(&gl->gl_spin);
494
495                         if (atomic_read(&sdp->sd_reclaim_count) >
496                             gfs2_tune_get(sdp, gt_reclaim_limit) &&
497                             !(gh->gh_flags & LM_FLAG_PRIORITY)) {
498                                 gfs2_reclaim_glock(sdp);
499                                 gfs2_reclaim_glock(sdp);
500                         }
501
502                         gfs2_glock_xmote_th(gh->gh_gl, gh);
503                         spin_lock(&gl->gl_spin);
504                 }
505                 return 1;
506         }
507
508         if (list_empty(&gl->gl_holders)) {
509                 set_bit(HIF_FIRST, &gh->gh_iflags);
510                 set_bit(GLF_LOCK, &gl->gl_flags);
511         } else {
512                 struct gfs2_holder *next_gh;
513                 if (gh->gh_state == LM_ST_EXCLUSIVE)
514                         return 1;
515                 next_gh = list_entry(gl->gl_holders.next, struct gfs2_holder,
516                                      gh_list);
517                 if (next_gh->gh_state == LM_ST_EXCLUSIVE)
518                          return 1;
519         }
520
521         list_move_tail(&gh->gh_list, &gl->gl_holders);
522         gh->gh_error = 0;
523         set_bit(HIF_HOLDER, &gh->gh_iflags);
524
525         gfs2_holder_wake(gh);
526
527         return 0;
528 }
529
530 /**
531  * rq_demote - process a demote request in the queue
532  * @gh: the glock holder
533  *
534  * Returns: 1 if the queue is blocked
535  */
536
537 static int rq_demote(struct gfs2_glock *gl)
538 {
539         if (!list_empty(&gl->gl_holders))
540                 return 1;
541
542         if (gl->gl_state == gl->gl_demote_state ||
543             gl->gl_state == LM_ST_UNLOCKED) {
544                 gfs2_demote_wake(gl);
545                 return 0;
546         }
547         set_bit(GLF_LOCK, &gl->gl_flags);
548         spin_unlock(&gl->gl_spin);
549         if (gl->gl_demote_state == LM_ST_UNLOCKED ||
550             gl->gl_state != LM_ST_EXCLUSIVE)
551                 gfs2_glock_drop_th(gl);
552         else
553                 gfs2_glock_xmote_th(gl, NULL);
554         spin_lock(&gl->gl_spin);
555
556         return 0;
557 }
558
559 /**
560  * run_queue - process holder structures on a glock
561  * @gl: the glock
562  *
563  */
564 static void run_queue(struct gfs2_glock *gl)
565 {
566         struct gfs2_holder *gh;
567         int blocked = 1;
568
569         for (;;) {
570                 if (test_bit(GLF_LOCK, &gl->gl_flags))
571                         break;
572
573                 if (!list_empty(&gl->gl_waiters1)) {
574                         gh = list_entry(gl->gl_waiters1.next,
575                                         struct gfs2_holder, gh_list);
576
577                         if (test_bit(HIF_MUTEX, &gh->gh_iflags))
578                                 blocked = rq_mutex(gh);
579                         else
580                                 gfs2_assert_warn(gl->gl_sbd, 0);
581
582                 } else if (test_bit(GLF_DEMOTE, &gl->gl_flags)) {
583                         blocked = rq_demote(gl);
584                 } else if (!list_empty(&gl->gl_waiters3)) {
585                         gh = list_entry(gl->gl_waiters3.next,
586                                         struct gfs2_holder, gh_list);
587
588                         if (test_bit(HIF_PROMOTE, &gh->gh_iflags))
589                                 blocked = rq_promote(gh);
590                         else
591                                 gfs2_assert_warn(gl->gl_sbd, 0);
592
593                 } else
594                         break;
595
596                 if (blocked)
597                         break;
598         }
599 }
600
601 /**
602  * gfs2_glmutex_lock - acquire a local lock on a glock
603  * @gl: the glock
604  *
605  * Gives caller exclusive access to manipulate a glock structure.
606  */
607
608 static void gfs2_glmutex_lock(struct gfs2_glock *gl)
609 {
610         struct gfs2_holder gh;
611
612         gfs2_holder_init(gl, 0, 0, &gh);
613         set_bit(HIF_MUTEX, &gh.gh_iflags);
614         if (test_and_set_bit(HIF_WAIT, &gh.gh_iflags))
615                 BUG();
616
617         spin_lock(&gl->gl_spin);
618         if (test_and_set_bit(GLF_LOCK, &gl->gl_flags)) {
619                 list_add_tail(&gh.gh_list, &gl->gl_waiters1);
620         } else {
621                 gl->gl_owner_pid = current->pid;
622                 gl->gl_ip = (unsigned long)__builtin_return_address(0);
623                 clear_bit(HIF_WAIT, &gh.gh_iflags);
624                 smp_mb();
625                 wake_up_bit(&gh.gh_iflags, HIF_WAIT);
626         }
627         spin_unlock(&gl->gl_spin);
628
629         wait_on_holder(&gh);
630         gfs2_holder_uninit(&gh);
631 }
632
633 /**
634  * gfs2_glmutex_trylock - try to acquire a local lock on a glock
635  * @gl: the glock
636  *
637  * Returns: 1 if the glock is acquired
638  */
639
640 static int gfs2_glmutex_trylock(struct gfs2_glock *gl)
641 {
642         int acquired = 1;
643
644         spin_lock(&gl->gl_spin);
645         if (test_and_set_bit(GLF_LOCK, &gl->gl_flags)) {
646                 acquired = 0;
647         } else {
648                 gl->gl_owner_pid = current->pid;
649                 gl->gl_ip = (unsigned long)__builtin_return_address(0);
650         }
651         spin_unlock(&gl->gl_spin);
652
653         return acquired;
654 }
655
656 /**
657  * gfs2_glmutex_unlock - release a local lock on a glock
658  * @gl: the glock
659  *
660  */
661
662 static void gfs2_glmutex_unlock(struct gfs2_glock *gl)
663 {
664         spin_lock(&gl->gl_spin);
665         clear_bit(GLF_LOCK, &gl->gl_flags);
666         gl->gl_owner_pid = 0;
667         gl->gl_ip = 0;
668         run_queue(gl);
669         BUG_ON(!spin_is_locked(&gl->gl_spin));
670         spin_unlock(&gl->gl_spin);
671 }
672
673 /**
674  * handle_callback - process a demote request
675  * @gl: the glock
676  * @state: the state the caller wants us to change to
677  *
678  * There are only two requests that we are going to see in actual
679  * practise: LM_ST_SHARED and LM_ST_UNLOCKED
680  */
681
682 static void handle_callback(struct gfs2_glock *gl, unsigned int state, int remote)
683 {
684         spin_lock(&gl->gl_spin);
685         if (test_and_set_bit(GLF_DEMOTE, &gl->gl_flags) == 0) {
686                 gl->gl_demote_state = state;
687                 gl->gl_demote_time = jiffies;
688                 if (remote && gl->gl_ops->go_type == LM_TYPE_IOPEN &&
689                     gl->gl_object) {
690                         struct inode *inode = igrab(gl->gl_object);
691                         spin_unlock(&gl->gl_spin);
692                         if (inode) {
693                                 d_prune_aliases(inode);
694                                 iput(inode);
695                         }
696                         return;
697                 }
698         } else if (gl->gl_demote_state != LM_ST_UNLOCKED) {
699                 gl->gl_demote_state = state;
700         }
701         spin_unlock(&gl->gl_spin);
702 }
703
704 /**
705  * state_change - record that the glock is now in a different state
706  * @gl: the glock
707  * @new_state the new state
708  *
709  */
710
711 static void state_change(struct gfs2_glock *gl, unsigned int new_state)
712 {
713         int held1, held2;
714
715         held1 = (gl->gl_state != LM_ST_UNLOCKED);
716         held2 = (new_state != LM_ST_UNLOCKED);
717
718         if (held1 != held2) {
719                 if (held2)
720                         gfs2_glock_hold(gl);
721                 else
722                         gfs2_glock_put(gl);
723         }
724
725         gl->gl_state = new_state;
726 }
727
728 /**
729  * xmote_bh - Called after the lock module is done acquiring a lock
730  * @gl: The glock in question
731  * @ret: the int returned from the lock module
732  *
733  */
734
735 static void xmote_bh(struct gfs2_glock *gl, unsigned int ret)
736 {
737         struct gfs2_sbd *sdp = gl->gl_sbd;
738         const struct gfs2_glock_operations *glops = gl->gl_ops;
739         struct gfs2_holder *gh = gl->gl_req_gh;
740         int prev_state = gl->gl_state;
741         int op_done = 1;
742
743         gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
744         gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
745         gfs2_assert_warn(sdp, !(ret & LM_OUT_ASYNC));
746
747         state_change(gl, ret & LM_OUT_ST_MASK);
748
749         if (prev_state != LM_ST_UNLOCKED && !(ret & LM_OUT_CACHEABLE)) {
750                 if (glops->go_inval)
751                         glops->go_inval(gl, DIO_METADATA);
752         } else if (gl->gl_state == LM_ST_DEFERRED) {
753                 /* We might not want to do this here.
754                    Look at moving to the inode glops. */
755                 if (glops->go_inval)
756                         glops->go_inval(gl, 0);
757         }
758
759         /*  Deal with each possible exit condition  */
760
761         if (!gh) {
762                 gl->gl_stamp = jiffies;
763                 if (ret & LM_OUT_CANCELED)
764                         op_done = 0;
765                 else
766                         gfs2_demote_wake(gl);
767         } else {
768                 spin_lock(&gl->gl_spin);
769                 list_del_init(&gh->gh_list);
770                 gh->gh_error = -EIO;
771                 if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags))) 
772                         goto out;
773                 gh->gh_error = GLR_CANCELED;
774                 if (ret & LM_OUT_CANCELED) 
775                         goto out;
776                 if (relaxed_state_ok(gl->gl_state, gh->gh_state, gh->gh_flags)) {
777                         list_add_tail(&gh->gh_list, &gl->gl_holders);
778                         gh->gh_error = 0;
779                         set_bit(HIF_HOLDER, &gh->gh_iflags);
780                         set_bit(HIF_FIRST, &gh->gh_iflags);
781                         op_done = 0;
782                         goto out;
783                 }
784                 gh->gh_error = GLR_TRYFAILED;
785                 if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB))
786                         goto out;
787                 gh->gh_error = -EINVAL;
788                 if (gfs2_assert_withdraw(sdp, 0) == -1)
789                         fs_err(sdp, "ret = 0x%.8X\n", ret);
790 out:
791                 spin_unlock(&gl->gl_spin);
792         }
793
794         if (glops->go_xmote_bh)
795                 glops->go_xmote_bh(gl);
796
797         if (op_done) {
798                 spin_lock(&gl->gl_spin);
799                 gl->gl_req_gh = NULL;
800                 gl->gl_req_bh = NULL;
801                 clear_bit(GLF_LOCK, &gl->gl_flags);
802                 run_queue(gl);
803                 spin_unlock(&gl->gl_spin);
804         }
805
806         gfs2_glock_put(gl);
807
808         if (gh)
809                 gfs2_holder_wake(gh);
810 }
811
812 /**
813  * gfs2_glock_xmote_th - Call into the lock module to acquire or change a glock
814  * @gl: The glock in question
815  * @state: the requested state
816  * @flags: modifier flags to the lock call
817  *
818  */
819
820 void gfs2_glock_xmote_th(struct gfs2_glock *gl, struct gfs2_holder *gh)
821 {
822         struct gfs2_sbd *sdp = gl->gl_sbd;
823         int flags = gh ? gh->gh_flags : 0;
824         unsigned state = gh ? gh->gh_state : gl->gl_demote_state;
825         const struct gfs2_glock_operations *glops = gl->gl_ops;
826         int lck_flags = flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB |
827                                  LM_FLAG_NOEXP | LM_FLAG_ANY |
828                                  LM_FLAG_PRIORITY);
829         unsigned int lck_ret;
830
831         if (glops->go_xmote_th)
832                 glops->go_xmote_th(gl);
833
834         gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
835         gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
836         gfs2_assert_warn(sdp, state != LM_ST_UNLOCKED);
837         gfs2_assert_warn(sdp, state != gl->gl_state);
838
839         gfs2_glock_hold(gl);
840         gl->gl_req_bh = xmote_bh;
841
842         lck_ret = gfs2_lm_lock(sdp, gl->gl_lock, gl->gl_state, state, lck_flags);
843
844         if (gfs2_assert_withdraw(sdp, !(lck_ret & LM_OUT_ERROR)))
845                 return;
846
847         if (lck_ret & LM_OUT_ASYNC)
848                 gfs2_assert_warn(sdp, lck_ret == LM_OUT_ASYNC);
849         else
850                 xmote_bh(gl, lck_ret);
851 }
852
853 /**
854  * drop_bh - Called after a lock module unlock completes
855  * @gl: the glock
856  * @ret: the return status
857  *
858  * Doesn't wake up the process waiting on the struct gfs2_holder (if any)
859  * Doesn't drop the reference on the glock the top half took out
860  *
861  */
862
863 static void drop_bh(struct gfs2_glock *gl, unsigned int ret)
864 {
865         struct gfs2_sbd *sdp = gl->gl_sbd;
866         const struct gfs2_glock_operations *glops = gl->gl_ops;
867         struct gfs2_holder *gh = gl->gl_req_gh;
868
869         gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
870         gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
871         gfs2_assert_warn(sdp, !ret);
872
873         state_change(gl, LM_ST_UNLOCKED);
874         gfs2_demote_wake(gl);
875
876         if (glops->go_inval)
877                 glops->go_inval(gl, DIO_METADATA);
878
879         if (gh) {
880                 spin_lock(&gl->gl_spin);
881                 list_del_init(&gh->gh_list);
882                 gh->gh_error = 0;
883                 spin_unlock(&gl->gl_spin);
884         }
885
886         spin_lock(&gl->gl_spin);
887         gl->gl_req_gh = NULL;
888         gl->gl_req_bh = NULL;
889         clear_bit(GLF_LOCK, &gl->gl_flags);
890         run_queue(gl);
891         spin_unlock(&gl->gl_spin);
892
893         gfs2_glock_put(gl);
894
895         if (gh)
896                 gfs2_holder_wake(gh);
897 }
898
899 /**
900  * gfs2_glock_drop_th - call into the lock module to unlock a lock
901  * @gl: the glock
902  *
903  */
904
905 static void gfs2_glock_drop_th(struct gfs2_glock *gl)
906 {
907         struct gfs2_sbd *sdp = gl->gl_sbd;
908         const struct gfs2_glock_operations *glops = gl->gl_ops;
909         unsigned int ret;
910
911         if (glops->go_drop_th)
912                 glops->go_drop_th(gl);
913
914         gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
915         gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
916         gfs2_assert_warn(sdp, gl->gl_state != LM_ST_UNLOCKED);
917
918         gfs2_glock_hold(gl);
919         gl->gl_req_bh = drop_bh;
920
921         ret = gfs2_lm_unlock(sdp, gl->gl_lock, gl->gl_state);
922
923         if (gfs2_assert_withdraw(sdp, !(ret & LM_OUT_ERROR)))
924                 return;
925
926         if (!ret)
927                 drop_bh(gl, ret);
928         else
929                 gfs2_assert_warn(sdp, ret == LM_OUT_ASYNC);
930 }
931
932 /**
933  * do_cancels - cancel requests for locks stuck waiting on an expire flag
934  * @gh: the LM_FLAG_PRIORITY holder waiting to acquire the lock
935  *
936  * Don't cancel GL_NOCANCEL requests.
937  */
938
939 static void do_cancels(struct gfs2_holder *gh)
940 {
941         struct gfs2_glock *gl = gh->gh_gl;
942
943         spin_lock(&gl->gl_spin);
944
945         while (gl->gl_req_gh != gh &&
946                !test_bit(HIF_HOLDER, &gh->gh_iflags) &&
947                !list_empty(&gh->gh_list)) {
948                 if (gl->gl_req_bh && !(gl->gl_req_gh &&
949                                      (gl->gl_req_gh->gh_flags & GL_NOCANCEL))) {
950                         spin_unlock(&gl->gl_spin);
951                         gfs2_lm_cancel(gl->gl_sbd, gl->gl_lock);
952                         msleep(100);
953                         spin_lock(&gl->gl_spin);
954                 } else {
955                         spin_unlock(&gl->gl_spin);
956                         msleep(100);
957                         spin_lock(&gl->gl_spin);
958                 }
959         }
960
961         spin_unlock(&gl->gl_spin);
962 }
963
964 /**
965  * glock_wait_internal - wait on a glock acquisition
966  * @gh: the glock holder
967  *
968  * Returns: 0 on success
969  */
970
971 static int glock_wait_internal(struct gfs2_holder *gh)
972 {
973         struct gfs2_glock *gl = gh->gh_gl;
974         struct gfs2_sbd *sdp = gl->gl_sbd;
975         const struct gfs2_glock_operations *glops = gl->gl_ops;
976
977         if (test_bit(HIF_ABORTED, &gh->gh_iflags))
978                 return -EIO;
979
980         if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)) {
981                 spin_lock(&gl->gl_spin);
982                 if (gl->gl_req_gh != gh &&
983                     !test_bit(HIF_HOLDER, &gh->gh_iflags) &&
984                     !list_empty(&gh->gh_list)) {
985                         list_del_init(&gh->gh_list);
986                         gh->gh_error = GLR_TRYFAILED;
987                         run_queue(gl);
988                         spin_unlock(&gl->gl_spin);
989                         return gh->gh_error;
990                 }
991                 spin_unlock(&gl->gl_spin);
992         }
993
994         if (gh->gh_flags & LM_FLAG_PRIORITY)
995                 do_cancels(gh);
996
997         wait_on_holder(gh);
998         if (gh->gh_error)
999                 return gh->gh_error;
1000
1001         gfs2_assert_withdraw(sdp, test_bit(HIF_HOLDER, &gh->gh_iflags));
1002         gfs2_assert_withdraw(sdp, relaxed_state_ok(gl->gl_state, gh->gh_state,
1003                                                    gh->gh_flags));
1004
1005         if (test_bit(HIF_FIRST, &gh->gh_iflags)) {
1006                 gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
1007
1008                 if (glops->go_lock) {
1009                         gh->gh_error = glops->go_lock(gh);
1010                         if (gh->gh_error) {
1011                                 spin_lock(&gl->gl_spin);
1012                                 list_del_init(&gh->gh_list);
1013                                 spin_unlock(&gl->gl_spin);
1014                         }
1015                 }
1016
1017                 spin_lock(&gl->gl_spin);
1018                 gl->gl_req_gh = NULL;
1019                 gl->gl_req_bh = NULL;
1020                 clear_bit(GLF_LOCK, &gl->gl_flags);
1021                 run_queue(gl);
1022                 spin_unlock(&gl->gl_spin);
1023         }
1024
1025         return gh->gh_error;
1026 }
1027
1028 static inline struct gfs2_holder *
1029 find_holder_by_owner(struct list_head *head, pid_t pid)
1030 {
1031         struct gfs2_holder *gh;
1032
1033         list_for_each_entry(gh, head, gh_list) {
1034                 if (gh->gh_owner_pid == pid)
1035                         return gh;
1036         }
1037
1038         return NULL;
1039 }
1040
1041 static void print_dbg(struct glock_iter *gi, const char *fmt, ...)
1042 {
1043         va_list args;
1044
1045         va_start(args, fmt);
1046         if (gi) {
1047                 vsprintf(gi->string, fmt, args);
1048                 seq_printf(gi->seq, gi->string);
1049         }
1050         else
1051                 vprintk(fmt, args);
1052         va_end(args);
1053 }
1054
1055 /**
1056  * add_to_queue - Add a holder to the wait queue (but look for recursion)
1057  * @gh: the holder structure to add
1058  *
1059  */
1060
1061 static void add_to_queue(struct gfs2_holder *gh)
1062 {
1063         struct gfs2_glock *gl = gh->gh_gl;
1064         struct gfs2_holder *existing;
1065
1066         BUG_ON(!gh->gh_owner_pid);
1067         if (test_and_set_bit(HIF_WAIT, &gh->gh_iflags))
1068                 BUG();
1069
1070         existing = find_holder_by_owner(&gl->gl_holders, gh->gh_owner_pid);
1071         if (existing) {
1072                 print_symbol(KERN_WARNING "original: %s\n", existing->gh_ip);
1073                 printk(KERN_INFO "pid : %d\n", existing->gh_owner_pid);
1074                 printk(KERN_INFO "lock type : %d lock state : %d\n",
1075                                 existing->gh_gl->gl_name.ln_type, existing->gh_gl->gl_state);
1076                 print_symbol(KERN_WARNING "new: %s\n", gh->gh_ip);
1077                 printk(KERN_INFO "pid : %d\n", gh->gh_owner_pid);
1078                 printk(KERN_INFO "lock type : %d lock state : %d\n",
1079                                 gl->gl_name.ln_type, gl->gl_state);
1080                 BUG();
1081         }
1082
1083         existing = find_holder_by_owner(&gl->gl_waiters3, gh->gh_owner_pid);
1084         if (existing) {
1085                 print_symbol(KERN_WARNING "original: %s\n", existing->gh_ip);
1086                 print_symbol(KERN_WARNING "new: %s\n", gh->gh_ip);
1087                 BUG();
1088         }
1089
1090         if (gh->gh_flags & LM_FLAG_PRIORITY)
1091                 list_add(&gh->gh_list, &gl->gl_waiters3);
1092         else
1093                 list_add_tail(&gh->gh_list, &gl->gl_waiters3);
1094 }
1095
1096 /**
1097  * gfs2_glock_nq - enqueue a struct gfs2_holder onto a glock (acquire a glock)
1098  * @gh: the holder structure
1099  *
1100  * if (gh->gh_flags & GL_ASYNC), this never returns an error
1101  *
1102  * Returns: 0, GLR_TRYFAILED, or errno on failure
1103  */
1104
1105 int gfs2_glock_nq(struct gfs2_holder *gh)
1106 {
1107         struct gfs2_glock *gl = gh->gh_gl;
1108         struct gfs2_sbd *sdp = gl->gl_sbd;
1109         int error = 0;
1110
1111 restart:
1112         if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags))) {
1113                 set_bit(HIF_ABORTED, &gh->gh_iflags);
1114                 return -EIO;
1115         }
1116
1117         set_bit(HIF_PROMOTE, &gh->gh_iflags);
1118
1119         spin_lock(&gl->gl_spin);
1120         add_to_queue(gh);
1121         run_queue(gl);
1122         spin_unlock(&gl->gl_spin);
1123
1124         if (!(gh->gh_flags & GL_ASYNC)) {
1125                 error = glock_wait_internal(gh);
1126                 if (error == GLR_CANCELED) {
1127                         msleep(100);
1128                         goto restart;
1129                 }
1130         }
1131
1132         return error;
1133 }
1134
1135 /**
1136  * gfs2_glock_poll - poll to see if an async request has been completed
1137  * @gh: the holder
1138  *
1139  * Returns: 1 if the request is ready to be gfs2_glock_wait()ed on
1140  */
1141
1142 int gfs2_glock_poll(struct gfs2_holder *gh)
1143 {
1144         struct gfs2_glock *gl = gh->gh_gl;
1145         int ready = 0;
1146
1147         spin_lock(&gl->gl_spin);
1148
1149         if (test_bit(HIF_HOLDER, &gh->gh_iflags))
1150                 ready = 1;
1151         else if (list_empty(&gh->gh_list)) {
1152                 if (gh->gh_error == GLR_CANCELED) {
1153                         spin_unlock(&gl->gl_spin);
1154                         msleep(100);
1155                         if (gfs2_glock_nq(gh))
1156                                 return 1;
1157                         return 0;
1158                 } else
1159                         ready = 1;
1160         }
1161
1162         spin_unlock(&gl->gl_spin);
1163
1164         return ready;
1165 }
1166
1167 /**
1168  * gfs2_glock_wait - wait for a lock acquisition that ended in a GLR_ASYNC
1169  * @gh: the holder structure
1170  *
1171  * Returns: 0, GLR_TRYFAILED, or errno on failure
1172  */
1173
1174 int gfs2_glock_wait(struct gfs2_holder *gh)
1175 {
1176         int error;
1177
1178         error = glock_wait_internal(gh);
1179         if (error == GLR_CANCELED) {
1180                 msleep(100);
1181                 gh->gh_flags &= ~GL_ASYNC;
1182                 error = gfs2_glock_nq(gh);
1183         }
1184
1185         return error;
1186 }
1187
1188 /**
1189  * gfs2_glock_dq - dequeue a struct gfs2_holder from a glock (release a glock)
1190  * @gh: the glock holder
1191  *
1192  */
1193
1194 void gfs2_glock_dq(struct gfs2_holder *gh)
1195 {
1196         struct gfs2_glock *gl = gh->gh_gl;
1197         const struct gfs2_glock_operations *glops = gl->gl_ops;
1198
1199         if (gh->gh_flags & GL_NOCACHE)
1200                 handle_callback(gl, LM_ST_UNLOCKED, 0);
1201
1202         gfs2_glmutex_lock(gl);
1203
1204         spin_lock(&gl->gl_spin);
1205         list_del_init(&gh->gh_list);
1206
1207         if (list_empty(&gl->gl_holders)) {
1208                 spin_unlock(&gl->gl_spin);
1209
1210                 if (glops->go_unlock)
1211                         glops->go_unlock(gh);
1212
1213                 spin_lock(&gl->gl_spin);
1214                 gl->gl_stamp = jiffies;
1215         }
1216
1217         clear_bit(GLF_LOCK, &gl->gl_flags);
1218         run_queue(gl);
1219         spin_unlock(&gl->gl_spin);
1220 }
1221
1222 void gfs2_glock_dq_wait(struct gfs2_holder *gh)
1223 {
1224         struct gfs2_glock *gl = gh->gh_gl;
1225         gfs2_glock_dq(gh);
1226         wait_on_demote(gl);
1227 }
1228
1229 /**
1230  * gfs2_glock_dq_uninit - dequeue a holder from a glock and initialize it
1231  * @gh: the holder structure
1232  *
1233  */
1234
1235 void gfs2_glock_dq_uninit(struct gfs2_holder *gh)
1236 {
1237         gfs2_glock_dq(gh);
1238         gfs2_holder_uninit(gh);
1239 }
1240
1241 /**
1242  * gfs2_glock_nq_num - acquire a glock based on lock number
1243  * @sdp: the filesystem
1244  * @number: the lock number
1245  * @glops: the glock operations for the type of glock
1246  * @state: the state to acquire the glock in
1247  * @flags: modifier flags for the aquisition
1248  * @gh: the struct gfs2_holder
1249  *
1250  * Returns: errno
1251  */
1252
1253 int gfs2_glock_nq_num(struct gfs2_sbd *sdp, u64 number,
1254                       const struct gfs2_glock_operations *glops,
1255                       unsigned int state, int flags, struct gfs2_holder *gh)
1256 {
1257         struct gfs2_glock *gl;
1258         int error;
1259
1260         error = gfs2_glock_get(sdp, number, glops, CREATE, &gl);
1261         if (!error) {
1262                 error = gfs2_glock_nq_init(gl, state, flags, gh);
1263                 gfs2_glock_put(gl);
1264         }
1265
1266         return error;
1267 }
1268
1269 /**
1270  * glock_compare - Compare two struct gfs2_glock structures for sorting
1271  * @arg_a: the first structure
1272  * @arg_b: the second structure
1273  *
1274  */
1275
1276 static int glock_compare(const void *arg_a, const void *arg_b)
1277 {
1278         const struct gfs2_holder *gh_a = *(const struct gfs2_holder **)arg_a;
1279         const struct gfs2_holder *gh_b = *(const struct gfs2_holder **)arg_b;
1280         const struct lm_lockname *a = &gh_a->gh_gl->gl_name;
1281         const struct lm_lockname *b = &gh_b->gh_gl->gl_name;
1282
1283         if (a->ln_number > b->ln_number)
1284                 return 1;
1285         if (a->ln_number < b->ln_number)
1286                 return -1;
1287         BUG_ON(gh_a->gh_gl->gl_ops->go_type == gh_b->gh_gl->gl_ops->go_type);
1288         return 0;
1289 }
1290
1291 /**
1292  * nq_m_sync - synchonously acquire more than one glock in deadlock free order
1293  * @num_gh: the number of structures
1294  * @ghs: an array of struct gfs2_holder structures
1295  *
1296  * Returns: 0 on success (all glocks acquired),
1297  *          errno on failure (no glocks acquired)
1298  */
1299
1300 static int nq_m_sync(unsigned int num_gh, struct gfs2_holder *ghs,
1301                      struct gfs2_holder **p)
1302 {
1303         unsigned int x;
1304         int error = 0;
1305
1306         for (x = 0; x < num_gh; x++)
1307                 p[x] = &ghs[x];
1308
1309         sort(p, num_gh, sizeof(struct gfs2_holder *), glock_compare, NULL);
1310
1311         for (x = 0; x < num_gh; x++) {
1312                 p[x]->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1313
1314                 error = gfs2_glock_nq(p[x]);
1315                 if (error) {
1316                         while (x--)
1317                                 gfs2_glock_dq(p[x]);
1318                         break;
1319                 }
1320         }
1321
1322         return error;
1323 }
1324
1325 /**
1326  * gfs2_glock_nq_m - acquire multiple glocks
1327  * @num_gh: the number of structures
1328  * @ghs: an array of struct gfs2_holder structures
1329  *
1330  * Figure out how big an impact this function has.  Either:
1331  * 1) Replace this code with code that calls gfs2_glock_prefetch()
1332  * 2) Forget async stuff and just call nq_m_sync()
1333  * 3) Leave it like it is
1334  *
1335  * Returns: 0 on success (all glocks acquired),
1336  *          errno on failure (no glocks acquired)
1337  */
1338
1339 int gfs2_glock_nq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1340 {
1341         int *e;
1342         unsigned int x;
1343         int borked = 0, serious = 0;
1344         int error = 0;
1345
1346         if (!num_gh)
1347                 return 0;
1348
1349         if (num_gh == 1) {
1350                 ghs->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1351                 return gfs2_glock_nq(ghs);
1352         }
1353
1354         e = kcalloc(num_gh, sizeof(struct gfs2_holder *), GFP_KERNEL);
1355         if (!e)
1356                 return -ENOMEM;
1357
1358         for (x = 0; x < num_gh; x++) {
1359                 ghs[x].gh_flags |= LM_FLAG_TRY | GL_ASYNC;
1360                 error = gfs2_glock_nq(&ghs[x]);
1361                 if (error) {
1362                         borked = 1;
1363                         serious = error;
1364                         num_gh = x;
1365                         break;
1366                 }
1367         }
1368
1369         for (x = 0; x < num_gh; x++) {
1370                 error = e[x] = glock_wait_internal(&ghs[x]);
1371                 if (error) {
1372                         borked = 1;
1373                         if (error != GLR_TRYFAILED && error != GLR_CANCELED)
1374                                 serious = error;
1375                 }
1376         }
1377
1378         if (!borked) {
1379                 kfree(e);
1380                 return 0;
1381         }
1382
1383         for (x = 0; x < num_gh; x++)
1384                 if (!e[x])
1385                         gfs2_glock_dq(&ghs[x]);
1386
1387         if (serious)
1388                 error = serious;
1389         else {
1390                 for (x = 0; x < num_gh; x++)
1391                         gfs2_holder_reinit(ghs[x].gh_state, ghs[x].gh_flags,
1392                                           &ghs[x]);
1393                 error = nq_m_sync(num_gh, ghs, (struct gfs2_holder **)e);
1394         }
1395
1396         kfree(e);
1397
1398         return error;
1399 }
1400
1401 /**
1402  * gfs2_glock_dq_m - release multiple glocks
1403  * @num_gh: the number of structures
1404  * @ghs: an array of struct gfs2_holder structures
1405  *
1406  */
1407
1408 void gfs2_glock_dq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1409 {
1410         unsigned int x;
1411
1412         for (x = 0; x < num_gh; x++)
1413                 gfs2_glock_dq(&ghs[x]);
1414 }
1415
1416 /**
1417  * gfs2_glock_dq_uninit_m - release multiple glocks
1418  * @num_gh: the number of structures
1419  * @ghs: an array of struct gfs2_holder structures
1420  *
1421  */
1422
1423 void gfs2_glock_dq_uninit_m(unsigned int num_gh, struct gfs2_holder *ghs)
1424 {
1425         unsigned int x;
1426
1427         for (x = 0; x < num_gh; x++)
1428                 gfs2_glock_dq_uninit(&ghs[x]);
1429 }
1430
1431 /**
1432  * gfs2_lvb_hold - attach a LVB from a glock
1433  * @gl: The glock in question
1434  *
1435  */
1436
1437 int gfs2_lvb_hold(struct gfs2_glock *gl)
1438 {
1439         int error;
1440
1441         gfs2_glmutex_lock(gl);
1442
1443         if (!atomic_read(&gl->gl_lvb_count)) {
1444                 error = gfs2_lm_hold_lvb(gl->gl_sbd, gl->gl_lock, &gl->gl_lvb);
1445                 if (error) {
1446                         gfs2_glmutex_unlock(gl);
1447                         return error;
1448                 }
1449                 gfs2_glock_hold(gl);
1450         }
1451         atomic_inc(&gl->gl_lvb_count);
1452
1453         gfs2_glmutex_unlock(gl);
1454
1455         return 0;
1456 }
1457
1458 /**
1459  * gfs2_lvb_unhold - detach a LVB from a glock
1460  * @gl: The glock in question
1461  *
1462  */
1463
1464 void gfs2_lvb_unhold(struct gfs2_glock *gl)
1465 {
1466         gfs2_glock_hold(gl);
1467         gfs2_glmutex_lock(gl);
1468
1469         gfs2_assert(gl->gl_sbd, atomic_read(&gl->gl_lvb_count) > 0);
1470         if (atomic_dec_and_test(&gl->gl_lvb_count)) {
1471                 gfs2_lm_unhold_lvb(gl->gl_sbd, gl->gl_lock, gl->gl_lvb);
1472                 gl->gl_lvb = NULL;
1473                 gfs2_glock_put(gl);
1474         }
1475
1476         gfs2_glmutex_unlock(gl);
1477         gfs2_glock_put(gl);
1478 }
1479
1480 static void blocking_cb(struct gfs2_sbd *sdp, struct lm_lockname *name,
1481                         unsigned int state)
1482 {
1483         struct gfs2_glock *gl;
1484
1485         gl = gfs2_glock_find(sdp, name);
1486         if (!gl)
1487                 return;
1488
1489         handle_callback(gl, state, 1);
1490
1491         spin_lock(&gl->gl_spin);
1492         run_queue(gl);
1493         spin_unlock(&gl->gl_spin);
1494
1495         gfs2_glock_put(gl);
1496 }
1497
1498 /**
1499  * gfs2_glock_cb - Callback used by locking module
1500  * @sdp: Pointer to the superblock
1501  * @type: Type of callback
1502  * @data: Type dependent data pointer
1503  *
1504  * Called by the locking module when it wants to tell us something.
1505  * Either we need to drop a lock, one of our ASYNC requests completed, or
1506  * a journal from another client needs to be recovered.
1507  */
1508
1509 void gfs2_glock_cb(void *cb_data, unsigned int type, void *data)
1510 {
1511         struct gfs2_sbd *sdp = cb_data;
1512
1513         switch (type) {
1514         case LM_CB_NEED_E:
1515                 blocking_cb(sdp, data, LM_ST_UNLOCKED);
1516                 return;
1517
1518         case LM_CB_NEED_D:
1519                 blocking_cb(sdp, data, LM_ST_DEFERRED);
1520                 return;
1521
1522         case LM_CB_NEED_S:
1523                 blocking_cb(sdp, data, LM_ST_SHARED);
1524                 return;
1525
1526         case LM_CB_ASYNC: {
1527                 struct lm_async_cb *async = data;
1528                 struct gfs2_glock *gl;
1529
1530                 down_read(&gfs2_umount_flush_sem);
1531                 gl = gfs2_glock_find(sdp, &async->lc_name);
1532                 if (gfs2_assert_warn(sdp, gl))
1533                         return;
1534                 if (!gfs2_assert_warn(sdp, gl->gl_req_bh))
1535                         gl->gl_req_bh(gl, async->lc_ret);
1536                 gfs2_glock_put(gl);
1537                 up_read(&gfs2_umount_flush_sem);
1538                 return;
1539         }
1540
1541         case LM_CB_NEED_RECOVERY:
1542                 gfs2_jdesc_make_dirty(sdp, *(unsigned int *)data);
1543                 if (sdp->sd_recoverd_process)
1544                         wake_up_process(sdp->sd_recoverd_process);
1545                 return;
1546
1547         case LM_CB_DROPLOCKS:
1548                 gfs2_gl_hash_clear(sdp, NO_WAIT);
1549                 gfs2_quota_scan(sdp);
1550                 return;
1551
1552         default:
1553                 gfs2_assert_warn(sdp, 0);
1554                 return;
1555         }
1556 }
1557
1558 /**
1559  * demote_ok - Check to see if it's ok to unlock a glock
1560  * @gl: the glock
1561  *
1562  * Returns: 1 if it's ok
1563  */
1564
1565 static int demote_ok(struct gfs2_glock *gl)
1566 {
1567         const struct gfs2_glock_operations *glops = gl->gl_ops;
1568         int demote = 1;
1569
1570         if (test_bit(GLF_STICKY, &gl->gl_flags))
1571                 demote = 0;
1572         else if (glops->go_demote_ok)
1573                 demote = glops->go_demote_ok(gl);
1574
1575         return demote;
1576 }
1577
1578 /**
1579  * gfs2_glock_schedule_for_reclaim - Add a glock to the reclaim list
1580  * @gl: the glock
1581  *
1582  */
1583
1584 void gfs2_glock_schedule_for_reclaim(struct gfs2_glock *gl)
1585 {
1586         struct gfs2_sbd *sdp = gl->gl_sbd;
1587
1588         spin_lock(&sdp->sd_reclaim_lock);
1589         if (list_empty(&gl->gl_reclaim)) {
1590                 gfs2_glock_hold(gl);
1591                 list_add(&gl->gl_reclaim, &sdp->sd_reclaim_list);
1592                 atomic_inc(&sdp->sd_reclaim_count);
1593         }
1594         spin_unlock(&sdp->sd_reclaim_lock);
1595
1596         wake_up(&sdp->sd_reclaim_wq);
1597 }
1598
1599 /**
1600  * gfs2_reclaim_glock - process the next glock on the filesystem's reclaim list
1601  * @sdp: the filesystem
1602  *
1603  * Called from gfs2_glockd() glock reclaim daemon, or when promoting a
1604  * different glock and we notice that there are a lot of glocks in the
1605  * reclaim list.
1606  *
1607  */
1608
1609 void gfs2_reclaim_glock(struct gfs2_sbd *sdp)
1610 {
1611         struct gfs2_glock *gl;
1612
1613         spin_lock(&sdp->sd_reclaim_lock);
1614         if (list_empty(&sdp->sd_reclaim_list)) {
1615                 spin_unlock(&sdp->sd_reclaim_lock);
1616                 return;
1617         }
1618         gl = list_entry(sdp->sd_reclaim_list.next,
1619                         struct gfs2_glock, gl_reclaim);
1620         list_del_init(&gl->gl_reclaim);
1621         spin_unlock(&sdp->sd_reclaim_lock);
1622
1623         atomic_dec(&sdp->sd_reclaim_count);
1624         atomic_inc(&sdp->sd_reclaimed);
1625
1626         if (gfs2_glmutex_trylock(gl)) {
1627                 if (list_empty(&gl->gl_holders) &&
1628                     gl->gl_state != LM_ST_UNLOCKED && demote_ok(gl))
1629                         handle_callback(gl, LM_ST_UNLOCKED, 0);
1630                 gfs2_glmutex_unlock(gl);
1631         }
1632
1633         gfs2_glock_put(gl);
1634 }
1635
1636 /**
1637  * examine_bucket - Call a function for glock in a hash bucket
1638  * @examiner: the function
1639  * @sdp: the filesystem
1640  * @bucket: the bucket
1641  *
1642  * Returns: 1 if the bucket has entries
1643  */
1644
1645 static int examine_bucket(glock_examiner examiner, struct gfs2_sbd *sdp,
1646                           unsigned int hash)
1647 {
1648         struct gfs2_glock *gl, *prev = NULL;
1649         int has_entries = 0;
1650         struct hlist_head *head = &gl_hash_table[hash].hb_list;
1651
1652         read_lock(gl_lock_addr(hash));
1653         /* Can't use hlist_for_each_entry - don't want prefetch here */
1654         if (hlist_empty(head))
1655                 goto out;
1656         gl = list_entry(head->first, struct gfs2_glock, gl_list);
1657         while(1) {
1658                 if (gl->gl_sbd == sdp) {
1659                         gfs2_glock_hold(gl);
1660                         read_unlock(gl_lock_addr(hash));
1661                         if (prev)
1662                                 gfs2_glock_put(prev);
1663                         prev = gl;
1664                         examiner(gl);
1665                         has_entries = 1;
1666                         read_lock(gl_lock_addr(hash));
1667                 }
1668                 if (gl->gl_list.next == NULL)
1669                         break;
1670                 gl = list_entry(gl->gl_list.next, struct gfs2_glock, gl_list);
1671         }
1672 out:
1673         read_unlock(gl_lock_addr(hash));
1674         if (prev)
1675                 gfs2_glock_put(prev);
1676         return has_entries;
1677 }
1678
1679 /**
1680  * scan_glock - look at a glock and see if we can reclaim it
1681  * @gl: the glock to look at
1682  *
1683  */
1684
1685 static void scan_glock(struct gfs2_glock *gl)
1686 {
1687         if (gl->gl_ops == &gfs2_inode_glops && gl->gl_object)
1688                 return;
1689
1690         if (gfs2_glmutex_trylock(gl)) {
1691                 if (list_empty(&gl->gl_holders) &&
1692                     gl->gl_state != LM_ST_UNLOCKED && demote_ok(gl))
1693                         goto out_schedule;
1694                 gfs2_glmutex_unlock(gl);
1695         }
1696         return;
1697
1698 out_schedule:
1699         gfs2_glmutex_unlock(gl);
1700         gfs2_glock_schedule_for_reclaim(gl);
1701 }
1702
1703 /**
1704  * gfs2_scand_internal - Look for glocks and inodes to toss from memory
1705  * @sdp: the filesystem
1706  *
1707  */
1708
1709 void gfs2_scand_internal(struct gfs2_sbd *sdp)
1710 {
1711         unsigned int x;
1712
1713         for (x = 0; x < GFS2_GL_HASH_SIZE; x++)
1714                 examine_bucket(scan_glock, sdp, x);
1715 }
1716
1717 /**
1718  * clear_glock - look at a glock and see if we can free it from glock cache
1719  * @gl: the glock to look at
1720  *
1721  */
1722
1723 static void clear_glock(struct gfs2_glock *gl)
1724 {
1725         struct gfs2_sbd *sdp = gl->gl_sbd;
1726         int released;
1727
1728         spin_lock(&sdp->sd_reclaim_lock);
1729         if (!list_empty(&gl->gl_reclaim)) {
1730                 list_del_init(&gl->gl_reclaim);
1731                 atomic_dec(&sdp->sd_reclaim_count);
1732                 spin_unlock(&sdp->sd_reclaim_lock);
1733                 released = gfs2_glock_put(gl);
1734                 gfs2_assert(sdp, !released);
1735         } else {
1736                 spin_unlock(&sdp->sd_reclaim_lock);
1737         }
1738
1739         if (gfs2_glmutex_trylock(gl)) {
1740                 if (list_empty(&gl->gl_holders) &&
1741                     gl->gl_state != LM_ST_UNLOCKED)
1742                         handle_callback(gl, LM_ST_UNLOCKED, 0);
1743                 gfs2_glmutex_unlock(gl);
1744         }
1745 }
1746
1747 /**
1748  * gfs2_gl_hash_clear - Empty out the glock hash table
1749  * @sdp: the filesystem
1750  * @wait: wait until it's all gone
1751  *
1752  * Called when unmounting the filesystem, or when inter-node lock manager
1753  * requests DROPLOCKS because it is running out of capacity.
1754  */
1755
1756 void gfs2_gl_hash_clear(struct gfs2_sbd *sdp, int wait)
1757 {
1758         unsigned long t;
1759         unsigned int x;
1760         int cont;
1761
1762         t = jiffies;
1763
1764         for (;;) {
1765                 cont = 0;
1766                 for (x = 0; x < GFS2_GL_HASH_SIZE; x++) {
1767                         if (examine_bucket(clear_glock, sdp, x))
1768                                 cont = 1;
1769                 }
1770
1771                 if (!wait || !cont)
1772                         break;
1773
1774                 if (time_after_eq(jiffies,
1775                                   t + gfs2_tune_get(sdp, gt_stall_secs) * HZ)) {
1776                         fs_warn(sdp, "Unmount seems to be stalled. "
1777                                      "Dumping lock state...\n");
1778                         gfs2_dump_lockstate(sdp);
1779                         t = jiffies;
1780                 }
1781
1782                 down_write(&gfs2_umount_flush_sem);
1783                 invalidate_inodes(sdp->sd_vfs);
1784                 up_write(&gfs2_umount_flush_sem);
1785                 msleep(10);
1786         }
1787 }
1788
1789 /*
1790  *  Diagnostic routines to help debug distributed deadlock
1791  */
1792
1793 static void gfs2_print_symbol(struct glock_iter *gi, const char *fmt,
1794                               unsigned long address)
1795 {
1796         char buffer[KSYM_SYMBOL_LEN];
1797
1798         sprint_symbol(buffer, address);
1799         print_dbg(gi, fmt, buffer);
1800 }
1801
1802 /**
1803  * dump_holder - print information about a glock holder
1804  * @str: a string naming the type of holder
1805  * @gh: the glock holder
1806  *
1807  * Returns: 0 on success, -ENOBUFS when we run out of space
1808  */
1809
1810 static int dump_holder(struct glock_iter *gi, char *str,
1811                        struct gfs2_holder *gh)
1812 {
1813         unsigned int x;
1814         struct task_struct *gh_owner;
1815
1816         print_dbg(gi, "  %s\n", str);
1817         if (gh->gh_owner_pid) {
1818                 print_dbg(gi, "    owner = %ld ", (long)gh->gh_owner_pid);
1819                 gh_owner = find_task_by_pid(gh->gh_owner_pid);
1820                 if (gh_owner)
1821                         print_dbg(gi, "(%s)\n", gh_owner->comm);
1822                 else
1823                         print_dbg(gi, "(ended)\n");
1824         } else
1825                 print_dbg(gi, "    owner = -1\n");
1826         print_dbg(gi, "    gh_state = %u\n", gh->gh_state);
1827         print_dbg(gi, "    gh_flags =");
1828         for (x = 0; x < 32; x++)
1829                 if (gh->gh_flags & (1 << x))
1830                         print_dbg(gi, " %u", x);
1831         print_dbg(gi, " \n");
1832         print_dbg(gi, "    error = %d\n", gh->gh_error);
1833         print_dbg(gi, "    gh_iflags =");
1834         for (x = 0; x < 32; x++)
1835                 if (test_bit(x, &gh->gh_iflags))
1836                         print_dbg(gi, " %u", x);
1837         print_dbg(gi, " \n");
1838         gfs2_print_symbol(gi, "    initialized at: %s\n", gh->gh_ip);
1839
1840         return 0;
1841 }
1842
1843 /**
1844  * dump_inode - print information about an inode
1845  * @ip: the inode
1846  *
1847  * Returns: 0 on success, -ENOBUFS when we run out of space
1848  */
1849
1850 static int dump_inode(struct glock_iter *gi, struct gfs2_inode *ip)
1851 {
1852         unsigned int x;
1853
1854         print_dbg(gi, "  Inode:\n");
1855         print_dbg(gi, "    num = %llu/%llu\n",
1856                   (unsigned long long)ip->i_no_formal_ino,
1857                   (unsigned long long)ip->i_no_addr);
1858         print_dbg(gi, "    type = %u\n", IF2DT(ip->i_inode.i_mode));
1859         print_dbg(gi, "    i_flags =");
1860         for (x = 0; x < 32; x++)
1861                 if (test_bit(x, &ip->i_flags))
1862                         print_dbg(gi, " %u", x);
1863         print_dbg(gi, " \n");
1864         return 0;
1865 }
1866
1867 /**
1868  * dump_glock - print information about a glock
1869  * @gl: the glock
1870  * @count: where we are in the buffer
1871  *
1872  * Returns: 0 on success, -ENOBUFS when we run out of space
1873  */
1874
1875 static int dump_glock(struct glock_iter *gi, struct gfs2_glock *gl)
1876 {
1877         struct gfs2_holder *gh;
1878         unsigned int x;
1879         int error = -ENOBUFS;
1880         struct task_struct *gl_owner;
1881
1882         spin_lock(&gl->gl_spin);
1883
1884         print_dbg(gi, "Glock 0x%p (%u, %llu)\n", gl, gl->gl_name.ln_type,
1885                    (unsigned long long)gl->gl_name.ln_number);
1886         print_dbg(gi, "  gl_flags =");
1887         for (x = 0; x < 32; x++) {
1888                 if (test_bit(x, &gl->gl_flags))
1889                         print_dbg(gi, " %u", x);
1890         }
1891         if (!test_bit(GLF_LOCK, &gl->gl_flags))
1892                 print_dbg(gi, " (unlocked)");
1893         print_dbg(gi, " \n");
1894         print_dbg(gi, "  gl_ref = %d\n", atomic_read(&gl->gl_ref));
1895         print_dbg(gi, "  gl_state = %u\n", gl->gl_state);
1896         if (gl->gl_owner_pid) {
1897                 gl_owner = find_task_by_pid(gl->gl_owner_pid);
1898                 if (gl_owner)
1899                         print_dbg(gi, "  gl_owner = pid %d (%s)\n",
1900                                   gl->gl_owner_pid, gl_owner->comm);
1901                 else
1902                         print_dbg(gi, "  gl_owner = %d (ended)\n",
1903                                   gl->gl_owner_pid);
1904         } else
1905                 print_dbg(gi, "  gl_owner = -1\n");
1906         print_dbg(gi, "  gl_ip = %lu\n", gl->gl_ip);
1907         print_dbg(gi, "  req_gh = %s\n", (gl->gl_req_gh) ? "yes" : "no");
1908         print_dbg(gi, "  req_bh = %s\n", (gl->gl_req_bh) ? "yes" : "no");
1909         print_dbg(gi, "  lvb_count = %d\n", atomic_read(&gl->gl_lvb_count));
1910         print_dbg(gi, "  object = %s\n", (gl->gl_object) ? "yes" : "no");
1911         print_dbg(gi, "  le = %s\n",
1912                    (list_empty(&gl->gl_le.le_list)) ? "no" : "yes");
1913         print_dbg(gi, "  reclaim = %s\n",
1914                    (list_empty(&gl->gl_reclaim)) ? "no" : "yes");
1915         if (gl->gl_aspace)
1916                 print_dbg(gi, "  aspace = 0x%p nrpages = %lu\n", gl->gl_aspace,
1917                            gl->gl_aspace->i_mapping->nrpages);
1918         else
1919                 print_dbg(gi, "  aspace = no\n");
1920         print_dbg(gi, "  ail = %d\n", atomic_read(&gl->gl_ail_count));
1921         if (gl->gl_req_gh) {
1922                 error = dump_holder(gi, "Request", gl->gl_req_gh);
1923                 if (error)
1924                         goto out;
1925         }
1926         list_for_each_entry(gh, &gl->gl_holders, gh_list) {
1927                 error = dump_holder(gi, "Holder", gh);
1928                 if (error)
1929                         goto out;
1930         }
1931         list_for_each_entry(gh, &gl->gl_waiters1, gh_list) {
1932                 error = dump_holder(gi, "Waiter1", gh);
1933                 if (error)
1934                         goto out;
1935         }
1936         list_for_each_entry(gh, &gl->gl_waiters3, gh_list) {
1937                 error = dump_holder(gi, "Waiter3", gh);
1938                 if (error)
1939                         goto out;
1940         }
1941         if (test_bit(GLF_DEMOTE, &gl->gl_flags)) {
1942                 print_dbg(gi, "  Demotion req to state %u (%llu uS ago)\n",
1943                           gl->gl_demote_state, (unsigned long long)
1944                           (jiffies - gl->gl_demote_time)*(1000000/HZ));
1945         }
1946         if (gl->gl_ops == &gfs2_inode_glops && gl->gl_object) {
1947                 if (!test_bit(GLF_LOCK, &gl->gl_flags) &&
1948                         list_empty(&gl->gl_holders)) {
1949                         error = dump_inode(gi, gl->gl_object);
1950                         if (error)
1951                                 goto out;
1952                 } else {
1953                         error = -ENOBUFS;
1954                         print_dbg(gi, "  Inode: busy\n");
1955                 }
1956         }
1957
1958         error = 0;
1959
1960 out:
1961         spin_unlock(&gl->gl_spin);
1962         return error;
1963 }
1964
1965 /**
1966  * gfs2_dump_lockstate - print out the current lockstate
1967  * @sdp: the filesystem
1968  * @ub: the buffer to copy the information into
1969  *
1970  * If @ub is NULL, dump the lockstate to the console.
1971  *
1972  */
1973
1974 static int gfs2_dump_lockstate(struct gfs2_sbd *sdp)
1975 {
1976         struct gfs2_glock *gl;
1977         struct hlist_node *h;
1978         unsigned int x;
1979         int error = 0;
1980
1981         for (x = 0; x < GFS2_GL_HASH_SIZE; x++) {
1982
1983                 read_lock(gl_lock_addr(x));
1984
1985                 hlist_for_each_entry(gl, h, &gl_hash_table[x].hb_list, gl_list) {
1986                         if (gl->gl_sbd != sdp)
1987                                 continue;
1988
1989                         error = dump_glock(NULL, gl);
1990                         if (error)
1991                                 break;
1992                 }
1993
1994                 read_unlock(gl_lock_addr(x));
1995
1996                 if (error)
1997                         break;
1998         }
1999
2000
2001         return error;
2002 }
2003
2004 int __init gfs2_glock_init(void)
2005 {
2006         unsigned i;
2007         for(i = 0; i < GFS2_GL_HASH_SIZE; i++) {
2008                 INIT_HLIST_HEAD(&gl_hash_table[i].hb_list);
2009         }
2010 #ifdef GL_HASH_LOCK_SZ
2011         for(i = 0; i < GL_HASH_LOCK_SZ; i++) {
2012                 rwlock_init(&gl_hash_locks[i]);
2013         }
2014 #endif
2015         return 0;
2016 }
2017
2018 static int gfs2_glock_iter_next(struct glock_iter *gi)
2019 {
2020         read_lock(gl_lock_addr(gi->hash));
2021         while (1) {
2022                 if (!gi->hb_list) {  /* If we don't have a hash bucket yet */
2023                         gi->hb_list = &gl_hash_table[gi->hash].hb_list;
2024                         if (hlist_empty(gi->hb_list)) {
2025                                 read_unlock(gl_lock_addr(gi->hash));
2026                                 gi->hash++;
2027                                 read_lock(gl_lock_addr(gi->hash));
2028                                 gi->hb_list = NULL;
2029                                 if (gi->hash >= GFS2_GL_HASH_SIZE) {
2030                                         read_unlock(gl_lock_addr(gi->hash));
2031                                         return 1;
2032                                 }
2033                                 else
2034                                         continue;
2035                         }
2036                         if (!hlist_empty(gi->hb_list)) {
2037                                 gi->gl = list_entry(gi->hb_list->first,
2038                                                     struct gfs2_glock,
2039                                                     gl_list);
2040                         }
2041                 } else {
2042                         if (gi->gl->gl_list.next == NULL) {
2043                                 read_unlock(gl_lock_addr(gi->hash));
2044                                 gi->hash++;
2045                                 read_lock(gl_lock_addr(gi->hash));
2046                                 gi->hb_list = NULL;
2047                                 continue;
2048                         }
2049                         gi->gl = list_entry(gi->gl->gl_list.next,
2050                                             struct gfs2_glock, gl_list);
2051                 }
2052                 if (gi->gl)
2053                         break;
2054         }
2055         read_unlock(gl_lock_addr(gi->hash));
2056         return 0;
2057 }
2058
2059 static void gfs2_glock_iter_free(struct glock_iter *gi)
2060 {
2061         kfree(gi);
2062 }
2063
2064 static struct glock_iter *gfs2_glock_iter_init(struct gfs2_sbd *sdp)
2065 {
2066         struct glock_iter *gi;
2067
2068         gi = kmalloc(sizeof (*gi), GFP_KERNEL);
2069         if (!gi)
2070                 return NULL;
2071
2072         gi->sdp = sdp;
2073         gi->hash = 0;
2074         gi->gl = NULL;
2075         gi->hb_list = NULL;
2076         gi->seq = NULL;
2077         memset(gi->string, 0, sizeof(gi->string));
2078
2079         if (gfs2_glock_iter_next(gi)) {
2080                 gfs2_glock_iter_free(gi);
2081                 return NULL;
2082         }
2083
2084         return gi;
2085 }
2086
2087 static void *gfs2_glock_seq_start(struct seq_file *file, loff_t *pos)
2088 {
2089         struct glock_iter *gi;
2090         loff_t n = *pos;
2091
2092         gi = gfs2_glock_iter_init(file->private);
2093         if (!gi)
2094                 return NULL;
2095
2096         while (n--) {
2097                 if (gfs2_glock_iter_next(gi)) {
2098                         gfs2_glock_iter_free(gi);
2099                         return NULL;
2100                 }
2101         }
2102
2103         return gi;
2104 }
2105
2106 static void *gfs2_glock_seq_next(struct seq_file *file, void *iter_ptr,
2107                                  loff_t *pos)
2108 {
2109         struct glock_iter *gi = iter_ptr;
2110
2111         (*pos)++;
2112
2113         if (gfs2_glock_iter_next(gi)) {
2114                 gfs2_glock_iter_free(gi);
2115                 return NULL;
2116         }
2117
2118         return gi;
2119 }
2120
2121 static void gfs2_glock_seq_stop(struct seq_file *file, void *iter_ptr)
2122 {
2123         /* nothing for now */
2124 }
2125
2126 static int gfs2_glock_seq_show(struct seq_file *file, void *iter_ptr)
2127 {
2128         struct glock_iter *gi = iter_ptr;
2129
2130         gi->seq = file;
2131         dump_glock(gi, gi->gl);
2132
2133         return 0;
2134 }
2135
2136 static struct seq_operations gfs2_glock_seq_ops = {
2137         .start = gfs2_glock_seq_start,
2138         .next  = gfs2_glock_seq_next,
2139         .stop  = gfs2_glock_seq_stop,
2140         .show  = gfs2_glock_seq_show,
2141 };
2142
2143 static int gfs2_debugfs_open(struct inode *inode, struct file *file)
2144 {
2145         struct seq_file *seq;
2146         int ret;
2147
2148         ret = seq_open(file, &gfs2_glock_seq_ops);
2149         if (ret)
2150                 return ret;
2151
2152         seq = file->private_data;
2153         seq->private = inode->i_private;
2154
2155         return 0;
2156 }
2157
2158 static const struct file_operations gfs2_debug_fops = {
2159         .owner   = THIS_MODULE,
2160         .open    = gfs2_debugfs_open,
2161         .read    = seq_read,
2162         .llseek  = seq_lseek,
2163         .release = seq_release
2164 };
2165
2166 int gfs2_create_debugfs_file(struct gfs2_sbd *sdp)
2167 {
2168         sdp->debugfs_dir = debugfs_create_dir(sdp->sd_table_name, gfs2_root);
2169         if (!sdp->debugfs_dir)
2170                 return -ENOMEM;
2171         sdp->debugfs_dentry_glocks = debugfs_create_file("glocks",
2172                                                          S_IFREG | S_IRUGO,
2173                                                          sdp->debugfs_dir, sdp,
2174                                                          &gfs2_debug_fops);
2175         if (!sdp->debugfs_dentry_glocks)
2176                 return -ENOMEM;
2177
2178         return 0;
2179 }
2180
2181 void gfs2_delete_debugfs_file(struct gfs2_sbd *sdp)
2182 {
2183         if (sdp && sdp->debugfs_dir) {
2184                 if (sdp->debugfs_dentry_glocks) {
2185                         debugfs_remove(sdp->debugfs_dentry_glocks);
2186                         sdp->debugfs_dentry_glocks = NULL;
2187                 }
2188                 debugfs_remove(sdp->debugfs_dir);
2189                 sdp->debugfs_dir = NULL;
2190         }
2191 }
2192
2193 int gfs2_register_debugfs(void)
2194 {
2195         gfs2_root = debugfs_create_dir("gfs2", NULL);
2196         return gfs2_root ? 0 : -ENOMEM;
2197 }
2198
2199 void gfs2_unregister_debugfs(void)
2200 {
2201         debugfs_remove(gfs2_root);
2202         gfs2_root = NULL;
2203 }