3ad8fd36f8dae81431f7e8b7d31e4894028f50c3
[firefly-linux-kernel-4.4.55.git] / fs / gfs2 / glock.c
1 /*
2  * Copyright (C) Sistina Software, Inc.  1997-2003 All rights reserved.
3  * Copyright (C) 2004-2008 Red Hat, Inc.  All rights reserved.
4  *
5  * This copyrighted material is made available to anyone wishing to use,
6  * modify, copy, or redistribute it subject to the terms and conditions
7  * of the GNU General Public License version 2.
8  */
9
10 #include <linux/sched.h>
11 #include <linux/slab.h>
12 #include <linux/spinlock.h>
13 #include <linux/buffer_head.h>
14 #include <linux/delay.h>
15 #include <linux/sort.h>
16 #include <linux/jhash.h>
17 #include <linux/kallsyms.h>
18 #include <linux/gfs2_ondisk.h>
19 #include <linux/list.h>
20 #include <linux/wait.h>
21 #include <linux/module.h>
22 #include <asm/uaccess.h>
23 #include <linux/seq_file.h>
24 #include <linux/debugfs.h>
25 #include <linux/kthread.h>
26 #include <linux/freezer.h>
27 #include <linux/workqueue.h>
28 #include <linux/jiffies.h>
29 #include <linux/rcupdate.h>
30 #include <linux/rculist_bl.h>
31 #include <linux/bit_spinlock.h>
32 #include <linux/percpu.h>
33
34 #include "gfs2.h"
35 #include "incore.h"
36 #include "glock.h"
37 #include "glops.h"
38 #include "inode.h"
39 #include "lops.h"
40 #include "meta_io.h"
41 #include "quota.h"
42 #include "super.h"
43 #include "util.h"
44 #include "bmap.h"
45 #define CREATE_TRACE_POINTS
46 #include "trace_gfs2.h"
47
48 struct gfs2_glock_iter {
49         int hash;                       /* hash bucket index           */
50         unsigned nhash;                 /* Index within current bucket */
51         struct gfs2_sbd *sdp;           /* incore superblock           */
52         struct gfs2_glock *gl;          /* current glock struct        */
53         loff_t last_pos;                /* last position               */
54 };
55
56 typedef void (*glock_examiner) (struct gfs2_glock * gl);
57
58 static void do_xmote(struct gfs2_glock *gl, struct gfs2_holder *gh, unsigned int target);
59
60 static struct dentry *gfs2_root;
61 static struct workqueue_struct *glock_workqueue;
62 struct workqueue_struct *gfs2_delete_workqueue;
63 static LIST_HEAD(lru_list);
64 static atomic_t lru_count = ATOMIC_INIT(0);
65 static DEFINE_SPINLOCK(lru_lock);
66
67 #define GFS2_GL_HASH_SHIFT      15
68 #define GFS2_GL_HASH_SIZE       (1 << GFS2_GL_HASH_SHIFT)
69 #define GFS2_GL_HASH_MASK       (GFS2_GL_HASH_SIZE - 1)
70
71 static struct hlist_bl_head gl_hash_table[GFS2_GL_HASH_SIZE];
72 static struct dentry *gfs2_root;
73
74 /**
75  * gl_hash() - Turn glock number into hash bucket number
76  * @lock: The glock number
77  *
78  * Returns: The number of the corresponding hash bucket
79  */
80
81 static unsigned int gl_hash(const struct gfs2_sbd *sdp,
82                             const struct lm_lockname *name)
83 {
84         unsigned int h;
85
86         h = jhash(&name->ln_number, sizeof(u64), 0);
87         h = jhash(&name->ln_type, sizeof(unsigned int), h);
88         h = jhash(&sdp, sizeof(struct gfs2_sbd *), h);
89         h &= GFS2_GL_HASH_MASK;
90
91         return h;
92 }
93
94 static inline void spin_lock_bucket(unsigned int hash)
95 {
96         hlist_bl_lock(&gl_hash_table[hash]);
97 }
98
99 static inline void spin_unlock_bucket(unsigned int hash)
100 {
101         hlist_bl_unlock(&gl_hash_table[hash]);
102 }
103
104 static void gfs2_glock_dealloc(struct rcu_head *rcu)
105 {
106         struct gfs2_glock *gl = container_of(rcu, struct gfs2_glock, gl_rcu);
107
108         if (gl->gl_ops->go_flags & GLOF_ASPACE) {
109                 kmem_cache_free(gfs2_glock_aspace_cachep, gl);
110         } else {
111                 kfree(gl->gl_lksb.sb_lvbptr);
112                 kmem_cache_free(gfs2_glock_cachep, gl);
113         }
114 }
115
116 void gfs2_glock_free(struct gfs2_glock *gl)
117 {
118         struct gfs2_sbd *sdp = gl->gl_sbd;
119
120         call_rcu(&gl->gl_rcu, gfs2_glock_dealloc);
121         if (atomic_dec_and_test(&sdp->sd_glock_disposal))
122                 wake_up(&sdp->sd_glock_wait);
123 }
124
125 /**
126  * gfs2_glock_hold() - increment reference count on glock
127  * @gl: The glock to hold
128  *
129  */
130
131 void gfs2_glock_hold(struct gfs2_glock *gl)
132 {
133         GLOCK_BUG_ON(gl, atomic_read(&gl->gl_ref) == 0);
134         atomic_inc(&gl->gl_ref);
135 }
136
137 /**
138  * demote_ok - Check to see if it's ok to unlock a glock
139  * @gl: the glock
140  *
141  * Returns: 1 if it's ok
142  */
143
144 static int demote_ok(const struct gfs2_glock *gl)
145 {
146         const struct gfs2_glock_operations *glops = gl->gl_ops;
147
148         if (gl->gl_state == LM_ST_UNLOCKED)
149                 return 0;
150         if (!list_empty(&gl->gl_holders))
151                 return 0;
152         if (glops->go_demote_ok)
153                 return glops->go_demote_ok(gl);
154         return 1;
155 }
156
157
158 void gfs2_glock_add_to_lru(struct gfs2_glock *gl)
159 {
160         spin_lock(&lru_lock);
161
162         if (!list_empty(&gl->gl_lru))
163                 list_del_init(&gl->gl_lru);
164         else
165                 atomic_inc(&lru_count);
166
167         list_add_tail(&gl->gl_lru, &lru_list);
168         set_bit(GLF_LRU, &gl->gl_flags);
169         spin_unlock(&lru_lock);
170 }
171
172 static void __gfs2_glock_remove_from_lru(struct gfs2_glock *gl)
173 {
174         if (!list_empty(&gl->gl_lru)) {
175                 list_del_init(&gl->gl_lru);
176                 atomic_dec(&lru_count);
177                 clear_bit(GLF_LRU, &gl->gl_flags);
178         }
179 }
180
181 static void gfs2_glock_remove_from_lru(struct gfs2_glock *gl)
182 {
183         spin_lock(&lru_lock);
184         __gfs2_glock_remove_from_lru(gl);
185         spin_unlock(&lru_lock);
186 }
187
188 /**
189  * gfs2_glock_put_nolock() - Decrement reference count on glock
190  * @gl: The glock to put
191  *
192  * This function should only be used if the caller has its own reference
193  * to the glock, in addition to the one it is dropping.
194  */
195
196 void gfs2_glock_put_nolock(struct gfs2_glock *gl)
197 {
198         if (atomic_dec_and_test(&gl->gl_ref))
199                 GLOCK_BUG_ON(gl, 1);
200 }
201
202 /**
203  * gfs2_glock_put() - Decrement reference count on glock
204  * @gl: The glock to put
205  *
206  */
207
208 void gfs2_glock_put(struct gfs2_glock *gl)
209 {
210         struct gfs2_sbd *sdp = gl->gl_sbd;
211         struct address_space *mapping = gfs2_glock2aspace(gl);
212
213         if (atomic_dec_and_lock(&gl->gl_ref, &lru_lock)) {
214                 __gfs2_glock_remove_from_lru(gl);
215                 spin_unlock(&lru_lock);
216                 spin_lock_bucket(gl->gl_hash);
217                 hlist_bl_del_rcu(&gl->gl_list);
218                 spin_unlock_bucket(gl->gl_hash);
219                 GLOCK_BUG_ON(gl, !list_empty(&gl->gl_holders));
220                 GLOCK_BUG_ON(gl, mapping && mapping->nrpages);
221                 trace_gfs2_glock_put(gl);
222                 sdp->sd_lockstruct.ls_ops->lm_put_lock(gl);
223         }
224 }
225
226 /**
227  * search_bucket() - Find struct gfs2_glock by lock number
228  * @bucket: the bucket to search
229  * @name: The lock name
230  *
231  * Returns: NULL, or the struct gfs2_glock with the requested number
232  */
233
234 static struct gfs2_glock *search_bucket(unsigned int hash,
235                                         const struct gfs2_sbd *sdp,
236                                         const struct lm_lockname *name)
237 {
238         struct gfs2_glock *gl;
239         struct hlist_bl_node *h;
240
241         hlist_bl_for_each_entry_rcu(gl, h, &gl_hash_table[hash], gl_list) {
242                 if (!lm_name_equal(&gl->gl_name, name))
243                         continue;
244                 if (gl->gl_sbd != sdp)
245                         continue;
246                 if (atomic_inc_not_zero(&gl->gl_ref))
247                         return gl;
248         }
249
250         return NULL;
251 }
252
253 /**
254  * may_grant - check if its ok to grant a new lock
255  * @gl: The glock
256  * @gh: The lock request which we wish to grant
257  *
258  * Returns: true if its ok to grant the lock
259  */
260
261 static inline int may_grant(const struct gfs2_glock *gl, const struct gfs2_holder *gh)
262 {
263         const struct gfs2_holder *gh_head = list_entry(gl->gl_holders.next, const struct gfs2_holder, gh_list);
264         if ((gh->gh_state == LM_ST_EXCLUSIVE ||
265              gh_head->gh_state == LM_ST_EXCLUSIVE) && gh != gh_head)
266                 return 0;
267         if (gl->gl_state == gh->gh_state)
268                 return 1;
269         if (gh->gh_flags & GL_EXACT)
270                 return 0;
271         if (gl->gl_state == LM_ST_EXCLUSIVE) {
272                 if (gh->gh_state == LM_ST_SHARED && gh_head->gh_state == LM_ST_SHARED)
273                         return 1;
274                 if (gh->gh_state == LM_ST_DEFERRED && gh_head->gh_state == LM_ST_DEFERRED)
275                         return 1;
276         }
277         if (gl->gl_state != LM_ST_UNLOCKED && (gh->gh_flags & LM_FLAG_ANY))
278                 return 1;
279         return 0;
280 }
281
282 static void gfs2_holder_wake(struct gfs2_holder *gh)
283 {
284         clear_bit(HIF_WAIT, &gh->gh_iflags);
285         smp_mb__after_clear_bit();
286         wake_up_bit(&gh->gh_iflags, HIF_WAIT);
287 }
288
289 /**
290  * do_error - Something unexpected has happened during a lock request
291  *
292  */
293
294 static inline void do_error(struct gfs2_glock *gl, const int ret)
295 {
296         struct gfs2_holder *gh, *tmp;
297
298         list_for_each_entry_safe(gh, tmp, &gl->gl_holders, gh_list) {
299                 if (test_bit(HIF_HOLDER, &gh->gh_iflags))
300                         continue;
301                 if (ret & LM_OUT_ERROR)
302                         gh->gh_error = -EIO;
303                 else if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB))
304                         gh->gh_error = GLR_TRYFAILED;
305                 else
306                         continue;
307                 list_del_init(&gh->gh_list);
308                 trace_gfs2_glock_queue(gh, 0);
309                 gfs2_holder_wake(gh);
310         }
311 }
312
313 /**
314  * do_promote - promote as many requests as possible on the current queue
315  * @gl: The glock
316  * 
317  * Returns: 1 if there is a blocked holder at the head of the list, or 2
318  *          if a type specific operation is underway.
319  */
320
321 static int do_promote(struct gfs2_glock *gl)
322 __releases(&gl->gl_spin)
323 __acquires(&gl->gl_spin)
324 {
325         const struct gfs2_glock_operations *glops = gl->gl_ops;
326         struct gfs2_holder *gh, *tmp;
327         int ret;
328
329 restart:
330         list_for_each_entry_safe(gh, tmp, &gl->gl_holders, gh_list) {
331                 if (test_bit(HIF_HOLDER, &gh->gh_iflags))
332                         continue;
333                 if (may_grant(gl, gh)) {
334                         if (gh->gh_list.prev == &gl->gl_holders &&
335                             glops->go_lock) {
336                                 spin_unlock(&gl->gl_spin);
337                                 /* FIXME: eliminate this eventually */
338                                 ret = glops->go_lock(gh);
339                                 spin_lock(&gl->gl_spin);
340                                 if (ret) {
341                                         if (ret == 1)
342                                                 return 2;
343                                         gh->gh_error = ret;
344                                         list_del_init(&gh->gh_list);
345                                         trace_gfs2_glock_queue(gh, 0);
346                                         gfs2_holder_wake(gh);
347                                         goto restart;
348                                 }
349                                 set_bit(HIF_HOLDER, &gh->gh_iflags);
350                                 trace_gfs2_promote(gh, 1);
351                                 gfs2_holder_wake(gh);
352                                 goto restart;
353                         }
354                         set_bit(HIF_HOLDER, &gh->gh_iflags);
355                         trace_gfs2_promote(gh, 0);
356                         gfs2_holder_wake(gh);
357                         continue;
358                 }
359                 if (gh->gh_list.prev == &gl->gl_holders)
360                         return 1;
361                 do_error(gl, 0);
362                 break;
363         }
364         return 0;
365 }
366
367 /**
368  * find_first_waiter - find the first gh that's waiting for the glock
369  * @gl: the glock
370  */
371
372 static inline struct gfs2_holder *find_first_waiter(const struct gfs2_glock *gl)
373 {
374         struct gfs2_holder *gh;
375
376         list_for_each_entry(gh, &gl->gl_holders, gh_list) {
377                 if (!test_bit(HIF_HOLDER, &gh->gh_iflags))
378                         return gh;
379         }
380         return NULL;
381 }
382
383 /**
384  * state_change - record that the glock is now in a different state
385  * @gl: the glock
386  * @new_state the new state
387  *
388  */
389
390 static void state_change(struct gfs2_glock *gl, unsigned int new_state)
391 {
392         int held1, held2;
393
394         held1 = (gl->gl_state != LM_ST_UNLOCKED);
395         held2 = (new_state != LM_ST_UNLOCKED);
396
397         if (held1 != held2) {
398                 if (held2)
399                         gfs2_glock_hold(gl);
400                 else
401                         gfs2_glock_put_nolock(gl);
402         }
403         if (held1 && held2 && list_empty(&gl->gl_holders))
404                 clear_bit(GLF_QUEUED, &gl->gl_flags);
405
406         if (new_state != gl->gl_target)
407                 /* shorten our minimum hold time */
408                 gl->gl_hold_time = max(gl->gl_hold_time - GL_GLOCK_HOLD_DECR,
409                                        GL_GLOCK_MIN_HOLD);
410         gl->gl_state = new_state;
411         gl->gl_tchange = jiffies;
412 }
413
414 static void gfs2_demote_wake(struct gfs2_glock *gl)
415 {
416         gl->gl_demote_state = LM_ST_EXCLUSIVE;
417         clear_bit(GLF_DEMOTE, &gl->gl_flags);
418         smp_mb__after_clear_bit();
419         wake_up_bit(&gl->gl_flags, GLF_DEMOTE);
420 }
421
422 /**
423  * finish_xmote - The DLM has replied to one of our lock requests
424  * @gl: The glock
425  * @ret: The status from the DLM
426  *
427  */
428
429 static void finish_xmote(struct gfs2_glock *gl, unsigned int ret)
430 {
431         const struct gfs2_glock_operations *glops = gl->gl_ops;
432         struct gfs2_holder *gh;
433         unsigned state = ret & LM_OUT_ST_MASK;
434         int rv;
435
436         spin_lock(&gl->gl_spin);
437         trace_gfs2_glock_state_change(gl, state);
438         state_change(gl, state);
439         gh = find_first_waiter(gl);
440
441         /* Demote to UN request arrived during demote to SH or DF */
442         if (test_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags) &&
443             state != LM_ST_UNLOCKED && gl->gl_demote_state == LM_ST_UNLOCKED)
444                 gl->gl_target = LM_ST_UNLOCKED;
445
446         /* Check for state != intended state */
447         if (unlikely(state != gl->gl_target)) {
448                 if (gh && !test_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags)) {
449                         /* move to back of queue and try next entry */
450                         if (ret & LM_OUT_CANCELED) {
451                                 if ((gh->gh_flags & LM_FLAG_PRIORITY) == 0)
452                                         list_move_tail(&gh->gh_list, &gl->gl_holders);
453                                 gh = find_first_waiter(gl);
454                                 gl->gl_target = gh->gh_state;
455                                 goto retry;
456                         }
457                         /* Some error or failed "try lock" - report it */
458                         if ((ret & LM_OUT_ERROR) ||
459                             (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB))) {
460                                 gl->gl_target = gl->gl_state;
461                                 do_error(gl, ret);
462                                 goto out;
463                         }
464                 }
465                 switch(state) {
466                 /* Unlocked due to conversion deadlock, try again */
467                 case LM_ST_UNLOCKED:
468 retry:
469                         do_xmote(gl, gh, gl->gl_target);
470                         break;
471                 /* Conversion fails, unlock and try again */
472                 case LM_ST_SHARED:
473                 case LM_ST_DEFERRED:
474                         do_xmote(gl, gh, LM_ST_UNLOCKED);
475                         break;
476                 default: /* Everything else */
477                         printk(KERN_ERR "GFS2: wanted %u got %u\n", gl->gl_target, state);
478                         GLOCK_BUG_ON(gl, 1);
479                 }
480                 spin_unlock(&gl->gl_spin);
481                 return;
482         }
483
484         /* Fast path - we got what we asked for */
485         if (test_and_clear_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags))
486                 gfs2_demote_wake(gl);
487         if (state != LM_ST_UNLOCKED) {
488                 if (glops->go_xmote_bh) {
489                         spin_unlock(&gl->gl_spin);
490                         rv = glops->go_xmote_bh(gl, gh);
491                         spin_lock(&gl->gl_spin);
492                         if (rv) {
493                                 do_error(gl, rv);
494                                 goto out;
495                         }
496                 }
497                 rv = do_promote(gl);
498                 if (rv == 2)
499                         goto out_locked;
500         }
501 out:
502         clear_bit(GLF_LOCK, &gl->gl_flags);
503 out_locked:
504         spin_unlock(&gl->gl_spin);
505 }
506
507 /**
508  * do_xmote - Calls the DLM to change the state of a lock
509  * @gl: The lock state
510  * @gh: The holder (only for promotes)
511  * @target: The target lock state
512  *
513  */
514
515 static void do_xmote(struct gfs2_glock *gl, struct gfs2_holder *gh, unsigned int target)
516 __releases(&gl->gl_spin)
517 __acquires(&gl->gl_spin)
518 {
519         const struct gfs2_glock_operations *glops = gl->gl_ops;
520         struct gfs2_sbd *sdp = gl->gl_sbd;
521         unsigned int lck_flags = gh ? gh->gh_flags : 0;
522         int ret;
523
524         lck_flags &= (LM_FLAG_TRY | LM_FLAG_TRY_1CB | LM_FLAG_NOEXP |
525                       LM_FLAG_PRIORITY);
526         GLOCK_BUG_ON(gl, gl->gl_state == target);
527         GLOCK_BUG_ON(gl, gl->gl_state == gl->gl_target);
528         if ((target == LM_ST_UNLOCKED || target == LM_ST_DEFERRED) &&
529             glops->go_inval) {
530                 set_bit(GLF_INVALIDATE_IN_PROGRESS, &gl->gl_flags);
531                 do_error(gl, 0); /* Fail queued try locks */
532         }
533         gl->gl_req = target;
534         set_bit(GLF_BLOCKING, &gl->gl_flags);
535         if ((gl->gl_req == LM_ST_UNLOCKED) ||
536             (gl->gl_state == LM_ST_EXCLUSIVE) ||
537             (lck_flags & (LM_FLAG_TRY|LM_FLAG_TRY_1CB)))
538                 clear_bit(GLF_BLOCKING, &gl->gl_flags);
539         spin_unlock(&gl->gl_spin);
540         if (glops->go_sync)
541                 glops->go_sync(gl);
542         if (test_bit(GLF_INVALIDATE_IN_PROGRESS, &gl->gl_flags))
543                 glops->go_inval(gl, target == LM_ST_DEFERRED ? 0 : DIO_METADATA);
544         clear_bit(GLF_INVALIDATE_IN_PROGRESS, &gl->gl_flags);
545
546         gfs2_glock_hold(gl);
547         if (sdp->sd_lockstruct.ls_ops->lm_lock) {
548                 /* lock_dlm */
549                 ret = sdp->sd_lockstruct.ls_ops->lm_lock(gl, target, lck_flags);
550                 if (ret) {
551                         printk(KERN_ERR "GFS2: lm_lock ret %d\n", ret);
552                         GLOCK_BUG_ON(gl, 1);
553                 }
554         } else { /* lock_nolock */
555                 finish_xmote(gl, target);
556                 if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
557                         gfs2_glock_put(gl);
558         }
559
560         spin_lock(&gl->gl_spin);
561 }
562
563 /**
564  * find_first_holder - find the first "holder" gh
565  * @gl: the glock
566  */
567
568 static inline struct gfs2_holder *find_first_holder(const struct gfs2_glock *gl)
569 {
570         struct gfs2_holder *gh;
571
572         if (!list_empty(&gl->gl_holders)) {
573                 gh = list_entry(gl->gl_holders.next, struct gfs2_holder, gh_list);
574                 if (test_bit(HIF_HOLDER, &gh->gh_iflags))
575                         return gh;
576         }
577         return NULL;
578 }
579
580 /**
581  * run_queue - do all outstanding tasks related to a glock
582  * @gl: The glock in question
583  * @nonblock: True if we must not block in run_queue
584  *
585  */
586
587 static void run_queue(struct gfs2_glock *gl, const int nonblock)
588 __releases(&gl->gl_spin)
589 __acquires(&gl->gl_spin)
590 {
591         struct gfs2_holder *gh = NULL;
592         int ret;
593
594         if (test_and_set_bit(GLF_LOCK, &gl->gl_flags))
595                 return;
596
597         GLOCK_BUG_ON(gl, test_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags));
598
599         if (test_bit(GLF_DEMOTE, &gl->gl_flags) &&
600             gl->gl_demote_state != gl->gl_state) {
601                 if (find_first_holder(gl))
602                         goto out_unlock;
603                 if (nonblock)
604                         goto out_sched;
605                 set_bit(GLF_DEMOTE_IN_PROGRESS, &gl->gl_flags);
606                 GLOCK_BUG_ON(gl, gl->gl_demote_state == LM_ST_EXCLUSIVE);
607                 gl->gl_target = gl->gl_demote_state;
608         } else {
609                 if (test_bit(GLF_DEMOTE, &gl->gl_flags))
610                         gfs2_demote_wake(gl);
611                 ret = do_promote(gl);
612                 if (ret == 0)
613                         goto out_unlock;
614                 if (ret == 2)
615                         goto out;
616                 gh = find_first_waiter(gl);
617                 gl->gl_target = gh->gh_state;
618                 if (!(gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)))
619                         do_error(gl, 0); /* Fail queued try locks */
620         }
621         do_xmote(gl, gh, gl->gl_target);
622 out:
623         return;
624
625 out_sched:
626         clear_bit(GLF_LOCK, &gl->gl_flags);
627         smp_mb__after_clear_bit();
628         gfs2_glock_hold(gl);
629         if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
630                 gfs2_glock_put_nolock(gl);
631         return;
632
633 out_unlock:
634         clear_bit(GLF_LOCK, &gl->gl_flags);
635         smp_mb__after_clear_bit();
636         return;
637 }
638
639 static void delete_work_func(struct work_struct *work)
640 {
641         struct gfs2_glock *gl = container_of(work, struct gfs2_glock, gl_delete);
642         struct gfs2_sbd *sdp = gl->gl_sbd;
643         struct gfs2_inode *ip;
644         struct inode *inode;
645         u64 no_addr = gl->gl_name.ln_number;
646
647         ip = gl->gl_object;
648         /* Note: Unsafe to dereference ip as we don't hold right refs/locks */
649
650         if (ip)
651                 inode = gfs2_ilookup(sdp->sd_vfs, no_addr, 1);
652         else
653                 inode = gfs2_lookup_by_inum(sdp, no_addr, NULL, GFS2_BLKST_UNLINKED);
654         if (inode && !IS_ERR(inode)) {
655                 d_prune_aliases(inode);
656                 iput(inode);
657         }
658         gfs2_glock_put(gl);
659 }
660
661 static void glock_work_func(struct work_struct *work)
662 {
663         unsigned long delay = 0;
664         struct gfs2_glock *gl = container_of(work, struct gfs2_glock, gl_work.work);
665         int drop_ref = 0;
666
667         if (test_and_clear_bit(GLF_REPLY_PENDING, &gl->gl_flags)) {
668                 finish_xmote(gl, gl->gl_reply);
669                 drop_ref = 1;
670         }
671         spin_lock(&gl->gl_spin);
672         if (test_bit(GLF_PENDING_DEMOTE, &gl->gl_flags) &&
673             gl->gl_state != LM_ST_UNLOCKED &&
674             gl->gl_demote_state != LM_ST_EXCLUSIVE) {
675                 unsigned long holdtime, now = jiffies;
676
677                 holdtime = gl->gl_tchange + gl->gl_hold_time;
678                 if (time_before(now, holdtime))
679                         delay = holdtime - now;
680
681                 if (!delay) {
682                         clear_bit(GLF_PENDING_DEMOTE, &gl->gl_flags);
683                         set_bit(GLF_DEMOTE, &gl->gl_flags);
684                 }
685         }
686         run_queue(gl, 0);
687         spin_unlock(&gl->gl_spin);
688         if (!delay)
689                 gfs2_glock_put(gl);
690         else {
691                 if (gl->gl_name.ln_type != LM_TYPE_INODE)
692                         delay = 0;
693                 if (queue_delayed_work(glock_workqueue, &gl->gl_work, delay) == 0)
694                         gfs2_glock_put(gl);
695         }
696         if (drop_ref)
697                 gfs2_glock_put(gl);
698 }
699
700 /**
701  * gfs2_glock_get() - Get a glock, or create one if one doesn't exist
702  * @sdp: The GFS2 superblock
703  * @number: the lock number
704  * @glops: The glock_operations to use
705  * @create: If 0, don't create the glock if it doesn't exist
706  * @glp: the glock is returned here
707  *
708  * This does not lock a glock, just finds/creates structures for one.
709  *
710  * Returns: errno
711  */
712
713 int gfs2_glock_get(struct gfs2_sbd *sdp, u64 number,
714                    const struct gfs2_glock_operations *glops, int create,
715                    struct gfs2_glock **glp)
716 {
717         struct super_block *s = sdp->sd_vfs;
718         struct lm_lockname name = { .ln_number = number, .ln_type = glops->go_type };
719         struct gfs2_glock *gl, *tmp;
720         unsigned int hash = gl_hash(sdp, &name);
721         struct address_space *mapping;
722         struct kmem_cache *cachep;
723
724         rcu_read_lock();
725         gl = search_bucket(hash, sdp, &name);
726         rcu_read_unlock();
727
728         *glp = gl;
729         if (gl)
730                 return 0;
731         if (!create)
732                 return -ENOENT;
733
734         if (glops->go_flags & GLOF_ASPACE)
735                 cachep = gfs2_glock_aspace_cachep;
736         else
737                 cachep = gfs2_glock_cachep;
738         gl = kmem_cache_alloc(cachep, GFP_KERNEL);
739         if (!gl)
740                 return -ENOMEM;
741
742         memset(&gl->gl_lksb, 0, sizeof(struct dlm_lksb));
743
744         if (glops->go_flags & GLOF_LVB) {
745                 gl->gl_lksb.sb_lvbptr = kzalloc(GFS2_MIN_LVB_SIZE, GFP_KERNEL);
746                 if (!gl->gl_lksb.sb_lvbptr) {
747                         kmem_cache_free(cachep, gl);
748                         return -ENOMEM;
749                 }
750         }
751
752         atomic_inc(&sdp->sd_glock_disposal);
753         gl->gl_sbd = sdp;
754         gl->gl_flags = 0;
755         gl->gl_name = name;
756         atomic_set(&gl->gl_ref, 1);
757         gl->gl_state = LM_ST_UNLOCKED;
758         gl->gl_target = LM_ST_UNLOCKED;
759         gl->gl_demote_state = LM_ST_EXCLUSIVE;
760         gl->gl_hash = hash;
761         gl->gl_ops = glops;
762         gl->gl_dstamp = ktime_set(0, 0);
763         preempt_disable();
764         /* We use the global stats to estimate the initial per-glock stats */
765         gl->gl_stats = this_cpu_ptr(sdp->sd_lkstats)->lkstats[glops->go_type];
766         preempt_enable();
767         gl->gl_stats.stats[GFS2_LKS_DCOUNT] = 0;
768         gl->gl_stats.stats[GFS2_LKS_QCOUNT] = 0;
769         gl->gl_tchange = jiffies;
770         gl->gl_object = NULL;
771         gl->gl_hold_time = GL_GLOCK_DFT_HOLD;
772         INIT_DELAYED_WORK(&gl->gl_work, glock_work_func);
773         INIT_WORK(&gl->gl_delete, delete_work_func);
774
775         mapping = gfs2_glock2aspace(gl);
776         if (mapping) {
777                 mapping->a_ops = &gfs2_meta_aops;
778                 mapping->host = s->s_bdev->bd_inode;
779                 mapping->flags = 0;
780                 mapping_set_gfp_mask(mapping, GFP_NOFS);
781                 mapping->private_data = NULL;
782                 mapping->backing_dev_info = s->s_bdi;
783                 mapping->writeback_index = 0;
784         }
785
786         spin_lock_bucket(hash);
787         tmp = search_bucket(hash, sdp, &name);
788         if (tmp) {
789                 spin_unlock_bucket(hash);
790                 kfree(gl->gl_lksb.sb_lvbptr);
791                 kmem_cache_free(cachep, gl);
792                 atomic_dec(&sdp->sd_glock_disposal);
793                 gl = tmp;
794         } else {
795                 hlist_bl_add_head_rcu(&gl->gl_list, &gl_hash_table[hash]);
796                 spin_unlock_bucket(hash);
797         }
798
799         *glp = gl;
800
801         return 0;
802 }
803
804 /**
805  * gfs2_holder_init - initialize a struct gfs2_holder in the default way
806  * @gl: the glock
807  * @state: the state we're requesting
808  * @flags: the modifier flags
809  * @gh: the holder structure
810  *
811  */
812
813 void gfs2_holder_init(struct gfs2_glock *gl, unsigned int state, unsigned flags,
814                       struct gfs2_holder *gh)
815 {
816         INIT_LIST_HEAD(&gh->gh_list);
817         gh->gh_gl = gl;
818         gh->gh_ip = (unsigned long)__builtin_return_address(0);
819         gh->gh_owner_pid = get_pid(task_pid(current));
820         gh->gh_state = state;
821         gh->gh_flags = flags;
822         gh->gh_error = 0;
823         gh->gh_iflags = 0;
824         gfs2_glock_hold(gl);
825 }
826
827 /**
828  * gfs2_holder_reinit - reinitialize a struct gfs2_holder so we can requeue it
829  * @state: the state we're requesting
830  * @flags: the modifier flags
831  * @gh: the holder structure
832  *
833  * Don't mess with the glock.
834  *
835  */
836
837 void gfs2_holder_reinit(unsigned int state, unsigned flags, struct gfs2_holder *gh)
838 {
839         gh->gh_state = state;
840         gh->gh_flags = flags;
841         gh->gh_iflags = 0;
842         gh->gh_ip = (unsigned long)__builtin_return_address(0);
843         if (gh->gh_owner_pid)
844                 put_pid(gh->gh_owner_pid);
845         gh->gh_owner_pid = get_pid(task_pid(current));
846 }
847
848 /**
849  * gfs2_holder_uninit - uninitialize a holder structure (drop glock reference)
850  * @gh: the holder structure
851  *
852  */
853
854 void gfs2_holder_uninit(struct gfs2_holder *gh)
855 {
856         put_pid(gh->gh_owner_pid);
857         gfs2_glock_put(gh->gh_gl);
858         gh->gh_gl = NULL;
859         gh->gh_ip = 0;
860 }
861
862 /**
863  * gfs2_glock_holder_wait
864  * @word: unused
865  *
866  * This function and gfs2_glock_demote_wait both show up in the WCHAN
867  * field. Thus I've separated these otherwise identical functions in
868  * order to be more informative to the user.
869  */
870
871 static int gfs2_glock_holder_wait(void *word)
872 {
873         schedule();
874         return 0;
875 }
876
877 static int gfs2_glock_demote_wait(void *word)
878 {
879         schedule();
880         return 0;
881 }
882
883 /**
884  * gfs2_glock_wait - wait on a glock acquisition
885  * @gh: the glock holder
886  *
887  * Returns: 0 on success
888  */
889
890 int gfs2_glock_wait(struct gfs2_holder *gh)
891 {
892         unsigned long time1 = jiffies;
893
894         might_sleep();
895         wait_on_bit(&gh->gh_iflags, HIF_WAIT, gfs2_glock_holder_wait, TASK_UNINTERRUPTIBLE);
896         if (time_after(jiffies, time1 + HZ)) /* have we waited > a second? */
897                 /* Lengthen the minimum hold time. */
898                 gh->gh_gl->gl_hold_time = min(gh->gh_gl->gl_hold_time +
899                                               GL_GLOCK_HOLD_INCR,
900                                               GL_GLOCK_MAX_HOLD);
901         return gh->gh_error;
902 }
903
904 /**
905  * handle_callback - process a demote request
906  * @gl: the glock
907  * @state: the state the caller wants us to change to
908  *
909  * There are only two requests that we are going to see in actual
910  * practise: LM_ST_SHARED and LM_ST_UNLOCKED
911  */
912
913 static void handle_callback(struct gfs2_glock *gl, unsigned int state,
914                             unsigned long delay)
915 {
916         int bit = delay ? GLF_PENDING_DEMOTE : GLF_DEMOTE;
917
918         set_bit(bit, &gl->gl_flags);
919         if (gl->gl_demote_state == LM_ST_EXCLUSIVE) {
920                 gl->gl_demote_state = state;
921                 gl->gl_demote_time = jiffies;
922         } else if (gl->gl_demote_state != LM_ST_UNLOCKED &&
923                         gl->gl_demote_state != state) {
924                 gl->gl_demote_state = LM_ST_UNLOCKED;
925         }
926         if (gl->gl_ops->go_callback)
927                 gl->gl_ops->go_callback(gl);
928         trace_gfs2_demote_rq(gl);
929 }
930
931 void gfs2_print_dbg(struct seq_file *seq, const char *fmt, ...)
932 {
933         struct va_format vaf;
934         va_list args;
935
936         va_start(args, fmt);
937
938         if (seq) {
939                 seq_vprintf(seq, fmt, args);
940         } else {
941                 vaf.fmt = fmt;
942                 vaf.va = &args;
943
944                 printk(KERN_ERR " %pV", &vaf);
945         }
946
947         va_end(args);
948 }
949
950 /**
951  * add_to_queue - Add a holder to the wait queue (but look for recursion)
952  * @gh: the holder structure to add
953  *
954  * Eventually we should move the recursive locking trap to a
955  * debugging option or something like that. This is the fast
956  * path and needs to have the minimum number of distractions.
957  * 
958  */
959
960 static inline void add_to_queue(struct gfs2_holder *gh)
961 __releases(&gl->gl_spin)
962 __acquires(&gl->gl_spin)
963 {
964         struct gfs2_glock *gl = gh->gh_gl;
965         struct gfs2_sbd *sdp = gl->gl_sbd;
966         struct list_head *insert_pt = NULL;
967         struct gfs2_holder *gh2;
968         int try_futile = 0;
969
970         BUG_ON(gh->gh_owner_pid == NULL);
971         if (test_and_set_bit(HIF_WAIT, &gh->gh_iflags))
972                 BUG();
973
974         if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)) {
975                 if (test_bit(GLF_LOCK, &gl->gl_flags))
976                         try_futile = !may_grant(gl, gh);
977                 if (test_bit(GLF_INVALIDATE_IN_PROGRESS, &gl->gl_flags))
978                         goto fail;
979         }
980
981         list_for_each_entry(gh2, &gl->gl_holders, gh_list) {
982                 if (unlikely(gh2->gh_owner_pid == gh->gh_owner_pid &&
983                     (gh->gh_gl->gl_ops->go_type != LM_TYPE_FLOCK)))
984                         goto trap_recursive;
985                 if (try_futile &&
986                     !(gh2->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB))) {
987 fail:
988                         gh->gh_error = GLR_TRYFAILED;
989                         gfs2_holder_wake(gh);
990                         return;
991                 }
992                 if (test_bit(HIF_HOLDER, &gh2->gh_iflags))
993                         continue;
994                 if (unlikely((gh->gh_flags & LM_FLAG_PRIORITY) && !insert_pt))
995                         insert_pt = &gh2->gh_list;
996         }
997         set_bit(GLF_QUEUED, &gl->gl_flags);
998         trace_gfs2_glock_queue(gh, 1);
999         gfs2_glstats_inc(gl, GFS2_LKS_QCOUNT);
1000         gfs2_sbstats_inc(gl, GFS2_LKS_QCOUNT);
1001         if (likely(insert_pt == NULL)) {
1002                 list_add_tail(&gh->gh_list, &gl->gl_holders);
1003                 if (unlikely(gh->gh_flags & LM_FLAG_PRIORITY))
1004                         goto do_cancel;
1005                 return;
1006         }
1007         list_add_tail(&gh->gh_list, insert_pt);
1008 do_cancel:
1009         gh = list_entry(gl->gl_holders.next, struct gfs2_holder, gh_list);
1010         if (!(gh->gh_flags & LM_FLAG_PRIORITY)) {
1011                 spin_unlock(&gl->gl_spin);
1012                 if (sdp->sd_lockstruct.ls_ops->lm_cancel)
1013                         sdp->sd_lockstruct.ls_ops->lm_cancel(gl);
1014                 spin_lock(&gl->gl_spin);
1015         }
1016         return;
1017
1018 trap_recursive:
1019         print_symbol(KERN_ERR "original: %s\n", gh2->gh_ip);
1020         printk(KERN_ERR "pid: %d\n", pid_nr(gh2->gh_owner_pid));
1021         printk(KERN_ERR "lock type: %d req lock state : %d\n",
1022                gh2->gh_gl->gl_name.ln_type, gh2->gh_state);
1023         print_symbol(KERN_ERR "new: %s\n", gh->gh_ip);
1024         printk(KERN_ERR "pid: %d\n", pid_nr(gh->gh_owner_pid));
1025         printk(KERN_ERR "lock type: %d req lock state : %d\n",
1026                gh->gh_gl->gl_name.ln_type, gh->gh_state);
1027         gfs2_dump_glock(NULL, gl);
1028         BUG();
1029 }
1030
1031 /**
1032  * gfs2_glock_nq - enqueue a struct gfs2_holder onto a glock (acquire a glock)
1033  * @gh: the holder structure
1034  *
1035  * if (gh->gh_flags & GL_ASYNC), this never returns an error
1036  *
1037  * Returns: 0, GLR_TRYFAILED, or errno on failure
1038  */
1039
1040 int gfs2_glock_nq(struct gfs2_holder *gh)
1041 {
1042         struct gfs2_glock *gl = gh->gh_gl;
1043         struct gfs2_sbd *sdp = gl->gl_sbd;
1044         int error = 0;
1045
1046         if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags)))
1047                 return -EIO;
1048
1049         if (test_bit(GLF_LRU, &gl->gl_flags))
1050                 gfs2_glock_remove_from_lru(gl);
1051
1052         spin_lock(&gl->gl_spin);
1053         add_to_queue(gh);
1054         if ((LM_FLAG_NOEXP & gh->gh_flags) &&
1055             test_and_clear_bit(GLF_FROZEN, &gl->gl_flags))
1056                 set_bit(GLF_REPLY_PENDING, &gl->gl_flags);
1057         run_queue(gl, 1);
1058         spin_unlock(&gl->gl_spin);
1059
1060         if (!(gh->gh_flags & GL_ASYNC))
1061                 error = gfs2_glock_wait(gh);
1062
1063         return error;
1064 }
1065
1066 /**
1067  * gfs2_glock_poll - poll to see if an async request has been completed
1068  * @gh: the holder
1069  *
1070  * Returns: 1 if the request is ready to be gfs2_glock_wait()ed on
1071  */
1072
1073 int gfs2_glock_poll(struct gfs2_holder *gh)
1074 {
1075         return test_bit(HIF_WAIT, &gh->gh_iflags) ? 0 : 1;
1076 }
1077
1078 /**
1079  * gfs2_glock_dq - dequeue a struct gfs2_holder from a glock (release a glock)
1080  * @gh: the glock holder
1081  *
1082  */
1083
1084 void gfs2_glock_dq(struct gfs2_holder *gh)
1085 {
1086         struct gfs2_glock *gl = gh->gh_gl;
1087         const struct gfs2_glock_operations *glops = gl->gl_ops;
1088         unsigned delay = 0;
1089         int fast_path = 0;
1090
1091         spin_lock(&gl->gl_spin);
1092         if (gh->gh_flags & GL_NOCACHE)
1093                 handle_callback(gl, LM_ST_UNLOCKED, 0);
1094
1095         list_del_init(&gh->gh_list);
1096         if (find_first_holder(gl) == NULL) {
1097                 if (glops->go_unlock) {
1098                         GLOCK_BUG_ON(gl, test_and_set_bit(GLF_LOCK, &gl->gl_flags));
1099                         spin_unlock(&gl->gl_spin);
1100                         glops->go_unlock(gh);
1101                         spin_lock(&gl->gl_spin);
1102                         clear_bit(GLF_LOCK, &gl->gl_flags);
1103                 }
1104                 if (list_empty(&gl->gl_holders) &&
1105                     !test_bit(GLF_PENDING_DEMOTE, &gl->gl_flags) &&
1106                     !test_bit(GLF_DEMOTE, &gl->gl_flags))
1107                         fast_path = 1;
1108         }
1109         if (!test_bit(GLF_LFLUSH, &gl->gl_flags) && demote_ok(gl))
1110                 gfs2_glock_add_to_lru(gl);
1111
1112         trace_gfs2_glock_queue(gh, 0);
1113         spin_unlock(&gl->gl_spin);
1114         if (likely(fast_path))
1115                 return;
1116
1117         gfs2_glock_hold(gl);
1118         if (test_bit(GLF_PENDING_DEMOTE, &gl->gl_flags) &&
1119             !test_bit(GLF_DEMOTE, &gl->gl_flags) &&
1120             gl->gl_name.ln_type == LM_TYPE_INODE)
1121                 delay = gl->gl_hold_time;
1122         if (queue_delayed_work(glock_workqueue, &gl->gl_work, delay) == 0)
1123                 gfs2_glock_put(gl);
1124 }
1125
1126 void gfs2_glock_dq_wait(struct gfs2_holder *gh)
1127 {
1128         struct gfs2_glock *gl = gh->gh_gl;
1129         gfs2_glock_dq(gh);
1130         might_sleep();
1131         wait_on_bit(&gl->gl_flags, GLF_DEMOTE, gfs2_glock_demote_wait, TASK_UNINTERRUPTIBLE);
1132 }
1133
1134 /**
1135  * gfs2_glock_dq_uninit - dequeue a holder from a glock and initialize it
1136  * @gh: the holder structure
1137  *
1138  */
1139
1140 void gfs2_glock_dq_uninit(struct gfs2_holder *gh)
1141 {
1142         gfs2_glock_dq(gh);
1143         gfs2_holder_uninit(gh);
1144 }
1145
1146 /**
1147  * gfs2_glock_nq_num - acquire a glock based on lock number
1148  * @sdp: the filesystem
1149  * @number: the lock number
1150  * @glops: the glock operations for the type of glock
1151  * @state: the state to acquire the glock in
1152  * @flags: modifier flags for the acquisition
1153  * @gh: the struct gfs2_holder
1154  *
1155  * Returns: errno
1156  */
1157
1158 int gfs2_glock_nq_num(struct gfs2_sbd *sdp, u64 number,
1159                       const struct gfs2_glock_operations *glops,
1160                       unsigned int state, int flags, struct gfs2_holder *gh)
1161 {
1162         struct gfs2_glock *gl;
1163         int error;
1164
1165         error = gfs2_glock_get(sdp, number, glops, CREATE, &gl);
1166         if (!error) {
1167                 error = gfs2_glock_nq_init(gl, state, flags, gh);
1168                 gfs2_glock_put(gl);
1169         }
1170
1171         return error;
1172 }
1173
1174 /**
1175  * glock_compare - Compare two struct gfs2_glock structures for sorting
1176  * @arg_a: the first structure
1177  * @arg_b: the second structure
1178  *
1179  */
1180
1181 static int glock_compare(const void *arg_a, const void *arg_b)
1182 {
1183         const struct gfs2_holder *gh_a = *(const struct gfs2_holder **)arg_a;
1184         const struct gfs2_holder *gh_b = *(const struct gfs2_holder **)arg_b;
1185         const struct lm_lockname *a = &gh_a->gh_gl->gl_name;
1186         const struct lm_lockname *b = &gh_b->gh_gl->gl_name;
1187
1188         if (a->ln_number > b->ln_number)
1189                 return 1;
1190         if (a->ln_number < b->ln_number)
1191                 return -1;
1192         BUG_ON(gh_a->gh_gl->gl_ops->go_type == gh_b->gh_gl->gl_ops->go_type);
1193         return 0;
1194 }
1195
1196 /**
1197  * nq_m_sync - synchonously acquire more than one glock in deadlock free order
1198  * @num_gh: the number of structures
1199  * @ghs: an array of struct gfs2_holder structures
1200  *
1201  * Returns: 0 on success (all glocks acquired),
1202  *          errno on failure (no glocks acquired)
1203  */
1204
1205 static int nq_m_sync(unsigned int num_gh, struct gfs2_holder *ghs,
1206                      struct gfs2_holder **p)
1207 {
1208         unsigned int x;
1209         int error = 0;
1210
1211         for (x = 0; x < num_gh; x++)
1212                 p[x] = &ghs[x];
1213
1214         sort(p, num_gh, sizeof(struct gfs2_holder *), glock_compare, NULL);
1215
1216         for (x = 0; x < num_gh; x++) {
1217                 p[x]->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1218
1219                 error = gfs2_glock_nq(p[x]);
1220                 if (error) {
1221                         while (x--)
1222                                 gfs2_glock_dq(p[x]);
1223                         break;
1224                 }
1225         }
1226
1227         return error;
1228 }
1229
1230 /**
1231  * gfs2_glock_nq_m - acquire multiple glocks
1232  * @num_gh: the number of structures
1233  * @ghs: an array of struct gfs2_holder structures
1234  *
1235  *
1236  * Returns: 0 on success (all glocks acquired),
1237  *          errno on failure (no glocks acquired)
1238  */
1239
1240 int gfs2_glock_nq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1241 {
1242         struct gfs2_holder *tmp[4];
1243         struct gfs2_holder **pph = tmp;
1244         int error = 0;
1245
1246         switch(num_gh) {
1247         case 0:
1248                 return 0;
1249         case 1:
1250                 ghs->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1251                 return gfs2_glock_nq(ghs);
1252         default:
1253                 if (num_gh <= 4)
1254                         break;
1255                 pph = kmalloc(num_gh * sizeof(struct gfs2_holder *), GFP_NOFS);
1256                 if (!pph)
1257                         return -ENOMEM;
1258         }
1259
1260         error = nq_m_sync(num_gh, ghs, pph);
1261
1262         if (pph != tmp)
1263                 kfree(pph);
1264
1265         return error;
1266 }
1267
1268 /**
1269  * gfs2_glock_dq_m - release multiple glocks
1270  * @num_gh: the number of structures
1271  * @ghs: an array of struct gfs2_holder structures
1272  *
1273  */
1274
1275 void gfs2_glock_dq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1276 {
1277         while (num_gh--)
1278                 gfs2_glock_dq(&ghs[num_gh]);
1279 }
1280
1281 /**
1282  * gfs2_glock_dq_uninit_m - release multiple glocks
1283  * @num_gh: the number of structures
1284  * @ghs: an array of struct gfs2_holder structures
1285  *
1286  */
1287
1288 void gfs2_glock_dq_uninit_m(unsigned int num_gh, struct gfs2_holder *ghs)
1289 {
1290         while (num_gh--)
1291                 gfs2_glock_dq_uninit(&ghs[num_gh]);
1292 }
1293
1294 void gfs2_glock_cb(struct gfs2_glock *gl, unsigned int state)
1295 {
1296         unsigned long delay = 0;
1297         unsigned long holdtime;
1298         unsigned long now = jiffies;
1299
1300         gfs2_glock_hold(gl);
1301         holdtime = gl->gl_tchange + gl->gl_hold_time;
1302         if (test_bit(GLF_QUEUED, &gl->gl_flags) &&
1303             gl->gl_name.ln_type == LM_TYPE_INODE) {
1304                 if (time_before(now, holdtime))
1305                         delay = holdtime - now;
1306                 if (test_bit(GLF_REPLY_PENDING, &gl->gl_flags))
1307                         delay = gl->gl_hold_time;
1308         }
1309
1310         spin_lock(&gl->gl_spin);
1311         handle_callback(gl, state, delay);
1312         spin_unlock(&gl->gl_spin);
1313         if (queue_delayed_work(glock_workqueue, &gl->gl_work, delay) == 0)
1314                 gfs2_glock_put(gl);
1315 }
1316
1317 /**
1318  * gfs2_should_freeze - Figure out if glock should be frozen
1319  * @gl: The glock in question
1320  *
1321  * Glocks are not frozen if (a) the result of the dlm operation is
1322  * an error, (b) the locking operation was an unlock operation or
1323  * (c) if there is a "noexp" flagged request anywhere in the queue
1324  *
1325  * Returns: 1 if freezing should occur, 0 otherwise
1326  */
1327
1328 static int gfs2_should_freeze(const struct gfs2_glock *gl)
1329 {
1330         const struct gfs2_holder *gh;
1331
1332         if (gl->gl_reply & ~LM_OUT_ST_MASK)
1333                 return 0;
1334         if (gl->gl_target == LM_ST_UNLOCKED)
1335                 return 0;
1336
1337         list_for_each_entry(gh, &gl->gl_holders, gh_list) {
1338                 if (test_bit(HIF_HOLDER, &gh->gh_iflags))
1339                         continue;
1340                 if (LM_FLAG_NOEXP & gh->gh_flags)
1341                         return 0;
1342         }
1343
1344         return 1;
1345 }
1346
1347 /**
1348  * gfs2_glock_complete - Callback used by locking
1349  * @gl: Pointer to the glock
1350  * @ret: The return value from the dlm
1351  *
1352  * The gl_reply field is under the gl_spin lock so that it is ok
1353  * to use a bitfield shared with other glock state fields.
1354  */
1355
1356 void gfs2_glock_complete(struct gfs2_glock *gl, int ret)
1357 {
1358         struct lm_lockstruct *ls = &gl->gl_sbd->sd_lockstruct;
1359
1360         spin_lock(&gl->gl_spin);
1361         gl->gl_reply = ret;
1362
1363         if (unlikely(test_bit(DFL_BLOCK_LOCKS, &ls->ls_recover_flags))) {
1364                 if (gfs2_should_freeze(gl)) {
1365                         set_bit(GLF_FROZEN, &gl->gl_flags);
1366                         spin_unlock(&gl->gl_spin);
1367                         return;
1368                 }
1369         }
1370
1371         spin_unlock(&gl->gl_spin);
1372         set_bit(GLF_REPLY_PENDING, &gl->gl_flags);
1373         smp_wmb();
1374         gfs2_glock_hold(gl);
1375         if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
1376                 gfs2_glock_put(gl);
1377 }
1378
1379 /**
1380  * gfs2_scan_glock_lru - Scan the LRU looking for locks to demote
1381  * @nr: The number of entries to scan
1382  *
1383  */
1384
1385 static void gfs2_scan_glock_lru(int nr)
1386 {
1387         struct gfs2_glock *gl;
1388         int may_demote;
1389         int nr_skipped = 0;
1390         LIST_HEAD(skipped);
1391
1392         spin_lock(&lru_lock);
1393         while(nr && !list_empty(&lru_list)) {
1394                 gl = list_entry(lru_list.next, struct gfs2_glock, gl_lru);
1395                 list_del_init(&gl->gl_lru);
1396                 clear_bit(GLF_LRU, &gl->gl_flags);
1397                 atomic_dec(&lru_count);
1398
1399                 /* Test for being demotable */
1400                 if (!test_and_set_bit(GLF_LOCK, &gl->gl_flags)) {
1401                         gfs2_glock_hold(gl);
1402                         spin_unlock(&lru_lock);
1403                         spin_lock(&gl->gl_spin);
1404                         may_demote = demote_ok(gl);
1405                         if (may_demote) {
1406                                 handle_callback(gl, LM_ST_UNLOCKED, 0);
1407                                 nr--;
1408                         }
1409                         clear_bit(GLF_LOCK, &gl->gl_flags);
1410                         smp_mb__after_clear_bit();
1411                         if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
1412                                 gfs2_glock_put_nolock(gl);
1413                         spin_unlock(&gl->gl_spin);
1414                         spin_lock(&lru_lock);
1415                         continue;
1416                 }
1417                 nr_skipped++;
1418                 list_add(&gl->gl_lru, &skipped);
1419                 set_bit(GLF_LRU, &gl->gl_flags);
1420         }
1421         list_splice(&skipped, &lru_list);
1422         atomic_add(nr_skipped, &lru_count);
1423         spin_unlock(&lru_lock);
1424 }
1425
1426 static int gfs2_shrink_glock_memory(struct shrinker *shrink,
1427                                     struct shrink_control *sc)
1428 {
1429         if (sc->nr_to_scan) {
1430                 if (!(sc->gfp_mask & __GFP_FS))
1431                         return -1;
1432                 gfs2_scan_glock_lru(sc->nr_to_scan);
1433         }
1434
1435         return (atomic_read(&lru_count) / 100) * sysctl_vfs_cache_pressure;
1436 }
1437
1438 static struct shrinker glock_shrinker = {
1439         .shrink = gfs2_shrink_glock_memory,
1440         .seeks = DEFAULT_SEEKS,
1441 };
1442
1443 /**
1444  * examine_bucket - Call a function for glock in a hash bucket
1445  * @examiner: the function
1446  * @sdp: the filesystem
1447  * @bucket: the bucket
1448  *
1449  */
1450
1451 static void examine_bucket(glock_examiner examiner, const struct gfs2_sbd *sdp,
1452                           unsigned int hash)
1453 {
1454         struct gfs2_glock *gl;
1455         struct hlist_bl_head *head = &gl_hash_table[hash];
1456         struct hlist_bl_node *pos;
1457
1458         rcu_read_lock();
1459         hlist_bl_for_each_entry_rcu(gl, pos, head, gl_list) {
1460                 if ((gl->gl_sbd == sdp) && atomic_read(&gl->gl_ref))
1461                         examiner(gl);
1462         }
1463         rcu_read_unlock();
1464         cond_resched();
1465 }
1466
1467 static void glock_hash_walk(glock_examiner examiner, const struct gfs2_sbd *sdp)
1468 {
1469         unsigned x;
1470
1471         for (x = 0; x < GFS2_GL_HASH_SIZE; x++)
1472                 examine_bucket(examiner, sdp, x);
1473 }
1474
1475
1476 /**
1477  * thaw_glock - thaw out a glock which has an unprocessed reply waiting
1478  * @gl: The glock to thaw
1479  *
1480  * N.B. When we freeze a glock, we leave a ref to the glock outstanding,
1481  * so this has to result in the ref count being dropped by one.
1482  */
1483
1484 static void thaw_glock(struct gfs2_glock *gl)
1485 {
1486         if (!test_and_clear_bit(GLF_FROZEN, &gl->gl_flags))
1487                 return;
1488         set_bit(GLF_REPLY_PENDING, &gl->gl_flags);
1489         gfs2_glock_hold(gl);
1490         if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
1491                 gfs2_glock_put(gl);
1492 }
1493
1494 /**
1495  * clear_glock - look at a glock and see if we can free it from glock cache
1496  * @gl: the glock to look at
1497  *
1498  */
1499
1500 static void clear_glock(struct gfs2_glock *gl)
1501 {
1502         gfs2_glock_remove_from_lru(gl);
1503
1504         spin_lock(&gl->gl_spin);
1505         if (gl->gl_state != LM_ST_UNLOCKED)
1506                 handle_callback(gl, LM_ST_UNLOCKED, 0);
1507         spin_unlock(&gl->gl_spin);
1508         gfs2_glock_hold(gl);
1509         if (queue_delayed_work(glock_workqueue, &gl->gl_work, 0) == 0)
1510                 gfs2_glock_put(gl);
1511 }
1512
1513 /**
1514  * gfs2_glock_thaw - Thaw any frozen glocks
1515  * @sdp: The super block
1516  *
1517  */
1518
1519 void gfs2_glock_thaw(struct gfs2_sbd *sdp)
1520 {
1521         glock_hash_walk(thaw_glock, sdp);
1522 }
1523
1524 static int dump_glock(struct seq_file *seq, struct gfs2_glock *gl)
1525 {
1526         int ret;
1527         spin_lock(&gl->gl_spin);
1528         ret = gfs2_dump_glock(seq, gl);
1529         spin_unlock(&gl->gl_spin);
1530         return ret;
1531 }
1532
1533 static void dump_glock_func(struct gfs2_glock *gl)
1534 {
1535         dump_glock(NULL, gl);
1536 }
1537
1538 /**
1539  * gfs2_gl_hash_clear - Empty out the glock hash table
1540  * @sdp: the filesystem
1541  * @wait: wait until it's all gone
1542  *
1543  * Called when unmounting the filesystem.
1544  */
1545
1546 void gfs2_gl_hash_clear(struct gfs2_sbd *sdp)
1547 {
1548         set_bit(SDF_SKIP_DLM_UNLOCK, &sdp->sd_flags);
1549         glock_hash_walk(clear_glock, sdp);
1550         flush_workqueue(glock_workqueue);
1551         wait_event(sdp->sd_glock_wait, atomic_read(&sdp->sd_glock_disposal) == 0);
1552         glock_hash_walk(dump_glock_func, sdp);
1553 }
1554
1555 void gfs2_glock_finish_truncate(struct gfs2_inode *ip)
1556 {
1557         struct gfs2_glock *gl = ip->i_gl;
1558         int ret;
1559
1560         ret = gfs2_truncatei_resume(ip);
1561         gfs2_assert_withdraw(gl->gl_sbd, ret == 0);
1562
1563         spin_lock(&gl->gl_spin);
1564         clear_bit(GLF_LOCK, &gl->gl_flags);
1565         run_queue(gl, 1);
1566         spin_unlock(&gl->gl_spin);
1567 }
1568
1569 static const char *state2str(unsigned state)
1570 {
1571         switch(state) {
1572         case LM_ST_UNLOCKED:
1573                 return "UN";
1574         case LM_ST_SHARED:
1575                 return "SH";
1576         case LM_ST_DEFERRED:
1577                 return "DF";
1578         case LM_ST_EXCLUSIVE:
1579                 return "EX";
1580         }
1581         return "??";
1582 }
1583
1584 static const char *hflags2str(char *buf, unsigned flags, unsigned long iflags)
1585 {
1586         char *p = buf;
1587         if (flags & LM_FLAG_TRY)
1588                 *p++ = 't';
1589         if (flags & LM_FLAG_TRY_1CB)
1590                 *p++ = 'T';
1591         if (flags & LM_FLAG_NOEXP)
1592                 *p++ = 'e';
1593         if (flags & LM_FLAG_ANY)
1594                 *p++ = 'A';
1595         if (flags & LM_FLAG_PRIORITY)
1596                 *p++ = 'p';
1597         if (flags & GL_ASYNC)
1598                 *p++ = 'a';
1599         if (flags & GL_EXACT)
1600                 *p++ = 'E';
1601         if (flags & GL_NOCACHE)
1602                 *p++ = 'c';
1603         if (test_bit(HIF_HOLDER, &iflags))
1604                 *p++ = 'H';
1605         if (test_bit(HIF_WAIT, &iflags))
1606                 *p++ = 'W';
1607         if (test_bit(HIF_FIRST, &iflags))
1608                 *p++ = 'F';
1609         *p = 0;
1610         return buf;
1611 }
1612
1613 /**
1614  * dump_holder - print information about a glock holder
1615  * @seq: the seq_file struct
1616  * @gh: the glock holder
1617  *
1618  * Returns: 0 on success, -ENOBUFS when we run out of space
1619  */
1620
1621 static int dump_holder(struct seq_file *seq, const struct gfs2_holder *gh)
1622 {
1623         struct task_struct *gh_owner = NULL;
1624         char flags_buf[32];
1625
1626         if (gh->gh_owner_pid)
1627                 gh_owner = pid_task(gh->gh_owner_pid, PIDTYPE_PID);
1628         gfs2_print_dbg(seq, " H: s:%s f:%s e:%d p:%ld [%s] %pS\n",
1629                        state2str(gh->gh_state),
1630                        hflags2str(flags_buf, gh->gh_flags, gh->gh_iflags),
1631                        gh->gh_error,
1632                        gh->gh_owner_pid ? (long)pid_nr(gh->gh_owner_pid) : -1,
1633                        gh_owner ? gh_owner->comm : "(ended)",
1634                        (void *)gh->gh_ip);
1635         return 0;
1636 }
1637
1638 static const char *gflags2str(char *buf, const struct gfs2_glock *gl)
1639 {
1640         const unsigned long *gflags = &gl->gl_flags;
1641         char *p = buf;
1642
1643         if (test_bit(GLF_LOCK, gflags))
1644                 *p++ = 'l';
1645         if (test_bit(GLF_DEMOTE, gflags))
1646                 *p++ = 'D';
1647         if (test_bit(GLF_PENDING_DEMOTE, gflags))
1648                 *p++ = 'd';
1649         if (test_bit(GLF_DEMOTE_IN_PROGRESS, gflags))
1650                 *p++ = 'p';
1651         if (test_bit(GLF_DIRTY, gflags))
1652                 *p++ = 'y';
1653         if (test_bit(GLF_LFLUSH, gflags))
1654                 *p++ = 'f';
1655         if (test_bit(GLF_INVALIDATE_IN_PROGRESS, gflags))
1656                 *p++ = 'i';
1657         if (test_bit(GLF_REPLY_PENDING, gflags))
1658                 *p++ = 'r';
1659         if (test_bit(GLF_INITIAL, gflags))
1660                 *p++ = 'I';
1661         if (test_bit(GLF_FROZEN, gflags))
1662                 *p++ = 'F';
1663         if (test_bit(GLF_QUEUED, gflags))
1664                 *p++ = 'q';
1665         if (test_bit(GLF_LRU, gflags))
1666                 *p++ = 'L';
1667         if (gl->gl_object)
1668                 *p++ = 'o';
1669         if (test_bit(GLF_BLOCKING, gflags))
1670                 *p++ = 'b';
1671         *p = 0;
1672         return buf;
1673 }
1674
1675 /**
1676  * gfs2_dump_glock - print information about a glock
1677  * @seq: The seq_file struct
1678  * @gl: the glock
1679  *
1680  * The file format is as follows:
1681  * One line per object, capital letters are used to indicate objects
1682  * G = glock, I = Inode, R = rgrp, H = holder. Glocks are not indented,
1683  * other objects are indented by a single space and follow the glock to
1684  * which they are related. Fields are indicated by lower case letters
1685  * followed by a colon and the field value, except for strings which are in
1686  * [] so that its possible to see if they are composed of spaces for
1687  * example. The field's are n = number (id of the object), f = flags,
1688  * t = type, s = state, r = refcount, e = error, p = pid.
1689  *
1690  * Returns: 0 on success, -ENOBUFS when we run out of space
1691  */
1692
1693 int gfs2_dump_glock(struct seq_file *seq, const struct gfs2_glock *gl)
1694 {
1695         const struct gfs2_glock_operations *glops = gl->gl_ops;
1696         unsigned long long dtime;
1697         const struct gfs2_holder *gh;
1698         char gflags_buf[32];
1699         int error = 0;
1700
1701         dtime = jiffies - gl->gl_demote_time;
1702         dtime *= 1000000/HZ; /* demote time in uSec */
1703         if (!test_bit(GLF_DEMOTE, &gl->gl_flags))
1704                 dtime = 0;
1705         gfs2_print_dbg(seq, "G:  s:%s n:%u/%llx f:%s t:%s d:%s/%llu a:%d v:%d r:%d m:%ld\n",
1706                   state2str(gl->gl_state),
1707                   gl->gl_name.ln_type,
1708                   (unsigned long long)gl->gl_name.ln_number,
1709                   gflags2str(gflags_buf, gl),
1710                   state2str(gl->gl_target),
1711                   state2str(gl->gl_demote_state), dtime,
1712                   atomic_read(&gl->gl_ail_count),
1713                   atomic_read(&gl->gl_revokes),
1714                   atomic_read(&gl->gl_ref), gl->gl_hold_time);
1715
1716         list_for_each_entry(gh, &gl->gl_holders, gh_list) {
1717                 error = dump_holder(seq, gh);
1718                 if (error)
1719                         goto out;
1720         }
1721         if (gl->gl_state != LM_ST_UNLOCKED && glops->go_dump)
1722                 error = glops->go_dump(seq, gl);
1723 out:
1724         return error;
1725 }
1726
1727 static int gfs2_glstats_seq_show(struct seq_file *seq, void *iter_ptr)
1728 {
1729         struct gfs2_glock *gl = iter_ptr;
1730
1731         seq_printf(seq, "G: n:%u/%llx rtt:%lld/%lld rttb:%lld/%lld irt:%lld/%lld dcnt: %lld qcnt: %lld\n",
1732                    gl->gl_name.ln_type,
1733                    (unsigned long long)gl->gl_name.ln_number,
1734                    (long long)gl->gl_stats.stats[GFS2_LKS_SRTT],
1735                    (long long)gl->gl_stats.stats[GFS2_LKS_SRTTVAR],
1736                    (long long)gl->gl_stats.stats[GFS2_LKS_SRTTB],
1737                    (long long)gl->gl_stats.stats[GFS2_LKS_SRTTVARB],
1738                    (long long)gl->gl_stats.stats[GFS2_LKS_SIRT],
1739                    (long long)gl->gl_stats.stats[GFS2_LKS_SIRTVAR],
1740                    (long long)gl->gl_stats.stats[GFS2_LKS_DCOUNT],
1741                    (long long)gl->gl_stats.stats[GFS2_LKS_QCOUNT]);
1742         return 0;
1743 }
1744
1745 static const char *gfs2_gltype[] = {
1746         "type",
1747         "reserved",
1748         "nondisk",
1749         "inode",
1750         "rgrp",
1751         "meta",
1752         "iopen",
1753         "flock",
1754         "plock",
1755         "quota",
1756         "journal",
1757 };
1758
1759 static const char *gfs2_stype[] = {
1760         [GFS2_LKS_SRTT]         = "srtt",
1761         [GFS2_LKS_SRTTVAR]      = "srttvar",
1762         [GFS2_LKS_SRTTB]        = "srttb",
1763         [GFS2_LKS_SRTTVARB]     = "srttvarb",
1764         [GFS2_LKS_SIRT]         = "sirt",
1765         [GFS2_LKS_SIRTVAR]      = "sirtvar",
1766         [GFS2_LKS_DCOUNT]       = "dlm",
1767         [GFS2_LKS_QCOUNT]       = "queue",
1768 };
1769
1770 #define GFS2_NR_SBSTATS (ARRAY_SIZE(gfs2_gltype) * ARRAY_SIZE(gfs2_stype))
1771
1772 static int gfs2_sbstats_seq_show(struct seq_file *seq, void *iter_ptr)
1773 {
1774         struct gfs2_glock_iter *gi = seq->private;
1775         struct gfs2_sbd *sdp = gi->sdp;
1776         unsigned index = gi->hash >> 3;
1777         unsigned subindex = gi->hash & 0x07;
1778         s64 value;
1779         int i;
1780
1781         if (index == 0 && subindex != 0)
1782                 return 0;
1783
1784         seq_printf(seq, "%-10s %8s:", gfs2_gltype[index],
1785                    (index == 0) ? "cpu": gfs2_stype[subindex]);
1786
1787         for_each_possible_cpu(i) {
1788                 const struct gfs2_pcpu_lkstats *lkstats = per_cpu_ptr(sdp->sd_lkstats, i);
1789                 if (index == 0) {
1790                         value = i;
1791                 } else {
1792                         value = lkstats->lkstats[index - 1].stats[subindex];
1793                 }
1794                 seq_printf(seq, " %15lld", (long long)value);
1795         }
1796         seq_putc(seq, '\n');
1797         return 0;
1798 }
1799
1800 int __init gfs2_glock_init(void)
1801 {
1802         unsigned i;
1803         for(i = 0; i < GFS2_GL_HASH_SIZE; i++) {
1804                 INIT_HLIST_BL_HEAD(&gl_hash_table[i]);
1805         }
1806
1807         glock_workqueue = alloc_workqueue("glock_workqueue", WQ_MEM_RECLAIM |
1808                                           WQ_HIGHPRI | WQ_FREEZABLE, 0);
1809         if (IS_ERR(glock_workqueue))
1810                 return PTR_ERR(glock_workqueue);
1811         gfs2_delete_workqueue = alloc_workqueue("delete_workqueue",
1812                                                 WQ_MEM_RECLAIM | WQ_FREEZABLE,
1813                                                 0);
1814         if (IS_ERR(gfs2_delete_workqueue)) {
1815                 destroy_workqueue(glock_workqueue);
1816                 return PTR_ERR(gfs2_delete_workqueue);
1817         }
1818
1819         register_shrinker(&glock_shrinker);
1820
1821         return 0;
1822 }
1823
1824 void gfs2_glock_exit(void)
1825 {
1826         unregister_shrinker(&glock_shrinker);
1827         destroy_workqueue(glock_workqueue);
1828         destroy_workqueue(gfs2_delete_workqueue);
1829 }
1830
1831 static inline struct gfs2_glock *glock_hash_chain(unsigned hash)
1832 {
1833         return hlist_bl_entry(hlist_bl_first_rcu(&gl_hash_table[hash]),
1834                               struct gfs2_glock, gl_list);
1835 }
1836
1837 static inline struct gfs2_glock *glock_hash_next(struct gfs2_glock *gl)
1838 {
1839         return hlist_bl_entry(rcu_dereference(gl->gl_list.next),
1840                               struct gfs2_glock, gl_list);
1841 }
1842
1843 static int gfs2_glock_iter_next(struct gfs2_glock_iter *gi)
1844 {
1845         struct gfs2_glock *gl;
1846
1847         do {
1848                 gl = gi->gl;
1849                 if (gl) {
1850                         gi->gl = glock_hash_next(gl);
1851                         gi->nhash++;
1852                 } else {
1853                         if (gi->hash >= GFS2_GL_HASH_SIZE) {
1854                                 rcu_read_unlock();
1855                                 return 1;
1856                         }
1857                         gi->gl = glock_hash_chain(gi->hash);
1858                         gi->nhash = 0;
1859                 }
1860                 while (gi->gl == NULL) {
1861                         gi->hash++;
1862                         if (gi->hash >= GFS2_GL_HASH_SIZE) {
1863                                 rcu_read_unlock();
1864                                 return 1;
1865                         }
1866                         gi->gl = glock_hash_chain(gi->hash);
1867                         gi->nhash = 0;
1868                 }
1869         /* Skip entries for other sb and dead entries */
1870         } while (gi->sdp != gi->gl->gl_sbd || atomic_read(&gi->gl->gl_ref) == 0);
1871
1872         return 0;
1873 }
1874
1875 static void *gfs2_glock_seq_start(struct seq_file *seq, loff_t *pos)
1876 {
1877         struct gfs2_glock_iter *gi = seq->private;
1878         loff_t n = *pos;
1879
1880         if (gi->last_pos <= *pos)
1881                 n = gi->nhash + (*pos - gi->last_pos);
1882         else
1883                 gi->hash = 0;
1884
1885         gi->nhash = 0;
1886         rcu_read_lock();
1887
1888         do {
1889                 if (gfs2_glock_iter_next(gi))
1890                         return NULL;
1891         } while (n--);
1892
1893         gi->last_pos = *pos;
1894         return gi->gl;
1895 }
1896
1897 static void *gfs2_glock_seq_next(struct seq_file *seq, void *iter_ptr,
1898                                  loff_t *pos)
1899 {
1900         struct gfs2_glock_iter *gi = seq->private;
1901
1902         (*pos)++;
1903         gi->last_pos = *pos;
1904         if (gfs2_glock_iter_next(gi))
1905                 return NULL;
1906
1907         return gi->gl;
1908 }
1909
1910 static void gfs2_glock_seq_stop(struct seq_file *seq, void *iter_ptr)
1911 {
1912         struct gfs2_glock_iter *gi = seq->private;
1913
1914         if (gi->gl)
1915                 rcu_read_unlock();
1916         gi->gl = NULL;
1917 }
1918
1919 static int gfs2_glock_seq_show(struct seq_file *seq, void *iter_ptr)
1920 {
1921         return dump_glock(seq, iter_ptr);
1922 }
1923
1924 static void *gfs2_sbstats_seq_start(struct seq_file *seq, loff_t *pos)
1925 {
1926         struct gfs2_glock_iter *gi = seq->private;
1927
1928         gi->hash = *pos;
1929         if (*pos >= GFS2_NR_SBSTATS)
1930                 return NULL;
1931         preempt_disable();
1932         return SEQ_START_TOKEN;
1933 }
1934
1935 static void *gfs2_sbstats_seq_next(struct seq_file *seq, void *iter_ptr,
1936                                    loff_t *pos)
1937 {
1938         struct gfs2_glock_iter *gi = seq->private;
1939         (*pos)++;
1940         gi->hash++;
1941         if (gi->hash >= GFS2_NR_SBSTATS) {
1942                 preempt_enable();
1943                 return NULL;
1944         }
1945         return SEQ_START_TOKEN;
1946 }
1947
1948 static void gfs2_sbstats_seq_stop(struct seq_file *seq, void *iter_ptr)
1949 {
1950         preempt_enable();
1951 }
1952
1953 static const struct seq_operations gfs2_glock_seq_ops = {
1954         .start = gfs2_glock_seq_start,
1955         .next  = gfs2_glock_seq_next,
1956         .stop  = gfs2_glock_seq_stop,
1957         .show  = gfs2_glock_seq_show,
1958 };
1959
1960 static const struct seq_operations gfs2_glstats_seq_ops = {
1961         .start = gfs2_glock_seq_start,
1962         .next  = gfs2_glock_seq_next,
1963         .stop  = gfs2_glock_seq_stop,
1964         .show  = gfs2_glstats_seq_show,
1965 };
1966
1967 static const struct seq_operations gfs2_sbstats_seq_ops = {
1968         .start = gfs2_sbstats_seq_start,
1969         .next  = gfs2_sbstats_seq_next,
1970         .stop  = gfs2_sbstats_seq_stop,
1971         .show  = gfs2_sbstats_seq_show,
1972 };
1973
1974 #define GFS2_SEQ_GOODSIZE min(PAGE_SIZE << PAGE_ALLOC_COSTLY_ORDER, 65536UL)
1975
1976 static int gfs2_glocks_open(struct inode *inode, struct file *file)
1977 {
1978         int ret = seq_open_private(file, &gfs2_glock_seq_ops,
1979                                    sizeof(struct gfs2_glock_iter));
1980         if (ret == 0) {
1981                 struct seq_file *seq = file->private_data;
1982                 struct gfs2_glock_iter *gi = seq->private;
1983                 gi->sdp = inode->i_private;
1984                 seq->buf = kmalloc(GFS2_SEQ_GOODSIZE, GFP_KERNEL | __GFP_NOWARN);
1985                 if (seq->buf)
1986                         seq->size = GFS2_SEQ_GOODSIZE;
1987         }
1988         return ret;
1989 }
1990
1991 static int gfs2_glstats_open(struct inode *inode, struct file *file)
1992 {
1993         int ret = seq_open_private(file, &gfs2_glstats_seq_ops,
1994                                    sizeof(struct gfs2_glock_iter));
1995         if (ret == 0) {
1996                 struct seq_file *seq = file->private_data;
1997                 struct gfs2_glock_iter *gi = seq->private;
1998                 gi->sdp = inode->i_private;
1999                 seq->buf = kmalloc(GFS2_SEQ_GOODSIZE, GFP_KERNEL | __GFP_NOWARN);
2000                 if (seq->buf)
2001                         seq->size = GFS2_SEQ_GOODSIZE;
2002         }
2003         return ret;
2004 }
2005
2006 static int gfs2_sbstats_open(struct inode *inode, struct file *file)
2007 {
2008         int ret = seq_open_private(file, &gfs2_sbstats_seq_ops,
2009                                    sizeof(struct gfs2_glock_iter));
2010         if (ret == 0) {
2011                 struct seq_file *seq = file->private_data;
2012                 struct gfs2_glock_iter *gi = seq->private;
2013                 gi->sdp = inode->i_private;
2014         }
2015         return ret;
2016 }
2017
2018 static const struct file_operations gfs2_glocks_fops = {
2019         .owner   = THIS_MODULE,
2020         .open    = gfs2_glocks_open,
2021         .read    = seq_read,
2022         .llseek  = seq_lseek,
2023         .release = seq_release_private,
2024 };
2025
2026 static const struct file_operations gfs2_glstats_fops = {
2027         .owner   = THIS_MODULE,
2028         .open    = gfs2_glstats_open,
2029         .read    = seq_read,
2030         .llseek  = seq_lseek,
2031         .release = seq_release_private,
2032 };
2033
2034 static const struct file_operations gfs2_sbstats_fops = {
2035         .owner   = THIS_MODULE,
2036         .open    = gfs2_sbstats_open,
2037         .read    = seq_read,
2038         .llseek  = seq_lseek,
2039         .release = seq_release_private,
2040 };
2041
2042 int gfs2_create_debugfs_file(struct gfs2_sbd *sdp)
2043 {
2044         sdp->debugfs_dir = debugfs_create_dir(sdp->sd_table_name, gfs2_root);
2045         if (!sdp->debugfs_dir)
2046                 return -ENOMEM;
2047         sdp->debugfs_dentry_glocks = debugfs_create_file("glocks",
2048                                                          S_IFREG | S_IRUGO,
2049                                                          sdp->debugfs_dir, sdp,
2050                                                          &gfs2_glocks_fops);
2051         if (!sdp->debugfs_dentry_glocks)
2052                 goto fail;
2053
2054         sdp->debugfs_dentry_glstats = debugfs_create_file("glstats",
2055                                                         S_IFREG | S_IRUGO,
2056                                                         sdp->debugfs_dir, sdp,
2057                                                         &gfs2_glstats_fops);
2058         if (!sdp->debugfs_dentry_glstats)
2059                 goto fail;
2060
2061         sdp->debugfs_dentry_sbstats = debugfs_create_file("sbstats",
2062                                                         S_IFREG | S_IRUGO,
2063                                                         sdp->debugfs_dir, sdp,
2064                                                         &gfs2_sbstats_fops);
2065         if (!sdp->debugfs_dentry_sbstats)
2066                 goto fail;
2067
2068         return 0;
2069 fail:
2070         gfs2_delete_debugfs_file(sdp);
2071         return -ENOMEM;
2072 }
2073
2074 void gfs2_delete_debugfs_file(struct gfs2_sbd *sdp)
2075 {
2076         if (sdp->debugfs_dir) {
2077                 if (sdp->debugfs_dentry_glocks) {
2078                         debugfs_remove(sdp->debugfs_dentry_glocks);
2079                         sdp->debugfs_dentry_glocks = NULL;
2080                 }
2081                 if (sdp->debugfs_dentry_glstats) {
2082                         debugfs_remove(sdp->debugfs_dentry_glstats);
2083                         sdp->debugfs_dentry_glstats = NULL;
2084                 }
2085                 if (sdp->debugfs_dentry_sbstats) {
2086                         debugfs_remove(sdp->debugfs_dentry_sbstats);
2087                         sdp->debugfs_dentry_sbstats = NULL;
2088                 }
2089                 debugfs_remove(sdp->debugfs_dir);
2090                 sdp->debugfs_dir = NULL;
2091         }
2092 }
2093
2094 int gfs2_register_debugfs(void)
2095 {
2096         gfs2_root = debugfs_create_dir("gfs2", NULL);
2097         return gfs2_root ? 0 : -ENOMEM;
2098 }
2099
2100 void gfs2_unregister_debugfs(void)
2101 {
2102         debugfs_remove(gfs2_root);
2103         gfs2_root = NULL;
2104 }