xref: /openbmc/linux/fs/gfs2/glock.c (revision 64c70b1c)
1 /*
2  * Copyright (C) Sistina Software, Inc.  1997-2003 All rights reserved.
3  * Copyright (C) 2004-2006 Red Hat, Inc.  All rights reserved.
4  *
5  * This copyrighted material is made available to anyone wishing to use,
6  * modify, copy, or redistribute it subject to the terms and conditions
7  * of the GNU General Public License version 2.
8  */
9 
10 #include <linux/sched.h>
11 #include <linux/slab.h>
12 #include <linux/spinlock.h>
13 #include <linux/completion.h>
14 #include <linux/buffer_head.h>
15 #include <linux/delay.h>
16 #include <linux/sort.h>
17 #include <linux/jhash.h>
18 #include <linux/kallsyms.h>
19 #include <linux/gfs2_ondisk.h>
20 #include <linux/list.h>
21 #include <linux/lm_interface.h>
22 #include <linux/wait.h>
23 #include <linux/module.h>
24 #include <linux/rwsem.h>
25 #include <asm/uaccess.h>
26 #include <linux/seq_file.h>
27 #include <linux/debugfs.h>
28 #include <linux/module.h>
29 #include <linux/kallsyms.h>
30 
31 #include "gfs2.h"
32 #include "incore.h"
33 #include "glock.h"
34 #include "glops.h"
35 #include "inode.h"
36 #include "lm.h"
37 #include "lops.h"
38 #include "meta_io.h"
39 #include "quota.h"
40 #include "super.h"
41 #include "util.h"
42 
43 struct gfs2_gl_hash_bucket {
44         struct hlist_head hb_list;
45 };
46 
47 struct glock_iter {
48 	int hash;                     /* hash bucket index         */
49 	struct gfs2_sbd *sdp;         /* incore superblock         */
50 	struct gfs2_glock *gl;        /* current glock struct      */
51 	struct hlist_head *hb_list;   /* current hash bucket ptr   */
52 	struct seq_file *seq;         /* sequence file for debugfs */
53 	char string[512];             /* scratch space             */
54 };
55 
56 typedef void (*glock_examiner) (struct gfs2_glock * gl);
57 
58 static int gfs2_dump_lockstate(struct gfs2_sbd *sdp);
59 static int dump_glock(struct glock_iter *gi, struct gfs2_glock *gl);
60 static void gfs2_glock_xmote_th(struct gfs2_glock *gl, struct gfs2_holder *gh);
61 static void gfs2_glock_drop_th(struct gfs2_glock *gl);
62 static DECLARE_RWSEM(gfs2_umount_flush_sem);
63 static struct dentry *gfs2_root;
64 
65 #define GFS2_GL_HASH_SHIFT      15
66 #define GFS2_GL_HASH_SIZE       (1 << GFS2_GL_HASH_SHIFT)
67 #define GFS2_GL_HASH_MASK       (GFS2_GL_HASH_SIZE - 1)
68 
69 static struct gfs2_gl_hash_bucket gl_hash_table[GFS2_GL_HASH_SIZE];
70 static struct dentry *gfs2_root;
71 
72 /*
73  * Despite what you might think, the numbers below are not arbitrary :-)
74  * They are taken from the ipv4 routing hash code, which is well tested
75  * and thus should be nearly optimal. Later on we might tweek the numbers
76  * but for now this should be fine.
77  *
78  * The reason for putting the locks in a separate array from the list heads
79  * is that we can have fewer locks than list heads and save memory. We use
80  * the same hash function for both, but with a different hash mask.
81  */
82 #if defined(CONFIG_SMP) || defined(CONFIG_DEBUG_SPINLOCK) || \
83 	defined(CONFIG_PROVE_LOCKING)
84 
85 #ifdef CONFIG_LOCKDEP
86 # define GL_HASH_LOCK_SZ        256
87 #else
88 # if NR_CPUS >= 32
89 #  define GL_HASH_LOCK_SZ       4096
90 # elif NR_CPUS >= 16
91 #  define GL_HASH_LOCK_SZ       2048
92 # elif NR_CPUS >= 8
93 #  define GL_HASH_LOCK_SZ       1024
94 # elif NR_CPUS >= 4
95 #  define GL_HASH_LOCK_SZ       512
96 # else
97 #  define GL_HASH_LOCK_SZ       256
98 # endif
99 #endif
100 
101 /* We never want more locks than chains */
102 #if GFS2_GL_HASH_SIZE < GL_HASH_LOCK_SZ
103 # undef GL_HASH_LOCK_SZ
104 # define GL_HASH_LOCK_SZ GFS2_GL_HASH_SIZE
105 #endif
106 
107 static rwlock_t gl_hash_locks[GL_HASH_LOCK_SZ];
108 
109 static inline rwlock_t *gl_lock_addr(unsigned int x)
110 {
111 	return &gl_hash_locks[x & (GL_HASH_LOCK_SZ-1)];
112 }
113 #else /* not SMP, so no spinlocks required */
114 static inline rwlock_t *gl_lock_addr(unsigned int x)
115 {
116 	return NULL;
117 }
118 #endif
119 
120 /**
121  * relaxed_state_ok - is a requested lock compatible with the current lock mode?
122  * @actual: the current state of the lock
123  * @requested: the lock state that was requested by the caller
124  * @flags: the modifier flags passed in by the caller
125  *
126  * Returns: 1 if the locks are compatible, 0 otherwise
127  */
128 
129 static inline int relaxed_state_ok(unsigned int actual, unsigned requested,
130 				   int flags)
131 {
132 	if (actual == requested)
133 		return 1;
134 
135 	if (flags & GL_EXACT)
136 		return 0;
137 
138 	if (actual == LM_ST_EXCLUSIVE && requested == LM_ST_SHARED)
139 		return 1;
140 
141 	if (actual != LM_ST_UNLOCKED && (flags & LM_FLAG_ANY))
142 		return 1;
143 
144 	return 0;
145 }
146 
147 /**
148  * gl_hash() - Turn glock number into hash bucket number
149  * @lock: The glock number
150  *
151  * Returns: The number of the corresponding hash bucket
152  */
153 
154 static unsigned int gl_hash(const struct gfs2_sbd *sdp,
155 			    const struct lm_lockname *name)
156 {
157 	unsigned int h;
158 
159 	h = jhash(&name->ln_number, sizeof(u64), 0);
160 	h = jhash(&name->ln_type, sizeof(unsigned int), h);
161 	h = jhash(&sdp, sizeof(struct gfs2_sbd *), h);
162 	h &= GFS2_GL_HASH_MASK;
163 
164 	return h;
165 }
166 
167 /**
168  * glock_free() - Perform a few checks and then release struct gfs2_glock
169  * @gl: The glock to release
170  *
171  * Also calls lock module to release its internal structure for this glock.
172  *
173  */
174 
175 static void glock_free(struct gfs2_glock *gl)
176 {
177 	struct gfs2_sbd *sdp = gl->gl_sbd;
178 	struct inode *aspace = gl->gl_aspace;
179 
180 	gfs2_lm_put_lock(sdp, gl->gl_lock);
181 
182 	if (aspace)
183 		gfs2_aspace_put(aspace);
184 
185 	kmem_cache_free(gfs2_glock_cachep, gl);
186 }
187 
188 /**
189  * gfs2_glock_hold() - increment reference count on glock
190  * @gl: The glock to hold
191  *
192  */
193 
194 void gfs2_glock_hold(struct gfs2_glock *gl)
195 {
196 	atomic_inc(&gl->gl_ref);
197 }
198 
199 /**
200  * gfs2_glock_put() - Decrement reference count on glock
201  * @gl: The glock to put
202  *
203  */
204 
205 int gfs2_glock_put(struct gfs2_glock *gl)
206 {
207 	int rv = 0;
208 	struct gfs2_sbd *sdp = gl->gl_sbd;
209 
210 	write_lock(gl_lock_addr(gl->gl_hash));
211 	if (atomic_dec_and_test(&gl->gl_ref)) {
212 		hlist_del(&gl->gl_list);
213 		write_unlock(gl_lock_addr(gl->gl_hash));
214 		BUG_ON(spin_is_locked(&gl->gl_spin));
215 		gfs2_assert(sdp, gl->gl_state == LM_ST_UNLOCKED);
216 		gfs2_assert(sdp, list_empty(&gl->gl_reclaim));
217 		gfs2_assert(sdp, list_empty(&gl->gl_holders));
218 		gfs2_assert(sdp, list_empty(&gl->gl_waiters1));
219 		gfs2_assert(sdp, list_empty(&gl->gl_waiters3));
220 		glock_free(gl);
221 		rv = 1;
222 		goto out;
223 	}
224 	write_unlock(gl_lock_addr(gl->gl_hash));
225 out:
226 	return rv;
227 }
228 
229 /**
230  * search_bucket() - Find struct gfs2_glock by lock number
231  * @bucket: the bucket to search
232  * @name: The lock name
233  *
234  * Returns: NULL, or the struct gfs2_glock with the requested number
235  */
236 
237 static struct gfs2_glock *search_bucket(unsigned int hash,
238 					const struct gfs2_sbd *sdp,
239 					const struct lm_lockname *name)
240 {
241 	struct gfs2_glock *gl;
242 	struct hlist_node *h;
243 
244 	hlist_for_each_entry(gl, h, &gl_hash_table[hash].hb_list, gl_list) {
245 		if (!lm_name_equal(&gl->gl_name, name))
246 			continue;
247 		if (gl->gl_sbd != sdp)
248 			continue;
249 
250 		atomic_inc(&gl->gl_ref);
251 
252 		return gl;
253 	}
254 
255 	return NULL;
256 }
257 
258 /**
259  * gfs2_glock_find() - Find glock by lock number
260  * @sdp: The GFS2 superblock
261  * @name: The lock name
262  *
263  * Returns: NULL, or the struct gfs2_glock with the requested number
264  */
265 
266 static struct gfs2_glock *gfs2_glock_find(const struct gfs2_sbd *sdp,
267 					  const struct lm_lockname *name)
268 {
269 	unsigned int hash = gl_hash(sdp, name);
270 	struct gfs2_glock *gl;
271 
272 	read_lock(gl_lock_addr(hash));
273 	gl = search_bucket(hash, sdp, name);
274 	read_unlock(gl_lock_addr(hash));
275 
276 	return gl;
277 }
278 
279 /**
280  * gfs2_glock_get() - Get a glock, or create one if one doesn't exist
281  * @sdp: The GFS2 superblock
282  * @number: the lock number
283  * @glops: The glock_operations to use
284  * @create: If 0, don't create the glock if it doesn't exist
285  * @glp: the glock is returned here
286  *
287  * This does not lock a glock, just finds/creates structures for one.
288  *
289  * Returns: errno
290  */
291 
292 int gfs2_glock_get(struct gfs2_sbd *sdp, u64 number,
293 		   const struct gfs2_glock_operations *glops, int create,
294 		   struct gfs2_glock **glp)
295 {
296 	struct lm_lockname name = { .ln_number = number, .ln_type = glops->go_type };
297 	struct gfs2_glock *gl, *tmp;
298 	unsigned int hash = gl_hash(sdp, &name);
299 	int error;
300 
301 	read_lock(gl_lock_addr(hash));
302 	gl = search_bucket(hash, sdp, &name);
303 	read_unlock(gl_lock_addr(hash));
304 
305 	if (gl || !create) {
306 		*glp = gl;
307 		return 0;
308 	}
309 
310 	gl = kmem_cache_alloc(gfs2_glock_cachep, GFP_KERNEL);
311 	if (!gl)
312 		return -ENOMEM;
313 
314 	gl->gl_flags = 0;
315 	gl->gl_name = name;
316 	atomic_set(&gl->gl_ref, 1);
317 	gl->gl_state = LM_ST_UNLOCKED;
318 	gl->gl_hash = hash;
319 	gl->gl_owner_pid = 0;
320 	gl->gl_ip = 0;
321 	gl->gl_ops = glops;
322 	gl->gl_req_gh = NULL;
323 	gl->gl_req_bh = NULL;
324 	gl->gl_vn = 0;
325 	gl->gl_stamp = jiffies;
326 	gl->gl_object = NULL;
327 	gl->gl_sbd = sdp;
328 	gl->gl_aspace = NULL;
329 	lops_init_le(&gl->gl_le, &gfs2_glock_lops);
330 
331 	/* If this glock protects actual on-disk data or metadata blocks,
332 	   create a VFS inode to manage the pages/buffers holding them. */
333 	if (glops == &gfs2_inode_glops || glops == &gfs2_rgrp_glops) {
334 		gl->gl_aspace = gfs2_aspace_get(sdp);
335 		if (!gl->gl_aspace) {
336 			error = -ENOMEM;
337 			goto fail;
338 		}
339 	}
340 
341 	error = gfs2_lm_get_lock(sdp, &name, &gl->gl_lock);
342 	if (error)
343 		goto fail_aspace;
344 
345 	write_lock(gl_lock_addr(hash));
346 	tmp = search_bucket(hash, sdp, &name);
347 	if (tmp) {
348 		write_unlock(gl_lock_addr(hash));
349 		glock_free(gl);
350 		gl = tmp;
351 	} else {
352 		hlist_add_head(&gl->gl_list, &gl_hash_table[hash].hb_list);
353 		write_unlock(gl_lock_addr(hash));
354 	}
355 
356 	*glp = gl;
357 
358 	return 0;
359 
360 fail_aspace:
361 	if (gl->gl_aspace)
362 		gfs2_aspace_put(gl->gl_aspace);
363 fail:
364 	kmem_cache_free(gfs2_glock_cachep, gl);
365 	return error;
366 }
367 
368 /**
369  * gfs2_holder_init - initialize a struct gfs2_holder in the default way
370  * @gl: the glock
371  * @state: the state we're requesting
372  * @flags: the modifier flags
373  * @gh: the holder structure
374  *
375  */
376 
377 void gfs2_holder_init(struct gfs2_glock *gl, unsigned int state, unsigned flags,
378 		      struct gfs2_holder *gh)
379 {
380 	INIT_LIST_HEAD(&gh->gh_list);
381 	gh->gh_gl = gl;
382 	gh->gh_ip = (unsigned long)__builtin_return_address(0);
383 	gh->gh_owner_pid = current->pid;
384 	gh->gh_state = state;
385 	gh->gh_flags = flags;
386 	gh->gh_error = 0;
387 	gh->gh_iflags = 0;
388 	gfs2_glock_hold(gl);
389 }
390 
391 /**
392  * gfs2_holder_reinit - reinitialize a struct gfs2_holder so we can requeue it
393  * @state: the state we're requesting
394  * @flags: the modifier flags
395  * @gh: the holder structure
396  *
397  * Don't mess with the glock.
398  *
399  */
400 
401 void gfs2_holder_reinit(unsigned int state, unsigned flags, struct gfs2_holder *gh)
402 {
403 	gh->gh_state = state;
404 	gh->gh_flags = flags;
405 	gh->gh_iflags = 0;
406 	gh->gh_ip = (unsigned long)__builtin_return_address(0);
407 }
408 
409 /**
410  * gfs2_holder_uninit - uninitialize a holder structure (drop glock reference)
411  * @gh: the holder structure
412  *
413  */
414 
415 void gfs2_holder_uninit(struct gfs2_holder *gh)
416 {
417 	gfs2_glock_put(gh->gh_gl);
418 	gh->gh_gl = NULL;
419 	gh->gh_ip = 0;
420 }
421 
422 static void gfs2_holder_wake(struct gfs2_holder *gh)
423 {
424 	clear_bit(HIF_WAIT, &gh->gh_iflags);
425 	smp_mb__after_clear_bit();
426 	wake_up_bit(&gh->gh_iflags, HIF_WAIT);
427 }
428 
429 static int just_schedule(void *word)
430 {
431         schedule();
432         return 0;
433 }
434 
435 static void wait_on_holder(struct gfs2_holder *gh)
436 {
437 	might_sleep();
438 	wait_on_bit(&gh->gh_iflags, HIF_WAIT, just_schedule, TASK_UNINTERRUPTIBLE);
439 }
440 
441 static void gfs2_demote_wake(struct gfs2_glock *gl)
442 {
443         clear_bit(GLF_DEMOTE, &gl->gl_flags);
444         smp_mb__after_clear_bit();
445         wake_up_bit(&gl->gl_flags, GLF_DEMOTE);
446 }
447 
448 static void wait_on_demote(struct gfs2_glock *gl)
449 {
450 	might_sleep();
451 	wait_on_bit(&gl->gl_flags, GLF_DEMOTE, just_schedule, TASK_UNINTERRUPTIBLE);
452 }
453 
454 /**
455  * rq_mutex - process a mutex request in the queue
456  * @gh: the glock holder
457  *
458  * Returns: 1 if the queue is blocked
459  */
460 
461 static int rq_mutex(struct gfs2_holder *gh)
462 {
463 	struct gfs2_glock *gl = gh->gh_gl;
464 
465 	list_del_init(&gh->gh_list);
466 	/*  gh->gh_error never examined.  */
467 	set_bit(GLF_LOCK, &gl->gl_flags);
468 	clear_bit(HIF_WAIT, &gh->gh_iflags);
469 	smp_mb();
470 	wake_up_bit(&gh->gh_iflags, HIF_WAIT);
471 
472 	return 1;
473 }
474 
475 /**
476  * rq_promote - process a promote request in the queue
477  * @gh: the glock holder
478  *
479  * Acquire a new inter-node lock, or change a lock state to more restrictive.
480  *
481  * Returns: 1 if the queue is blocked
482  */
483 
484 static int rq_promote(struct gfs2_holder *gh)
485 {
486 	struct gfs2_glock *gl = gh->gh_gl;
487 	struct gfs2_sbd *sdp = gl->gl_sbd;
488 
489 	if (!relaxed_state_ok(gl->gl_state, gh->gh_state, gh->gh_flags)) {
490 		if (list_empty(&gl->gl_holders)) {
491 			gl->gl_req_gh = gh;
492 			set_bit(GLF_LOCK, &gl->gl_flags);
493 			spin_unlock(&gl->gl_spin);
494 
495 			if (atomic_read(&sdp->sd_reclaim_count) >
496 			    gfs2_tune_get(sdp, gt_reclaim_limit) &&
497 			    !(gh->gh_flags & LM_FLAG_PRIORITY)) {
498 				gfs2_reclaim_glock(sdp);
499 				gfs2_reclaim_glock(sdp);
500 			}
501 
502 			gfs2_glock_xmote_th(gh->gh_gl, gh);
503 			spin_lock(&gl->gl_spin);
504 		}
505 		return 1;
506 	}
507 
508 	if (list_empty(&gl->gl_holders)) {
509 		set_bit(HIF_FIRST, &gh->gh_iflags);
510 		set_bit(GLF_LOCK, &gl->gl_flags);
511 	} else {
512 		struct gfs2_holder *next_gh;
513 		if (gh->gh_state == LM_ST_EXCLUSIVE)
514 			return 1;
515 		next_gh = list_entry(gl->gl_holders.next, struct gfs2_holder,
516 				     gh_list);
517 		if (next_gh->gh_state == LM_ST_EXCLUSIVE)
518 			 return 1;
519 	}
520 
521 	list_move_tail(&gh->gh_list, &gl->gl_holders);
522 	gh->gh_error = 0;
523 	set_bit(HIF_HOLDER, &gh->gh_iflags);
524 
525 	gfs2_holder_wake(gh);
526 
527 	return 0;
528 }
529 
530 /**
531  * rq_demote - process a demote request in the queue
532  * @gh: the glock holder
533  *
534  * Returns: 1 if the queue is blocked
535  */
536 
537 static int rq_demote(struct gfs2_glock *gl)
538 {
539 	if (!list_empty(&gl->gl_holders))
540 		return 1;
541 
542 	if (gl->gl_state == gl->gl_demote_state ||
543 	    gl->gl_state == LM_ST_UNLOCKED) {
544 		gfs2_demote_wake(gl);
545 		return 0;
546 	}
547 	set_bit(GLF_LOCK, &gl->gl_flags);
548 	spin_unlock(&gl->gl_spin);
549 	if (gl->gl_demote_state == LM_ST_UNLOCKED ||
550 	    gl->gl_state != LM_ST_EXCLUSIVE)
551 		gfs2_glock_drop_th(gl);
552 	else
553 		gfs2_glock_xmote_th(gl, NULL);
554 	spin_lock(&gl->gl_spin);
555 
556 	return 0;
557 }
558 
559 /**
560  * run_queue - process holder structures on a glock
561  * @gl: the glock
562  *
563  */
564 static void run_queue(struct gfs2_glock *gl)
565 {
566 	struct gfs2_holder *gh;
567 	int blocked = 1;
568 
569 	for (;;) {
570 		if (test_bit(GLF_LOCK, &gl->gl_flags))
571 			break;
572 
573 		if (!list_empty(&gl->gl_waiters1)) {
574 			gh = list_entry(gl->gl_waiters1.next,
575 					struct gfs2_holder, gh_list);
576 
577 			if (test_bit(HIF_MUTEX, &gh->gh_iflags))
578 				blocked = rq_mutex(gh);
579 			else
580 				gfs2_assert_warn(gl->gl_sbd, 0);
581 
582 		} else if (test_bit(GLF_DEMOTE, &gl->gl_flags)) {
583 			blocked = rq_demote(gl);
584 		} else if (!list_empty(&gl->gl_waiters3)) {
585 			gh = list_entry(gl->gl_waiters3.next,
586 					struct gfs2_holder, gh_list);
587 
588 			if (test_bit(HIF_PROMOTE, &gh->gh_iflags))
589 				blocked = rq_promote(gh);
590 			else
591 				gfs2_assert_warn(gl->gl_sbd, 0);
592 
593 		} else
594 			break;
595 
596 		if (blocked)
597 			break;
598 	}
599 }
600 
601 /**
602  * gfs2_glmutex_lock - acquire a local lock on a glock
603  * @gl: the glock
604  *
605  * Gives caller exclusive access to manipulate a glock structure.
606  */
607 
608 static void gfs2_glmutex_lock(struct gfs2_glock *gl)
609 {
610 	struct gfs2_holder gh;
611 
612 	gfs2_holder_init(gl, 0, 0, &gh);
613 	set_bit(HIF_MUTEX, &gh.gh_iflags);
614 	if (test_and_set_bit(HIF_WAIT, &gh.gh_iflags))
615 		BUG();
616 
617 	spin_lock(&gl->gl_spin);
618 	if (test_and_set_bit(GLF_LOCK, &gl->gl_flags)) {
619 		list_add_tail(&gh.gh_list, &gl->gl_waiters1);
620 	} else {
621 		gl->gl_owner_pid = current->pid;
622 		gl->gl_ip = (unsigned long)__builtin_return_address(0);
623 		clear_bit(HIF_WAIT, &gh.gh_iflags);
624 		smp_mb();
625 		wake_up_bit(&gh.gh_iflags, HIF_WAIT);
626 	}
627 	spin_unlock(&gl->gl_spin);
628 
629 	wait_on_holder(&gh);
630 	gfs2_holder_uninit(&gh);
631 }
632 
633 /**
634  * gfs2_glmutex_trylock - try to acquire a local lock on a glock
635  * @gl: the glock
636  *
637  * Returns: 1 if the glock is acquired
638  */
639 
640 static int gfs2_glmutex_trylock(struct gfs2_glock *gl)
641 {
642 	int acquired = 1;
643 
644 	spin_lock(&gl->gl_spin);
645 	if (test_and_set_bit(GLF_LOCK, &gl->gl_flags)) {
646 		acquired = 0;
647 	} else {
648 		gl->gl_owner_pid = current->pid;
649 		gl->gl_ip = (unsigned long)__builtin_return_address(0);
650 	}
651 	spin_unlock(&gl->gl_spin);
652 
653 	return acquired;
654 }
655 
656 /**
657  * gfs2_glmutex_unlock - release a local lock on a glock
658  * @gl: the glock
659  *
660  */
661 
662 static void gfs2_glmutex_unlock(struct gfs2_glock *gl)
663 {
664 	spin_lock(&gl->gl_spin);
665 	clear_bit(GLF_LOCK, &gl->gl_flags);
666 	gl->gl_owner_pid = 0;
667 	gl->gl_ip = 0;
668 	run_queue(gl);
669 	BUG_ON(!spin_is_locked(&gl->gl_spin));
670 	spin_unlock(&gl->gl_spin);
671 }
672 
673 /**
674  * handle_callback - process a demote request
675  * @gl: the glock
676  * @state: the state the caller wants us to change to
677  *
678  * There are only two requests that we are going to see in actual
679  * practise: LM_ST_SHARED and LM_ST_UNLOCKED
680  */
681 
682 static void handle_callback(struct gfs2_glock *gl, unsigned int state, int remote)
683 {
684 	spin_lock(&gl->gl_spin);
685 	if (test_and_set_bit(GLF_DEMOTE, &gl->gl_flags) == 0) {
686 		gl->gl_demote_state = state;
687 		gl->gl_demote_time = jiffies;
688 		if (remote && gl->gl_ops->go_type == LM_TYPE_IOPEN &&
689 		    gl->gl_object) {
690 			struct inode *inode = igrab(gl->gl_object);
691 			spin_unlock(&gl->gl_spin);
692 			if (inode) {
693 				d_prune_aliases(inode);
694 				iput(inode);
695 			}
696 			return;
697 		}
698 	} else if (gl->gl_demote_state != LM_ST_UNLOCKED) {
699 		gl->gl_demote_state = state;
700 	}
701 	spin_unlock(&gl->gl_spin);
702 }
703 
704 /**
705  * state_change - record that the glock is now in a different state
706  * @gl: the glock
707  * @new_state the new state
708  *
709  */
710 
711 static void state_change(struct gfs2_glock *gl, unsigned int new_state)
712 {
713 	int held1, held2;
714 
715 	held1 = (gl->gl_state != LM_ST_UNLOCKED);
716 	held2 = (new_state != LM_ST_UNLOCKED);
717 
718 	if (held1 != held2) {
719 		if (held2)
720 			gfs2_glock_hold(gl);
721 		else
722 			gfs2_glock_put(gl);
723 	}
724 
725 	gl->gl_state = new_state;
726 }
727 
728 /**
729  * xmote_bh - Called after the lock module is done acquiring a lock
730  * @gl: The glock in question
731  * @ret: the int returned from the lock module
732  *
733  */
734 
735 static void xmote_bh(struct gfs2_glock *gl, unsigned int ret)
736 {
737 	struct gfs2_sbd *sdp = gl->gl_sbd;
738 	const struct gfs2_glock_operations *glops = gl->gl_ops;
739 	struct gfs2_holder *gh = gl->gl_req_gh;
740 	int prev_state = gl->gl_state;
741 	int op_done = 1;
742 
743 	gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
744 	gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
745 	gfs2_assert_warn(sdp, !(ret & LM_OUT_ASYNC));
746 
747 	state_change(gl, ret & LM_OUT_ST_MASK);
748 
749 	if (prev_state != LM_ST_UNLOCKED && !(ret & LM_OUT_CACHEABLE)) {
750 		if (glops->go_inval)
751 			glops->go_inval(gl, DIO_METADATA);
752 	} else if (gl->gl_state == LM_ST_DEFERRED) {
753 		/* We might not want to do this here.
754 		   Look at moving to the inode glops. */
755 		if (glops->go_inval)
756 			glops->go_inval(gl, 0);
757 	}
758 
759 	/*  Deal with each possible exit condition  */
760 
761 	if (!gh) {
762 		gl->gl_stamp = jiffies;
763 		if (ret & LM_OUT_CANCELED)
764 			op_done = 0;
765 		else
766 			gfs2_demote_wake(gl);
767 	} else {
768 		spin_lock(&gl->gl_spin);
769 		list_del_init(&gh->gh_list);
770 		gh->gh_error = -EIO;
771 		if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags)))
772 			goto out;
773 		gh->gh_error = GLR_CANCELED;
774 		if (ret & LM_OUT_CANCELED)
775 			goto out;
776 		if (relaxed_state_ok(gl->gl_state, gh->gh_state, gh->gh_flags)) {
777 			list_add_tail(&gh->gh_list, &gl->gl_holders);
778 			gh->gh_error = 0;
779 			set_bit(HIF_HOLDER, &gh->gh_iflags);
780 			set_bit(HIF_FIRST, &gh->gh_iflags);
781 			op_done = 0;
782 			goto out;
783 		}
784 		gh->gh_error = GLR_TRYFAILED;
785 		if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB))
786 			goto out;
787 		gh->gh_error = -EINVAL;
788 		if (gfs2_assert_withdraw(sdp, 0) == -1)
789 			fs_err(sdp, "ret = 0x%.8X\n", ret);
790 out:
791 		spin_unlock(&gl->gl_spin);
792 	}
793 
794 	if (glops->go_xmote_bh)
795 		glops->go_xmote_bh(gl);
796 
797 	if (op_done) {
798 		spin_lock(&gl->gl_spin);
799 		gl->gl_req_gh = NULL;
800 		gl->gl_req_bh = NULL;
801 		clear_bit(GLF_LOCK, &gl->gl_flags);
802 		run_queue(gl);
803 		spin_unlock(&gl->gl_spin);
804 	}
805 
806 	gfs2_glock_put(gl);
807 
808 	if (gh)
809 		gfs2_holder_wake(gh);
810 }
811 
812 /**
813  * gfs2_glock_xmote_th - Call into the lock module to acquire or change a glock
814  * @gl: The glock in question
815  * @state: the requested state
816  * @flags: modifier flags to the lock call
817  *
818  */
819 
820 void gfs2_glock_xmote_th(struct gfs2_glock *gl, struct gfs2_holder *gh)
821 {
822 	struct gfs2_sbd *sdp = gl->gl_sbd;
823 	int flags = gh ? gh->gh_flags : 0;
824 	unsigned state = gh ? gh->gh_state : gl->gl_demote_state;
825 	const struct gfs2_glock_operations *glops = gl->gl_ops;
826 	int lck_flags = flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB |
827 				 LM_FLAG_NOEXP | LM_FLAG_ANY |
828 				 LM_FLAG_PRIORITY);
829 	unsigned int lck_ret;
830 
831 	if (glops->go_xmote_th)
832 		glops->go_xmote_th(gl);
833 
834 	gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
835 	gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
836 	gfs2_assert_warn(sdp, state != LM_ST_UNLOCKED);
837 	gfs2_assert_warn(sdp, state != gl->gl_state);
838 
839 	gfs2_glock_hold(gl);
840 	gl->gl_req_bh = xmote_bh;
841 
842 	lck_ret = gfs2_lm_lock(sdp, gl->gl_lock, gl->gl_state, state, lck_flags);
843 
844 	if (gfs2_assert_withdraw(sdp, !(lck_ret & LM_OUT_ERROR)))
845 		return;
846 
847 	if (lck_ret & LM_OUT_ASYNC)
848 		gfs2_assert_warn(sdp, lck_ret == LM_OUT_ASYNC);
849 	else
850 		xmote_bh(gl, lck_ret);
851 }
852 
853 /**
854  * drop_bh - Called after a lock module unlock completes
855  * @gl: the glock
856  * @ret: the return status
857  *
858  * Doesn't wake up the process waiting on the struct gfs2_holder (if any)
859  * Doesn't drop the reference on the glock the top half took out
860  *
861  */
862 
863 static void drop_bh(struct gfs2_glock *gl, unsigned int ret)
864 {
865 	struct gfs2_sbd *sdp = gl->gl_sbd;
866 	const struct gfs2_glock_operations *glops = gl->gl_ops;
867 	struct gfs2_holder *gh = gl->gl_req_gh;
868 
869 	gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
870 	gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
871 	gfs2_assert_warn(sdp, !ret);
872 
873 	state_change(gl, LM_ST_UNLOCKED);
874 	gfs2_demote_wake(gl);
875 
876 	if (glops->go_inval)
877 		glops->go_inval(gl, DIO_METADATA);
878 
879 	if (gh) {
880 		spin_lock(&gl->gl_spin);
881 		list_del_init(&gh->gh_list);
882 		gh->gh_error = 0;
883 		spin_unlock(&gl->gl_spin);
884 	}
885 
886 	spin_lock(&gl->gl_spin);
887 	gl->gl_req_gh = NULL;
888 	gl->gl_req_bh = NULL;
889 	clear_bit(GLF_LOCK, &gl->gl_flags);
890 	run_queue(gl);
891 	spin_unlock(&gl->gl_spin);
892 
893 	gfs2_glock_put(gl);
894 
895 	if (gh)
896 		gfs2_holder_wake(gh);
897 }
898 
899 /**
900  * gfs2_glock_drop_th - call into the lock module to unlock a lock
901  * @gl: the glock
902  *
903  */
904 
905 static void gfs2_glock_drop_th(struct gfs2_glock *gl)
906 {
907 	struct gfs2_sbd *sdp = gl->gl_sbd;
908 	const struct gfs2_glock_operations *glops = gl->gl_ops;
909 	unsigned int ret;
910 
911 	if (glops->go_drop_th)
912 		glops->go_drop_th(gl);
913 
914 	gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
915 	gfs2_assert_warn(sdp, list_empty(&gl->gl_holders));
916 	gfs2_assert_warn(sdp, gl->gl_state != LM_ST_UNLOCKED);
917 
918 	gfs2_glock_hold(gl);
919 	gl->gl_req_bh = drop_bh;
920 
921 	ret = gfs2_lm_unlock(sdp, gl->gl_lock, gl->gl_state);
922 
923 	if (gfs2_assert_withdraw(sdp, !(ret & LM_OUT_ERROR)))
924 		return;
925 
926 	if (!ret)
927 		drop_bh(gl, ret);
928 	else
929 		gfs2_assert_warn(sdp, ret == LM_OUT_ASYNC);
930 }
931 
932 /**
933  * do_cancels - cancel requests for locks stuck waiting on an expire flag
934  * @gh: the LM_FLAG_PRIORITY holder waiting to acquire the lock
935  *
936  * Don't cancel GL_NOCANCEL requests.
937  */
938 
939 static void do_cancels(struct gfs2_holder *gh)
940 {
941 	struct gfs2_glock *gl = gh->gh_gl;
942 
943 	spin_lock(&gl->gl_spin);
944 
945 	while (gl->gl_req_gh != gh &&
946 	       !test_bit(HIF_HOLDER, &gh->gh_iflags) &&
947 	       !list_empty(&gh->gh_list)) {
948 		if (gl->gl_req_bh && !(gl->gl_req_gh &&
949 				     (gl->gl_req_gh->gh_flags & GL_NOCANCEL))) {
950 			spin_unlock(&gl->gl_spin);
951 			gfs2_lm_cancel(gl->gl_sbd, gl->gl_lock);
952 			msleep(100);
953 			spin_lock(&gl->gl_spin);
954 		} else {
955 			spin_unlock(&gl->gl_spin);
956 			msleep(100);
957 			spin_lock(&gl->gl_spin);
958 		}
959 	}
960 
961 	spin_unlock(&gl->gl_spin);
962 }
963 
964 /**
965  * glock_wait_internal - wait on a glock acquisition
966  * @gh: the glock holder
967  *
968  * Returns: 0 on success
969  */
970 
971 static int glock_wait_internal(struct gfs2_holder *gh)
972 {
973 	struct gfs2_glock *gl = gh->gh_gl;
974 	struct gfs2_sbd *sdp = gl->gl_sbd;
975 	const struct gfs2_glock_operations *glops = gl->gl_ops;
976 
977 	if (test_bit(HIF_ABORTED, &gh->gh_iflags))
978 		return -EIO;
979 
980 	if (gh->gh_flags & (LM_FLAG_TRY | LM_FLAG_TRY_1CB)) {
981 		spin_lock(&gl->gl_spin);
982 		if (gl->gl_req_gh != gh &&
983 		    !test_bit(HIF_HOLDER, &gh->gh_iflags) &&
984 		    !list_empty(&gh->gh_list)) {
985 			list_del_init(&gh->gh_list);
986 			gh->gh_error = GLR_TRYFAILED;
987 			run_queue(gl);
988 			spin_unlock(&gl->gl_spin);
989 			return gh->gh_error;
990 		}
991 		spin_unlock(&gl->gl_spin);
992 	}
993 
994 	if (gh->gh_flags & LM_FLAG_PRIORITY)
995 		do_cancels(gh);
996 
997 	wait_on_holder(gh);
998 	if (gh->gh_error)
999 		return gh->gh_error;
1000 
1001 	gfs2_assert_withdraw(sdp, test_bit(HIF_HOLDER, &gh->gh_iflags));
1002 	gfs2_assert_withdraw(sdp, relaxed_state_ok(gl->gl_state, gh->gh_state,
1003 						   gh->gh_flags));
1004 
1005 	if (test_bit(HIF_FIRST, &gh->gh_iflags)) {
1006 		gfs2_assert_warn(sdp, test_bit(GLF_LOCK, &gl->gl_flags));
1007 
1008 		if (glops->go_lock) {
1009 			gh->gh_error = glops->go_lock(gh);
1010 			if (gh->gh_error) {
1011 				spin_lock(&gl->gl_spin);
1012 				list_del_init(&gh->gh_list);
1013 				spin_unlock(&gl->gl_spin);
1014 			}
1015 		}
1016 
1017 		spin_lock(&gl->gl_spin);
1018 		gl->gl_req_gh = NULL;
1019 		gl->gl_req_bh = NULL;
1020 		clear_bit(GLF_LOCK, &gl->gl_flags);
1021 		run_queue(gl);
1022 		spin_unlock(&gl->gl_spin);
1023 	}
1024 
1025 	return gh->gh_error;
1026 }
1027 
1028 static inline struct gfs2_holder *
1029 find_holder_by_owner(struct list_head *head, pid_t pid)
1030 {
1031 	struct gfs2_holder *gh;
1032 
1033 	list_for_each_entry(gh, head, gh_list) {
1034 		if (gh->gh_owner_pid == pid)
1035 			return gh;
1036 	}
1037 
1038 	return NULL;
1039 }
1040 
1041 static void print_dbg(struct glock_iter *gi, const char *fmt, ...)
1042 {
1043 	va_list args;
1044 
1045 	va_start(args, fmt);
1046 	if (gi) {
1047 		vsprintf(gi->string, fmt, args);
1048 		seq_printf(gi->seq, gi->string);
1049 	}
1050 	else
1051 		vprintk(fmt, args);
1052 	va_end(args);
1053 }
1054 
1055 /**
1056  * add_to_queue - Add a holder to the wait queue (but look for recursion)
1057  * @gh: the holder structure to add
1058  *
1059  */
1060 
1061 static void add_to_queue(struct gfs2_holder *gh)
1062 {
1063 	struct gfs2_glock *gl = gh->gh_gl;
1064 	struct gfs2_holder *existing;
1065 
1066 	BUG_ON(!gh->gh_owner_pid);
1067 	if (test_and_set_bit(HIF_WAIT, &gh->gh_iflags))
1068 		BUG();
1069 
1070 	existing = find_holder_by_owner(&gl->gl_holders, gh->gh_owner_pid);
1071 	if (existing) {
1072 		print_symbol(KERN_WARNING "original: %s\n", existing->gh_ip);
1073 		printk(KERN_INFO "pid : %d\n", existing->gh_owner_pid);
1074 		printk(KERN_INFO "lock type : %d lock state : %d\n",
1075 				existing->gh_gl->gl_name.ln_type, existing->gh_gl->gl_state);
1076 		print_symbol(KERN_WARNING "new: %s\n", gh->gh_ip);
1077 		printk(KERN_INFO "pid : %d\n", gh->gh_owner_pid);
1078 		printk(KERN_INFO "lock type : %d lock state : %d\n",
1079 				gl->gl_name.ln_type, gl->gl_state);
1080 		BUG();
1081 	}
1082 
1083 	existing = find_holder_by_owner(&gl->gl_waiters3, gh->gh_owner_pid);
1084 	if (existing) {
1085 		print_symbol(KERN_WARNING "original: %s\n", existing->gh_ip);
1086 		print_symbol(KERN_WARNING "new: %s\n", gh->gh_ip);
1087 		BUG();
1088 	}
1089 
1090 	if (gh->gh_flags & LM_FLAG_PRIORITY)
1091 		list_add(&gh->gh_list, &gl->gl_waiters3);
1092 	else
1093 		list_add_tail(&gh->gh_list, &gl->gl_waiters3);
1094 }
1095 
1096 /**
1097  * gfs2_glock_nq - enqueue a struct gfs2_holder onto a glock (acquire a glock)
1098  * @gh: the holder structure
1099  *
1100  * if (gh->gh_flags & GL_ASYNC), this never returns an error
1101  *
1102  * Returns: 0, GLR_TRYFAILED, or errno on failure
1103  */
1104 
1105 int gfs2_glock_nq(struct gfs2_holder *gh)
1106 {
1107 	struct gfs2_glock *gl = gh->gh_gl;
1108 	struct gfs2_sbd *sdp = gl->gl_sbd;
1109 	int error = 0;
1110 
1111 restart:
1112 	if (unlikely(test_bit(SDF_SHUTDOWN, &sdp->sd_flags))) {
1113 		set_bit(HIF_ABORTED, &gh->gh_iflags);
1114 		return -EIO;
1115 	}
1116 
1117 	set_bit(HIF_PROMOTE, &gh->gh_iflags);
1118 
1119 	spin_lock(&gl->gl_spin);
1120 	add_to_queue(gh);
1121 	run_queue(gl);
1122 	spin_unlock(&gl->gl_spin);
1123 
1124 	if (!(gh->gh_flags & GL_ASYNC)) {
1125 		error = glock_wait_internal(gh);
1126 		if (error == GLR_CANCELED) {
1127 			msleep(100);
1128 			goto restart;
1129 		}
1130 	}
1131 
1132 	return error;
1133 }
1134 
1135 /**
1136  * gfs2_glock_poll - poll to see if an async request has been completed
1137  * @gh: the holder
1138  *
1139  * Returns: 1 if the request is ready to be gfs2_glock_wait()ed on
1140  */
1141 
1142 int gfs2_glock_poll(struct gfs2_holder *gh)
1143 {
1144 	struct gfs2_glock *gl = gh->gh_gl;
1145 	int ready = 0;
1146 
1147 	spin_lock(&gl->gl_spin);
1148 
1149 	if (test_bit(HIF_HOLDER, &gh->gh_iflags))
1150 		ready = 1;
1151 	else if (list_empty(&gh->gh_list)) {
1152 		if (gh->gh_error == GLR_CANCELED) {
1153 			spin_unlock(&gl->gl_spin);
1154 			msleep(100);
1155 			if (gfs2_glock_nq(gh))
1156 				return 1;
1157 			return 0;
1158 		} else
1159 			ready = 1;
1160 	}
1161 
1162 	spin_unlock(&gl->gl_spin);
1163 
1164 	return ready;
1165 }
1166 
1167 /**
1168  * gfs2_glock_wait - wait for a lock acquisition that ended in a GLR_ASYNC
1169  * @gh: the holder structure
1170  *
1171  * Returns: 0, GLR_TRYFAILED, or errno on failure
1172  */
1173 
1174 int gfs2_glock_wait(struct gfs2_holder *gh)
1175 {
1176 	int error;
1177 
1178 	error = glock_wait_internal(gh);
1179 	if (error == GLR_CANCELED) {
1180 		msleep(100);
1181 		gh->gh_flags &= ~GL_ASYNC;
1182 		error = gfs2_glock_nq(gh);
1183 	}
1184 
1185 	return error;
1186 }
1187 
1188 /**
1189  * gfs2_glock_dq - dequeue a struct gfs2_holder from a glock (release a glock)
1190  * @gh: the glock holder
1191  *
1192  */
1193 
1194 void gfs2_glock_dq(struct gfs2_holder *gh)
1195 {
1196 	struct gfs2_glock *gl = gh->gh_gl;
1197 	const struct gfs2_glock_operations *glops = gl->gl_ops;
1198 
1199 	if (gh->gh_flags & GL_NOCACHE)
1200 		handle_callback(gl, LM_ST_UNLOCKED, 0);
1201 
1202 	gfs2_glmutex_lock(gl);
1203 
1204 	spin_lock(&gl->gl_spin);
1205 	list_del_init(&gh->gh_list);
1206 
1207 	if (list_empty(&gl->gl_holders)) {
1208 		spin_unlock(&gl->gl_spin);
1209 
1210 		if (glops->go_unlock)
1211 			glops->go_unlock(gh);
1212 
1213 		spin_lock(&gl->gl_spin);
1214 		gl->gl_stamp = jiffies;
1215 	}
1216 
1217 	clear_bit(GLF_LOCK, &gl->gl_flags);
1218 	run_queue(gl);
1219 	spin_unlock(&gl->gl_spin);
1220 }
1221 
1222 void gfs2_glock_dq_wait(struct gfs2_holder *gh)
1223 {
1224 	struct gfs2_glock *gl = gh->gh_gl;
1225 	gfs2_glock_dq(gh);
1226 	wait_on_demote(gl);
1227 }
1228 
1229 /**
1230  * gfs2_glock_dq_uninit - dequeue a holder from a glock and initialize it
1231  * @gh: the holder structure
1232  *
1233  */
1234 
1235 void gfs2_glock_dq_uninit(struct gfs2_holder *gh)
1236 {
1237 	gfs2_glock_dq(gh);
1238 	gfs2_holder_uninit(gh);
1239 }
1240 
1241 /**
1242  * gfs2_glock_nq_num - acquire a glock based on lock number
1243  * @sdp: the filesystem
1244  * @number: the lock number
1245  * @glops: the glock operations for the type of glock
1246  * @state: the state to acquire the glock in
1247  * @flags: modifier flags for the aquisition
1248  * @gh: the struct gfs2_holder
1249  *
1250  * Returns: errno
1251  */
1252 
1253 int gfs2_glock_nq_num(struct gfs2_sbd *sdp, u64 number,
1254 		      const struct gfs2_glock_operations *glops,
1255 		      unsigned int state, int flags, struct gfs2_holder *gh)
1256 {
1257 	struct gfs2_glock *gl;
1258 	int error;
1259 
1260 	error = gfs2_glock_get(sdp, number, glops, CREATE, &gl);
1261 	if (!error) {
1262 		error = gfs2_glock_nq_init(gl, state, flags, gh);
1263 		gfs2_glock_put(gl);
1264 	}
1265 
1266 	return error;
1267 }
1268 
1269 /**
1270  * glock_compare - Compare two struct gfs2_glock structures for sorting
1271  * @arg_a: the first structure
1272  * @arg_b: the second structure
1273  *
1274  */
1275 
1276 static int glock_compare(const void *arg_a, const void *arg_b)
1277 {
1278 	const struct gfs2_holder *gh_a = *(const struct gfs2_holder **)arg_a;
1279 	const struct gfs2_holder *gh_b = *(const struct gfs2_holder **)arg_b;
1280 	const struct lm_lockname *a = &gh_a->gh_gl->gl_name;
1281 	const struct lm_lockname *b = &gh_b->gh_gl->gl_name;
1282 
1283 	if (a->ln_number > b->ln_number)
1284 		return 1;
1285 	if (a->ln_number < b->ln_number)
1286 		return -1;
1287 	BUG_ON(gh_a->gh_gl->gl_ops->go_type == gh_b->gh_gl->gl_ops->go_type);
1288 	return 0;
1289 }
1290 
1291 /**
1292  * nq_m_sync - synchonously acquire more than one glock in deadlock free order
1293  * @num_gh: the number of structures
1294  * @ghs: an array of struct gfs2_holder structures
1295  *
1296  * Returns: 0 on success (all glocks acquired),
1297  *          errno on failure (no glocks acquired)
1298  */
1299 
1300 static int nq_m_sync(unsigned int num_gh, struct gfs2_holder *ghs,
1301 		     struct gfs2_holder **p)
1302 {
1303 	unsigned int x;
1304 	int error = 0;
1305 
1306 	for (x = 0; x < num_gh; x++)
1307 		p[x] = &ghs[x];
1308 
1309 	sort(p, num_gh, sizeof(struct gfs2_holder *), glock_compare, NULL);
1310 
1311 	for (x = 0; x < num_gh; x++) {
1312 		p[x]->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1313 
1314 		error = gfs2_glock_nq(p[x]);
1315 		if (error) {
1316 			while (x--)
1317 				gfs2_glock_dq(p[x]);
1318 			break;
1319 		}
1320 	}
1321 
1322 	return error;
1323 }
1324 
1325 /**
1326  * gfs2_glock_nq_m - acquire multiple glocks
1327  * @num_gh: the number of structures
1328  * @ghs: an array of struct gfs2_holder structures
1329  *
1330  *
1331  * Returns: 0 on success (all glocks acquired),
1332  *          errno on failure (no glocks acquired)
1333  */
1334 
1335 int gfs2_glock_nq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1336 {
1337 	struct gfs2_holder *tmp[4];
1338 	struct gfs2_holder **pph = tmp;
1339 	int error = 0;
1340 
1341 	switch(num_gh) {
1342 	case 0:
1343 		return 0;
1344 	case 1:
1345 		ghs->gh_flags &= ~(LM_FLAG_TRY | GL_ASYNC);
1346 		return gfs2_glock_nq(ghs);
1347 	default:
1348 		if (num_gh <= 4)
1349 			break;
1350 		pph = kmalloc(num_gh * sizeof(struct gfs2_holder *), GFP_NOFS);
1351 		if (!pph)
1352 			return -ENOMEM;
1353 	}
1354 
1355 	error = nq_m_sync(num_gh, ghs, pph);
1356 
1357 	if (pph != tmp)
1358 		kfree(pph);
1359 
1360 	return error;
1361 }
1362 
1363 /**
1364  * gfs2_glock_dq_m - release multiple glocks
1365  * @num_gh: the number of structures
1366  * @ghs: an array of struct gfs2_holder structures
1367  *
1368  */
1369 
1370 void gfs2_glock_dq_m(unsigned int num_gh, struct gfs2_holder *ghs)
1371 {
1372 	unsigned int x;
1373 
1374 	for (x = 0; x < num_gh; x++)
1375 		gfs2_glock_dq(&ghs[x]);
1376 }
1377 
1378 /**
1379  * gfs2_glock_dq_uninit_m - release multiple glocks
1380  * @num_gh: the number of structures
1381  * @ghs: an array of struct gfs2_holder structures
1382  *
1383  */
1384 
1385 void gfs2_glock_dq_uninit_m(unsigned int num_gh, struct gfs2_holder *ghs)
1386 {
1387 	unsigned int x;
1388 
1389 	for (x = 0; x < num_gh; x++)
1390 		gfs2_glock_dq_uninit(&ghs[x]);
1391 }
1392 
1393 /**
1394  * gfs2_lvb_hold - attach a LVB from a glock
1395  * @gl: The glock in question
1396  *
1397  */
1398 
1399 int gfs2_lvb_hold(struct gfs2_glock *gl)
1400 {
1401 	int error;
1402 
1403 	gfs2_glmutex_lock(gl);
1404 
1405 	if (!atomic_read(&gl->gl_lvb_count)) {
1406 		error = gfs2_lm_hold_lvb(gl->gl_sbd, gl->gl_lock, &gl->gl_lvb);
1407 		if (error) {
1408 			gfs2_glmutex_unlock(gl);
1409 			return error;
1410 		}
1411 		gfs2_glock_hold(gl);
1412 	}
1413 	atomic_inc(&gl->gl_lvb_count);
1414 
1415 	gfs2_glmutex_unlock(gl);
1416 
1417 	return 0;
1418 }
1419 
1420 /**
1421  * gfs2_lvb_unhold - detach a LVB from a glock
1422  * @gl: The glock in question
1423  *
1424  */
1425 
1426 void gfs2_lvb_unhold(struct gfs2_glock *gl)
1427 {
1428 	gfs2_glock_hold(gl);
1429 	gfs2_glmutex_lock(gl);
1430 
1431 	gfs2_assert(gl->gl_sbd, atomic_read(&gl->gl_lvb_count) > 0);
1432 	if (atomic_dec_and_test(&gl->gl_lvb_count)) {
1433 		gfs2_lm_unhold_lvb(gl->gl_sbd, gl->gl_lock, gl->gl_lvb);
1434 		gl->gl_lvb = NULL;
1435 		gfs2_glock_put(gl);
1436 	}
1437 
1438 	gfs2_glmutex_unlock(gl);
1439 	gfs2_glock_put(gl);
1440 }
1441 
1442 static void blocking_cb(struct gfs2_sbd *sdp, struct lm_lockname *name,
1443 			unsigned int state)
1444 {
1445 	struct gfs2_glock *gl;
1446 
1447 	gl = gfs2_glock_find(sdp, name);
1448 	if (!gl)
1449 		return;
1450 
1451 	handle_callback(gl, state, 1);
1452 
1453 	spin_lock(&gl->gl_spin);
1454 	run_queue(gl);
1455 	spin_unlock(&gl->gl_spin);
1456 
1457 	gfs2_glock_put(gl);
1458 }
1459 
1460 /**
1461  * gfs2_glock_cb - Callback used by locking module
1462  * @sdp: Pointer to the superblock
1463  * @type: Type of callback
1464  * @data: Type dependent data pointer
1465  *
1466  * Called by the locking module when it wants to tell us something.
1467  * Either we need to drop a lock, one of our ASYNC requests completed, or
1468  * a journal from another client needs to be recovered.
1469  */
1470 
1471 void gfs2_glock_cb(void *cb_data, unsigned int type, void *data)
1472 {
1473 	struct gfs2_sbd *sdp = cb_data;
1474 
1475 	switch (type) {
1476 	case LM_CB_NEED_E:
1477 		blocking_cb(sdp, data, LM_ST_UNLOCKED);
1478 		return;
1479 
1480 	case LM_CB_NEED_D:
1481 		blocking_cb(sdp, data, LM_ST_DEFERRED);
1482 		return;
1483 
1484 	case LM_CB_NEED_S:
1485 		blocking_cb(sdp, data, LM_ST_SHARED);
1486 		return;
1487 
1488 	case LM_CB_ASYNC: {
1489 		struct lm_async_cb *async = data;
1490 		struct gfs2_glock *gl;
1491 
1492 		down_read(&gfs2_umount_flush_sem);
1493 		gl = gfs2_glock_find(sdp, &async->lc_name);
1494 		if (gfs2_assert_warn(sdp, gl))
1495 			return;
1496 		if (!gfs2_assert_warn(sdp, gl->gl_req_bh))
1497 			gl->gl_req_bh(gl, async->lc_ret);
1498 		gfs2_glock_put(gl);
1499 		up_read(&gfs2_umount_flush_sem);
1500 		return;
1501 	}
1502 
1503 	case LM_CB_NEED_RECOVERY:
1504 		gfs2_jdesc_make_dirty(sdp, *(unsigned int *)data);
1505 		if (sdp->sd_recoverd_process)
1506 			wake_up_process(sdp->sd_recoverd_process);
1507 		return;
1508 
1509 	case LM_CB_DROPLOCKS:
1510 		gfs2_gl_hash_clear(sdp, NO_WAIT);
1511 		gfs2_quota_scan(sdp);
1512 		return;
1513 
1514 	default:
1515 		gfs2_assert_warn(sdp, 0);
1516 		return;
1517 	}
1518 }
1519 
1520 /**
1521  * demote_ok - Check to see if it's ok to unlock a glock
1522  * @gl: the glock
1523  *
1524  * Returns: 1 if it's ok
1525  */
1526 
1527 static int demote_ok(struct gfs2_glock *gl)
1528 {
1529 	const struct gfs2_glock_operations *glops = gl->gl_ops;
1530 	int demote = 1;
1531 
1532 	if (test_bit(GLF_STICKY, &gl->gl_flags))
1533 		demote = 0;
1534 	else if (glops->go_demote_ok)
1535 		demote = glops->go_demote_ok(gl);
1536 
1537 	return demote;
1538 }
1539 
1540 /**
1541  * gfs2_glock_schedule_for_reclaim - Add a glock to the reclaim list
1542  * @gl: the glock
1543  *
1544  */
1545 
1546 void gfs2_glock_schedule_for_reclaim(struct gfs2_glock *gl)
1547 {
1548 	struct gfs2_sbd *sdp = gl->gl_sbd;
1549 
1550 	spin_lock(&sdp->sd_reclaim_lock);
1551 	if (list_empty(&gl->gl_reclaim)) {
1552 		gfs2_glock_hold(gl);
1553 		list_add(&gl->gl_reclaim, &sdp->sd_reclaim_list);
1554 		atomic_inc(&sdp->sd_reclaim_count);
1555 	}
1556 	spin_unlock(&sdp->sd_reclaim_lock);
1557 
1558 	wake_up(&sdp->sd_reclaim_wq);
1559 }
1560 
1561 /**
1562  * gfs2_reclaim_glock - process the next glock on the filesystem's reclaim list
1563  * @sdp: the filesystem
1564  *
1565  * Called from gfs2_glockd() glock reclaim daemon, or when promoting a
1566  * different glock and we notice that there are a lot of glocks in the
1567  * reclaim list.
1568  *
1569  */
1570 
1571 void gfs2_reclaim_glock(struct gfs2_sbd *sdp)
1572 {
1573 	struct gfs2_glock *gl;
1574 
1575 	spin_lock(&sdp->sd_reclaim_lock);
1576 	if (list_empty(&sdp->sd_reclaim_list)) {
1577 		spin_unlock(&sdp->sd_reclaim_lock);
1578 		return;
1579 	}
1580 	gl = list_entry(sdp->sd_reclaim_list.next,
1581 			struct gfs2_glock, gl_reclaim);
1582 	list_del_init(&gl->gl_reclaim);
1583 	spin_unlock(&sdp->sd_reclaim_lock);
1584 
1585 	atomic_dec(&sdp->sd_reclaim_count);
1586 	atomic_inc(&sdp->sd_reclaimed);
1587 
1588 	if (gfs2_glmutex_trylock(gl)) {
1589 		if (list_empty(&gl->gl_holders) &&
1590 		    gl->gl_state != LM_ST_UNLOCKED && demote_ok(gl))
1591 			handle_callback(gl, LM_ST_UNLOCKED, 0);
1592 		gfs2_glmutex_unlock(gl);
1593 	}
1594 
1595 	gfs2_glock_put(gl);
1596 }
1597 
1598 /**
1599  * examine_bucket - Call a function for glock in a hash bucket
1600  * @examiner: the function
1601  * @sdp: the filesystem
1602  * @bucket: the bucket
1603  *
1604  * Returns: 1 if the bucket has entries
1605  */
1606 
1607 static int examine_bucket(glock_examiner examiner, struct gfs2_sbd *sdp,
1608 			  unsigned int hash)
1609 {
1610 	struct gfs2_glock *gl, *prev = NULL;
1611 	int has_entries = 0;
1612 	struct hlist_head *head = &gl_hash_table[hash].hb_list;
1613 
1614 	read_lock(gl_lock_addr(hash));
1615 	/* Can't use hlist_for_each_entry - don't want prefetch here */
1616 	if (hlist_empty(head))
1617 		goto out;
1618 	gl = list_entry(head->first, struct gfs2_glock, gl_list);
1619 	while(1) {
1620 		if (gl->gl_sbd == sdp) {
1621 			gfs2_glock_hold(gl);
1622 			read_unlock(gl_lock_addr(hash));
1623 			if (prev)
1624 				gfs2_glock_put(prev);
1625 			prev = gl;
1626 			examiner(gl);
1627 			has_entries = 1;
1628 			read_lock(gl_lock_addr(hash));
1629 		}
1630 		if (gl->gl_list.next == NULL)
1631 			break;
1632 		gl = list_entry(gl->gl_list.next, struct gfs2_glock, gl_list);
1633 	}
1634 out:
1635 	read_unlock(gl_lock_addr(hash));
1636 	if (prev)
1637 		gfs2_glock_put(prev);
1638 	return has_entries;
1639 }
1640 
1641 /**
1642  * scan_glock - look at a glock and see if we can reclaim it
1643  * @gl: the glock to look at
1644  *
1645  */
1646 
1647 static void scan_glock(struct gfs2_glock *gl)
1648 {
1649 	if (gl->gl_ops == &gfs2_inode_glops && gl->gl_object)
1650 		return;
1651 
1652 	if (gfs2_glmutex_trylock(gl)) {
1653 		if (list_empty(&gl->gl_holders) &&
1654 		    gl->gl_state != LM_ST_UNLOCKED && demote_ok(gl))
1655 			goto out_schedule;
1656 		gfs2_glmutex_unlock(gl);
1657 	}
1658 	return;
1659 
1660 out_schedule:
1661 	gfs2_glmutex_unlock(gl);
1662 	gfs2_glock_schedule_for_reclaim(gl);
1663 }
1664 
1665 /**
1666  * gfs2_scand_internal - Look for glocks and inodes to toss from memory
1667  * @sdp: the filesystem
1668  *
1669  */
1670 
1671 void gfs2_scand_internal(struct gfs2_sbd *sdp)
1672 {
1673 	unsigned int x;
1674 
1675 	for (x = 0; x < GFS2_GL_HASH_SIZE; x++)
1676 		examine_bucket(scan_glock, sdp, x);
1677 }
1678 
1679 /**
1680  * clear_glock - look at a glock and see if we can free it from glock cache
1681  * @gl: the glock to look at
1682  *
1683  */
1684 
1685 static void clear_glock(struct gfs2_glock *gl)
1686 {
1687 	struct gfs2_sbd *sdp = gl->gl_sbd;
1688 	int released;
1689 
1690 	spin_lock(&sdp->sd_reclaim_lock);
1691 	if (!list_empty(&gl->gl_reclaim)) {
1692 		list_del_init(&gl->gl_reclaim);
1693 		atomic_dec(&sdp->sd_reclaim_count);
1694 		spin_unlock(&sdp->sd_reclaim_lock);
1695 		released = gfs2_glock_put(gl);
1696 		gfs2_assert(sdp, !released);
1697 	} else {
1698 		spin_unlock(&sdp->sd_reclaim_lock);
1699 	}
1700 
1701 	if (gfs2_glmutex_trylock(gl)) {
1702 		if (list_empty(&gl->gl_holders) &&
1703 		    gl->gl_state != LM_ST_UNLOCKED)
1704 			handle_callback(gl, LM_ST_UNLOCKED, 0);
1705 		gfs2_glmutex_unlock(gl);
1706 	}
1707 }
1708 
1709 /**
1710  * gfs2_gl_hash_clear - Empty out the glock hash table
1711  * @sdp: the filesystem
1712  * @wait: wait until it's all gone
1713  *
1714  * Called when unmounting the filesystem, or when inter-node lock manager
1715  * requests DROPLOCKS because it is running out of capacity.
1716  */
1717 
1718 void gfs2_gl_hash_clear(struct gfs2_sbd *sdp, int wait)
1719 {
1720 	unsigned long t;
1721 	unsigned int x;
1722 	int cont;
1723 
1724 	t = jiffies;
1725 
1726 	for (;;) {
1727 		cont = 0;
1728 		for (x = 0; x < GFS2_GL_HASH_SIZE; x++) {
1729 			if (examine_bucket(clear_glock, sdp, x))
1730 				cont = 1;
1731 		}
1732 
1733 		if (!wait || !cont)
1734 			break;
1735 
1736 		if (time_after_eq(jiffies,
1737 				  t + gfs2_tune_get(sdp, gt_stall_secs) * HZ)) {
1738 			fs_warn(sdp, "Unmount seems to be stalled. "
1739 				     "Dumping lock state...\n");
1740 			gfs2_dump_lockstate(sdp);
1741 			t = jiffies;
1742 		}
1743 
1744 		down_write(&gfs2_umount_flush_sem);
1745 		invalidate_inodes(sdp->sd_vfs);
1746 		up_write(&gfs2_umount_flush_sem);
1747 		msleep(10);
1748 	}
1749 }
1750 
1751 /*
1752  *  Diagnostic routines to help debug distributed deadlock
1753  */
1754 
1755 static void gfs2_print_symbol(struct glock_iter *gi, const char *fmt,
1756                               unsigned long address)
1757 {
1758 	char buffer[KSYM_SYMBOL_LEN];
1759 
1760 	sprint_symbol(buffer, address);
1761 	print_dbg(gi, fmt, buffer);
1762 }
1763 
1764 /**
1765  * dump_holder - print information about a glock holder
1766  * @str: a string naming the type of holder
1767  * @gh: the glock holder
1768  *
1769  * Returns: 0 on success, -ENOBUFS when we run out of space
1770  */
1771 
1772 static int dump_holder(struct glock_iter *gi, char *str,
1773 		       struct gfs2_holder *gh)
1774 {
1775 	unsigned int x;
1776 	struct task_struct *gh_owner;
1777 
1778 	print_dbg(gi, "  %s\n", str);
1779 	if (gh->gh_owner_pid) {
1780 		print_dbg(gi, "    owner = %ld ", (long)gh->gh_owner_pid);
1781 		gh_owner = find_task_by_pid(gh->gh_owner_pid);
1782 		if (gh_owner)
1783 			print_dbg(gi, "(%s)\n", gh_owner->comm);
1784 		else
1785 			print_dbg(gi, "(ended)\n");
1786 	} else
1787 		print_dbg(gi, "    owner = -1\n");
1788 	print_dbg(gi, "    gh_state = %u\n", gh->gh_state);
1789 	print_dbg(gi, "    gh_flags =");
1790 	for (x = 0; x < 32; x++)
1791 		if (gh->gh_flags & (1 << x))
1792 			print_dbg(gi, " %u", x);
1793 	print_dbg(gi, " \n");
1794 	print_dbg(gi, "    error = %d\n", gh->gh_error);
1795 	print_dbg(gi, "    gh_iflags =");
1796 	for (x = 0; x < 32; x++)
1797 		if (test_bit(x, &gh->gh_iflags))
1798 			print_dbg(gi, " %u", x);
1799 	print_dbg(gi, " \n");
1800         gfs2_print_symbol(gi, "    initialized at: %s\n", gh->gh_ip);
1801 
1802 	return 0;
1803 }
1804 
1805 /**
1806  * dump_inode - print information about an inode
1807  * @ip: the inode
1808  *
1809  * Returns: 0 on success, -ENOBUFS when we run out of space
1810  */
1811 
1812 static int dump_inode(struct glock_iter *gi, struct gfs2_inode *ip)
1813 {
1814 	unsigned int x;
1815 
1816 	print_dbg(gi, "  Inode:\n");
1817 	print_dbg(gi, "    num = %llu/%llu\n",
1818 		  (unsigned long long)ip->i_no_formal_ino,
1819 		  (unsigned long long)ip->i_no_addr);
1820 	print_dbg(gi, "    type = %u\n", IF2DT(ip->i_inode.i_mode));
1821 	print_dbg(gi, "    i_flags =");
1822 	for (x = 0; x < 32; x++)
1823 		if (test_bit(x, &ip->i_flags))
1824 			print_dbg(gi, " %u", x);
1825 	print_dbg(gi, " \n");
1826 	return 0;
1827 }
1828 
1829 /**
1830  * dump_glock - print information about a glock
1831  * @gl: the glock
1832  * @count: where we are in the buffer
1833  *
1834  * Returns: 0 on success, -ENOBUFS when we run out of space
1835  */
1836 
1837 static int dump_glock(struct glock_iter *gi, struct gfs2_glock *gl)
1838 {
1839 	struct gfs2_holder *gh;
1840 	unsigned int x;
1841 	int error = -ENOBUFS;
1842 	struct task_struct *gl_owner;
1843 
1844 	spin_lock(&gl->gl_spin);
1845 
1846 	print_dbg(gi, "Glock 0x%p (%u, %llu)\n", gl, gl->gl_name.ln_type,
1847 		   (unsigned long long)gl->gl_name.ln_number);
1848 	print_dbg(gi, "  gl_flags =");
1849 	for (x = 0; x < 32; x++) {
1850 		if (test_bit(x, &gl->gl_flags))
1851 			print_dbg(gi, " %u", x);
1852 	}
1853 	if (!test_bit(GLF_LOCK, &gl->gl_flags))
1854 		print_dbg(gi, " (unlocked)");
1855 	print_dbg(gi, " \n");
1856 	print_dbg(gi, "  gl_ref = %d\n", atomic_read(&gl->gl_ref));
1857 	print_dbg(gi, "  gl_state = %u\n", gl->gl_state);
1858 	if (gl->gl_owner_pid) {
1859 		gl_owner = find_task_by_pid(gl->gl_owner_pid);
1860 		if (gl_owner)
1861 			print_dbg(gi, "  gl_owner = pid %d (%s)\n",
1862 				  gl->gl_owner_pid, gl_owner->comm);
1863 		else
1864 			print_dbg(gi, "  gl_owner = %d (ended)\n",
1865 				  gl->gl_owner_pid);
1866 	} else
1867 		print_dbg(gi, "  gl_owner = -1\n");
1868 	print_dbg(gi, "  gl_ip = %lu\n", gl->gl_ip);
1869 	print_dbg(gi, "  req_gh = %s\n", (gl->gl_req_gh) ? "yes" : "no");
1870 	print_dbg(gi, "  req_bh = %s\n", (gl->gl_req_bh) ? "yes" : "no");
1871 	print_dbg(gi, "  lvb_count = %d\n", atomic_read(&gl->gl_lvb_count));
1872 	print_dbg(gi, "  object = %s\n", (gl->gl_object) ? "yes" : "no");
1873 	print_dbg(gi, "  le = %s\n",
1874 		   (list_empty(&gl->gl_le.le_list)) ? "no" : "yes");
1875 	print_dbg(gi, "  reclaim = %s\n",
1876 		   (list_empty(&gl->gl_reclaim)) ? "no" : "yes");
1877 	if (gl->gl_aspace)
1878 		print_dbg(gi, "  aspace = 0x%p nrpages = %lu\n", gl->gl_aspace,
1879 			   gl->gl_aspace->i_mapping->nrpages);
1880 	else
1881 		print_dbg(gi, "  aspace = no\n");
1882 	print_dbg(gi, "  ail = %d\n", atomic_read(&gl->gl_ail_count));
1883 	if (gl->gl_req_gh) {
1884 		error = dump_holder(gi, "Request", gl->gl_req_gh);
1885 		if (error)
1886 			goto out;
1887 	}
1888 	list_for_each_entry(gh, &gl->gl_holders, gh_list) {
1889 		error = dump_holder(gi, "Holder", gh);
1890 		if (error)
1891 			goto out;
1892 	}
1893 	list_for_each_entry(gh, &gl->gl_waiters1, gh_list) {
1894 		error = dump_holder(gi, "Waiter1", gh);
1895 		if (error)
1896 			goto out;
1897 	}
1898 	list_for_each_entry(gh, &gl->gl_waiters3, gh_list) {
1899 		error = dump_holder(gi, "Waiter3", gh);
1900 		if (error)
1901 			goto out;
1902 	}
1903 	if (test_bit(GLF_DEMOTE, &gl->gl_flags)) {
1904 		print_dbg(gi, "  Demotion req to state %u (%llu uS ago)\n",
1905 			  gl->gl_demote_state, (unsigned long long)
1906 			  (jiffies - gl->gl_demote_time)*(1000000/HZ));
1907 	}
1908 	if (gl->gl_ops == &gfs2_inode_glops && gl->gl_object) {
1909 		if (!test_bit(GLF_LOCK, &gl->gl_flags) &&
1910 			list_empty(&gl->gl_holders)) {
1911 			error = dump_inode(gi, gl->gl_object);
1912 			if (error)
1913 				goto out;
1914 		} else {
1915 			error = -ENOBUFS;
1916 			print_dbg(gi, "  Inode: busy\n");
1917 		}
1918 	}
1919 
1920 	error = 0;
1921 
1922 out:
1923 	spin_unlock(&gl->gl_spin);
1924 	return error;
1925 }
1926 
1927 /**
1928  * gfs2_dump_lockstate - print out the current lockstate
1929  * @sdp: the filesystem
1930  * @ub: the buffer to copy the information into
1931  *
1932  * If @ub is NULL, dump the lockstate to the console.
1933  *
1934  */
1935 
1936 static int gfs2_dump_lockstate(struct gfs2_sbd *sdp)
1937 {
1938 	struct gfs2_glock *gl;
1939 	struct hlist_node *h;
1940 	unsigned int x;
1941 	int error = 0;
1942 
1943 	for (x = 0; x < GFS2_GL_HASH_SIZE; x++) {
1944 
1945 		read_lock(gl_lock_addr(x));
1946 
1947 		hlist_for_each_entry(gl, h, &gl_hash_table[x].hb_list, gl_list) {
1948 			if (gl->gl_sbd != sdp)
1949 				continue;
1950 
1951 			error = dump_glock(NULL, gl);
1952 			if (error)
1953 				break;
1954 		}
1955 
1956 		read_unlock(gl_lock_addr(x));
1957 
1958 		if (error)
1959 			break;
1960 	}
1961 
1962 
1963 	return error;
1964 }
1965 
1966 int __init gfs2_glock_init(void)
1967 {
1968 	unsigned i;
1969 	for(i = 0; i < GFS2_GL_HASH_SIZE; i++) {
1970 		INIT_HLIST_HEAD(&gl_hash_table[i].hb_list);
1971 	}
1972 #ifdef GL_HASH_LOCK_SZ
1973 	for(i = 0; i < GL_HASH_LOCK_SZ; i++) {
1974 		rwlock_init(&gl_hash_locks[i]);
1975 	}
1976 #endif
1977 	return 0;
1978 }
1979 
1980 static int gfs2_glock_iter_next(struct glock_iter *gi)
1981 {
1982 	read_lock(gl_lock_addr(gi->hash));
1983 	while (1) {
1984 		if (!gi->hb_list) {  /* If we don't have a hash bucket yet */
1985 			gi->hb_list = &gl_hash_table[gi->hash].hb_list;
1986 			if (hlist_empty(gi->hb_list)) {
1987 				read_unlock(gl_lock_addr(gi->hash));
1988 				gi->hash++;
1989 				read_lock(gl_lock_addr(gi->hash));
1990 				gi->hb_list = NULL;
1991 				if (gi->hash >= GFS2_GL_HASH_SIZE) {
1992 					read_unlock(gl_lock_addr(gi->hash));
1993 					return 1;
1994 				}
1995 				else
1996 					continue;
1997 			}
1998 			if (!hlist_empty(gi->hb_list)) {
1999 				gi->gl = list_entry(gi->hb_list->first,
2000 						    struct gfs2_glock,
2001 						    gl_list);
2002 			}
2003 		} else {
2004 			if (gi->gl->gl_list.next == NULL) {
2005 				read_unlock(gl_lock_addr(gi->hash));
2006 				gi->hash++;
2007 				read_lock(gl_lock_addr(gi->hash));
2008 				gi->hb_list = NULL;
2009 				continue;
2010 			}
2011 			gi->gl = list_entry(gi->gl->gl_list.next,
2012 					    struct gfs2_glock, gl_list);
2013 		}
2014 		if (gi->gl)
2015 			break;
2016 	}
2017 	read_unlock(gl_lock_addr(gi->hash));
2018 	return 0;
2019 }
2020 
2021 static void gfs2_glock_iter_free(struct glock_iter *gi)
2022 {
2023 	kfree(gi);
2024 }
2025 
2026 static struct glock_iter *gfs2_glock_iter_init(struct gfs2_sbd *sdp)
2027 {
2028 	struct glock_iter *gi;
2029 
2030 	gi = kmalloc(sizeof (*gi), GFP_KERNEL);
2031 	if (!gi)
2032 		return NULL;
2033 
2034 	gi->sdp = sdp;
2035 	gi->hash = 0;
2036 	gi->gl = NULL;
2037 	gi->hb_list = NULL;
2038 	gi->seq = NULL;
2039 	memset(gi->string, 0, sizeof(gi->string));
2040 
2041 	if (gfs2_glock_iter_next(gi)) {
2042 		gfs2_glock_iter_free(gi);
2043 		return NULL;
2044 	}
2045 
2046 	return gi;
2047 }
2048 
2049 static void *gfs2_glock_seq_start(struct seq_file *file, loff_t *pos)
2050 {
2051 	struct glock_iter *gi;
2052 	loff_t n = *pos;
2053 
2054 	gi = gfs2_glock_iter_init(file->private);
2055 	if (!gi)
2056 		return NULL;
2057 
2058 	while (n--) {
2059 		if (gfs2_glock_iter_next(gi)) {
2060 			gfs2_glock_iter_free(gi);
2061 			return NULL;
2062 		}
2063 	}
2064 
2065 	return gi;
2066 }
2067 
2068 static void *gfs2_glock_seq_next(struct seq_file *file, void *iter_ptr,
2069 				 loff_t *pos)
2070 {
2071 	struct glock_iter *gi = iter_ptr;
2072 
2073 	(*pos)++;
2074 
2075 	if (gfs2_glock_iter_next(gi)) {
2076 		gfs2_glock_iter_free(gi);
2077 		return NULL;
2078 	}
2079 
2080 	return gi;
2081 }
2082 
2083 static void gfs2_glock_seq_stop(struct seq_file *file, void *iter_ptr)
2084 {
2085 	/* nothing for now */
2086 }
2087 
2088 static int gfs2_glock_seq_show(struct seq_file *file, void *iter_ptr)
2089 {
2090 	struct glock_iter *gi = iter_ptr;
2091 
2092 	gi->seq = file;
2093 	dump_glock(gi, gi->gl);
2094 
2095 	return 0;
2096 }
2097 
2098 static struct seq_operations gfs2_glock_seq_ops = {
2099 	.start = gfs2_glock_seq_start,
2100 	.next  = gfs2_glock_seq_next,
2101 	.stop  = gfs2_glock_seq_stop,
2102 	.show  = gfs2_glock_seq_show,
2103 };
2104 
2105 static int gfs2_debugfs_open(struct inode *inode, struct file *file)
2106 {
2107 	struct seq_file *seq;
2108 	int ret;
2109 
2110 	ret = seq_open(file, &gfs2_glock_seq_ops);
2111 	if (ret)
2112 		return ret;
2113 
2114 	seq = file->private_data;
2115 	seq->private = inode->i_private;
2116 
2117 	return 0;
2118 }
2119 
2120 static const struct file_operations gfs2_debug_fops = {
2121 	.owner   = THIS_MODULE,
2122 	.open    = gfs2_debugfs_open,
2123 	.read    = seq_read,
2124 	.llseek  = seq_lseek,
2125 	.release = seq_release
2126 };
2127 
2128 int gfs2_create_debugfs_file(struct gfs2_sbd *sdp)
2129 {
2130 	sdp->debugfs_dir = debugfs_create_dir(sdp->sd_table_name, gfs2_root);
2131 	if (!sdp->debugfs_dir)
2132 		return -ENOMEM;
2133 	sdp->debugfs_dentry_glocks = debugfs_create_file("glocks",
2134 							 S_IFREG | S_IRUGO,
2135 							 sdp->debugfs_dir, sdp,
2136 							 &gfs2_debug_fops);
2137 	if (!sdp->debugfs_dentry_glocks)
2138 		return -ENOMEM;
2139 
2140 	return 0;
2141 }
2142 
2143 void gfs2_delete_debugfs_file(struct gfs2_sbd *sdp)
2144 {
2145 	if (sdp && sdp->debugfs_dir) {
2146 		if (sdp->debugfs_dentry_glocks) {
2147 			debugfs_remove(sdp->debugfs_dentry_glocks);
2148 			sdp->debugfs_dentry_glocks = NULL;
2149 		}
2150 		debugfs_remove(sdp->debugfs_dir);
2151 		sdp->debugfs_dir = NULL;
2152 	}
2153 }
2154 
2155 int gfs2_register_debugfs(void)
2156 {
2157 	gfs2_root = debugfs_create_dir("gfs2", NULL);
2158 	return gfs2_root ? 0 : -ENOMEM;
2159 }
2160 
2161 void gfs2_unregister_debugfs(void)
2162 {
2163 	debugfs_remove(gfs2_root);
2164 	gfs2_root = NULL;
2165 }
2166